diff --git a/.clang-format b/.clang-format
index 2da3911dced..893d9c613f1 100644
--- a/.clang-format
+++ b/.clang-format
@@ -74,6 +74,7 @@ ConstructorInitializerIndentWidth: 4
 ContinuationIndentWidth: 4
 DerivePointerAlignment: false
 DisableFormat: false
+IndentRequiresClause: false
 IndentWidth: 4
 IndentWrappedFunctionNames: false
 MacroBlockBegin: ''
diff --git a/.github/workflows/nightly.yml b/.github/workflows/nightly.yml
index acf6bbe8f6a..cf61012f2bc 100644
--- a/.github/workflows/nightly.yml
+++ b/.github/workflows/nightly.yml
@@ -121,8 +121,6 @@ jobs:
           docker ps --all --quiet | xargs --no-run-if-empty docker rm -f ||:
           sudo rm -fr "$TEMP_PATH" "$CACHES_PATH"
   SonarCloud:
-    # TODO: Remove if: whenever SonarCloud supports c++23
-    if: ${{ false }}
     runs-on: [self-hosted, builder]
     env:
       SONAR_SCANNER_VERSION: 4.8.0.2856
@@ -159,7 +157,7 @@ jobs:
       - name: Set Up Build Tools
         run: |
           sudo apt-get update
-          sudo apt-get install -yq git cmake ccache ninja-build python3 yasm
+          sudo apt-get install -yq git cmake ccache ninja-build python3 yasm nasm
           sudo bash -c "$(wget -O - https://apt.llvm.org/llvm.sh)"
       - name: Run build-wrapper
         run: |
@@ -178,4 +176,5 @@ jobs:
             --define sonar.cfamily.build-wrapper-output="${{ env.BUILD_WRAPPER_OUT_DIR }}" \
             --define sonar.projectKey="ClickHouse_ClickHouse" \
             --define sonar.organization="clickhouse-java" \
-            --define sonar.exclusions="**/*.java,**/*.ts,**/*.js,**/*.css,**/*.sql" \
+            --define sonar.cfamily.cpp23.enabled=true \
+            --define sonar.exclusions="**/*.java,**/*.ts,**/*.js,**/*.css,**/*.sql"
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 506ed451b6d..afc08f3e637 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -46,7 +46,12 @@ jobs:
       - name: Python unit tests
         run: |
           cd "$GITHUB_WORKSPACE/tests/ci"
+          echo "Testing the main ci directory"
           python3 -m unittest discover -s . -p '*_test.py'
+          for dir in *_lambda/; do
+            echo "Testing $dir"
+            python3 -m unittest discover -s "$dir" -p '*_test.py'
+          done
   DockerHubPushAarch64:
     needs: CheckLabels
     runs-on: [self-hosted, style-checker-aarch64]
diff --git a/.github/workflows/woboq.yml b/.github/workflows/woboq.yml
index bdfbc8fef9c..1ef729af30a 100644
--- a/.github/workflows/woboq.yml
+++ b/.github/workflows/woboq.yml
@@ -12,6 +12,7 @@ jobs:
   # don't use dockerhub push because this image updates so rarely
   WoboqCodebrowser:
     runs-on: [self-hosted, style-checker]
+    timeout-minutes: 420  # the task is pretty heavy, so there's an additional hour
     steps:
       - name: Set envs
         run: |
diff --git a/.gitmodules b/.gitmodules
index 8bf4f6e8975..151dc28c55b 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -19,7 +19,7 @@
 	url = https://github.com/google/googletest
 [submodule "contrib/capnproto"]
 	path = contrib/capnproto
-	url = https://github.com/capnproto/capnproto
+	url = https://github.com/ClickHouse/capnproto
 [submodule "contrib/double-conversion"]
 	path = contrib/double-conversion
 	url = https://github.com/google/double-conversion
diff --git a/.yamllint b/.yamllint
index fe161e71849..9d6550ac960 100644
--- a/.yamllint
+++ b/.yamllint
@@ -6,8 +6,10 @@ rules:
         level: warning
         indent-sequences: consistent
     line-length:
-        # there are some bash -c "", so this is OK
-        max: 300
+        # there are:
+        # - bash -c "", so this is OK
+        # - yaml in tests
+        max: 1000
         level: warning
     comments:
         min-spaces-from-content: 1
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 1ccd4f9846d..bf6b309ef2c 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,4 +1,6 @@
 ### Table of Contents
+**[ClickHouse release v23.6, 2023-06-30](#236)**<br/>
+**[ClickHouse release v23.5, 2023-06-08](#235)**<br/>
 **[ClickHouse release v23.4, 2023-04-26](#234)**<br/>
 **[ClickHouse release v23.3 LTS, 2023-03-30](#233)**<br/>
 **[ClickHouse release v23.2, 2023-02-23](#232)**<br/>
@@ -7,6 +9,358 @@
 
 # 2023 Changelog
 
+### <a id="236"></a> ClickHouse release 23.6, 2023-06-29
+
+#### Backward Incompatible Change
+* Delete feature `do_not_evict_index_and_mark_files` in the fs cache. This feature was only making things worse. [#51253](https://github.com/ClickHouse/ClickHouse/pull/51253) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Remove ALTER support for experimental LIVE VIEW. [#51287](https://github.com/ClickHouse/ClickHouse/pull/51287) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Decrease the default values for `http_max_field_value_size` and `http_max_field_name_size` to 128 KiB. [#51163](https://github.com/ClickHouse/ClickHouse/pull/51163) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* CGroups metrics related to CPU are replaced with one metric, `CGroupMaxCPU` for better usability. The `Normalized` CPU usage metrics will be normalized to CGroups limits instead of the total number of CPUs when they are set. This closes [#50836](https://github.com/ClickHouse/ClickHouse/issues/50836). [#50835](https://github.com/ClickHouse/ClickHouse/pull/50835) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### New Feature
+* The function `transform` as well as `CASE` with value matching started to support all data types. This closes [#29730](https://github.com/ClickHouse/ClickHouse/issues/29730). This closes [#32387](https://github.com/ClickHouse/ClickHouse/issues/32387). This closes [#50827](https://github.com/ClickHouse/ClickHouse/issues/50827). This closes [#31336](https://github.com/ClickHouse/ClickHouse/issues/31336). This closes [#40493](https://github.com/ClickHouse/ClickHouse/issues/40493). [#51351](https://github.com/ClickHouse/ClickHouse/pull/51351) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Added option `--rename_files_after_processing <pattern>`. This closes [#34207](https://github.com/ClickHouse/ClickHouse/issues/34207). [#49626](https://github.com/ClickHouse/ClickHouse/pull/49626) ([alekseygolub](https://github.com/alekseygolub)).
+* Add support for `TRUNCATE` modifier in `INTO OUTFILE` clause. Suggest using `APPEND` or `TRUNCATE` for `INTO OUTFILE` when file exists. [#50950](https://github.com/ClickHouse/ClickHouse/pull/50950) ([alekar](https://github.com/alekar)).
+* Add table engine `Redis` and table function `redis`. It allows querying external Redis servers. [#50150](https://github.com/ClickHouse/ClickHouse/pull/50150) ([JackyWoo](https://github.com/JackyWoo)).
+* Allow to skip empty files in file/s3/url/hdfs table functions using settings `s3_skip_empty_files`, `hdfs_skip_empty_files`, `engine_file_skip_empty_files`, `engine_url_skip_empty_files`. [#50364](https://github.com/ClickHouse/ClickHouse/pull/50364) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add a new setting named `use_mysql_types_in_show_columns` to alter the `SHOW COLUMNS` SQL statement to display MySQL equivalent types when a client is connected via the MySQL compatibility port. [#49577](https://github.com/ClickHouse/ClickHouse/pull/49577) ([Thomas Panetti](https://github.com/tpanetti)).
+* Clickhouse-client can now be called with a connection string instead of "--host", "--port", "--user" etc. [#50689](https://github.com/ClickHouse/ClickHouse/pull/50689) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
+* Add setting `session_timezone`; it is used as the default timezone for a session when not explicitly specified. [#44149](https://github.com/ClickHouse/ClickHouse/pull/44149) ([Andrey Zvonov](https://github.com/zvonand)).
+* Codec DEFLATE_QPL is now controlled via server setting "enable_deflate_qpl_codec" (default: false) instead of setting "allow_experimental_codecs". This marks DEFLATE_QPL non-experimental. [#50775](https://github.com/ClickHouse/ClickHouse/pull/50775) ([Robert Schulze](https://github.com/rschu1ze)).
+
+#### Performance Improvement
+* Improved scheduling of merge selecting and cleanup tasks in `ReplicatedMergeTree`. The tasks will not be executed too frequently when there's nothing to merge or cleanup. Added settings `max_merge_selecting_sleep_ms`, `merge_selecting_sleep_slowdown_factor`, `max_cleanup_delay_period` and `cleanup_thread_preferred_points_per_iteration`. It should close [#31919](https://github.com/ClickHouse/ClickHouse/issues/31919). [#50107](https://github.com/ClickHouse/ClickHouse/pull/50107) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Make filter push down through cross join. [#50605](https://github.com/ClickHouse/ClickHouse/pull/50605) ([Han Fei](https://github.com/hanfei1991)).
+* Improve performance with enabled QueryProfiler using thread-local timer_id instead of global object. [#48778](https://github.com/ClickHouse/ClickHouse/pull/48778) ([Jiebin Sun](https://github.com/jiebinn)).
+* Rewrite CapnProto input/output format to improve its performance. Map column names and CapnProto fields case insensitive, fix reading/writing of nested structure fields. [#49752](https://github.com/ClickHouse/ClickHouse/pull/49752) ([Kruglov Pavel](https://github.com/Avogar)).
+* Optimize parquet write performance for parallel threads. [#50102](https://github.com/ClickHouse/ClickHouse/pull/50102) ([Hongbin Ma](https://github.com/binmahone)).
+* Disable `parallelize_output_from_storages` for processing MATERIALIZED VIEWs and storages with one block only. [#50214](https://github.com/ClickHouse/ClickHouse/pull/50214) ([Azat Khuzhin](https://github.com/azat)).
+* Merge PR [#46558](https://github.com/ClickHouse/ClickHouse/pull/46558). Avoid block permutation during sort if the block is already sorted. [#50697](https://github.com/ClickHouse/ClickHouse/pull/50697) ([Alexey Milovidov](https://github.com/alexey-milovidov), [Maksim Kita](https://github.com/kitaisreal)).
+* Make multiple list requests to ZooKeeper in parallel to speed up reading from system.zookeeper table. [#51042](https://github.com/ClickHouse/ClickHouse/pull/51042) ([Alexander Gololobov](https://github.com/davenger)).
+* Speedup initialization of DateTime lookup tables for time zones. This should reduce startup/connect time of clickhouse-client especially in debug build as it is rather heavy. [#51347](https://github.com/ClickHouse/ClickHouse/pull/51347) ([Alexander Gololobov](https://github.com/davenger)).
+* Fix data lakes slowness because of synchronous head requests. (Related to Iceberg/Deltalake/Hudi being slow with a lot of files). [#50976](https://github.com/ClickHouse/ClickHouse/pull/50976) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Do not read all the columns from right GLOBAL JOIN table. [#50721](https://github.com/ClickHouse/ClickHouse/pull/50721) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+
+#### Experimental Feature
+* Support parallel replicas with the analyzer. [#50441](https://github.com/ClickHouse/ClickHouse/pull/50441) ([Raúl Marín](https://github.com/Algunenano)).
+* Add random sleep before large merges/mutations execution to split load more evenly between replicas in case of zero-copy replication. [#51282](https://github.com/ClickHouse/ClickHouse/pull/51282) ([alesapin](https://github.com/alesapin)).
+* Do not replicate `ALTER PARTITION` queries and mutations through `Replicated` database if it has only one shard and the underlying table is `ReplicatedMergeTree`. [#51049](https://github.com/ClickHouse/ClickHouse/pull/51049) ([Alexander Tokmakov](https://github.com/tavplubix)).
+
+#### Improvement
+* Relax the thresholds for "too many parts" to be more modern. Return the backpressure during long-running insert queries. [#50856](https://github.com/ClickHouse/ClickHouse/pull/50856) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Allow to cast IPv6 to IPv4 address for CIDR ::ffff:0:0/96 (IPv4-mapped addresses). [#49759](https://github.com/ClickHouse/ClickHouse/pull/49759) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Update MongoDB protocol to support MongoDB 5.1 version and newer. Support for the versions with the old protocol (<3.6) is preserved. Closes [#45621](https://github.com/ClickHouse/ClickHouse/issues/45621), [#49879](https://github.com/ClickHouse/ClickHouse/issues/49879). [#50061](https://github.com/ClickHouse/ClickHouse/pull/50061) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Add setting `input_format_max_bytes_to_read_for_schema_inference` to limit the number of bytes to read in schema inference. Closes [#50577](https://github.com/ClickHouse/ClickHouse/issues/50577). [#50592](https://github.com/ClickHouse/ClickHouse/pull/50592) ([Kruglov Pavel](https://github.com/Avogar)).
+* Respect setting `input_format_null_as_default` in schema inference. [#50602](https://github.com/ClickHouse/ClickHouse/pull/50602) ([Kruglov Pavel](https://github.com/Avogar)).
+* Allow to skip trailing empty lines in CSV/TSV/CustomSeparated formats via settings `input_format_csv_skip_trailing_empty_lines`, `input_format_tsv_skip_trailing_empty_lines` and `input_format_custom_skip_trailing_empty_lines` (disabled by default). Closes [#49315](https://github.com/ClickHouse/ClickHouse/issues/49315). [#50635](https://github.com/ClickHouse/ClickHouse/pull/50635) ([Kruglov Pavel](https://github.com/Avogar)).
+* Functions "toDateOrDefault|OrNull" and "accuateCast[OrDefault|OrNull]" now correctly parse numeric arguments. [#50709](https://github.com/ClickHouse/ClickHouse/pull/50709) ([Dmitry Kardymon](https://github.com/kardymonds)).
+* Support CSV with whitespace or `\t` field delimiters, and these delimiters are supported in Spark. [#50712](https://github.com/ClickHouse/ClickHouse/pull/50712) ([KevinyhZou](https://github.com/KevinyhZou)).
+* Settings `number_of_mutations_to_delay` and `number_of_mutations_to_throw` are enabled by default now with values 500 and 1000 respectively. [#50726](https://github.com/ClickHouse/ClickHouse/pull/50726) ([Anton Popov](https://github.com/CurtizJ)).
+* The dashboard correctly shows missing values. This closes [#50831](https://github.com/ClickHouse/ClickHouse/issues/50831). [#50832](https://github.com/ClickHouse/ClickHouse/pull/50832) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Added the possibility to use date and time arguments in the syslog timestamp format in functions `parseDateTimeBestEffort*` and `parseDateTime64BestEffort*`. [#50925](https://github.com/ClickHouse/ClickHouse/pull/50925) ([Victor Krasnov](https://github.com/sirvickr)).
+* Command line parameter "--password" in clickhouse-client can now be specified only once. [#50966](https://github.com/ClickHouse/ClickHouse/pull/50966) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
+* Use `hash_of_all_files` from `system.parts` to check identity of parts during on-cluster backups. [#50997](https://github.com/ClickHouse/ClickHouse/pull/50997) ([Vitaly Baranov](https://github.com/vitlibar)).
+* The system table zookeeper_connection connected_time identifies the time when the connection is established (standard format), and session_uptime_elapsed_seconds is added, which labels the duration of the established connection session (in seconds). [#51026](https://github.com/ClickHouse/ClickHouse/pull/51026) ([郭小龙](https://github.com/guoxiaolongzte)).
+* Improve the progress bar for file/s3/hdfs/url table functions by using chunk size from source data and using incremental total size counting in each thread. Fix the progress bar for *Cluster functions. This closes [#47250](https://github.com/ClickHouse/ClickHouse/issues/47250). [#51088](https://github.com/ClickHouse/ClickHouse/pull/51088) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add total_bytes_to_read to the Progress packet in TCP protocol for better Progress bar. [#51158](https://github.com/ClickHouse/ClickHouse/pull/51158) ([Kruglov Pavel](https://github.com/Avogar)).
+* Better checking of data parts on disks with filesystem cache. [#51164](https://github.com/ClickHouse/ClickHouse/pull/51164) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix sometimes not correct current_elements_num in fs cache. [#51242](https://github.com/ClickHouse/ClickHouse/pull/51242) ([Kseniia Sumarokova](https://github.com/kssenii)).
+
+#### Build/Testing/Packaging Improvement
+* Add embedded keeper-client to standalone keeper binary. [#50964](https://github.com/ClickHouse/ClickHouse/pull/50964) ([pufit](https://github.com/pufit)).
+* Actual LZ4 version is used now. [#50621](https://github.com/ClickHouse/ClickHouse/pull/50621) ([Nikita Taranov](https://github.com/nickitat)).
+* ClickHouse server will print the list of changed settings on fatal errors. This closes [#51137](https://github.com/ClickHouse/ClickHouse/issues/51137). [#51138](https://github.com/ClickHouse/ClickHouse/pull/51138) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Allow building ClickHouse with clang-17. [#51300](https://github.com/ClickHouse/ClickHouse/pull/51300) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* [SQLancer](https://github.com/sqlancer/sqlancer) check is considered stable as bugs that were triggered by it are fixed. Now failures of SQLancer check will be reported as failed check status. [#51340](https://github.com/ClickHouse/ClickHouse/pull/51340) ([Ilya Yatsishin](https://github.com/qoega)).
+* Split huge `RUN` in Dockerfile into smaller conditional. Install the necessary tools on demand in the same `RUN` layer, and remove them after that. Upgrade the OS only once at the beginning. Use a modern way to check the signed repository. Downgrade the base repo to ubuntu:20.04 to address the issues on older docker versions. Upgrade golang version to address golang vulnerabilities. [#51504](https://github.com/ClickHouse/ClickHouse/pull/51504) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Report loading status for executable dictionaries correctly [#48775](https://github.com/ClickHouse/ClickHouse/pull/48775) ([Anton Kozlov](https://github.com/tonickkozlov)).
+* Proper mutation of skip indices and projections [#50104](https://github.com/ClickHouse/ClickHouse/pull/50104) ([Amos Bird](https://github.com/amosbird)).
+* Cleanup moving parts [#50489](https://github.com/ClickHouse/ClickHouse/pull/50489) ([vdimir](https://github.com/vdimir)).
+* Fix backward compatibility for IP types hashing in aggregate functions [#50551](https://github.com/ClickHouse/ClickHouse/pull/50551) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Fix Log family table return wrong rows count after truncate [#50585](https://github.com/ClickHouse/ClickHouse/pull/50585) ([flynn](https://github.com/ucasfl)).
+* Fix bug in `uniqExact` parallel merging [#50590](https://github.com/ClickHouse/ClickHouse/pull/50590) ([Nikita Taranov](https://github.com/nickitat)).
+* Revert recent grace hash join changes [#50699](https://github.com/ClickHouse/ClickHouse/pull/50699) ([vdimir](https://github.com/vdimir)).
+* Query Cache: Try to fix bad cast from `ColumnConst` to `ColumnVector<char8_t>` [#50704](https://github.com/ClickHouse/ClickHouse/pull/50704) ([Robert Schulze](https://github.com/rschu1ze)).
+* Avoid storing logs in Keeper containing unknown operation [#50751](https://github.com/ClickHouse/ClickHouse/pull/50751) ([Antonio Andelic](https://github.com/antonio2368)).
+* SummingMergeTree support for DateTime64 [#50797](https://github.com/ClickHouse/ClickHouse/pull/50797) ([Jordi Villar](https://github.com/jrdi)).
+* Add compatibility setting for non-const timezones [#50834](https://github.com/ClickHouse/ClickHouse/pull/50834) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix hashing of LDAP params in the cache entries [#50865](https://github.com/ClickHouse/ClickHouse/pull/50865) ([Julian Maicher](https://github.com/jmaicher)).
+* Fallback to parsing big integer from String instead of exception in Parquet format [#50873](https://github.com/ClickHouse/ClickHouse/pull/50873) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix checking the lock file too often while writing a backup [#50889](https://github.com/ClickHouse/ClickHouse/pull/50889) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Do not apply projection if read-in-order was enabled. [#50923](https://github.com/ClickHouse/ClickHouse/pull/50923) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix race in the Azure blob storage iterator [#50936](https://github.com/ClickHouse/ClickHouse/pull/50936) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix erroneous `sort_description` propagation in `CreatingSets` [#50955](https://github.com/ClickHouse/ClickHouse/pull/50955) ([Nikita Taranov](https://github.com/nickitat)).
+* Fix Iceberg v2 optional metadata parsing [#50974](https://github.com/ClickHouse/ClickHouse/pull/50974) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* MaterializedMySQL: Keep parentheses for empty table overrides [#50977](https://github.com/ClickHouse/ClickHouse/pull/50977) ([Val Doroshchuk](https://github.com/valbok)).
+* Fix crash in BackupCoordinationStageSync::setError() [#51012](https://github.com/ClickHouse/ClickHouse/pull/51012) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix subtly broken copy-on-write of ColumnLowCardinality dictionary [#51064](https://github.com/ClickHouse/ClickHouse/pull/51064) ([Michael Kolupaev](https://github.com/al13n321)).
+* Generate safe IVs [#51086](https://github.com/ClickHouse/ClickHouse/pull/51086) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Fix ineffective query cache for SELECTs with subqueries [#51132](https://github.com/ClickHouse/ClickHouse/pull/51132) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix Set index with constant nullable comparison. [#51205](https://github.com/ClickHouse/ClickHouse/pull/51205) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix a crash in s3 and s3Cluster functions [#51209](https://github.com/ClickHouse/ClickHouse/pull/51209) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix a crash with compiled expressions [#51231](https://github.com/ClickHouse/ClickHouse/pull/51231) ([LiuNeng](https://github.com/liuneng1994)).
+* Fix use-after-free in StorageURL when switching URLs [#51260](https://github.com/ClickHouse/ClickHouse/pull/51260) ([Michael Kolupaev](https://github.com/al13n321)).
+* Updated check for parameterized view [#51272](https://github.com/ClickHouse/ClickHouse/pull/51272) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix multiple writing of same file to backup [#51299](https://github.com/ClickHouse/ClickHouse/pull/51299) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix fuzzer failure in ActionsDAG [#51301](https://github.com/ClickHouse/ClickHouse/pull/51301) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove garbage from function `transform` [#51350](https://github.com/ClickHouse/ClickHouse/pull/51350) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+
+### <a id="235"></a> ClickHouse release 23.5, 2023-06-08
+
+#### Upgrade Notes
+* Compress marks and primary key by default. It significantly reduces the cold query time. Upgrade notes: the support for compressed marks and primary key has been added in version 22.9. If you turned on compressed marks or primary key or installed version 23.5 or newer, which has compressed marks or primary key on by default, you will not be able to downgrade to version 22.8 or earlier. You can also explicitly disable compressed marks or primary keys by specifying the `compress_marks` and `compress_primary_key` settings in the `<merge_tree>` section of the server configuration file. **Upgrade notes:** If you upgrade from versions prior to 22.9, you should either upgrade all replicas at once or disable the compression before upgrade, or upgrade through an intermediate version, where the compressed marks are supported but not enabled by default, such as 23.3. [#42587](https://github.com/ClickHouse/ClickHouse/pull/42587) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Make local object storage work consistently with s3 object storage, fix problem with append (closes [#48465](https://github.com/ClickHouse/ClickHouse/issues/48465)), make it configurable as independent storage. The change is backward incompatible because the cache on top of local object storage is not compatible to previous versions. [#48791](https://github.com/ClickHouse/ClickHouse/pull/48791) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* The experimental feature "in-memory data parts" is removed. The data format is still supported, but the settings are no-op, and compact or wide parts will be used instead. This closes [#45409](https://github.com/ClickHouse/ClickHouse/issues/45409). [#49429](https://github.com/ClickHouse/ClickHouse/pull/49429) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Changed default values of settings `parallelize_output_from_storages` and `input_format_parquet_preserve_order`. This allows ClickHouse to reorder rows when reading from files (e.g. CSV or Parquet), greatly improving performance in many cases. To restore the old behavior of preserving order, use `parallelize_output_from_storages = 0`, `input_format_parquet_preserve_order = 1`. [#49479](https://github.com/ClickHouse/ClickHouse/pull/49479) ([Michael Kolupaev](https://github.com/al13n321)).
+* Make projections production-ready. Add the `optimize_use_projections` setting to control whether the projections will be selected for SELECT queries. The setting `allow_experimental_projection_optimization` is obsolete and does nothing. [#49719](https://github.com/ClickHouse/ClickHouse/pull/49719) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Mark `joinGet` as non-deterministic (so as `dictGet`). It allows using them in mutations without an extra setting. [#49843](https://github.com/ClickHouse/ClickHouse/pull/49843) ([Azat Khuzhin](https://github.com/azat)).
+* Revert the "`groupArray` returns cannot be nullable" change (due to binary compatibility breakage for `groupArray`/`groupArrayLast`/`groupArraySample` over `Nullable` types, which likely will lead to `TOO_LARGE_ARRAY_SIZE` or `CANNOT_READ_ALL_DATA`). [#49971](https://github.com/ClickHouse/ClickHouse/pull/49971) ([Azat Khuzhin](https://github.com/azat)).
+* Setting `enable_memory_bound_merging_of_aggregation_results` is enabled by default. If you update from version prior to 22.12, we recommend to set this flag to `false` until update is finished. [#50319](https://github.com/ClickHouse/ClickHouse/pull/50319) ([Nikita Taranov](https://github.com/nickitat)).
+
+#### New Feature
+* Added storage engine AzureBlobStorage and azureBlobStorage table function. The supported set of features is very similar to storage/table function S3 [#50604] (https://github.com/ClickHouse/ClickHouse/pull/50604) ([alesapin](https://github.com/alesapin)) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni).
+* Added native ClickHouse Keeper CLI Client, it is available as `clickhouse keeper-client` [#47414](https://github.com/ClickHouse/ClickHouse/pull/47414) ([pufit](https://github.com/pufit)).
+* Add `urlCluster` table function. Refactor all *Cluster table functions to reduce code duplication. Make schema inference work for all possible *Cluster function signatures and for named collections. Closes [#38499](https://github.com/ClickHouse/ClickHouse/issues/38499). [#45427](https://github.com/ClickHouse/ClickHouse/pull/45427) ([attack204](https://github.com/attack204)), Pavel Kruglov.
+* The query cache can now be used for production workloads. [#47977](https://github.com/ClickHouse/ClickHouse/pull/47977) ([Robert Schulze](https://github.com/rschu1ze)). The query cache can now support queries with totals and extremes modifier. [#48853](https://github.com/ClickHouse/ClickHouse/pull/48853) ([Robert Schulze](https://github.com/rschu1ze)). Make `allow_experimental_query_cache` setting as obsolete for backward-compatibility. It was removed in https://github.com/ClickHouse/ClickHouse/pull/47977. [#49934](https://github.com/ClickHouse/ClickHouse/pull/49934) ([Timur Solodovnikov](https://github.com/tsolodov)).
+* Geographical data types (`Point`, `Ring`, `Polygon`, and `MultiPolygon`) are production-ready. [#50022](https://github.com/ClickHouse/ClickHouse/pull/50022) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add schema inference to PostgreSQL, MySQL, MeiliSearch, and SQLite table engines. Closes [#49972](https://github.com/ClickHouse/ClickHouse/issues/49972). [#50000](https://github.com/ClickHouse/ClickHouse/pull/50000) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Password type in queries like `CREATE USER u IDENTIFIED BY 'p'` will be automatically set according to the setting `default_password_type` in the `config.xml` on the server. Closes [#42915](https://github.com/ClickHouse/ClickHouse/issues/42915). [#44674](https://github.com/ClickHouse/ClickHouse/pull/44674) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Add bcrypt password authentication type. Closes [#34599](https://github.com/ClickHouse/ClickHouse/issues/34599). [#44905](https://github.com/ClickHouse/ClickHouse/pull/44905) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Introduces new keyword `INTO OUTFILE 'file.txt' APPEND`. [#48880](https://github.com/ClickHouse/ClickHouse/pull/48880) ([alekar](https://github.com/alekar)).
+* Added `system.zookeeper_connection` table that shows information about Keeper connections. [#45245](https://github.com/ClickHouse/ClickHouse/pull/45245) ([mateng915](https://github.com/mateng0915)).
+* Add new function `generateRandomStructure` that generates random table structure. It can be used in combination with table function `generateRandom`. [#47409](https://github.com/ClickHouse/ClickHouse/pull/47409) ([Kruglov Pavel](https://github.com/Avogar)).
+* Allow the use of `CASE` without an `ELSE` branch and extended `transform` to deal with more types. Also fix some issues that made transform() return incorrect results when decimal types were mixed with other numeric types. [#48300](https://github.com/ClickHouse/ClickHouse/pull/48300) ([Salvatore Mesoraca](https://github.com/aiven-sal)). This closes #2655. This closes #9596. This closes #38666.
+* Added [server-side encryption using KMS keys](https://docs.aws.amazon.com/AmazonS3/latest/userguide/UsingKMSEncryption.html) with S3 tables, and the `header` setting with S3 disks. Closes [#48723](https://github.com/ClickHouse/ClickHouse/issues/48723). [#48724](https://github.com/ClickHouse/ClickHouse/pull/48724) ([Johann Gan](https://github.com/johanngan)).
+* Add MemoryTracker for the background tasks (merges and mutation). Introduces `merges_mutations_memory_usage_soft_limit` and `merges_mutations_memory_usage_to_ram_ratio` settings that represent the soft memory limit for merges and mutations. If this limit is reached ClickHouse won't schedule new merge or mutation tasks. Also `MergesMutationsMemoryTracking` metric is introduced to allow observing current memory usage of background tasks. Resubmit [#46089](https://github.com/ClickHouse/ClickHouse/issues/46089). Closes [#48774](https://github.com/ClickHouse/ClickHouse/issues/48774). [#48787](https://github.com/ClickHouse/ClickHouse/pull/48787) ([Dmitry Novik](https://github.com/novikd)).
+* Function `dotProduct` work for array. [#49050](https://github.com/ClickHouse/ClickHouse/pull/49050) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
+* Support statement `SHOW INDEX` to improve compatibility with MySQL. [#49158](https://github.com/ClickHouse/ClickHouse/pull/49158) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add virtual column `_file` and `_path` support to table function `url`. - Impove error message for table function `url`. - resolves [#49231](https://github.com/ClickHouse/ClickHouse/issues/49231) - resolves [#49232](https://github.com/ClickHouse/ClickHouse/issues/49232). [#49356](https://github.com/ClickHouse/ClickHouse/pull/49356) ([Ziyi Tan](https://github.com/Ziy1-Tan)).
+* Adding the `grants` field in the users.xml file, which allows specifying grants for users. [#49381](https://github.com/ClickHouse/ClickHouse/pull/49381) ([pufit](https://github.com/pufit)).
+* Support full/right join by using grace hash join algorithm. [#49483](https://github.com/ClickHouse/ClickHouse/pull/49483) ([lgbo](https://github.com/lgbo-ustc)).
+* `WITH FILL` modifier groups filling by sorting prefix. Controlled by `use_with_fill_by_sorting_prefix` setting (enabled by default). Related to [#33203](https://github.com/ClickHouse/ClickHouse/issues/33203)#issuecomment-1418736794. [#49503](https://github.com/ClickHouse/ClickHouse/pull/49503) ([Igor Nikonov](https://github.com/devcrafter)).
+* Clickhouse-client now accepts queries after "--multiquery" when "--query" (or "-q") is absent. example: clickhouse-client --multiquery "select 1; select 2;". [#49870](https://github.com/ClickHouse/ClickHouse/pull/49870) ([Alexey Gerasimchuk](https://github.com/Demilivor)).
+* Add separate `handshake_timeout` for receiving Hello packet from replica. Closes [#48854](https://github.com/ClickHouse/ClickHouse/issues/48854). [#49948](https://github.com/ClickHouse/ClickHouse/pull/49948) ([Kruglov Pavel](https://github.com/Avogar)).
+* Added a function "space" which repeats a space as many times as specified. [#50103](https://github.com/ClickHouse/ClickHouse/pull/50103) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added --input_format_csv_trim_whitespaces option. [#50215](https://github.com/ClickHouse/ClickHouse/pull/50215) ([Alexey Gerasimchuk](https://github.com/Demilivor)).
+* Allow the `dictGetAll` function for regexp tree dictionaries to return values from multiple matches as arrays. Closes [#50254](https://github.com/ClickHouse/ClickHouse/issues/50254). [#50255](https://github.com/ClickHouse/ClickHouse/pull/50255) ([Johann Gan](https://github.com/johanngan)).
+* Added `toLastDayOfWeek` function to round a date or a date with time up to the nearest Saturday or Sunday. [#50315](https://github.com/ClickHouse/ClickHouse/pull/50315) ([Victor Krasnov](https://github.com/sirvickr)).
+* Ability to ignore a skip index by specifying `ignore_data_skipping_indices`. [#50329](https://github.com/ClickHouse/ClickHouse/pull/50329) ([Boris Kuschel](https://github.com/bkuschel)).
+* Add `system.user_processes` table and `SHOW USER PROCESSES` query to show memory info and ProfileEvents on user level. [#50492](https://github.com/ClickHouse/ClickHouse/pull/50492) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Add server and format settings `display_secrets_in_show_and_select` for displaying secrets of tables, databases, table functions, and dictionaries. Add privilege `displaySecretsInShowAndSelect` controlling which users can view secrets. [#46528](https://github.com/ClickHouse/ClickHouse/pull/46528) ([Mike Kot](https://github.com/myrrc)).
+* Allow to set up a ROW POLICY for all tables that belong to a DATABASE. [#47640](https://github.com/ClickHouse/ClickHouse/pull/47640) ([Ilya Golshtein](https://github.com/ilejn)).
+
+#### Performance Improvement
+* Compress marks and primary key by default. It significantly reduces the cold query time. Upgrade notes: the support for compressed marks and primary key has been added in version 22.9. If you turned on compressed marks or primary key or installed version 23.5 or newer, which has compressed marks or primary key on by default, you will not be able to downgrade to version 22.8 or earlier. You can also explicitly disable compressed marks or primary keys by specifying the `compress_marks` and `compress_primary_key` settings in the `<merge_tree>` section of the server configuration file. [#42587](https://github.com/ClickHouse/ClickHouse/pull/42587) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* New setting s3_max_inflight_parts_for_one_file sets the limit of concurrently loaded parts with multipart upload request in scope of one file. [#49961](https://github.com/ClickHouse/ClickHouse/pull/49961) ([Sema Checherinda](https://github.com/CheSema)).
+* When reading from multiple files reduce parallel parsing threads for each file. Resolves [#42192](https://github.com/ClickHouse/ClickHouse/issues/42192). [#46661](https://github.com/ClickHouse/ClickHouse/pull/46661) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Use aggregate projection only if it reads fewer granules than normal reading. It should help in case if query hits the PK of the table, but not the projection. Fixes [#49150](https://github.com/ClickHouse/ClickHouse/issues/49150). [#49417](https://github.com/ClickHouse/ClickHouse/pull/49417) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Do not store blocks in `ANY` hash join if nothing is inserted. [#48633](https://github.com/ClickHouse/ClickHouse/pull/48633) ([vdimir](https://github.com/vdimir)).
+* Fixes aggregate combinator `-If` when JIT compiled, and enable JIT compilation for aggregate functions. Closes [#48120](https://github.com/ClickHouse/ClickHouse/issues/48120). [#49083](https://github.com/ClickHouse/ClickHouse/pull/49083) ([Igor Nikonov](https://github.com/devcrafter)).
+* For reading from remote tables we use smaller tasks (instead of reading the whole part) to make tasks stealing work * task size is determined by size of columns to read * always use 1mb buffers for reading from s3 * boundaries of cache segments aligned to 1mb so they have decent size even with small tasks. it also should prevent fragmentation. [#49287](https://github.com/ClickHouse/ClickHouse/pull/49287) ([Nikita Taranov](https://github.com/nickitat)).
+* Introduced settings: - `merge_max_block_size_bytes` to limit the amount of memory used for background operations. - `vertical_merge_algorithm_min_bytes_to_activate` to add another condition to activate vertical merges. [#49313](https://github.com/ClickHouse/ClickHouse/pull/49313) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Default size of a read buffer for reading from local filesystem changed to a slightly better value. Also two new settings are introduced: `max_read_buffer_size_local_fs` and `max_read_buffer_size_remote_fs`. [#49321](https://github.com/ClickHouse/ClickHouse/pull/49321) ([Nikita Taranov](https://github.com/nickitat)).
+* Improve memory usage and speed of `SPARSE_HASHED`/`HASHED` dictionaries (e.g. `SPARSE_HASHED` now eats 2.6x less memory, and is ~2x faster). [#49380](https://github.com/ClickHouse/ClickHouse/pull/49380) ([Azat Khuzhin](https://github.com/azat)).
+* Optimize the `system.query_log` and `system.query_thread_log` tables by applying `LowCardinality` when appropriate. The queries over these tables will be faster. [#49530](https://github.com/ClickHouse/ClickHouse/pull/49530) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Better performance when reading local `Parquet` files (through parallel reading). [#49539](https://github.com/ClickHouse/ClickHouse/pull/49539) ([Michael Kolupaev](https://github.com/al13n321)).
+* Improve the performance of `RIGHT/FULL JOIN` by up to 2 times in certain scenarios, especially when joining a small left table with a large right table. [#49585](https://github.com/ClickHouse/ClickHouse/pull/49585) ([lgbo](https://github.com/lgbo-ustc)).
+* Improve performance of BLAKE3 by 11% by enabling LTO for Rust. [#49600](https://github.com/ClickHouse/ClickHouse/pull/49600) ([Azat Khuzhin](https://github.com/azat)). Now it is on par with C++.
+* Optimize the structure of the `system.opentelemetry_span_log`. Use `LowCardinality` where appropriate. Although this table is generally stupid (it is using the Map data type even for common attributes), it will be slightly better. [#49647](https://github.com/ClickHouse/ClickHouse/pull/49647) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Try to reserve hash table's size in `grace_hash` join. [#49816](https://github.com/ClickHouse/ClickHouse/pull/49816) ([lgbo](https://github.com/lgbo-ustc)).
+* Parallel merge of `uniqExactIf` states. Closes [#49885](https://github.com/ClickHouse/ClickHouse/issues/49885). [#50285](https://github.com/ClickHouse/ClickHouse/pull/50285) ([flynn](https://github.com/ucasfl)).
+* Keeper improvement: add `CheckNotExists` request to Keeper, which allows to improve the performance of Replicated tables. [#48897](https://github.com/ClickHouse/ClickHouse/pull/48897) ([Antonio Andelic](https://github.com/antonio2368)).
+* Keeper performance improvements: avoid serializing same request twice while processing. Cache deserialization results of large requests. Controlled by new coordination setting `min_request_size_for_cache`. [#49004](https://github.com/ClickHouse/ClickHouse/pull/49004) ([Antonio Andelic](https://github.com/antonio2368)).
+* Reduced number of `List` ZooKeeper requests when selecting parts to merge and a lot of partitions do not have anything to merge. [#49637](https://github.com/ClickHouse/ClickHouse/pull/49637) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Rework locking in the FS cache [#44985](https://github.com/ClickHouse/ClickHouse/pull/44985) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Disable pure parallel replicas if trivial count optimization is possible. [#50594](https://github.com/ClickHouse/ClickHouse/pull/50594) ([Raúl Marín](https://github.com/Algunenano)).
+* Don't send head request for all keys in Iceberg schema inference, only for keys that are used for reaing data. [#50203](https://github.com/ClickHouse/ClickHouse/pull/50203) ([Kruglov Pavel](https://github.com/Avogar)).
+* Setting `enable_memory_bound_merging_of_aggregation_results` is enabled by default. [#50319](https://github.com/ClickHouse/ClickHouse/pull/50319) ([Nikita Taranov](https://github.com/nickitat)).
+
+#### Experimental Feature
+* `DEFLATE_QPL` codec lower the minimum simd version to SSE 4.2. [doc change in qpl](https://github.com/intel/qpl/commit/3f8f5cea27739f5261e8fd577dc233ffe88bf679) - Intel® QPL relies on a run-time kernels dispatcher and cpuid check to choose the best available implementation(sse/avx2/avx512) - restructured cmakefile for qpl build in clickhouse to align with latest upstream qpl. [#49811](https://github.com/ClickHouse/ClickHouse/pull/49811) ([jasperzhu](https://github.com/jinjunzh)).
+* Add initial support to do JOINs with pure parallel replicas. [#49544](https://github.com/ClickHouse/ClickHouse/pull/49544) ([Raúl Marín](https://github.com/Algunenano)).
+* More parallelism on `Outdated` parts removal with "zero-copy replication". [#49630](https://github.com/ClickHouse/ClickHouse/pull/49630) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Parallel Replicas: 1) Fixed an error `NOT_FOUND_COLUMN_IN_BLOCK` in case of using parallel replicas with non-replicated storage with disabled setting `parallel_replicas_for_non_replicated_merge_tree` 2) Now `allow_experimental_parallel_reading_from_replicas` have 3 possible values - 0, 1 and 2. 0 - disabled, 1 - enabled, silently disable them in case of failure (in case of FINAL or JOIN), 2 - enabled, throw an expection in case of failure. 3) If FINAL modifier is used in SELECT query and parallel replicas are enabled, ClickHouse will try to disable them if `allow_experimental_parallel_reading_from_replicas` is set to 1 and throw an exception otherwise. [#50195](https://github.com/ClickHouse/ClickHouse/pull/50195) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* When parallel replicas are enabled they will always skip unavailable servers (the behavior is controlled by the setting `skip_unavailable_shards`, enabled by default and can be only disabled). This closes: [#48565](https://github.com/ClickHouse/ClickHouse/issues/48565). [#50293](https://github.com/ClickHouse/ClickHouse/pull/50293) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+
+#### Improvement
+* The `BACKUP` command will not decrypt data from encrypted disks while making a backup. Instead the data will be stored in a backup in encrypted form. Such backups can be restored only to an encrypted disk with the same (or extended) list of encryption keys. [#48896](https://github.com/ClickHouse/ClickHouse/pull/48896) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Added possibility to use temporary tables in FROM part of ATTACH PARTITION FROM and REPLACE PARTITION FROM. [#49436](https://github.com/ClickHouse/ClickHouse/pull/49436) ([Roman Vasin](https://github.com/rvasin)).
+* Added setting `async_insert` for `MergeTree` tables. It has the same meaning as query-level setting `async_insert` and enables asynchronous inserts for specific table. Note: it doesn't take effect for insert queries from `clickhouse-client`, use query-level setting in that case. [#49122](https://github.com/ClickHouse/ClickHouse/pull/49122) ([Anton Popov](https://github.com/CurtizJ)).
+* Add support for size suffixes in quota creation statement parameters. [#49087](https://github.com/ClickHouse/ClickHouse/pull/49087) ([Eridanus](https://github.com/Eridanus117)).
+* Extend `first_value` and `last_value` to accept NULL. [#46467](https://github.com/ClickHouse/ClickHouse/pull/46467) ([lgbo](https://github.com/lgbo-ustc)).
+* Add alias `str_to_map` and `mapFromString` for `extractKeyValuePairs`. closes https://github.com/clickhouse/clickhouse/issues/47185. [#49466](https://github.com/ClickHouse/ClickHouse/pull/49466) ([flynn](https://github.com/ucasfl)).
+* Add support for CGroup version 2 for asynchronous metrics about the memory usage and availability. This closes [#37983](https://github.com/ClickHouse/ClickHouse/issues/37983). [#45999](https://github.com/ClickHouse/ClickHouse/pull/45999) ([sichenzhao](https://github.com/sichenzhao)).
+* Cluster table functions should always skip unavailable shards. close [#46314](https://github.com/ClickHouse/ClickHouse/issues/46314). [#46765](https://github.com/ClickHouse/ClickHouse/pull/46765) ([zk_kiger](https://github.com/zk-kiger)).
+* Allow CSV file to contain empty columns in its header. [#47496](https://github.com/ClickHouse/ClickHouse/pull/47496) ([你不要过来啊](https://github.com/iiiuwioajdks)).
+* Add Google Cloud Storage S3 compatible table function `gcs`. Like the `oss` and `cosn` functions, it is just an alias over the `s3` table function, and it does not bring any new features. [#47815](https://github.com/ClickHouse/ClickHouse/pull/47815) ([Kuba Kaflik](https://github.com/jkaflik)).
+* Add ability to use strict parts size for S3 (compatibility with CloudFlare R2 S3 Storage). [#48492](https://github.com/ClickHouse/ClickHouse/pull/48492) ([Azat Khuzhin](https://github.com/azat)).
+* Added new columns with info about `Replicated` database replicas to `system.clusters`: `database_shard_name`, `database_replica_name`, `is_active`. Added an optional `FROM SHARD` clause to `SYSTEM DROP DATABASE REPLICA` query. [#48548](https://github.com/ClickHouse/ClickHouse/pull/48548) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Add a new column `zookeeper_name` in system.replicas, to indicate on which (auxiliary) zookeeper cluster the replicated table's metadata is stored. [#48549](https://github.com/ClickHouse/ClickHouse/pull/48549) ([cangyin](https://github.com/cangyin)).
+* `IN` operator support the comparison of `Date` and `Date32`. Closes [#48736](https://github.com/ClickHouse/ClickHouse/issues/48736). [#48806](https://github.com/ClickHouse/ClickHouse/pull/48806) ([flynn](https://github.com/ucasfl)).
+* Support for erasure codes in `HDFS`, author: @M1eyu2018, @tomscut. [#48833](https://github.com/ClickHouse/ClickHouse/pull/48833) ([M1eyu](https://github.com/M1eyu2018)).
+* Implement SYSTEM DROP REPLICA from auxillary ZooKeeper clusters, may be close [#48931](https://github.com/ClickHouse/ClickHouse/issues/48931). [#48932](https://github.com/ClickHouse/ClickHouse/pull/48932) ([wangxiaobo](https://github.com/wzb5212)).
+* Add Array data type to MongoDB. Closes [#48598](https://github.com/ClickHouse/ClickHouse/issues/48598). [#48983](https://github.com/ClickHouse/ClickHouse/pull/48983) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Support storing `Interval` data types in tables. [#49085](https://github.com/ClickHouse/ClickHouse/pull/49085) ([larryluogit](https://github.com/larryluogit)).
+* Allow using `ntile` window function without explicit window frame definition: `ntile(3) OVER (ORDER BY a)`, close [#46763](https://github.com/ClickHouse/ClickHouse/issues/46763). [#49093](https://github.com/ClickHouse/ClickHouse/pull/49093) ([vdimir](https://github.com/vdimir)).
+* Added settings (`number_of_mutations_to_delay`, `number_of_mutations_to_throw`) to delay or throw `ALTER` queries that create mutations (`ALTER UPDATE`, `ALTER DELETE`, `ALTER MODIFY COLUMN`, ...) in case when table already has a lot of unfinished mutations. [#49117](https://github.com/ClickHouse/ClickHouse/pull/49117) ([Anton Popov](https://github.com/CurtizJ)).
+* Catch exception from `create_directories` in filesystem cache. [#49203](https://github.com/ClickHouse/ClickHouse/pull/49203) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Copies embedded examples to a new field `example` in `system.functions` to supplement the field `description`. [#49222](https://github.com/ClickHouse/ClickHouse/pull/49222) ([Dan Roscigno](https://github.com/DanRoscigno)).
+* Enable connection options for the MongoDB dictionary. Example: ``` xml <source> <mongodb> <host>localhost</host> <port>27017</port> <user></user> <password></password> <db>test</db> <collection>dictionary_source</collection> <options>ssl=true</options> </mongodb> </source> ``` ### Documentation entry for user-facing changes. [#49225](https://github.com/ClickHouse/ClickHouse/pull/49225) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* Added an alias `asymptotic` for `asymp` computational method for `kolmogorovSmirnovTest`. Improved documentation. [#49286](https://github.com/ClickHouse/ClickHouse/pull/49286) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Aggregation function groupBitAnd/Or/Xor now work on signed integer data. This makes them consistent with the behavior of scalar functions bitAnd/Or/Xor. [#49292](https://github.com/ClickHouse/ClickHouse/pull/49292) ([exmy](https://github.com/exmy)).
+* Split function-documentation into more fine-granular fields. [#49300](https://github.com/ClickHouse/ClickHouse/pull/49300) ([Robert Schulze](https://github.com/rschu1ze)).
+* Use multiple threads shared between all tables within a server to load outdated data parts. The the size of the pool and its queue is controlled by `max_outdated_parts_loading_thread_pool_size` and `outdated_part_loading_thread_pool_queue_size` settings. [#49317](https://github.com/ClickHouse/ClickHouse/pull/49317) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Don't overestimate the size of processed data for `LowCardinality` columns when they share dictionaries between blocks. This closes [#49322](https://github.com/ClickHouse/ClickHouse/issues/49322). See also [#48745](https://github.com/ClickHouse/ClickHouse/issues/48745). [#49323](https://github.com/ClickHouse/ClickHouse/pull/49323) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Parquet writer now uses reasonable row group size when invoked through `OUTFILE`. [#49325](https://github.com/ClickHouse/ClickHouse/pull/49325) ([Michael Kolupaev](https://github.com/al13n321)).
+* Allow restricted keywords like `ARRAY` as an alias if the alias is quoted. Closes [#49324](https://github.com/ClickHouse/ClickHouse/issues/49324). [#49360](https://github.com/ClickHouse/ClickHouse/pull/49360) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Data parts loading and deletion jobs were moved to shared server-wide pools instead of per-table pools. Pools sizes are controlled via settings `max_active_parts_loading_thread_pool_size`, `max_outdated_parts_loading_thread_pool_size` and `max_parts_cleaning_thread_pool_size` in top-level config. Table-level settings `max_part_loading_threads` and `max_part_removal_threads` became obsolete. [#49474](https://github.com/ClickHouse/ClickHouse/pull/49474) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Allow `?password=pass` in URL of the Play UI. Password is replaced in browser history. [#49505](https://github.com/ClickHouse/ClickHouse/pull/49505) ([Mike Kot](https://github.com/myrrc)).
+* Allow reading zero-size objects from remote filesystems. (because empty files are not backup'd, so we might end up with zero blobs in metadata file). Closes [#49480](https://github.com/ClickHouse/ClickHouse/issues/49480). [#49519](https://github.com/ClickHouse/ClickHouse/pull/49519) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Attach thread MemoryTracker to `total_memory_tracker` after `ThreadGroup` detached. [#49527](https://github.com/ClickHouse/ClickHouse/pull/49527) ([Dmitry Novik](https://github.com/novikd)).
+* Fix parameterized views when a query parameter is used multiple times in the query. [#49556](https://github.com/ClickHouse/ClickHouse/pull/49556) ([Azat Khuzhin](https://github.com/azat)).
+* Release memory allocated for the last sent ProfileEvents snapshot in the context of a query. Followup [#47564](https://github.com/ClickHouse/ClickHouse/issues/47564). [#49561](https://github.com/ClickHouse/ClickHouse/pull/49561) ([Dmitry Novik](https://github.com/novikd)).
+* Function "makeDate" now provides a MySQL-compatible overload (year & day of the year argument). [#49603](https://github.com/ClickHouse/ClickHouse/pull/49603) ([Robert Schulze](https://github.com/rschu1ze)).
+* Support `dictionary` table function for `RegExpTreeDictionary`. [#49666](https://github.com/ClickHouse/ClickHouse/pull/49666) ([Han Fei](https://github.com/hanfei1991)).
+* Added weighted fair IO scheduling policy. Added dynamic resource manager, which allows IO scheduling hierarchy to be updated in runtime w/o server restarts. [#49671](https://github.com/ClickHouse/ClickHouse/pull/49671) ([Sergei Trifonov](https://github.com/serxa)).
+* Add compose request after multipart upload to GCS. This enables the usage of copy operation on objects uploaded with the multipart upload. It's recommended to set `s3_strict_upload_part_size` to some value because compose request can fail on objects created with parts of different sizes. [#49693](https://github.com/ClickHouse/ClickHouse/pull/49693) ([Antonio Andelic](https://github.com/antonio2368)).
+* For the `extractKeyValuePairs` function: improve the "best-effort" parsing logic to accept `key_value_delimiter` as a valid part of the value. This also simplifies branching and might even speed up things a bit. [#49760](https://github.com/ClickHouse/ClickHouse/pull/49760) ([Arthur Passos](https://github.com/arthurpassos)).
+* Add `initial_query_id` field for system.processors_profile_log [#49777](https://github.com/ClickHouse/ClickHouse/pull/49777) ([helifu](https://github.com/helifu)).
+* System log tables can now have custom sorting keys. [#49778](https://github.com/ClickHouse/ClickHouse/pull/49778) ([helifu](https://github.com/helifu)).
+* A new field `partitions` to `system.query_log` is used to indicate which partitions are participating in the calculation. [#49779](https://github.com/ClickHouse/ClickHouse/pull/49779) ([helifu](https://github.com/helifu)).
+* Added `enable_the_endpoint_id_with_zookeeper_name_prefix` setting for `ReplicatedMergeTree` (disabled by default). When enabled, it adds ZooKeeper cluster name to table's interserver communication endpoint. It avoids `Duplicate interserver IO endpoint` errors when having replicated tables with the same path, but different auxiliary ZooKeepers. [#49780](https://github.com/ClickHouse/ClickHouse/pull/49780) ([helifu](https://github.com/helifu)).
+* Add query parameters to `clickhouse-local`. Closes [#46561](https://github.com/ClickHouse/ClickHouse/issues/46561). [#49785](https://github.com/ClickHouse/ClickHouse/pull/49785) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Allow loading dictionaries and functions from YAML by default. In previous versions, it required editing the `dictionaries_config` or `user_defined_executable_functions_config` in the configuration file, as they expected `*.xml` files. [#49812](https://github.com/ClickHouse/ClickHouse/pull/49812) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The Kafka table engine now allows to use alias columns. [#49824](https://github.com/ClickHouse/ClickHouse/pull/49824) ([Aleksandr Musorin](https://github.com/AVMusorin)).
+* Add setting to limit the max number of pairs produced by `extractKeyValuePairs`, a safeguard to avoid using way too much memory. [#49836](https://github.com/ClickHouse/ClickHouse/pull/49836) ([Arthur Passos](https://github.com/arthurpassos)).
+* Add support for (an unusual) case where the arguments in the `IN` operator are single-element tuples. [#49844](https://github.com/ClickHouse/ClickHouse/pull/49844) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* `bitHammingDistance` function support `String` and `FixedString` data type. Closes [#48827](https://github.com/ClickHouse/ClickHouse/issues/48827). [#49858](https://github.com/ClickHouse/ClickHouse/pull/49858) ([flynn](https://github.com/ucasfl)).
+* Fix timeout resetting errors in the client on OS X. [#49863](https://github.com/ClickHouse/ClickHouse/pull/49863) ([alekar](https://github.com/alekar)).
+* Add support for big integers, such as UInt128, Int128, UInt256, and Int256 in the function `bitCount`. This enables Hamming distance over large bit masks for AI applications. [#49867](https://github.com/ClickHouse/ClickHouse/pull/49867) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fingerprints to be used instead of key IDs in encrypted disks. This simplifies the configuration of encrypted disks. [#49882](https://github.com/ClickHouse/ClickHouse/pull/49882) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Add UUID data type to PostgreSQL. Closes [#49739](https://github.com/ClickHouse/ClickHouse/issues/49739). [#49894](https://github.com/ClickHouse/ClickHouse/pull/49894) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Function `toUnixTimestamp` now accepts `Date` and `Date32` arguments. [#49989](https://github.com/ClickHouse/ClickHouse/pull/49989) ([Victor Krasnov](https://github.com/sirvickr)).
+* Charge only server memory for dictionaries. [#49995](https://github.com/ClickHouse/ClickHouse/pull/49995) ([Azat Khuzhin](https://github.com/azat)).
+* The server will allow using the `SQL_*` settings such as `SQL_AUTO_IS_NULL` as no-ops for MySQL compatibility. This closes [#49927](https://github.com/ClickHouse/ClickHouse/issues/49927). [#50013](https://github.com/ClickHouse/ClickHouse/pull/50013) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Preserve initial_query_id for ON CLUSTER queries, which is useful for introspection (under `distributed_ddl_entry_format_version=5`). [#50015](https://github.com/ClickHouse/ClickHouse/pull/50015) ([Azat Khuzhin](https://github.com/azat)).
+* Preserve backward incompatibility for renamed settings by using aliases (`allow_experimental_projection_optimization` for `optimize_use_projections`, `allow_experimental_lightweight_delete` for `enable_lightweight_delete`). [#50044](https://github.com/ClickHouse/ClickHouse/pull/50044) ([Azat Khuzhin](https://github.com/azat)).
+* Support passing FQDN through setting my_hostname to register cluster node in keeper. Add setting of invisible to support multi compute groups. A compute group as a cluster, is invisible to other compute groups. [#50186](https://github.com/ClickHouse/ClickHouse/pull/50186) ([Yangkuan Liu](https://github.com/LiuYangkuan)).
+* Fix PostgreSQL reading all the data even though `LIMIT n` could be specified. [#50187](https://github.com/ClickHouse/ClickHouse/pull/50187) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add new profile events for queries with subqueries (`QueriesWithSubqueries`/`SelectQueriesWithSubqueries`/`InsertQueriesWithSubqueries`). [#50204](https://github.com/ClickHouse/ClickHouse/pull/50204) ([Azat Khuzhin](https://github.com/azat)).
+* Adding the roles field in the users.xml file, which allows specifying roles with grants via a config file. [#50278](https://github.com/ClickHouse/ClickHouse/pull/50278) ([pufit](https://github.com/pufit)).
+* Report `CGroupCpuCfsPeriod` and `CGroupCpuCfsQuota` in AsynchronousMetrics. - Respect cgroup v2 memory limits during server startup. [#50379](https://github.com/ClickHouse/ClickHouse/pull/50379) ([alekar](https://github.com/alekar)).
+* Add a signal handler for SIGQUIT to work the same way as SIGINT. Closes [#50298](https://github.com/ClickHouse/ClickHouse/issues/50298). [#50435](https://github.com/ClickHouse/ClickHouse/pull/50435) ([Nikolay Degterinsky](https://github.com/evillique)).
+* In case JSON parse fails due to the large size of the object output the last position to allow debugging. [#50474](https://github.com/ClickHouse/ClickHouse/pull/50474) ([Valentin Alexeev](https://github.com/valentinalexeev)).
+* Support decimals with not fixed size. Closes [#49130](https://github.com/ClickHouse/ClickHouse/issues/49130). [#50586](https://github.com/ClickHouse/ClickHouse/pull/50586) ([Kruglov Pavel](https://github.com/Avogar)).
+
+#### Build/Testing/Packaging Improvement
+* New and improved `keeper-bench`. Everything can be customized from YAML/XML file: - request generator - each type of request generator can have a specific set of fields - multi requests can be generated just by doing the same under `multi` key - for each request or subrequest in multi a `weight` field can be defined to control distribution - define trees that need to be setup for a test run - hosts can be defined with all timeouts customizable and it's possible to control how many sessions to generate for each host - integers defined with `min_value` and `max_value` fields are random number generators. [#48547](https://github.com/ClickHouse/ClickHouse/pull/48547) ([Antonio Andelic](https://github.com/antonio2368)).
+* Io_uring is not supported on macos, don't choose it when running tests on local to avoid occassional failures. [#49250](https://github.com/ClickHouse/ClickHouse/pull/49250) ([Frank Chen](https://github.com/FrankChen021)).
+* Support named fault injection for testing. [#49361](https://github.com/ClickHouse/ClickHouse/pull/49361) ([Han Fei](https://github.com/hanfei1991)).
+* Allow running ClickHouse in the OS where the `prctl` (process control) syscall is not available, such as AWS Lambda. [#49538](https://github.com/ClickHouse/ClickHouse/pull/49538) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fixed the issue of build conflict between contrib/isa-l and isa-l in qpl [49296](https://github.com/ClickHouse/ClickHouse/issues/49296). [#49584](https://github.com/ClickHouse/ClickHouse/pull/49584) ([jasperzhu](https://github.com/jinjunzh)).
+* Utilities are now only build if explicitly requested ("-DENABLE_UTILS=1") instead of by default, this reduces link times in typical development builds. [#49620](https://github.com/ClickHouse/ClickHouse/pull/49620) ([Robert Schulze](https://github.com/rschu1ze)).
+* Pull build description of idxd-config into a separate CMake file to avoid accidental removal in future. [#49651](https://github.com/ClickHouse/ClickHouse/pull/49651) ([jasperzhu](https://github.com/jinjunzh)).
+* Add CI check with an enabled analyzer in the master. Follow-up [#49562](https://github.com/ClickHouse/ClickHouse/issues/49562). [#49668](https://github.com/ClickHouse/ClickHouse/pull/49668) ([Dmitry Novik](https://github.com/novikd)).
+* Switch to LLVM/clang 16. [#49678](https://github.com/ClickHouse/ClickHouse/pull/49678) ([Azat Khuzhin](https://github.com/azat)).
+* Allow building ClickHouse with clang-17. [#49851](https://github.com/ClickHouse/ClickHouse/pull/49851) ([Alexey Milovidov](https://github.com/alexey-milovidov)). [#50410](https://github.com/ClickHouse/ClickHouse/pull/50410) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* ClickHouse is now easier to be integrated into other cmake projects. [#49991](https://github.com/ClickHouse/ClickHouse/pull/49991) ([Amos Bird](https://github.com/amosbird)). (Which is strongly discouraged - Alexey Milovidov).
+* Fix strange additional QEMU logging after [#47151](https://github.com/ClickHouse/ClickHouse/issues/47151), see https://s3.amazonaws.com/clickhouse-test-reports/50078/a4743996ee4f3583884d07bcd6501df0cfdaa346/stateless_tests__release__databasereplicated__[3_4].html. [#50442](https://github.com/ClickHouse/ClickHouse/pull/50442) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* ClickHouse can work on Linux RISC-V 6.1.22. This closes [#50456](https://github.com/ClickHouse/ClickHouse/issues/50456). [#50457](https://github.com/ClickHouse/ClickHouse/pull/50457) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Bump internal protobuf to v3.18 (fixes bogus CVE-2022-1941). [#50400](https://github.com/ClickHouse/ClickHouse/pull/50400) ([Robert Schulze](https://github.com/rschu1ze)).
+* Bump internal libxml2 to v2.10.4 (fixes bogus CVE-2023-28484 and bogus CVE-2023-29469). [#50402](https://github.com/ClickHouse/ClickHouse/pull/50402) ([Robert Schulze](https://github.com/rschu1ze)).
+* Bump c-ares to v1.19.1 (bogus CVE-2023-32067, bogus CVE-2023-31130, bogus CVE-2023-31147). [#50403](https://github.com/ClickHouse/ClickHouse/pull/50403) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix bogus CVE-2022-2469 in libgsasl. [#50404](https://github.com/ClickHouse/ClickHouse/pull/50404) ([Robert Schulze](https://github.com/rschu1ze)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* ActionsDAG: fix wrong optimization [#47584](https://github.com/ClickHouse/ClickHouse/pull/47584) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Correctly handle concurrent snapshots in Keeper [#48466](https://github.com/ClickHouse/ClickHouse/pull/48466) ([Antonio Andelic](https://github.com/antonio2368)).
+* MergeTreeMarksLoader holds DataPart instead of DataPartStorage [#48515](https://github.com/ClickHouse/ClickHouse/pull/48515) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Sequence state fix [#48603](https://github.com/ClickHouse/ClickHouse/pull/48603) ([Ilya Golshtein](https://github.com/ilejn)).
+* Back/Restore concurrency check on previous fails [#48726](https://github.com/ClickHouse/ClickHouse/pull/48726) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix Attaching a table with non-existent ZK path does not increase the ReadonlyReplica metric [#48954](https://github.com/ClickHouse/ClickHouse/pull/48954) ([wangxiaobo](https://github.com/wzb5212)).
+* Fix possible terminate called for uncaught exception in some places [#49112](https://github.com/ClickHouse/ClickHouse/pull/49112) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix key not found error for queries with multiple StorageJoin [#49137](https://github.com/ClickHouse/ClickHouse/pull/49137) ([vdimir](https://github.com/vdimir)).
+* Fix wrong query result when using nullable primary key [#49172](https://github.com/ClickHouse/ClickHouse/pull/49172) ([Duc Canh Le](https://github.com/canhld94)).
+* Fix reinterpretAs*() on big endian machines [#49198](https://github.com/ClickHouse/ClickHouse/pull/49198) ([Suzy Wang](https://github.com/SuzyWangIBMer)).
+* (Experimental zero-copy replication) Lock zero copy parts more atomically [#49211](https://github.com/ClickHouse/ClickHouse/pull/49211) ([alesapin](https://github.com/alesapin)).
+* Fix race on Outdated parts loading [#49223](https://github.com/ClickHouse/ClickHouse/pull/49223) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix all key value is null and group use rollup return wrong answer [#49282](https://github.com/ClickHouse/ClickHouse/pull/49282) ([Shuai li](https://github.com/loneylee)).
+* Fix calculating load_factor for HASHED dictionaries with SHARDS [#49319](https://github.com/ClickHouse/ClickHouse/pull/49319) ([Azat Khuzhin](https://github.com/azat)).
+* Disallow configuring compression CODECs for alias columns [#49363](https://github.com/ClickHouse/ClickHouse/pull/49363) ([Timur Solodovnikov](https://github.com/tsolodov)).
+* Fix bug in removal of existing part directory [#49365](https://github.com/ClickHouse/ClickHouse/pull/49365) ([alesapin](https://github.com/alesapin)).
+* Properly fix GCS when HMAC is used [#49390](https://github.com/ClickHouse/ClickHouse/pull/49390) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix fuzz bug when subquery set is not built when reading from remote() [#49425](https://github.com/ClickHouse/ClickHouse/pull/49425) ([Alexander Gololobov](https://github.com/davenger)).
+* Invert `shutdown_wait_unfinished_queries` [#49427](https://github.com/ClickHouse/ClickHouse/pull/49427) ([Konstantin Bogdanov](https://github.com/thevar1able)).
+* (Experimental zero-copy replication) Fix another zero copy bug [#49473](https://github.com/ClickHouse/ClickHouse/pull/49473) ([alesapin](https://github.com/alesapin)).
+* Fix postgres database setting [#49481](https://github.com/ClickHouse/ClickHouse/pull/49481) ([Mal Curtis](https://github.com/snikch)).
+* Correctly handle `s3Cluster` arguments [#49490](https://github.com/ClickHouse/ClickHouse/pull/49490) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix bug in TraceCollector destructor. [#49508](https://github.com/ClickHouse/ClickHouse/pull/49508) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Fix AsynchronousReadIndirectBufferFromRemoteFS breaking on short seeks [#49525](https://github.com/ClickHouse/ClickHouse/pull/49525) ([Michael Kolupaev](https://github.com/al13n321)).
+* Fix dictionaries loading order [#49560](https://github.com/ClickHouse/ClickHouse/pull/49560) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Forbid the change of data type of Object('json') column [#49563](https://github.com/ClickHouse/ClickHouse/pull/49563) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix stress test (Logical error: Expected 7134 >= 11030) [#49623](https://github.com/ClickHouse/ClickHouse/pull/49623) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix bug in DISTINCT [#49628](https://github.com/ClickHouse/ClickHouse/pull/49628) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix: DISTINCT in order with zero values in non-sorted columns [#49636](https://github.com/ClickHouse/ClickHouse/pull/49636) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix one-off error in big integers found by UBSan with fuzzer [#49645](https://github.com/ClickHouse/ClickHouse/pull/49645) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix reading from sparse columns after restart [#49660](https://github.com/ClickHouse/ClickHouse/pull/49660) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix assert in SpanHolder::finish() with fibers [#49673](https://github.com/ClickHouse/ClickHouse/pull/49673) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix short circuit functions and mutations with sparse arguments [#49716](https://github.com/ClickHouse/ClickHouse/pull/49716) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix writing appended files to incremental backups [#49725](https://github.com/ClickHouse/ClickHouse/pull/49725) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix "There is no physical column _row_exists in table" error occurring during lightweight delete mutation on a table with Object column. [#49737](https://github.com/ClickHouse/ClickHouse/pull/49737) ([Alexander Gololobov](https://github.com/davenger)).
+* Fix msan issue in randomStringUTF8(uneven number) [#49750](https://github.com/ClickHouse/ClickHouse/pull/49750) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix aggregate function kolmogorovSmirnovTest [#49768](https://github.com/ClickHouse/ClickHouse/pull/49768) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
+* Fix settings aliases in native protocol [#49776](https://github.com/ClickHouse/ClickHouse/pull/49776) ([Azat Khuzhin](https://github.com/azat)).
+* Fix `arrayMap` with array of tuples with single argument [#49789](https://github.com/ClickHouse/ClickHouse/pull/49789) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix per-query IO/BACKUPs throttling settings [#49797](https://github.com/ClickHouse/ClickHouse/pull/49797) ([Azat Khuzhin](https://github.com/azat)).
+* Fix setting NULL in profile definition [#49831](https://github.com/ClickHouse/ClickHouse/pull/49831) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix a bug with projections and the aggregate_functions_null_for_empty setting (for query_plan_optimize_projection) [#49873](https://github.com/ClickHouse/ClickHouse/pull/49873) ([Amos Bird](https://github.com/amosbird)).
+* Fix processing pending batch for Distributed async INSERT after restart [#49884](https://github.com/ClickHouse/ClickHouse/pull/49884) ([Azat Khuzhin](https://github.com/azat)).
+* Fix assertion in CacheMetadata::doCleanup [#49914](https://github.com/ClickHouse/ClickHouse/pull/49914) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* fix `is_prefix` in OptimizeRegularExpression [#49919](https://github.com/ClickHouse/ClickHouse/pull/49919) ([Han Fei](https://github.com/hanfei1991)).
+* Fix metrics `WriteBufferFromS3Bytes`, `WriteBufferFromS3Microseconds` and `WriteBufferFromS3RequestsErrors` [#49930](https://github.com/ClickHouse/ClickHouse/pull/49930) ([Aleksandr Musorin](https://github.com/AVMusorin)).
+* Fix IPv6 encoding in protobuf [#49933](https://github.com/ClickHouse/ClickHouse/pull/49933) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Fix possible Logical error on bad Nullable parsing for text formats [#49960](https://github.com/ClickHouse/ClickHouse/pull/49960) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add setting output_format_parquet_compliant_nested_types to produce more compatible Parquet files [#50001](https://github.com/ClickHouse/ClickHouse/pull/50001) ([Michael Kolupaev](https://github.com/al13n321)).
+* Fix logical error in stress test "Not enough space to add ..." [#50021](https://github.com/ClickHouse/ClickHouse/pull/50021) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Avoid deadlock when starting table in attach thread of `ReplicatedMergeTree` [#50026](https://github.com/ClickHouse/ClickHouse/pull/50026) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix assert in SpanHolder::finish() with fibers attempt 2 [#50034](https://github.com/ClickHouse/ClickHouse/pull/50034) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add proper escaping for DDL OpenTelemetry context serialization [#50045](https://github.com/ClickHouse/ClickHouse/pull/50045) ([Azat Khuzhin](https://github.com/azat)).
+* Fix reporting broken projection parts [#50052](https://github.com/ClickHouse/ClickHouse/pull/50052) ([Amos Bird](https://github.com/amosbird)).
+* JIT compilation not equals NaN fix [#50056](https://github.com/ClickHouse/ClickHouse/pull/50056) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix crashing in case of Replicated database without arguments [#50058](https://github.com/ClickHouse/ClickHouse/pull/50058) ([Azat Khuzhin](https://github.com/azat)).
+* Fix crash with `multiIf` and constant condition and nullable arguments [#50123](https://github.com/ClickHouse/ClickHouse/pull/50123) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix invalid index analysis for date related keys [#50153](https://github.com/ClickHouse/ClickHouse/pull/50153) ([Amos Bird](https://github.com/amosbird)).
+* do not allow modify order by when there are no order by cols [#50154](https://github.com/ClickHouse/ClickHouse/pull/50154) ([Han Fei](https://github.com/hanfei1991)).
+* Fix broken index analysis when binary operator contains a null constant argument [#50177](https://github.com/ClickHouse/ClickHouse/pull/50177) ([Amos Bird](https://github.com/amosbird)).
+* clickhouse-client: disallow usage of `--query` and `--queries-file` at the same time [#50210](https://github.com/ClickHouse/ClickHouse/pull/50210) ([Alexey Gerasimchuk](https://github.com/Demilivor)).
+* Fix UB for INTO OUTFILE extensions (APPEND / AND STDOUT) and WATCH EVENTS [#50216](https://github.com/ClickHouse/ClickHouse/pull/50216) ([Azat Khuzhin](https://github.com/azat)).
+* Fix skipping spaces at end of row in CustomSeparatedIgnoreSpaces format [#50224](https://github.com/ClickHouse/ClickHouse/pull/50224) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix iceberg metadata parsing [#50232](https://github.com/ClickHouse/ClickHouse/pull/50232) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix nested distributed SELECT in WITH clause [#50234](https://github.com/ClickHouse/ClickHouse/pull/50234) ([Azat Khuzhin](https://github.com/azat)).
+* Fix msan issue in keyed siphash [#50245](https://github.com/ClickHouse/ClickHouse/pull/50245) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix bugs in Poco sockets in non-blocking mode, use true non-blocking sockets [#50252](https://github.com/ClickHouse/ClickHouse/pull/50252) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix checksum calculation for backup entries [#50264](https://github.com/ClickHouse/ClickHouse/pull/50264) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Comparison functions NaN fix [#50287](https://github.com/ClickHouse/ClickHouse/pull/50287) ([Maksim Kita](https://github.com/kitaisreal)).
+* JIT aggregation nullable key fix [#50291](https://github.com/ClickHouse/ClickHouse/pull/50291) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix clickhouse-local crashing when writing empty Arrow or Parquet output [#50328](https://github.com/ClickHouse/ClickHouse/pull/50328) ([Michael Kolupaev](https://github.com/al13n321)).
+* Fix crash when Pool::Entry::disconnect() is called [#50334](https://github.com/ClickHouse/ClickHouse/pull/50334) ([Val Doroshchuk](https://github.com/valbok)).
+* Improved fetch part by holding directory lock longer [#50339](https://github.com/ClickHouse/ClickHouse/pull/50339) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix bitShift* functions with both constant arguments [#50343](https://github.com/ClickHouse/ClickHouse/pull/50343) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix Keeper deadlock on exception when preprocessing requests. [#50387](https://github.com/ClickHouse/ClickHouse/pull/50387) ([frinkr](https://github.com/frinkr)).
+* Fix hashing of const integer values [#50421](https://github.com/ClickHouse/ClickHouse/pull/50421) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix merge_tree_min_rows_for_seek/merge_tree_min_bytes_for_seek for data skipping indexes [#50432](https://github.com/ClickHouse/ClickHouse/pull/50432) ([Azat Khuzhin](https://github.com/azat)).
+* Limit the number of in-flight tasks for loading outdated parts [#50450](https://github.com/ClickHouse/ClickHouse/pull/50450) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Keeper fix: apply uncommitted state after snapshot install [#50483](https://github.com/ClickHouse/ClickHouse/pull/50483) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix incorrect constant folding [#50536](https://github.com/ClickHouse/ClickHouse/pull/50536) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix logical error in stress test (Not enough space to add ...) [#50583](https://github.com/ClickHouse/ClickHouse/pull/50583) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix converting Null to LowCardinality(Nullable) in values table function [#50637](https://github.com/ClickHouse/ClickHouse/pull/50637) ([Kruglov Pavel](https://github.com/Avogar)).
+* Revert invalid RegExpTreeDictionary optimization [#50642](https://github.com/ClickHouse/ClickHouse/pull/50642) ([Johann Gan](https://github.com/johanngan)).
+
 ### <a id="234"></a> ClickHouse release 23.4, 2023-04-26
 
 #### Backward Incompatible Change
diff --git a/README.md b/README.md
index 9561458ba37..1036e1a97e1 100644
--- a/README.md
+++ b/README.md
@@ -16,18 +16,21 @@ curl https://clickhouse.com/ | sh
 * [YouTube channel](https://www.youtube.com/c/ClickHouseDB) has a lot of content about ClickHouse in video format.
 * [Slack](https://clickhouse.com/slack) and [Telegram](https://telegram.me/clickhouse_en) allow chatting with ClickHouse users in real-time.
 * [Blog](https://clickhouse.com/blog/) contains various ClickHouse-related articles, as well as announcements and reports about events.
-* [Code Browser (Woboq)](https://clickhouse.com/codebrowser/ClickHouse/index.html) with syntax highlight and navigation.
-* [Code Browser (github.dev)](https://github.dev/ClickHouse/ClickHouse) with syntax highlight, powered by github.dev.
+* [Code Browser (Woboq)](https://clickhouse.com/codebrowser/ClickHouse/index.html) with syntax highlighting and navigation.
+* [Code Browser (github.dev)](https://github.dev/ClickHouse/ClickHouse) with syntax highlighting, powered by github.dev.
+* [Static Analysis (SonarCloud)](https://sonarcloud.io/project/issues?resolved=false&id=ClickHouse_ClickHouse) proposes C++ quality improvements.
 * [Contacts](https://clickhouse.com/company/contact) can help to get your questions answered if there are any.
 
 ## Upcoming Events
 
-* [**v23.5 Release Webinar**](https://clickhouse.com/company/events/v23-5-release-webinar?utm_source=github&utm_medium=social&utm_campaign=release-webinar-2023-05) - Jun 8 - 23.5 is rapidly approaching. Original creator, co-founder, and CTO of ClickHouse Alexey Milovidov will walk us through the highlights of the release.
-* [**ClickHouse Meetup in Bangalore**](https://www.meetup.com/clickhouse-bangalore-user-group/events/293740066/) - Jun 7
-* [**ClickHouse Meetup in San Francisco**](https://www.meetup.com/clickhouse-silicon-valley-meetup-group/events/293426725/) - Jun 7 
+* [**v23.6 Release Webinar**](https://clickhouse.com/company/events/v23-6-release-call?utm_source=github&utm_medium=social&utm_campaign=release-webinar-2023-06) - Jun 29 - 23.6 is rapidly approaching. Original creator, co-founder, and CTO of ClickHouse Alexey Milovidov will walk us through the highlights of the release.
+* [**ClickHouse Meetup in Boston**](https://www.meetup.com/clickhouse-boston-user-group/events/293913596) - Jul 18
+* [**ClickHouse Meetup in NYC**](https://www.meetup.com/clickhouse-new-york-user-group/events/293913441) - Jul 19
+* [**ClickHouse Meetup in Toronto**](https://www.meetup.com/clickhouse-toronto-user-group/events/294183127) - Jul 20
+* [**ClickHouse Meetup in Singapore**](https://www.meetup.com/clickhouse-singapore-meetup-group/events/294428050/) - Jul 27
+* [**ClickHouse Meetup in Paris**](https://www.meetup.com/clickhouse-france-user-group/events/294283460) - Sep 12
 
-
-Also, keep an eye out for upcoming meetups in Amsterdam, Boston, NYC, Beijing, and Toronto. Somewhere else you want us to be? Please feel free to reach out to tyler <at> clickhouse <dot> com.
+Also, keep an eye out for upcoming meetups around the world. Somewhere else you want us to be? Please feel free to reach out to tyler <at> clickhouse <dot> com.
 
 ## Recent Recordings
 * **Recent Meetup Videos**: [Meetup Playlist](https://www.youtube.com/playlist?list=PL0Z2YDlm0b3iNDUzpY1S3L_iV4nARda_U) Whenever possible recordings of the ClickHouse Community Meetups are edited and presented as individual talks. Current featuring "Modern SQL in 2023", "Fast, Concurrent, and Consistent Asynchronous INSERTS in ClickHouse", and "Full-Text Indices: Design and Experiments"
diff --git a/SECURITY.md b/SECURITY.md
index 75c1a9d7d6a..4ba5f13d09c 100644
--- a/SECURITY.md
+++ b/SECURITY.md
@@ -13,9 +13,11 @@ The following versions of ClickHouse server are currently being supported with s
 
 | Version | Supported |
 |:-|:-|
+| 23.6 | ✔️ |
+| 23.5 | ✔️ |
 | 23.4 | ✔️ |
 | 23.3 | ✔️ |
-| 23.2 | ✔️ |
+| 23.2 | ❌ |
 | 23.1 | ❌ |
 | 22.12 | ❌ |
 | 22.11 | ❌ |
diff --git a/base/base/IPv4andIPv6.h b/base/base/IPv4andIPv6.h
index 7b745ec7b84..e2f93b54124 100644
--- a/base/base/IPv4andIPv6.h
+++ b/base/base/IPv4andIPv6.h
@@ -2,21 +2,23 @@
 
 #include <base/strong_typedef.h>
 #include <base/extended_types.h>
+#include <Common/formatIPv6.h>
 #include <Common/memcmpSmall.h>
 
 namespace DB
 {
 
-    using IPv4 = StrongTypedef<UInt32, struct IPv4Tag>;
+    struct IPv4 : StrongTypedef<UInt32, struct IPv4Tag>
+    {
+        using StrongTypedef::StrongTypedef;
+        using StrongTypedef::operator=;
+        constexpr explicit IPv4(UInt64 value): StrongTypedef(static_cast<UnderlyingType>(value)) {}
+    };
 
     struct IPv6 : StrongTypedef<UInt128, struct IPv6Tag>
     {
-        constexpr IPv6() = default;
-        constexpr explicit IPv6(const UInt128 & x) : StrongTypedef(x) {}
-        constexpr explicit IPv6(UInt128 && x) : StrongTypedef(std::move(x)) {}
-
-        IPv6 & operator=(const UInt128 & rhs) { StrongTypedef::operator=(rhs); return *this; }
-        IPv6 & operator=(UInt128 && rhs) { StrongTypedef::operator=(std::move(rhs)); return *this; }
+        using StrongTypedef::StrongTypedef;
+        using StrongTypedef::operator=;
 
         bool operator<(const IPv6 & rhs) const
         {
@@ -54,12 +56,22 @@ namespace DB
 
 namespace std
 {
+    /// For historical reasons we hash IPv6 as a FixedString(16)
     template <>
     struct hash<DB::IPv6>
     {
         size_t operator()(const DB::IPv6 & x) const
         {
-            return std::hash<DB::IPv6::UnderlyingType>()(x.toUnderType());
+            return std::hash<std::string_view>{}(std::string_view(reinterpret_cast<const char*>(&x.toUnderType()), IPV6_BINARY_LENGTH));
+        }
+    };
+
+    template <>
+    struct hash<DB::IPv4>
+    {
+        size_t operator()(const DB::IPv4 & x) const
+        {
+            return std::hash<DB::IPv4::UnderlyingType>()(x.toUnderType());
         }
     };
 }
diff --git a/base/base/bit_cast.h b/base/base/bit_cast.h
index 5373ead36e8..4783a84586b 100644
--- a/base/base/bit_cast.h
+++ b/base/base/bit_cast.h
@@ -7,7 +7,13 @@
 
 /** Returns value `from` converted to type `To` while retaining bit representation.
   * `To` and `From` must satisfy `CopyConstructible`.
+  *
   * In contrast to std::bit_cast can cast types of different width.
+  *
+  * Note: for signed types of narrower size, the casted result is zero-extended
+  * instead of sign-extended as with regular static_cast.
+  * For example, -1 Int8 (represented as 0xFF) bit_casted to UInt64
+  * gives 255 (represented as 0x00000000000000FF) instead of 0xFFFFFFFFFFFFFFFF
   */
 template <typename To, typename From>
 std::decay_t<To> bit_cast(const From & from)
diff --git a/base/base/find_symbols.h b/base/base/find_symbols.h
index a8747ecc9b7..83232669c04 100644
--- a/base/base/find_symbols.h
+++ b/base/base/find_symbols.h
@@ -2,6 +2,7 @@
 
 #include <cstdint>
 #include <string>
+#include <array>
 
 #if defined(__SSE2__)
     #include <emmintrin.h>
diff --git a/base/base/hex.h b/base/base/hex.h
index b8cf95db893..937218fec5a 100644
--- a/base/base/hex.h
+++ b/base/base/hex.h
@@ -4,212 +4,288 @@
 #include <cstring>
 #include "types.h"
 
-/// Maps 0..15 to 0..9A..F or 0..9a..f correspondingly.
+namespace CityHash_v1_0_2 { struct uint128; }
 
-constexpr inline std::string_view hex_digit_to_char_uppercase_table = "0123456789ABCDEF";
-constexpr inline std::string_view hex_digit_to_char_lowercase_table = "0123456789abcdef";
+namespace wide
+{
+    template <size_t Bits, typename Signed>
+    class integer;
+}
+
+namespace impl
+{
+    /// Maps 0..15 to 0..9A..F or 0..9a..f correspondingly.
+    constexpr inline std::string_view hex_digit_to_char_uppercase_table = "0123456789ABCDEF";
+    constexpr inline std::string_view hex_digit_to_char_lowercase_table = "0123456789abcdef";
+
+    /// Maps 0..255 to 00..FF or 00..ff correspondingly.
+    constexpr inline std::string_view hex_byte_to_char_uppercase_table = //
+        "000102030405060708090A0B0C0D0E0F"
+        "101112131415161718191A1B1C1D1E1F"
+        "202122232425262728292A2B2C2D2E2F"
+        "303132333435363738393A3B3C3D3E3F"
+        "404142434445464748494A4B4C4D4E4F"
+        "505152535455565758595A5B5C5D5E5F"
+        "606162636465666768696A6B6C6D6E6F"
+        "707172737475767778797A7B7C7D7E7F"
+        "808182838485868788898A8B8C8D8E8F"
+        "909192939495969798999A9B9C9D9E9F"
+        "A0A1A2A3A4A5A6A7A8A9AAABACADAEAF"
+        "B0B1B2B3B4B5B6B7B8B9BABBBCBDBEBF"
+        "C0C1C2C3C4C5C6C7C8C9CACBCCCDCECF"
+        "D0D1D2D3D4D5D6D7D8D9DADBDCDDDEDF"
+        "E0E1E2E3E4E5E6E7E8E9EAEBECEDEEEF"
+        "F0F1F2F3F4F5F6F7F8F9FAFBFCFDFEFF";
+
+    constexpr inline std::string_view hex_byte_to_char_lowercase_table = //
+        "000102030405060708090a0b0c0d0e0f"
+        "101112131415161718191a1b1c1d1e1f"
+        "202122232425262728292a2b2c2d2e2f"
+        "303132333435363738393a3b3c3d3e3f"
+        "404142434445464748494a4b4c4d4e4f"
+        "505152535455565758595a5b5c5d5e5f"
+        "606162636465666768696a6b6c6d6e6f"
+        "707172737475767778797a7b7c7d7e7f"
+        "808182838485868788898a8b8c8d8e8f"
+        "909192939495969798999a9b9c9d9e9f"
+        "a0a1a2a3a4a5a6a7a8a9aaabacadaeaf"
+        "b0b1b2b3b4b5b6b7b8b9babbbcbdbebf"
+        "c0c1c2c3c4c5c6c7c8c9cacbcccdcecf"
+        "d0d1d2d3d4d5d6d7d8d9dadbdcdddedf"
+        "e0e1e2e3e4e5e6e7e8e9eaebecedeeef"
+        "f0f1f2f3f4f5f6f7f8f9fafbfcfdfeff";
+
+    /// Maps 0..255 to 00000000..11111111 correspondingly.
+    constexpr inline std::string_view bin_byte_to_char_table = //
+        "0000000000000001000000100000001100000100000001010000011000000111"
+        "0000100000001001000010100000101100001100000011010000111000001111"
+        "0001000000010001000100100001001100010100000101010001011000010111"
+        "0001100000011001000110100001101100011100000111010001111000011111"
+        "0010000000100001001000100010001100100100001001010010011000100111"
+        "0010100000101001001010100010101100101100001011010010111000101111"
+        "0011000000110001001100100011001100110100001101010011011000110111"
+        "0011100000111001001110100011101100111100001111010011111000111111"
+        "0100000001000001010000100100001101000100010001010100011001000111"
+        "0100100001001001010010100100101101001100010011010100111001001111"
+        "0101000001010001010100100101001101010100010101010101011001010111"
+        "0101100001011001010110100101101101011100010111010101111001011111"
+        "0110000001100001011000100110001101100100011001010110011001100111"
+        "0110100001101001011010100110101101101100011011010110111001101111"
+        "0111000001110001011100100111001101110100011101010111011001110111"
+        "0111100001111001011110100111101101111100011111010111111001111111"
+        "1000000010000001100000101000001110000100100001011000011010000111"
+        "1000100010001001100010101000101110001100100011011000111010001111"
+        "1001000010010001100100101001001110010100100101011001011010010111"
+        "1001100010011001100110101001101110011100100111011001111010011111"
+        "1010000010100001101000101010001110100100101001011010011010100111"
+        "1010100010101001101010101010101110101100101011011010111010101111"
+        "1011000010110001101100101011001110110100101101011011011010110111"
+        "1011100010111001101110101011101110111100101111011011111010111111"
+        "1100000011000001110000101100001111000100110001011100011011000111"
+        "1100100011001001110010101100101111001100110011011100111011001111"
+        "1101000011010001110100101101001111010100110101011101011011010111"
+        "1101100011011001110110101101101111011100110111011101111011011111"
+        "1110000011100001111000101110001111100100111001011110011011100111"
+        "1110100011101001111010101110101111101100111011011110111011101111"
+        "1111000011110001111100101111001111110100111101011111011011110111"
+        "1111100011111001111110101111101111111100111111011111111011111111";
+
+    /// Maps 0..9, A..F, a..f to 0..15. Other chars are mapped to implementation specific value.
+    constexpr inline std::string_view hex_char_to_digit_table
+        = {"\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
+        "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
+        "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
+        "\x00\x01\x02\x03\x04\x05\x06\x07\x08\x09\xff\xff\xff\xff\xff\xff" //0-9
+        "\xff\x0a\x0b\x0c\x0d\x0e\x0f\xff\xff\xff\xff\xff\xff\xff\xff\xff" //A-Z
+        "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
+        "\xff\x0a\x0b\x0c\x0d\x0e\x0f\xff\xff\xff\xff\xff\xff\xff\xff\xff" //a-z
+        "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
+        "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
+        "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
+        "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
+        "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
+        "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
+        "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
+        "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
+        "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff",
+        256};
+
+    /// Converts a hex digit '0'..'f' or '0'..'F' to its value 0..15.
+    constexpr UInt8 unhexDigit(char c)
+    {
+        return hex_char_to_digit_table[static_cast<UInt8>(c)];
+    }
+
+    /// Converts an unsigned integer in the native endian to hexadecimal representation and back. Used as a base class for HexConversion<T>.
+    template <typename TUInt, typename = void>
+    struct HexConversionUInt
+    {
+        static const constexpr size_t num_hex_digits = sizeof(TUInt) * 2;
+
+        static void hex(TUInt uint_, char * out, std::string_view table)
+        {
+            union
+            {
+                TUInt value;
+                UInt8 uint8[sizeof(TUInt)];
+            };
+
+            value = uint_;
+
+            for (size_t i = 0; i < sizeof(TUInt); ++i)
+            {
+                if constexpr (std::endian::native == std::endian::little)
+                    memcpy(out + i * 2, &table[static_cast<size_t>(uint8[sizeof(TUInt) - 1 - i]) * 2], 2);
+                else
+                    memcpy(out + i * 2, &table[static_cast<size_t>(uint8[i]) * 2], 2);
+            }
+        }
+
+        static TUInt unhex(const char * data)
+        {
+            TUInt res;
+            if constexpr (sizeof(TUInt) == 1)
+            {
+                res = static_cast<UInt8>(unhexDigit(data[0])) * 0x10 + static_cast<UInt8>(unhexDigit(data[1]));
+            }
+            else if constexpr (sizeof(TUInt) == 2)
+            {
+                res = static_cast<UInt16>(unhexDigit(data[0])) * 0x1000 + static_cast<UInt16>(unhexDigit(data[1])) * 0x100
+                    + static_cast<UInt16>(unhexDigit(data[2])) * 0x10 + static_cast<UInt16>(unhexDigit(data[3]));
+            }
+            else if constexpr ((sizeof(TUInt) <= 8) || ((sizeof(TUInt) % 8) != 0))
+            {
+                res = 0;
+                for (size_t i = 0; i < sizeof(TUInt) * 2; ++i, ++data)
+                {
+                    res <<= 4;
+                    res += unhexDigit(*data);
+                }
+            }
+            else
+            {
+                res = 0;
+                for (size_t i = 0; i < sizeof(TUInt) / 8; ++i, data += 16)
+                {
+                    res <<= 64;
+                    res += HexConversionUInt<UInt64>::unhex(data);
+                }
+            }
+            return res;
+        }
+    };
+
+    /// Helper template class to convert a value of any supported type to hexadecimal representation and back.
+    template <typename T, typename SFINAE = void>
+    struct HexConversion;
+
+    template <typename TUInt>
+    struct HexConversion<TUInt, std::enable_if_t<std::is_integral_v<TUInt>>> : public HexConversionUInt<TUInt> {};
+
+    template <size_t Bits, typename Signed>
+    struct HexConversion<wide::integer<Bits, Signed>> : public HexConversionUInt<wide::integer<Bits, Signed>> {};
+
+    template <typename CityHashUInt128> /// Partial specialization here allows not to include <city.h> in this header.
+    struct HexConversion<CityHashUInt128, std::enable_if_t<std::is_same_v<CityHashUInt128, typename CityHash_v1_0_2::uint128>>>
+    {
+        static const constexpr size_t num_hex_digits = 32;
+
+        static void hex(const CityHashUInt128 & uint_, char * out, std::string_view table)
+        {
+            HexConversion<UInt64>::hex(uint_.high64, out, table);
+            HexConversion<UInt64>::hex(uint_.low64, out + 16, table);
+        }
+
+        static CityHashUInt128 unhex(const char * data)
+        {
+            CityHashUInt128 res;
+            res.high64 = HexConversion<UInt64>::unhex(data);
+            res.low64 = HexConversion<UInt64>::unhex(data + 16);
+            return res;
+        }
+    };
+}
+
+/// Produces a hexadecimal representation of an integer value with leading zeros (for checksums).
+/// The function supports native integer types, wide::integer, CityHash_v1_0_2::uint128.
+/// It can be used with signed types as well, however they are written as corresponding unsigned numbers
+/// using two's complement (i.e. for example "-1" is written as "0xFF", not as "-0x01").
+template <typename T>
+void writeHexUIntUppercase(const T & value, char * out)
+{
+    impl::HexConversion<T>::hex(value, out, impl::hex_byte_to_char_uppercase_table);
+}
+
+template <typename T>
+void writeHexUIntLowercase(const T & value, char * out)
+{
+    impl::HexConversion<T>::hex(value, out, impl::hex_byte_to_char_lowercase_table);
+}
+
+template <typename T>
+std::string getHexUIntUppercase(const T & value)
+{
+    std::string res(impl::HexConversion<T>::num_hex_digits, '\0');
+    writeHexUIntUppercase(value, res.data());
+    return res;
+}
+
+template <typename T>
+std::string getHexUIntLowercase(const T & value)
+{
+    std::string res(impl::HexConversion<T>::num_hex_digits, '\0');
+    writeHexUIntLowercase(value, res.data());
+    return res;
+}
 
 constexpr char hexDigitUppercase(unsigned char c)
 {
-    return hex_digit_to_char_uppercase_table[c];
+    return impl::hex_digit_to_char_uppercase_table[c];
 }
+
 constexpr char hexDigitLowercase(unsigned char c)
 {
-    return hex_digit_to_char_lowercase_table[c];
+    return impl::hex_digit_to_char_lowercase_table[c];
 }
 
-/// Maps 0..255 to 00..FF or 00..ff correspondingly
-
-constexpr inline std::string_view hex_byte_to_char_uppercase_table = //
-    "000102030405060708090A0B0C0D0E0F"
-    "101112131415161718191A1B1C1D1E1F"
-    "202122232425262728292A2B2C2D2E2F"
-    "303132333435363738393A3B3C3D3E3F"
-    "404142434445464748494A4B4C4D4E4F"
-    "505152535455565758595A5B5C5D5E5F"
-    "606162636465666768696A6B6C6D6E6F"
-    "707172737475767778797A7B7C7D7E7F"
-    "808182838485868788898A8B8C8D8E8F"
-    "909192939495969798999A9B9C9D9E9F"
-    "A0A1A2A3A4A5A6A7A8A9AAABACADAEAF"
-    "B0B1B2B3B4B5B6B7B8B9BABBBCBDBEBF"
-    "C0C1C2C3C4C5C6C7C8C9CACBCCCDCECF"
-    "D0D1D2D3D4D5D6D7D8D9DADBDCDDDEDF"
-    "E0E1E2E3E4E5E6E7E8E9EAEBECEDEEEF"
-    "F0F1F2F3F4F5F6F7F8F9FAFBFCFDFEFF";
-
-constexpr inline std::string_view hex_byte_to_char_lowercase_table = //
-    "000102030405060708090a0b0c0d0e0f"
-    "101112131415161718191a1b1c1d1e1f"
-    "202122232425262728292a2b2c2d2e2f"
-    "303132333435363738393a3b3c3d3e3f"
-    "404142434445464748494a4b4c4d4e4f"
-    "505152535455565758595a5b5c5d5e5f"
-    "606162636465666768696a6b6c6d6e6f"
-    "707172737475767778797a7b7c7d7e7f"
-    "808182838485868788898a8b8c8d8e8f"
-    "909192939495969798999a9b9c9d9e9f"
-    "a0a1a2a3a4a5a6a7a8a9aaabacadaeaf"
-    "b0b1b2b3b4b5b6b7b8b9babbbcbdbebf"
-    "c0c1c2c3c4c5c6c7c8c9cacbcccdcecf"
-    "d0d1d2d3d4d5d6d7d8d9dadbdcdddedf"
-    "e0e1e2e3e4e5e6e7e8e9eaebecedeeef"
-    "f0f1f2f3f4f5f6f7f8f9fafbfcfdfeff";
-
 inline void writeHexByteUppercase(UInt8 byte, void * out)
 {
-    memcpy(out, &hex_byte_to_char_uppercase_table[static_cast<size_t>(byte) * 2], 2);
+    memcpy(out, &impl::hex_byte_to_char_uppercase_table[static_cast<size_t>(byte) * 2], 2);
 }
 
 inline void writeHexByteLowercase(UInt8 byte, void * out)
 {
-    memcpy(out, &hex_byte_to_char_lowercase_table[static_cast<size_t>(byte) * 2], 2);
+    memcpy(out, &impl::hex_byte_to_char_lowercase_table[static_cast<size_t>(byte) * 2], 2);
 }
 
-constexpr inline std::string_view bin_byte_to_char_table = //
-    "0000000000000001000000100000001100000100000001010000011000000111"
-    "0000100000001001000010100000101100001100000011010000111000001111"
-    "0001000000010001000100100001001100010100000101010001011000010111"
-    "0001100000011001000110100001101100011100000111010001111000011111"
-    "0010000000100001001000100010001100100100001001010010011000100111"
-    "0010100000101001001010100010101100101100001011010010111000101111"
-    "0011000000110001001100100011001100110100001101010011011000110111"
-    "0011100000111001001110100011101100111100001111010011111000111111"
-    "0100000001000001010000100100001101000100010001010100011001000111"
-    "0100100001001001010010100100101101001100010011010100111001001111"
-    "0101000001010001010100100101001101010100010101010101011001010111"
-    "0101100001011001010110100101101101011100010111010101111001011111"
-    "0110000001100001011000100110001101100100011001010110011001100111"
-    "0110100001101001011010100110101101101100011011010110111001101111"
-    "0111000001110001011100100111001101110100011101010111011001110111"
-    "0111100001111001011110100111101101111100011111010111111001111111"
-    "1000000010000001100000101000001110000100100001011000011010000111"
-    "1000100010001001100010101000101110001100100011011000111010001111"
-    "1001000010010001100100101001001110010100100101011001011010010111"
-    "1001100010011001100110101001101110011100100111011001111010011111"
-    "1010000010100001101000101010001110100100101001011010011010100111"
-    "1010100010101001101010101010101110101100101011011010111010101111"
-    "1011000010110001101100101011001110110100101101011011011010110111"
-    "1011100010111001101110101011101110111100101111011011111010111111"
-    "1100000011000001110000101100001111000100110001011100011011000111"
-    "1100100011001001110010101100101111001100110011011100111011001111"
-    "1101000011010001110100101101001111010100110101011101011011010111"
-    "1101100011011001110110101101101111011100110111011101111011011111"
-    "1110000011100001111000101110001111100100111001011110011011100111"
-    "1110100011101001111010101110101111101100111011011110111011101111"
-    "1111000011110001111100101111001111110100111101011111011011110111"
-    "1111100011111001111110101111101111111100111111011111111011111111";
-
-inline void writeBinByte(UInt8 byte, void * out)
+/// Converts a hex representation with leading zeros back to an integer value.
+/// The function supports native integer types, wide::integer, CityHash_v1_0_2::uint128.
+template <typename T>
+constexpr T unhexUInt(const char * data)
 {
-    memcpy(out, &bin_byte_to_char_table[static_cast<size_t>(byte) * 8], 8);
+    return impl::HexConversion<T>::unhex(data);
 }
 
-/// Produces hex representation of an unsigned int with leading zeros (for checksums)
-template <typename TUInt>
-inline void writeHexUIntImpl(TUInt uint_, char * out, std::string_view table)
-{
-    union
-    {
-        TUInt value;
-        UInt8 uint8[sizeof(TUInt)];
-    };
-
-    value = uint_;
-
-    for (size_t i = 0; i < sizeof(TUInt); ++i)
-    {
-        if constexpr (std::endian::native == std::endian::little)
-            memcpy(out + i * 2, &table[static_cast<size_t>(uint8[sizeof(TUInt) - 1 - i]) * 2], 2);
-        else
-            memcpy(out + i * 2, &table[static_cast<size_t>(uint8[i]) * 2], 2);
-    }
-}
-
-template <typename TUInt>
-inline void writeHexUIntUppercase(TUInt uint_, char * out)
-{
-    writeHexUIntImpl(uint_, out, hex_byte_to_char_uppercase_table);
-}
-
-template <typename TUInt>
-inline void writeHexUIntLowercase(TUInt uint_, char * out)
-{
-    writeHexUIntImpl(uint_, out, hex_byte_to_char_lowercase_table);
-}
-
-template <typename TUInt>
-std::string getHexUIntUppercase(TUInt uint_)
-{
-    std::string res(sizeof(TUInt) * 2, '\0');
-    writeHexUIntUppercase(uint_, res.data());
-    return res;
-}
-
-template <typename TUInt>
-std::string getHexUIntLowercase(TUInt uint_)
-{
-    std::string res(sizeof(TUInt) * 2, '\0');
-    writeHexUIntLowercase(uint_, res.data());
-    return res;
-}
-
-/// Maps 0..9, A..F, a..f to 0..15. Other chars are mapped to implementation specific value.
-
-constexpr inline std::string_view hex_char_to_digit_table
-    = {"\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
-       "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
-       "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
-       "\x00\x01\x02\x03\x04\x05\x06\x07\x08\x09\xff\xff\xff\xff\xff\xff" //0-9
-       "\xff\x0a\x0b\x0c\x0d\x0e\x0f\xff\xff\xff\xff\xff\xff\xff\xff\xff" //A-Z
-       "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
-       "\xff\x0a\x0b\x0c\x0d\x0e\x0f\xff\xff\xff\xff\xff\xff\xff\xff\xff" //a-z
-       "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
-       "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
-       "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
-       "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
-       "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
-       "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
-       "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
-       "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"
-       "\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff",
-       256};
-
+/// Converts a hexadecimal digit '0'..'f' or '0'..'F' to UInt8.
 constexpr UInt8 unhex(char c)
 {
-    return hex_char_to_digit_table[static_cast<UInt8>(c)];
+    return impl::unhexDigit(c);
 }
 
+/// Converts two hexadecimal digits to UInt8.
 constexpr UInt8 unhex2(const char * data)
 {
-    return static_cast<UInt8>(unhex(data[0])) * 0x10 + static_cast<UInt8>(unhex(data[1]));
+    return unhexUInt<UInt8>(data);
 }
 
+/// Converts four hexadecimal digits to UInt16.
 constexpr UInt16 unhex4(const char * data)
 {
-    return static_cast<UInt16>(unhex(data[0])) * 0x1000 + static_cast<UInt16>(unhex(data[1])) * 0x100
-        + static_cast<UInt16>(unhex(data[2])) * 0x10 + static_cast<UInt16>(unhex(data[3]));
+    return unhexUInt<UInt16>(data);
 }
 
-template <typename TUInt>
-constexpr TUInt unhexUInt(const char * data)
+/// Produces a binary representation of a single byte.
+inline void writeBinByte(UInt8 byte, void * out)
 {
-    TUInt res = 0;
-    if constexpr ((sizeof(TUInt) <= 8) || ((sizeof(TUInt) % 8) != 0))
-    {
-        for (size_t i = 0; i < sizeof(TUInt) * 2; ++i, ++data)
-        {
-            res <<= 4;
-            res += unhex(*data);
-        }
-    }
-    else
-    {
-        for (size_t i = 0; i < sizeof(TUInt) / 8; ++i, data += 16)
-        {
-            res <<= 64;
-            res += unhexUInt<UInt64>(data);
-        }
-    }
-    return res;
+    memcpy(out, &impl::bin_byte_to_char_table[static_cast<size_t>(byte) * 8], 8);
 }
diff --git a/base/base/interpolate.h b/base/base/interpolate.h
index 1d4fc0b6257..4c27f70c95b 100644
--- a/base/base/interpolate.h
+++ b/base/base/interpolate.h
@@ -11,3 +11,8 @@ constexpr double interpolateExponential(double min, double max, double ratio)
     assert(min > 0 && ratio >= 0 && ratio <= 1);
     return min * std::pow(max / min, ratio);
 }
+
+constexpr double interpolateLinear(double min, double max, double ratio)
+{
+    return std::lerp(min, max, ratio);
+}
diff --git a/base/base/wide_integer_impl.h b/base/base/wide_integer_impl.h
index 4a80c176829..411841e6d9f 100644
--- a/base/base/wide_integer_impl.h
+++ b/base/base/wide_integer_impl.h
@@ -27,6 +27,8 @@ using FromDoubleIntermediateType = long double;
 using FromDoubleIntermediateType = boost::multiprecision::cpp_bin_float_double_extended;
 #endif
 
+namespace CityHash_v1_0_2 { struct uint128; }
+
 namespace wide
 {
 
@@ -281,6 +283,17 @@ struct integer<Bits, Signed>::_impl
         }
     }
 
+    template <typename CityHashUInt128 = CityHash_v1_0_2::uint128>
+    constexpr static void wide_integer_from_cityhash_uint128(integer<Bits, Signed> & self, const CityHashUInt128 & value) noexcept
+    {
+        static_assert(sizeof(item_count) >= 2);
+
+        if constexpr (std::endian::native == std::endian::little)
+            wide_integer_from_tuple_like(self, std::make_pair(value.low64, value.high64));
+        else
+            wide_integer_from_tuple_like(self, std::make_pair(value.high64, value.low64));
+    }
+
     /**
      * N.B. t is constructed from double, so max(t) = max(double) ~ 2^310
      * the recursive call happens when t / 2^64 > 2^64, so there won't be more than 5 of them.
@@ -1036,6 +1049,8 @@ constexpr integer<Bits, Signed>::integer(T rhs) noexcept
         _impl::wide_integer_from_wide_integer(*this, rhs);
     else if  constexpr (IsTupleLike<T>::value)
         _impl::wide_integer_from_tuple_like(*this, rhs);
+    else if constexpr (std::is_same_v<std::remove_cvref_t<T>, CityHash_v1_0_2::uint128>)
+        _impl::wide_integer_from_cityhash_uint128(*this, rhs);
     else
         _impl::wide_integer_from_builtin(*this, rhs);
 }
@@ -1051,6 +1066,8 @@ constexpr integer<Bits, Signed>::integer(std::initializer_list<T> il) noexcept
             _impl::wide_integer_from_wide_integer(*this, *il.begin());
         else if  constexpr (IsTupleLike<T>::value)
             _impl::wide_integer_from_tuple_like(*this, *il.begin());
+        else if constexpr (std::is_same_v<std::remove_cvref_t<T>, CityHash_v1_0_2::uint128>)
+            _impl::wide_integer_from_cityhash_uint128(*this, *il.begin());
         else
             _impl::wide_integer_from_builtin(*this, *il.begin());
     }
@@ -1088,6 +1105,8 @@ constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator=(T rhs) noexce
 {
     if  constexpr (IsTupleLike<T>::value)
         _impl::wide_integer_from_tuple_like(*this, rhs);
+    else if constexpr (std::is_same_v<std::remove_cvref_t<T>, CityHash_v1_0_2::uint128>)
+        _impl::wide_integer_from_cityhash_uint128(*this, rhs);
     else
         _impl::wide_integer_from_builtin(*this, rhs);
     return *this;
diff --git a/base/poco/Foundation/CMakeLists.txt b/base/poco/Foundation/CMakeLists.txt
index 358f49ed055..d0dde8a51a5 100644
--- a/base/poco/Foundation/CMakeLists.txt
+++ b/base/poco/Foundation/CMakeLists.txt
@@ -87,7 +87,6 @@ set (SRCS
     src/LoggingRegistry.cpp
     src/LogStream.cpp
     src/MD5Engine.cpp
-    src/MemoryPool.cpp
     src/MemoryStream.cpp
     src/Message.cpp
     src/Mutex.cpp
diff --git a/base/poco/Foundation/include/Poco/BinaryReader.h b/base/poco/Foundation/include/Poco/BinaryReader.h
index 4042b507a2f..2b9bca29944 100644
--- a/base/poco/Foundation/include/Poco/BinaryReader.h
+++ b/base/poco/Foundation/include/Poco/BinaryReader.h
@@ -117,6 +117,9 @@ public:
     void readRaw(char * buffer, std::streamsize length);
     /// Reads length bytes of raw data into buffer.
 
+    void readCString(std::string& value);
+		/// Reads zero-terminated C-string into value.
+
     void readBOM();
     /// Reads a byte-order mark from the stream and configures
     /// the reader for the encountered byte order.
diff --git a/base/poco/Foundation/include/Poco/BinaryWriter.h b/base/poco/Foundation/include/Poco/BinaryWriter.h
index aa280d4ccab..a35d76d84bc 100644
--- a/base/poco/Foundation/include/Poco/BinaryWriter.h
+++ b/base/poco/Foundation/include/Poco/BinaryWriter.h
@@ -56,6 +56,8 @@ public:
         LITTLE_ENDIAN_BYTE_ORDER = 3 /// little-endian byte-order
     };
 
+    static const std::streamsize	DEFAULT_MAX_CSTR_LENGTH { 1024 };
+
     BinaryWriter(std::ostream & ostr, StreamByteOrder byteOrder = NATIVE_BYTE_ORDER);
     /// Creates the BinaryWriter.
 
@@ -131,6 +133,9 @@ public:
     void writeRaw(const char * buffer, std::streamsize length);
     /// Writes length raw bytes from the given buffer to the stream.
 
+    void writeCString(const char* cString, std::streamsize maxLength = DEFAULT_MAX_CSTR_LENGTH);
+		/// Writes zero-terminated C-string.
+
     void writeBOM();
     /// Writes a byte-order mark to the stream. A byte order mark is
     /// a 16-bit integer with a value of 0xFEFF, written in host byte-order.
diff --git a/base/poco/Foundation/include/Poco/MemoryPool.h b/base/poco/Foundation/include/Poco/MemoryPool.h
deleted file mode 100644
index 9ab12081b5f..00000000000
--- a/base/poco/Foundation/include/Poco/MemoryPool.h
+++ /dev/null
@@ -1,116 +0,0 @@
-//
-// MemoryPool.h
-//
-// Library: Foundation
-// Package: Core
-// Module:  MemoryPool
-//
-// Definition of the MemoryPool class.
-//
-// Copyright (c) 2005-2006, Applied Informatics Software Engineering GmbH.
-// and Contributors.
-//
-// SPDX-License-Identifier:	BSL-1.0
-//
-
-
-#ifndef Foundation_MemoryPool_INCLUDED
-#define Foundation_MemoryPool_INCLUDED
-
-
-#include <cstddef>
-#include <vector>
-#include "Poco/Foundation.h"
-#include "Poco/Mutex.h"
-
-
-namespace Poco
-{
-
-
-class Foundation_API MemoryPool
-/// A simple pool for fixed-size memory blocks.
-///
-/// The main purpose of this class is to speed-up
-/// memory allocations, as well as to reduce memory
-/// fragmentation in situations where the same blocks
-/// are allocated all over again, such as in server
-/// applications.
-///
-/// All allocated blocks are retained for future use.
-/// A limit on the number of blocks can be specified.
-/// Blocks can be preallocated.
-{
-public:
-    MemoryPool(std::size_t blockSize, int preAlloc = 0, int maxAlloc = 0);
-    /// Creates a MemoryPool for blocks with the given blockSize.
-    /// The number of blocks given in preAlloc are preallocated.
-
-    ~MemoryPool();
-
-    void * get();
-    /// Returns a memory block. If there are no more blocks
-    /// in the pool, a new block will be allocated.
-    ///
-    /// If maxAlloc blocks are already allocated, an
-    /// OutOfMemoryException is thrown.
-
-    void release(void * ptr);
-    /// Releases a memory block and returns it to the pool.
-
-    std::size_t blockSize() const;
-    /// Returns the block size.
-
-    int allocated() const;
-    /// Returns the number of allocated blocks.
-
-    int available() const;
-    /// Returns the number of available blocks in the pool.
-
-private:
-    MemoryPool();
-    MemoryPool(const MemoryPool &);
-    MemoryPool & operator=(const MemoryPool &);
-
-    void clear();
-
-    enum
-    {
-        BLOCK_RESERVE = 128
-    };
-
-    typedef std::vector<char *> BlockVec;
-
-    std::size_t _blockSize;
-    int _maxAlloc;
-    int _allocated;
-    BlockVec _blocks;
-    FastMutex _mutex;
-};
-
-
-//
-// inlines
-//
-inline std::size_t MemoryPool::blockSize() const
-{
-    return _blockSize;
-}
-
-
-inline int MemoryPool::allocated() const
-{
-    return _allocated;
-}
-
-
-inline int MemoryPool::available() const
-{
-    return (int)_blocks.size();
-}
-
-
-} // namespace Poco
-
-
-#endif // Foundation_MemoryPool_INCLUDED
diff --git a/base/poco/Foundation/src/BinaryReader.cpp b/base/poco/Foundation/src/BinaryReader.cpp
index f2961e03966..37ec2bc9040 100644
--- a/base/poco/Foundation/src/BinaryReader.cpp
+++ b/base/poco/Foundation/src/BinaryReader.cpp
@@ -274,6 +274,31 @@ void BinaryReader::readRaw(char* buffer, std::streamsize length)
 }
 
 
+void BinaryReader::readCString(std::string& value)
+{
+	value.clear();
+	if (!_istr.good())
+	{
+		return;
+	}
+	value.reserve(256);
+	while (true)
+	{
+		char c;
+		_istr.get(c);
+		if (!_istr.good())
+		{
+			break;
+		}
+		if (c == '\0')
+		{
+			break;
+		}
+		value += c;
+	}
+}
+
+
 void BinaryReader::readBOM()
 {
 	UInt16 bom;
diff --git a/base/poco/Foundation/src/BinaryWriter.cpp b/base/poco/Foundation/src/BinaryWriter.cpp
index 6db5ab7cb90..c3fcabc4374 100644
--- a/base/poco/Foundation/src/BinaryWriter.cpp
+++ b/base/poco/Foundation/src/BinaryWriter.cpp
@@ -271,7 +271,7 @@ BinaryWriter& BinaryWriter::operator << (const std::string& value)
 BinaryWriter& BinaryWriter::operator << (const char* value)
 {
 	poco_check_ptr (value);
-	
+
 	if (_pTextConverter)
 	{
 		std::string converted;
@@ -332,6 +332,15 @@ void BinaryWriter::writeRaw(const char* buffer, std::streamsize length)
 }
 
 
+void BinaryWriter::writeCString(const char* cString, std::streamsize maxLength)
+{
+	const std::size_t len = ::strnlen(cString, maxLength);
+	writeRaw(cString, len);
+	static const char zero = '\0';
+	_ostr.write(&zero, sizeof(zero));
+}
+
+
 void BinaryWriter::writeBOM()
 {
 	UInt16 value = 0xFEFF;
diff --git a/base/poco/Foundation/src/MemoryPool.cpp b/base/poco/Foundation/src/MemoryPool.cpp
deleted file mode 100644
index 01c477be525..00000000000
--- a/base/poco/Foundation/src/MemoryPool.cpp
+++ /dev/null
@@ -1,105 +0,0 @@
-//
-// MemoryPool.cpp
-//
-// Library: Foundation
-// Package: Core
-// Module:  MemoryPool
-//
-// Copyright (c) 2005-2006, Applied Informatics Software Engineering GmbH.
-// and Contributors.
-//
-// SPDX-License-Identifier:	BSL-1.0
-//
-
-
-#include "Poco/MemoryPool.h"
-#include "Poco/Exception.h"
-
-
-namespace Poco {
-
-
-MemoryPool::MemoryPool(std::size_t blockSize, int preAlloc, int maxAlloc):
-	_blockSize(blockSize),
-	_maxAlloc(maxAlloc),
-	_allocated(preAlloc)
-{
-	poco_assert (maxAlloc == 0 || maxAlloc >= preAlloc);
-	poco_assert (preAlloc >= 0 && maxAlloc >= 0);
-
-	int r = BLOCK_RESERVE;
-	if (preAlloc > r)
-		r = preAlloc;
-	if (maxAlloc > 0 && maxAlloc < r)
-		r = maxAlloc;
-	_blocks.reserve(r);
-	
-	try
-	{
-		for (int i = 0; i < preAlloc; ++i)
-		{
-			_blocks.push_back(new char[_blockSize]);
-		}
-	}
-	catch (...)
-	{
-		clear();
-		throw;
-	}
-}
-
-	
-MemoryPool::~MemoryPool()
-{
-	clear();
-}
-
-
-void MemoryPool::clear()
-{
-	for (BlockVec::iterator it = _blocks.begin(); it != _blocks.end(); ++it)
-	{
-		delete [] *it;
-	}
-	_blocks.clear();
-}
-
-
-void* MemoryPool::get()
-{
-	FastMutex::ScopedLock lock(_mutex);
-	
-	if (_blocks.empty())
-	{
-		if (_maxAlloc == 0 || _allocated < _maxAlloc)
-		{
-			++_allocated;
-			return new char[_blockSize];
-		}
-		else throw OutOfMemoryException("MemoryPool exhausted");
-	}
-	else
-	{
-		char* ptr = _blocks.back();
-		_blocks.pop_back();
-		return ptr;
-	}
-}
-
-	
-void MemoryPool::release(void* ptr)
-{
-	FastMutex::ScopedLock lock(_mutex);
-	
-	try
-	{
-		_blocks.push_back(reinterpret_cast<char*>(ptr));
-	}
-	catch (...)
-	{
-		delete [] reinterpret_cast<char*>(ptr);
-	}
-}
-
-
-} // namespace Poco
diff --git a/base/poco/MongoDB/CMakeLists.txt b/base/poco/MongoDB/CMakeLists.txt
index 8f5c6be2cae..bb6f90ed8f5 100644
--- a/base/poco/MongoDB/CMakeLists.txt
+++ b/base/poco/MongoDB/CMakeLists.txt
@@ -13,3 +13,4 @@ target_compile_options (_poco_mongodb
 
 target_include_directories (_poco_mongodb SYSTEM PUBLIC "include")
 target_link_libraries (_poco_mongodb PUBLIC Poco::Net)
+
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/Array.h b/base/poco/MongoDB/include/Poco/MongoDB/Array.h
index 4ed9cdd87ee..8a30c785b2d 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/Array.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/Array.h
@@ -33,7 +33,7 @@ namespace MongoDB
     /// This class represents a BSON Array.
     {
     public:
-        typedef SharedPtr<Array> Ptr;
+        using Ptr = SharedPtr<Array>;
 
         Array();
         /// Creates an empty Array.
@@ -41,8 +41,31 @@ namespace MongoDB
         virtual ~Array();
         /// Destroys the Array.
 
+        // Document template functions available for backward compatibility
+        using Document::add;
+        using Document::get;
+
         template <typename T>
-        T get(int pos) const
+        Document & add(T value)
+        /// Creates an element with the name from the current pos and value and
+        /// adds it to the array document.
+        ///
+        /// The active document is returned to allow chaining of the add methods.
+        {
+            return Document::add<T>(Poco::NumberFormatter::format(size()), value);
+        }
+
+        Document & add(const char * value)
+        /// Creates an element with a name from the current pos and value and
+        /// adds it to the array document.
+        ///
+        /// The active document is returned to allow chaining of the add methods.
+        {
+            return Document::add(Poco::NumberFormatter::format(size()), value);
+        }
+
+        template <typename T>
+        T get(std::size_t pos) const
         /// Returns the element at the given index and tries to convert
         /// it to the template type. If the element is not found, a
         /// Poco::NotFoundException will be thrown. If the element cannot be
@@ -52,7 +75,7 @@ namespace MongoDB
         }
 
         template <typename T>
-        T get(int pos, const T & deflt) const
+        T get(std::size_t pos, const T & deflt) const
         /// Returns the element at the given index and tries to convert
         /// it to the template type. If the element is not found, or
         /// has the wrong type, the deflt argument will be returned.
@@ -60,12 +83,12 @@ namespace MongoDB
             return Document::get<T>(Poco::NumberFormatter::format(pos), deflt);
         }
 
-        Element::Ptr get(int pos) const;
+        Element::Ptr get(std::size_t pos) const;
         /// Returns the element at the given index.
         /// An empty element will be returned if the element is not found.
 
         template <typename T>
-        bool isType(int pos) const
+        bool isType(std::size_t pos) const
         /// Returns true if the type of the element equals the TypeId of ElementTrait,
         /// otherwise false.
         {
@@ -74,6 +97,9 @@ namespace MongoDB
 
         std::string toString(int indent = 0) const;
         /// Returns a string representation of the Array.
+
+    private:
+        friend void BSONReader::read<Array::Ptr>(Array::Ptr & to);
     };
 
 
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/Binary.h b/base/poco/MongoDB/include/Poco/MongoDB/Binary.h
index 1005cb000f5..aad8736e8b6 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/Binary.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/Binary.h
@@ -40,7 +40,7 @@ namespace MongoDB
     /// A Binary stores its data in a Poco::Buffer<unsigned char>.
     {
     public:
-        typedef SharedPtr<Binary> Ptr;
+        using Ptr = SharedPtr<Binary>;
 
         Binary();
         /// Creates an empty Binary with subtype 0.
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/Connection.h b/base/poco/MongoDB/include/Poco/MongoDB/Connection.h
index dcb813b75bc..cf679d530aa 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/Connection.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/Connection.h
@@ -18,6 +18,7 @@
 #define MongoDB_Connection_INCLUDED
 
 
+#include "Poco/MongoDB/OpMsgMessage.h"
 #include "Poco/MongoDB/RequestMessage.h"
 #include "Poco/MongoDB/ResponseMessage.h"
 #include "Poco/Mutex.h"
@@ -39,7 +40,7 @@ namespace MongoDB
     /// for more information on the wire protocol.
     {
     public:
-        typedef Poco::SharedPtr<Connection> Ptr;
+        using Ptr = Poco::SharedPtr<Connection>;
 
         class MongoDB_API SocketFactory
         {
@@ -90,7 +91,7 @@ namespace MongoDB
 
         Poco::Net::SocketAddress address() const;
         /// Returns the address of the MongoDB server.
-        
+
         const std::string & uri() const;
         /// Returns the uri on which the connection was made.
 
@@ -145,6 +146,21 @@ namespace MongoDB
         /// Use this when a response is expected: only a "query" or "getmore"
         /// request will return a response.
 
+        void sendRequest(OpMsgMessage & request, OpMsgMessage & response);
+        /// Sends a request to the MongoDB server and receives the response
+        /// using newer wire protocol with OP_MSG.
+
+        void sendRequest(OpMsgMessage & request);
+        /// Sends an unacknowledged request to the MongoDB server using newer
+        /// wire protocol with OP_MSG.
+        /// No response is sent by the server.
+
+        void readResponse(OpMsgMessage & response);
+        /// Reads additional response data when previous message's flag moreToCome
+        /// indicates that server will send more data.
+        /// NOTE: See comments in OpMsgCursor code.
+
+
     protected:
         void connect();
 
@@ -164,7 +180,7 @@ namespace MongoDB
     }
     inline const std::string & Connection::uri() const
     {
-    	return _uri;
+        return _uri;
     }
 
 
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/Cursor.h b/base/poco/MongoDB/include/Poco/MongoDB/Cursor.h
index 4aed9fe64fb..8849d737a62 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/Cursor.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/Cursor.h
@@ -40,6 +40,9 @@ namespace MongoDB
         Cursor(const std::string & fullCollectionName, QueryRequest::Flags flags = QueryRequest::QUERY_DEFAULT);
         /// Creates a Cursor for the given database and collection ("database.collection"), using the specified flags.
 
+        Cursor(const Document & aggregationResponse);
+        /// Creates a Cursor for the given aggregation query response.
+
         virtual ~Cursor();
         /// Destroys the Cursor.
 
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/Database.h b/base/poco/MongoDB/include/Poco/MongoDB/Database.h
index 62aea632b08..3334a673df6 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/Database.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/Database.h
@@ -26,6 +26,8 @@
 #include "Poco/MongoDB/QueryRequest.h"
 #include "Poco/MongoDB/UpdateRequest.h"
 
+#include "Poco/MongoDB/OpMsgCursor.h"
+#include "Poco/MongoDB/OpMsgMessage.h"
 
 namespace Poco
 {
@@ -45,6 +47,9 @@ namespace MongoDB
         virtual ~Database();
         /// Destroys the Database.
 
+        const std::string & name() const;
+        /// Database name
+
         bool authenticate(
             Connection & connection,
             const std::string & username,
@@ -62,34 +67,49 @@ namespace MongoDB
         /// May throw a Poco::ProtocolException if authentication fails for a reason other than
         /// invalid credentials.
 
+        Document::Ptr queryBuildInfo(Connection & connection) const;
+        /// Queries server build info (all wire protocols)
+
+        Document::Ptr queryServerHello(Connection & connection) const;
+        /// Queries hello response from server (all wire protocols)
+
         Int64 count(Connection & connection, const std::string & collectionName) const;
-        /// Sends a count request for the given collection to MongoDB.
+        /// Sends a count request for the given collection to MongoDB. (old wire protocol)
         ///
         /// If the command fails, -1 is returned.
 
         Poco::SharedPtr<Poco::MongoDB::QueryRequest> createCommand() const;
-        /// Creates a QueryRequest for a command.
+        /// Creates a QueryRequest for a command. (old wire protocol)
 
         Poco::SharedPtr<Poco::MongoDB::QueryRequest> createCountRequest(const std::string & collectionName) const;
         /// Creates a QueryRequest to count the given collection.
-        /// The collectionname must not contain the database name.
+        /// The collectionname must not contain the database name. (old wire protocol)
 
         Poco::SharedPtr<Poco::MongoDB::DeleteRequest> createDeleteRequest(const std::string & collectionName) const;
         /// Creates a DeleteRequest to delete documents in the given collection.
-        /// The collectionname must not contain the database name.
+        /// The collectionname must not contain the database name. (old wire protocol)
 
         Poco::SharedPtr<Poco::MongoDB::InsertRequest> createInsertRequest(const std::string & collectionName) const;
         /// Creates an InsertRequest to insert new documents in the given collection.
-        /// The collectionname must not contain the database name.
+        /// The collectionname must not contain the database name. (old wire protocol)
 
         Poco::SharedPtr<Poco::MongoDB::QueryRequest> createQueryRequest(const std::string & collectionName) const;
-        /// Creates a QueryRequest.
+        /// Creates a QueryRequest. (old wire protocol)
         /// The collectionname must not contain the database name.
 
         Poco::SharedPtr<Poco::MongoDB::UpdateRequest> createUpdateRequest(const std::string & collectionName) const;
-        /// Creates an UpdateRequest.
+        /// Creates an UpdateRequest. (old wire protocol)
         /// The collectionname must not contain the database name.
 
+        Poco::SharedPtr<Poco::MongoDB::OpMsgMessage> createOpMsgMessage(const std::string & collectionName) const;
+        /// Creates OpMsgMessage. (new wire protocol)
+
+        Poco::SharedPtr<Poco::MongoDB::OpMsgMessage> createOpMsgMessage() const;
+        /// Creates OpMsgMessage for database commands that do not require collection as an argument. (new wire protocol)
+
+        Poco::SharedPtr<Poco::MongoDB::OpMsgCursor> createOpMsgCursor(const std::string & collectionName) const;
+        /// Creates OpMsgCursor. (new wire protocol)
+
         Poco::MongoDB::Document::Ptr ensureIndex(
             Connection & connection,
             const std::string & collection,
@@ -100,14 +120,16 @@ namespace MongoDB
             int version = 0,
             int ttl = 0);
         /// Creates an index. The document returned is the result of a getLastError call.
-        /// For more info look at the ensureIndex information on the MongoDB website.
+        /// For more info look at the ensureIndex information on the MongoDB website. (old wire protocol)
 
         Document::Ptr getLastErrorDoc(Connection & connection) const;
         /// Sends the getLastError command to the database and returns the error document.
+        /// (old wire protocol)
 
         std::string getLastError(Connection & connection) const;
         /// Sends the getLastError command to the database and returns the err element
         /// from the error document. When err is null, an empty string is returned.
+        /// (old wire protocol)
 
         static const std::string AUTH_MONGODB_CR;
         /// Default authentication mechanism prior to MongoDB 3.0.
@@ -115,6 +137,27 @@ namespace MongoDB
         static const std::string AUTH_SCRAM_SHA1;
         /// Default authentication mechanism for MongoDB 3.0.
 
+        enum WireVersion
+        /// Wire version as reported by the command hello.
+        /// See details in MongoDB github, repository specifications.
+        /// @see queryServerHello
+        {
+            VER_26 = 1,
+            VER_26_2 = 2,
+            VER_30 = 3,
+            VER_32 = 4,
+            VER_34 = 5,
+            VER_36 = 6, ///< First wire version that supports OP_MSG
+            VER_40 = 7,
+            VER_42 = 8,
+            VER_44 = 9,
+            VER_50 = 13,
+            VER_51 = 14, ///< First wire version that supports only OP_MSG
+            VER_52 = 15,
+            VER_53 = 16,
+            VER_60 = 17
+        };
+
     protected:
         bool authCR(Connection & connection, const std::string & username, const std::string & password);
         bool authSCRAM(Connection & connection, const std::string & username, const std::string & password);
@@ -127,6 +170,12 @@ namespace MongoDB
     //
     // inlines
     //
+    inline const std::string & Database::name() const
+    {
+        return _dbname;
+    }
+
+
     inline Poco::SharedPtr<Poco::MongoDB::QueryRequest> Database::createCommand() const
     {
         Poco::SharedPtr<Poco::MongoDB::QueryRequest> cmd = createQueryRequest("$cmd");
@@ -158,6 +207,24 @@ namespace MongoDB
         return new Poco::MongoDB::UpdateRequest(_dbname + '.' + collectionName);
     }
 
+    // -- New wire protocol commands
+
+    inline Poco::SharedPtr<Poco::MongoDB::OpMsgMessage> Database::createOpMsgMessage(const std::string & collectionName) const
+    {
+        return new Poco::MongoDB::OpMsgMessage(_dbname, collectionName);
+    }
+
+    inline Poco::SharedPtr<Poco::MongoDB::OpMsgMessage> Database::createOpMsgMessage() const
+    {
+        // Collection name for database commands is not needed.
+        return createOpMsgMessage("");
+    }
+
+    inline Poco::SharedPtr<Poco::MongoDB::OpMsgCursor> Database::createOpMsgCursor(const std::string & collectionName) const
+    {
+        return new Poco::MongoDB::OpMsgCursor(_dbname, collectionName);
+    }
+
 
 }
 } // namespace Poco::MongoDB
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/Document.h b/base/poco/MongoDB/include/Poco/MongoDB/Document.h
index 12889663827..9e1df349e20 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/Document.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/Document.h
@@ -31,6 +31,7 @@ namespace Poco
 namespace MongoDB
 {
 
+    class Array;
 
     class ElementFindByName
     {
@@ -48,8 +49,8 @@ namespace MongoDB
     /// Represents a MongoDB (BSON) document.
     {
     public:
-        typedef SharedPtr<Document> Ptr;
-        typedef std::vector<Document::Ptr> Vector;
+        using Ptr = SharedPtr<Document>;
+        using Vector = std::vector<Document::Ptr>;
 
         Document();
         /// Creates an empty Document.
@@ -86,6 +87,10 @@ namespace MongoDB
         /// Unlike the other add methods, this method returns
         /// a reference to the new document.
 
+        Array & addNewArray(const std::string & name);
+        /// Create a new array and add it to this document.
+        /// Method returns a reference to the new array.
+
         void clear();
         /// Removes all elements from the document.
 
@@ -95,7 +100,7 @@ namespace MongoDB
         bool empty() const;
         /// Returns true if the document doesn't contain any documents.
 
-        bool exists(const std::string & name);
+        bool exists(const std::string & name) const;
         /// Returns true if the document has an element with the given name.
 
         template <typename T>
@@ -158,6 +163,9 @@ namespace MongoDB
         /// return an Int64. When the element is not found, a
         /// Poco::NotFoundException will be thrown.
 
+        bool remove(const std::string & name);
+        /// Removes an element from the document.
+
         template <typename T>
         bool isType(const std::string & name) const
         /// Returns true when the type of the element equals the TypeId of ElementTrait.
@@ -227,12 +235,23 @@ namespace MongoDB
     }
 
 
-    inline bool Document::exists(const std::string & name)
+    inline bool Document::exists(const std::string & name) const
     {
         return std::find_if(_elements.begin(), _elements.end(), ElementFindByName(name)) != _elements.end();
     }
 
 
+    inline bool Document::remove(const std::string & name)
+    {
+        auto it = std::find_if(_elements.begin(), _elements.end(), ElementFindByName(name));
+        if (it == _elements.end())
+            return false;
+
+        _elements.erase(it);
+        return true;
+    }
+
+
     inline std::size_t Document::size() const
     {
         return _elements.size();
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/Element.h b/base/poco/MongoDB/include/Poco/MongoDB/Element.h
index b5592bd0e0b..26525d7d02b 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/Element.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/Element.h
@@ -45,7 +45,7 @@ namespace MongoDB
     /// Represents an Element of a Document or an Array.
     {
     public:
-        typedef Poco::SharedPtr<Element> Ptr;
+        using Ptr = Poco::SharedPtr<Element>;
 
         explicit Element(const std::string & name);
         /// Creates the Element with the given name.
@@ -80,7 +80,7 @@ namespace MongoDB
     }
 
 
-    typedef std::list<Element::Ptr> ElementSet;
+    using ElementSet = std::list<Element::Ptr>;
 
 
     template <typename T>
@@ -266,7 +266,7 @@ namespace MongoDB
     }
 
 
-    typedef Nullable<unsigned char> NullValue;
+    using NullValue = Nullable<unsigned char>;
 
 
     // BSON Null Value
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/JavaScriptCode.h b/base/poco/MongoDB/include/Poco/MongoDB/JavaScriptCode.h
index df1edc16817..c0f584b7c19 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/JavaScriptCode.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/JavaScriptCode.h
@@ -35,7 +35,7 @@ namespace MongoDB
     /// Represents JavaScript type in BSON.
     {
     public:
-        typedef SharedPtr<JavaScriptCode> Ptr;
+        using Ptr = SharedPtr<JavaScriptCode>;
 
         JavaScriptCode();
         /// Creates an empty JavaScriptCode object.
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/MessageHeader.h b/base/poco/MongoDB/include/Poco/MongoDB/MessageHeader.h
index 2b88e30fc74..98f45e876c1 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/MessageHeader.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/MessageHeader.h
@@ -28,6 +28,9 @@ namespace MongoDB
 {
 
 
+    class Message; // Required to disambiguate friend declaration in MessageHeader.
+
+
     class MongoDB_API MessageHeader
     /// Represents the message header which is always prepended to a
     /// MongoDB request or response message.
@@ -37,14 +40,18 @@ namespace MongoDB
 
         enum OpCode
         {
+            // Opcodes deprecated in MongoDB 5.0
             OP_REPLY = 1,
-            OP_MSG = 1000,
             OP_UPDATE = 2001,
             OP_INSERT = 2002,
             OP_QUERY = 2004,
             OP_GET_MORE = 2005,
             OP_DELETE = 2006,
-            OP_KILL_CURSORS = 2007
+            OP_KILL_CURSORS = 2007,
+
+            /// Opcodes supported in MongoDB 5.1 and later
+            OP_COMPRESSED = 2012,
+            OP_MSG = 2013
         };
 
         explicit MessageHeader(OpCode);
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/MongoDB.h b/base/poco/MongoDB/include/Poco/MongoDB/MongoDB.h
index 253f1f8ab27..de246ddc9dd 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/MongoDB.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/MongoDB.h
@@ -33,6 +33,13 @@
 //
 
 
+#if defined(_WIN32) && defined(POCO_DLL)
+#    if defined(MongoDB_EXPORTS)
+#        define MongoDB_API __declspec(dllexport)
+#    else
+#        define MongoDB_API __declspec(dllimport)
+#    endif
+#endif
 
 
 #if !defined(MongoDB_API)
@@ -47,6 +54,11 @@
 //
 // Automatically link MongoDB library.
 //
+#if defined(_MSC_VER)
+#    if !defined(POCO_NO_AUTOMATIC_LIBS) && !defined(MongoDB_EXPORTS)
+#        pragma comment(lib, "PocoMongoDB" POCO_LIB_SUFFIX)
+#    endif
+#endif
 
 
 #endif // MongoDBMongoDB_INCLUDED
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/ObjectId.h b/base/poco/MongoDB/include/Poco/MongoDB/ObjectId.h
index 76bb190db48..8a335320ea0 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/ObjectId.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/ObjectId.h
@@ -44,7 +44,7 @@ namespace MongoDB
     /// as its value.
     {
     public:
-        typedef SharedPtr<ObjectId> Ptr;
+        using Ptr = SharedPtr<ObjectId>;
 
         explicit ObjectId(const std::string & id);
         /// Creates an ObjectId from a string.
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/OpMsgCursor.h b/base/poco/MongoDB/include/Poco/MongoDB/OpMsgCursor.h
new file mode 100644
index 00000000000..a465a71bb1c
--- /dev/null
+++ b/base/poco/MongoDB/include/Poco/MongoDB/OpMsgCursor.h
@@ -0,0 +1,96 @@
+//
+// OpMsgCursor.h
+//
+// Library: MongoDB
+// Package: MongoDB
+// Module:  OpMsgCursor
+//
+// Definition of the OpMsgCursor class.
+//
+// Copyright (c) 2012, Applied Informatics Software Engineering GmbH.
+// and Contributors.
+//
+// SPDX-License-Identifier:	BSL-1.0
+//
+
+
+#ifndef MongoDB_OpMsgCursor_INCLUDED
+#define MongoDB_OpMsgCursor_INCLUDED
+
+
+#include "Poco/MongoDB/Connection.h"
+#include "Poco/MongoDB/MongoDB.h"
+#include "Poco/MongoDB/OpMsgMessage.h"
+
+namespace Poco
+{
+namespace MongoDB
+{
+
+
+    class MongoDB_API OpMsgCursor : public Document
+    /// OpMsgCursor is an helper class for querying multiple documents using OpMsgMessage.
+    {
+    public:
+        OpMsgCursor(const std::string & dbname, const std::string & collectionName);
+        /// Creates a OpMsgCursor for the given database and collection.
+
+        virtual ~OpMsgCursor();
+        /// Destroys the OpMsgCursor.
+
+        void setEmptyFirstBatch(bool empty);
+        /// Empty first batch is used to get error response faster with little server processing
+
+        bool emptyFirstBatch() const;
+
+        void setBatchSize(Int32 batchSize);
+        /// Set non-default batch size
+
+        Int32 batchSize() const;
+        /// Current batch size (zero or negative number indicates default batch size)
+
+        Int64 cursorID() const;
+
+        OpMsgMessage & next(Connection & connection);
+        /// Tries to get the next documents. As long as response message has a
+        /// cursor ID next can be called to retrieve the next bunch of documents.
+        ///
+        /// The cursor must be killed (see kill()) when not all documents are needed.
+
+        OpMsgMessage & query();
+        /// Returns the associated query.
+
+        void kill(Connection & connection);
+        /// Kills the cursor and reset it so that it can be reused.
+
+    private:
+        OpMsgMessage _query;
+        OpMsgMessage _response;
+
+        bool _emptyFirstBatch{false};
+        Int32 _batchSize{-1};
+        /// Batch size used in the cursor. Zero or negative value means that default shall be used.
+
+        Int64 _cursorID{0};
+    };
+
+
+    //
+    // inlines
+    //
+    inline OpMsgMessage & OpMsgCursor::query()
+    {
+        return _query;
+    }
+
+    inline Int64 OpMsgCursor::cursorID() const
+    {
+        return _cursorID;
+    }
+
+
+}
+} // namespace Poco::MongoDB
+
+
+#endif // MongoDB_OpMsgCursor_INCLUDED
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/OpMsgMessage.h b/base/poco/MongoDB/include/Poco/MongoDB/OpMsgMessage.h
new file mode 100644
index 00000000000..699c7fc4e12
--- /dev/null
+++ b/base/poco/MongoDB/include/Poco/MongoDB/OpMsgMessage.h
@@ -0,0 +1,163 @@
+//
+// OpMsgMessage.h
+//
+// Library: MongoDB
+// Package: MongoDB
+// Module:  OpMsgMessage
+//
+// Definition of the OpMsgMessage class.
+//
+// Copyright (c) 2022, Applied Informatics Software Engineering GmbH.
+// and Contributors.
+//
+// SPDX-License-Identifier:	BSL-1.0
+//
+
+
+#ifndef MongoDB_OpMsgMessage_INCLUDED
+#define MongoDB_OpMsgMessage_INCLUDED
+
+
+#include "Poco/MongoDB/Document.h"
+#include "Poco/MongoDB/Message.h"
+#include "Poco/MongoDB/MongoDB.h"
+
+#include <string>
+
+namespace Poco
+{
+namespace MongoDB
+{
+
+
+    class MongoDB_API OpMsgMessage : public Message
+    /// This class represents a request/response (OP_MSG) to send requests and receive responses to/from MongoDB.
+    {
+    public:
+        // Constants for most often used MongoDB commands that can be sent using OP_MSG
+        // For complete list see: https://www.mongodb.com/docs/manual/reference/command/
+
+        // Query and write
+        static const std::string CMD_INSERT;
+        static const std::string CMD_DELETE;
+        static const std::string CMD_UPDATE;
+        static const std::string CMD_FIND;
+        static const std::string CMD_FIND_AND_MODIFY;
+        static const std::string CMD_GET_MORE;
+
+        // Aggregation
+        static const std::string CMD_AGGREGATE;
+        static const std::string CMD_COUNT;
+        static const std::string CMD_DISTINCT;
+        static const std::string CMD_MAP_REDUCE;
+
+        // Replication and administration
+        static const std::string CMD_HELLO;
+        static const std::string CMD_REPL_SET_GET_STATUS;
+        static const std::string CMD_REPL_SET_GET_CONFIG;
+
+        static const std::string CMD_CREATE;
+        static const std::string CMD_CREATE_INDEXES;
+        static const std::string CMD_DROP;
+        static const std::string CMD_DROP_DATABASE;
+        static const std::string CMD_KILL_CURSORS;
+        static const std::string CMD_LIST_DATABASES;
+        static const std::string CMD_LIST_INDEXES;
+
+        // Diagnostic
+        static const std::string CMD_BUILD_INFO;
+        static const std::string CMD_COLL_STATS;
+        static const std::string CMD_DB_STATS;
+        static const std::string CMD_HOST_INFO;
+
+
+        enum Flags : UInt32
+        {
+            MSG_FLAGS_DEFAULT = 0,
+
+            MSG_CHECKSUM_PRESENT = (1 << 0),
+
+            MSG_MORE_TO_COME = (1 << 1),
+            /// Sender will send another message and is not prepared for overlapping messages
+
+            MSG_EXHAUST_ALLOWED = (1 << 16)
+            /// Client is prepared for multiple replies (using the moreToCome bit) to this request
+        };
+
+        OpMsgMessage();
+        /// Creates an OpMsgMessage for response.
+
+        OpMsgMessage(const std::string & databaseName, const std::string & collectionName, UInt32 flags = MSG_FLAGS_DEFAULT);
+        /// Creates an OpMsgMessage for requests.
+
+        virtual ~OpMsgMessage();
+
+        const std::string & databaseName() const;
+
+        const std::string & collectionName() const;
+
+        void setCommandName(const std::string & command);
+        /// Sets the command name and clears the command document
+
+        void setCursor(Poco::Int64 cursorID, Poco::Int32 batchSize = -1);
+        /// Sets the command "getMore" for the cursor id with batch size (if it is not negative).
+
+        const std::string & commandName() const;
+        /// Current command name.
+
+        void setAcknowledgedRequest(bool ack);
+        /// Set false to create request that does not return response.
+        /// It has effect only for commands that write or delete documents.
+        /// Default is true (request returns acknowledge response).
+
+        bool acknowledgedRequest() const;
+
+        UInt32 flags() const;
+
+        Document & body();
+        /// Access to body document.
+        /// Additional query arguments shall be added after setting the command name.
+
+        const Document & body() const;
+
+        Document::Vector & documents();
+        /// Documents prepared for request or retrieved in response.
+
+        const Document::Vector & documents() const;
+        /// Documents prepared for request or retrieved in response.
+
+        bool responseOk() const;
+        /// Reads "ok" status from the response message.
+
+        void clear();
+        /// Clears the message.
+
+        void send(std::ostream & ostr);
+        /// Writes the request to stream.
+
+        void read(std::istream & istr);
+        /// Reads the response from the stream.
+
+    private:
+        enum PayloadType : UInt8
+        {
+            PAYLOAD_TYPE_0 = 0,
+            PAYLOAD_TYPE_1 = 1
+        };
+
+        std::string _databaseName;
+        std::string _collectionName;
+        UInt32 _flags{MSG_FLAGS_DEFAULT};
+        std::string _commandName;
+        bool _acknowledged{true};
+
+        Document _body;
+        Document::Vector _documents;
+    };
+
+
+}
+} // namespace Poco::MongoDB
+
+
+#endif // MongoDB_OpMsgMessage_INCLUDED
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/PoolableConnectionFactory.h b/base/poco/MongoDB/include/Poco/MongoDB/PoolableConnectionFactory.h
index 9d35c728e5e..53f4a5127ef 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/PoolableConnectionFactory.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/PoolableConnectionFactory.h
@@ -94,7 +94,23 @@ namespace MongoDB
 
         operator Connection::Ptr() { return _connection; }
 
+#if defined(POCO_ENABLE_CPP11)
+        // Disable copy to prevent unwanted release of resources: C++11 way
+        PooledConnection(const PooledConnection &) = delete;
+        PooledConnection & operator=(const PooledConnection &) = delete;
+
+        // Enable move semantics
+        PooledConnection(PooledConnection && other) = default;
+        PooledConnection & operator=(PooledConnection &&) = default;
+#endif
+
     private:
+#if !defined(POCO_ENABLE_CPP11)
+        // Disable copy to prevent unwanted release of resources: pre C++11 way
+        PooledConnection(const PooledConnection &);
+        PooledConnection & operator=(const PooledConnection &);
+#endif
+
         Poco::ObjectPool<Connection, Connection::Ptr> & _pool;
         Connection::Ptr _connection;
     };
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/RegularExpression.h b/base/poco/MongoDB/include/Poco/MongoDB/RegularExpression.h
index b9a8694d321..244b8c14163 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/RegularExpression.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/RegularExpression.h
@@ -33,7 +33,7 @@ namespace MongoDB
     /// Represents a regular expression in BSON format.
     {
     public:
-        typedef SharedPtr<RegularExpression> Ptr;
+        using Ptr = SharedPtr<RegularExpression>;
 
         RegularExpression();
         /// Creates an empty RegularExpression.
diff --git a/base/poco/MongoDB/include/Poco/MongoDB/ResponseMessage.h b/base/poco/MongoDB/include/Poco/MongoDB/ResponseMessage.h
index 132859cc75f..9cb92cb16c4 100644
--- a/base/poco/MongoDB/include/Poco/MongoDB/ResponseMessage.h
+++ b/base/poco/MongoDB/include/Poco/MongoDB/ResponseMessage.h
@@ -38,6 +38,9 @@ namespace MongoDB
         ResponseMessage();
         /// Creates an empty ResponseMessage.
 
+        ResponseMessage(const Int64 & cursorID);
+        /// Creates an ResponseMessage for existing cursor ID.
+
         virtual ~ResponseMessage();
         /// Destroys the ResponseMessage.
 
diff --git a/base/poco/MongoDB/src/Array.cpp b/base/poco/MongoDB/src/Array.cpp
index c6d96d1371d..6fff0994d82 100644
--- a/base/poco/MongoDB/src/Array.cpp
+++ b/base/poco/MongoDB/src/Array.cpp
@@ -20,7 +20,7 @@ namespace Poco {
 namespace MongoDB {
 
 
-Array::Array(): 
+Array::Array():
 	Document()
 {
 }
@@ -31,7 +31,7 @@ Array::~Array()
 }
 
 
-Element::Ptr Array::get(int pos) const
+Element::Ptr Array::get(std::size_t pos) const
 {
 	std::string name = Poco::NumberFormatter::format(pos);
 	return Document::get(name);
diff --git a/base/poco/MongoDB/src/Connection.cpp b/base/poco/MongoDB/src/Connection.cpp
index 38c31d2250a..fa20887054b 100644
--- a/base/poco/MongoDB/src/Connection.cpp
+++ b/base/poco/MongoDB/src/Connection.cpp
@@ -319,4 +319,30 @@ void Connection::sendRequest(RequestMessage& request, ResponseMessage& response)
 }
 
 
+void Connection::sendRequest(OpMsgMessage& request, OpMsgMessage& response)
+{
+	Poco::Net::SocketOutputStream sos(_socket);
+	request.send(sos);
+
+	response.clear();
+	readResponse(response);
+}
+
+
+void Connection::sendRequest(OpMsgMessage& request)
+{
+	request.setAcknowledgedRequest(false);
+	Poco::Net::SocketOutputStream sos(_socket);
+	request.send(sos);
+}
+
+
+void Connection::readResponse(OpMsgMessage& response)
+{
+	Poco::Net::SocketInputStream sis(_socket);
+	response.read(sis);
+}
+
+
+
 } } // Poco::MongoDB
diff --git a/base/poco/MongoDB/src/Cursor.cpp b/base/poco/MongoDB/src/Cursor.cpp
index 69031e0ab65..ef7a4ca961d 100644
--- a/base/poco/MongoDB/src/Cursor.cpp
+++ b/base/poco/MongoDB/src/Cursor.cpp
@@ -33,6 +33,12 @@ Cursor::Cursor(const std::string& fullCollectionName, QueryRequest::Flags flags)
 }
 
 
+Cursor::Cursor(const Document& aggregationResponse) :
+    _query(aggregationResponse.get<Poco::MongoDB::Document::Ptr>("cursor")->get<std::string>("ns")),
+    _response(aggregationResponse.get<Poco::MongoDB::Document::Ptr>("cursor")->get<Int64>("id"))
+{
+}
+
 Cursor::~Cursor()
 {
 	try
diff --git a/base/poco/MongoDB/src/Database.cpp b/base/poco/MongoDB/src/Database.cpp
index 2b31523bdc4..1a0d3cfe559 100644
--- a/base/poco/MongoDB/src/Database.cpp
+++ b/base/poco/MongoDB/src/Database.cpp
@@ -334,6 +334,50 @@ bool Database::authSCRAM(Connection& connection, const std::string& username, co
 }
 
 
+Document::Ptr Database::queryBuildInfo(Connection& connection) const
+{
+	// build info can be issued on "config" system database
+	Poco::SharedPtr<Poco::MongoDB::QueryRequest> request = createCommand();
+	request->selector().add("buildInfo", 1);
+
+	Poco::MongoDB::ResponseMessage response;
+	connection.sendRequest(*request, response);
+
+	Document::Ptr buildInfo;
+	if ( response.documents().size() > 0 )
+	{
+		buildInfo = response.documents()[0];
+	}
+	else
+	{
+		throw Poco::ProtocolException("Didn't get a response from the buildinfo command");
+	}
+	return buildInfo;
+}
+
+
+Document::Ptr Database::queryServerHello(Connection& connection) const
+{
+	// hello can be issued on "config" system database
+	Poco::SharedPtr<Poco::MongoDB::QueryRequest> request = createCommand();
+	request->selector().add("hello", 1);
+
+	Poco::MongoDB::ResponseMessage response;
+	connection.sendRequest(*request, response);
+
+	Document::Ptr hello;
+	if ( response.documents().size() > 0 )
+	{
+		hello = response.documents()[0];
+	}
+	else
+	{
+		throw Poco::ProtocolException("Didn't get a response from the hello command");
+	}
+	return hello;
+}
+
+
 Int64 Database::count(Connection& connection, const std::string& collectionName) const
 {
 	Poco::SharedPtr<Poco::MongoDB::QueryRequest> countRequest = createCountRequest(collectionName);
@@ -390,7 +434,7 @@ Document::Ptr Database::getLastErrorDoc(Connection& connection) const
 {
 	Document::Ptr errorDoc;
 
-	Poco::SharedPtr<Poco::MongoDB::QueryRequest> request = createQueryRequest("$cmd");
+	Poco::SharedPtr<Poco::MongoDB::QueryRequest> request = createCommand();
 	request->setNumberToReturn(1);
 	request->selector().add("getLastError", 1);
 
@@ -420,7 +464,7 @@ std::string Database::getLastError(Connection& connection) const
 
 Poco::SharedPtr<Poco::MongoDB::QueryRequest> Database::createCountRequest(const std::string& collectionName) const
 {
-	Poco::SharedPtr<Poco::MongoDB::QueryRequest> request = createQueryRequest("$cmd");
+	Poco::SharedPtr<Poco::MongoDB::QueryRequest> request = createCommand();
 	request->setNumberToReturn(1);
 	request->selector().add("count", collectionName);
 	return request;
diff --git a/base/poco/MongoDB/src/DeleteRequest.cpp b/base/poco/MongoDB/src/DeleteRequest.cpp
index 67a88c33302..ba75beb55fb 100644
--- a/base/poco/MongoDB/src/DeleteRequest.cpp
+++ b/base/poco/MongoDB/src/DeleteRequest.cpp
@@ -20,8 +20,8 @@ namespace MongoDB {
 
 
 DeleteRequest::DeleteRequest(const std::string& collectionName, DeleteRequest::Flags flags):
-	RequestMessage(MessageHeader::OP_DELETE), 
-	_flags(flags), 
+	RequestMessage(MessageHeader::OP_DELETE),
+	_flags(flags),
 	_fullCollectionName(collectionName),
 	_selector()
 {
diff --git a/base/poco/MongoDB/src/Document.cpp b/base/poco/MongoDB/src/Document.cpp
index 114fc993891..f7c5c9c5dc6 100644
--- a/base/poco/MongoDB/src/Document.cpp
+++ b/base/poco/MongoDB/src/Document.cpp
@@ -35,6 +35,14 @@ Document::~Document()
 }
 
 
+Array& Document::addNewArray(const std::string& name)
+{
+	Array::Ptr newArray = new Array();
+	add(name, newArray);
+	return *newArray;
+}
+
+
 Element::Ptr Document::get(const std::string& name) const
 {
 	Element::Ptr element;
@@ -84,7 +92,7 @@ void Document::read(BinaryReader& reader)
 	while (type != '\0')
 	{
 		Element::Ptr element;
-		
+
 		std::string name = BSONReader(reader).readCString();
 
 		switch (type)
@@ -198,7 +206,7 @@ void Document::write(BinaryWriter& writer)
 	else
 	{
 		std::stringstream sstream;
-		Poco::BinaryWriter tempWriter(sstream);
+		Poco::BinaryWriter tempWriter(sstream, BinaryWriter::LITTLE_ENDIAN_BYTE_ORDER);
 		for (ElementSet::iterator it = _elements.begin(); it != _elements.end(); ++it)
 		{
 			tempWriter << static_cast<unsigned char>((*it)->type());
@@ -207,7 +215,7 @@ void Document::write(BinaryWriter& writer)
 			element->write(tempWriter);
 		}
 		tempWriter.flush();
-		
+
 		Poco::Int32 len = static_cast<Poco::Int32>(5 + sstream.tellp()); /* 5 = sizeof(len) + 0-byte */
 		writer << len;
 		writer.writeRaw(sstream.str());
diff --git a/base/poco/MongoDB/src/Element.cpp b/base/poco/MongoDB/src/Element.cpp
index 89629e0503e..f91ce264493 100644
--- a/base/poco/MongoDB/src/Element.cpp
+++ b/base/poco/MongoDB/src/Element.cpp
@@ -24,7 +24,7 @@ Element::Element(const std::string& name) : _name(name)
 }
 
 
-Element::~Element() 
+Element::~Element()
 {
 }
 
diff --git a/base/poco/MongoDB/src/GetMoreRequest.cpp b/base/poco/MongoDB/src/GetMoreRequest.cpp
index f8a6b73c6ad..2c1f6909eb7 100644
--- a/base/poco/MongoDB/src/GetMoreRequest.cpp
+++ b/base/poco/MongoDB/src/GetMoreRequest.cpp
@@ -21,7 +21,7 @@ namespace MongoDB {
 
 
 GetMoreRequest::GetMoreRequest(const std::string& collectionName, Int64 cursorID):
-	RequestMessage(MessageHeader::OP_GET_MORE), 
+	RequestMessage(MessageHeader::OP_GET_MORE),
 	_fullCollectionName(collectionName),
 	_numberToReturn(100),
 	_cursorID(cursorID)
diff --git a/base/poco/MongoDB/src/InsertRequest.cpp b/base/poco/MongoDB/src/InsertRequest.cpp
index ec8dc9cf94a..65be5654b3e 100644
--- a/base/poco/MongoDB/src/InsertRequest.cpp
+++ b/base/poco/MongoDB/src/InsertRequest.cpp
@@ -20,7 +20,7 @@ namespace MongoDB {
 
 
 InsertRequest::InsertRequest(const std::string& collectionName, Flags flags):
-	RequestMessage(MessageHeader::OP_INSERT), 
+	RequestMessage(MessageHeader::OP_INSERT),
 	_flags(flags),
 	_fullCollectionName(collectionName)
 {
diff --git a/base/poco/MongoDB/src/KillCursorsRequest.cpp b/base/poco/MongoDB/src/KillCursorsRequest.cpp
index 6baa0e0be8f..448002aa16a 100644
--- a/base/poco/MongoDB/src/KillCursorsRequest.cpp
+++ b/base/poco/MongoDB/src/KillCursorsRequest.cpp
@@ -37,7 +37,7 @@ void KillCursorsRequest::buildRequest(BinaryWriter& writer)
 	for (std::vector<Int64>::iterator it = _cursors.begin(); it != _cursors.end(); ++it)
 	{
 		writer << *it;
-	}		
+	}
 }
 
 
diff --git a/base/poco/MongoDB/src/Message.cpp b/base/poco/MongoDB/src/Message.cpp
index c29d282d15a..7b1cb23bab6 100644
--- a/base/poco/MongoDB/src/Message.cpp
+++ b/base/poco/MongoDB/src/Message.cpp
@@ -19,7 +19,7 @@ namespace Poco {
 namespace MongoDB {
 
 
-Message::Message(MessageHeader::OpCode opcode): 
+Message::Message(MessageHeader::OpCode opcode):
 	_header(opcode)
 {
 }
diff --git a/base/poco/MongoDB/src/MessageHeader.cpp b/base/poco/MongoDB/src/MessageHeader.cpp
index 222121243db..b472bcec465 100644
--- a/base/poco/MongoDB/src/MessageHeader.cpp
+++ b/base/poco/MongoDB/src/MessageHeader.cpp
@@ -20,10 +20,10 @@ namespace Poco {
 namespace MongoDB {
 
 
-MessageHeader::MessageHeader(OpCode opCode): 
-	_messageLength(0), 
-	_requestID(0), 
-	_responseTo(0), 
+MessageHeader::MessageHeader(OpCode opCode):
+	_messageLength(0),
+	_requestID(0),
+	_responseTo(0),
 	_opCode(opCode)
 {
 }
@@ -42,7 +42,7 @@ void MessageHeader::read(BinaryReader& reader)
 
 	Int32 opCode;
 	reader >> opCode;
-	_opCode = (OpCode) opCode;
+	_opCode = static_cast<OpCode>(opCode);
 
 	if (!reader.good())
 	{
@@ -56,7 +56,7 @@ void MessageHeader::write(BinaryWriter& writer)
 	writer << _messageLength;
 	writer << _requestID;
 	writer << _responseTo;
-	writer << (Int32) _opCode;
+	writer << static_cast<Int32>(_opCode);
 }
 
 
diff --git a/base/poco/MongoDB/src/ObjectId.cpp b/base/poco/MongoDB/src/ObjectId.cpp
index 3065a2ffc30..0125c246c2d 100644
--- a/base/poco/MongoDB/src/ObjectId.cpp
+++ b/base/poco/MongoDB/src/ObjectId.cpp
@@ -32,7 +32,7 @@ ObjectId::ObjectId(const std::string& id)
 	poco_assert_dbg(id.size() == 24);
 
     const char* p = id.c_str();
-    for (std::size_t i = 0; i < 12; ++i) 
+    for (std::size_t i = 0; i < 12; ++i)
     {
 		_id[i] = fromHex(p);
 		p += 2;
diff --git a/base/poco/MongoDB/src/OpMsgCursor.cpp b/base/poco/MongoDB/src/OpMsgCursor.cpp
new file mode 100644
index 00000000000..bc95851ae33
--- /dev/null
+++ b/base/poco/MongoDB/src/OpMsgCursor.cpp
@@ -0,0 +1,187 @@
+//
+// OpMsgCursor.cpp
+//
+// Library: MongoDB
+// Package: MongoDB
+// Module:  OpMsgCursor
+//
+// Copyright (c) 2022, Applied Informatics Software Engineering GmbH.
+// and Contributors.
+//
+// SPDX-License-Identifier:	BSL-1.0
+//
+
+
+#include "Poco/MongoDB/OpMsgCursor.h"
+#include "Poco/MongoDB/Array.h"
+
+//
+// NOTE:
+//
+// MongoDB specification indicates that the flag MSG_EXHAUST_ALLOWED shall be
+// used in the request when the receiver is ready to receive multiple messages
+// without sending additional requests in between. Sender (MongoDB) indicates
+// that more messages follow with flag MSG_MORE_TO_COME.
+//
+// It seems that this does not work properly. MSG_MORE_TO_COME is set and reading
+// next messages sometimes works, however often the data is missing in response
+// or the message header contains wrong message length and reading blocks.
+// Opcode in the header is correct.
+//
+// Using MSG_EXHAUST_ALLOWED is therefore currently disabled.
+//
+// It seems that related JIRA ticket is:
+//
+// https://jira.mongodb.org/browse/SERVER-57297
+//
+// https://github.com/mongodb/specifications/blob/master/source/message/OP_MSG.rst
+//
+
+#define MONGODB_EXHAUST_ALLOWED_WORKS	false
+
+namespace Poco {
+namespace MongoDB {
+
+
+static const std::string keyCursor		{"cursor"};
+static const std::string keyFirstBatch	{"firstBatch"};
+static const std::string keyNextBatch	{"nextBatch"};
+
+static Poco::Int64 cursorIdFromResponse(const MongoDB::Document& doc);
+
+
+OpMsgCursor::OpMsgCursor(const std::string& db, const std::string& collection):
+#if MONGODB_EXHAUST_ALLOWED_WORKS
+	_query(db, collection, OpMsgMessage::MSG_EXHAUST_ALLOWED)
+#else
+	_query(db, collection)
+#endif
+{
+}
+
+OpMsgCursor::~OpMsgCursor()
+{
+	try
+	{
+		poco_assert_dbg(_cursorID == 0);
+	}
+	catch (...)
+	{
+	}
+}
+
+
+void OpMsgCursor::setEmptyFirstBatch(bool empty)
+{
+	_emptyFirstBatch = empty;
+}
+
+
+bool OpMsgCursor::emptyFirstBatch() const
+{
+	return _emptyFirstBatch;
+}
+
+
+void OpMsgCursor::setBatchSize(Int32 batchSize)
+{
+	_batchSize = batchSize;
+}
+
+
+Int32 OpMsgCursor::batchSize() const
+{
+	return _batchSize;
+}
+
+
+OpMsgMessage& OpMsgCursor::next(Connection& connection)
+{
+	if (_cursorID == 0)
+	{
+		_response.clear();
+
+		if (_emptyFirstBatch || _batchSize > 0)
+		{
+			Int32 bsize = _emptyFirstBatch ? 0 : _batchSize;
+			if (_query.commandName() == OpMsgMessage::CMD_FIND)
+			{
+				_query.body().add("batchSize", bsize);
+			}
+			else if (_query.commandName() == OpMsgMessage::CMD_AGGREGATE)
+			{
+				auto& cursorDoc = _query.body().addNewDocument("cursor");
+				cursorDoc.add("batchSize", bsize);
+			}
+		}
+
+		connection.sendRequest(_query, _response);
+
+		const auto& rdoc = _response.body();
+		_cursorID = cursorIdFromResponse(rdoc);
+	}
+	else
+	{
+#if MONGODB_EXHAUST_ALLOWED_WORKS
+		std::cout << "Response flags: " << _response.flags() << std::endl;
+		if (_response.flags() & OpMsgMessage::MSG_MORE_TO_COME)
+		{
+			std::cout << "More to come. Reading more response: " << std::endl;
+			_response.clear();
+			connection.readResponse(_response);
+		}
+		else
+#endif		
+		{
+			_response.clear();
+			_query.setCursor(_cursorID, _batchSize);
+			connection.sendRequest(_query, _response);
+		}
+	}
+
+	const auto& rdoc = _response.body();
+	_cursorID = cursorIdFromResponse(rdoc);
+
+	return _response;
+}
+
+
+void OpMsgCursor::kill(Connection& connection)
+{
+	_response.clear();
+	if (_cursorID != 0)
+	{
+		_query.setCommandName(OpMsgMessage::CMD_KILL_CURSORS);
+
+		MongoDB::Array::Ptr cursors = new MongoDB::Array();
+		cursors->add<Poco::Int64>(_cursorID);
+		_query.body().add("cursors", cursors);
+
+		connection.sendRequest(_query, _response);
+
+		const auto killed = _response.body().get<MongoDB::Array::Ptr>("cursorsKilled", nullptr);
+		if (!killed || killed->size() != 1 || killed->get<Poco::Int64>(0, -1) != _cursorID)
+		{
+			throw Poco::ProtocolException("Cursor not killed as expected: " + std::to_string(_cursorID));
+		}
+
+		_cursorID = 0;
+		_query.clear();
+		_response.clear();
+	}
+}
+
+
+Poco::Int64 cursorIdFromResponse(const MongoDB::Document& doc)
+{
+	Poco::Int64 id {0};
+	auto cursorDoc = doc.get<Document::Ptr>(keyCursor, nullptr);
+	if(cursorDoc)
+	{
+		id = cursorDoc->get<Poco::Int64>("id", 0);
+	}
+	return id;
+}
+
+
+} } // Namespace Poco::MongoDB
diff --git a/base/poco/MongoDB/src/OpMsgMessage.cpp b/base/poco/MongoDB/src/OpMsgMessage.cpp
new file mode 100644
index 00000000000..2b55772ca59
--- /dev/null
+++ b/base/poco/MongoDB/src/OpMsgMessage.cpp
@@ -0,0 +1,412 @@
+//
+// OpMsgMessage.cpp
+//
+// Library: MongoDB
+// Package: MongoDB
+// Module:  OpMsgMessage
+//
+// Copyright (c) 2022, Applied Informatics Software Engineering GmbH.
+// and Contributors.
+//
+// SPDX-License-Identifier:	BSL-1.0
+//
+
+#include "Poco/MongoDB/OpMsgMessage.h"
+#include "Poco/MongoDB/MessageHeader.h"
+#include "Poco/MongoDB/Array.h"
+#include "Poco/StreamCopier.h"
+#include "Poco/Logger.h"
+
+#define POCO_MONGODB_DUMP	false
+
+namespace Poco {
+namespace MongoDB {
+
+// Query and write
+const std::string OpMsgMessage::CMD_INSERT { "insert" };
+const std::string OpMsgMessage::CMD_DELETE { "delete" };
+const std::string OpMsgMessage::CMD_UPDATE { "update" };
+const std::string OpMsgMessage::CMD_FIND { "find" };
+const std::string OpMsgMessage::CMD_FIND_AND_MODIFY { "findAndModify" };
+const std::string OpMsgMessage::CMD_GET_MORE { "getMore" };
+
+// Aggregation
+const std::string OpMsgMessage::CMD_AGGREGATE { "aggregate" };
+const std::string OpMsgMessage::CMD_COUNT { "count" };
+const std::string OpMsgMessage::CMD_DISTINCT { "distinct" };
+const std::string OpMsgMessage::CMD_MAP_REDUCE { "mapReduce" };
+
+// Replication and administration 
+const std::string OpMsgMessage::CMD_HELLO { "hello" };
+const std::string OpMsgMessage::CMD_REPL_SET_GET_STATUS { "replSetGetStatus" };
+const std::string OpMsgMessage::CMD_REPL_SET_GET_CONFIG { "replSetGetConfig" };
+
+const std::string OpMsgMessage::CMD_CREATE { "create" };
+const std::string OpMsgMessage::CMD_CREATE_INDEXES { "createIndexes" };
+const std::string OpMsgMessage::CMD_DROP { "drop" };
+const std::string OpMsgMessage::CMD_DROP_DATABASE { "dropDatabase" };
+const std::string OpMsgMessage::CMD_KILL_CURSORS { "killCursors" };
+const std::string OpMsgMessage::CMD_LIST_DATABASES { "listDatabases" };
+const std::string OpMsgMessage::CMD_LIST_INDEXES { "listIndexes" };
+
+// Diagnostic
+const std::string OpMsgMessage::CMD_BUILD_INFO { "buildInfo" };
+const std::string OpMsgMessage::CMD_COLL_STATS { "collStats" };
+const std::string OpMsgMessage::CMD_DB_STATS { "dbStats" };
+const std::string OpMsgMessage::CMD_HOST_INFO { "hostInfo" };
+
+
+static const std::string& commandIdentifier(const std::string& command);
+	/// Commands have different names for the payload that is sent in a separate section
+
+
+static const std::string keyCursor		{"cursor"};
+static const std::string keyFirstBatch	{"firstBatch"};
+static const std::string keyNextBatch	{"nextBatch"};
+
+
+OpMsgMessage::OpMsgMessage() :
+	Message(MessageHeader::OP_MSG)
+{
+}
+
+
+OpMsgMessage::OpMsgMessage(const std::string& databaseName, const std::string& collectionName, UInt32 flags) :
+	Message(MessageHeader::OP_MSG),
+	_databaseName(databaseName),
+	_collectionName(collectionName),
+	_flags(flags)
+{
+}
+
+
+OpMsgMessage::~OpMsgMessage()
+{
+}
+
+const std::string& OpMsgMessage::databaseName() const
+{
+	return _databaseName;
+}
+
+
+const std::string& OpMsgMessage::collectionName() const
+{
+	return _collectionName;
+}
+
+
+void OpMsgMessage::setCommandName(const std::string& command)
+{
+	_commandName = command;
+	_body.clear();
+
+	// IMPORTANT: Command name must be first
+	if (_collectionName.empty())
+	{
+		// Collection is not specified. It is assumed that this particular command does 
+		// not need it.
+		_body.add(_commandName, Int32(1));
+	}
+	else
+	{
+		_body.add(_commandName, _collectionName);
+	}
+	_body.add("$db", _databaseName);
+}
+
+
+void OpMsgMessage::setCursor(Poco::Int64 cursorID, Poco::Int32 batchSize)
+{
+	_commandName = OpMsgMessage::CMD_GET_MORE;
+	_body.clear();
+
+	// IMPORTANT: Command name must be first
+	_body.add(_commandName, cursorID);
+	_body.add("$db", _databaseName);
+	_body.add("collection", _collectionName);
+	if (batchSize > 0)
+	{
+		_body.add("batchSize", batchSize);
+	}
+}
+
+
+const std::string& OpMsgMessage::commandName() const
+{
+	return _commandName;
+}
+
+
+void OpMsgMessage::setAcknowledgedRequest(bool ack)
+{
+	const auto& id = commandIdentifier(_commandName);
+	if (id.empty())
+		return;
+
+	_acknowledged = ack;
+
+	auto writeConcern = _body.get<Document::Ptr>("writeConcern", nullptr);
+	if (writeConcern)
+		writeConcern->remove("w");
+
+	if (ack)
+	{
+		_flags = _flags & (~MSG_MORE_TO_COME);
+	}
+	else
+	{
+		_flags = _flags | MSG_MORE_TO_COME;
+		if (!writeConcern)
+			_body.addNewDocument("writeConcern").add("w", 0);
+		else
+			writeConcern->add("w", 0);
+	}
+
+}
+
+
+bool OpMsgMessage::acknowledgedRequest() const
+{
+	return _acknowledged;
+}
+
+
+UInt32 OpMsgMessage::flags() const
+{
+	return _flags;
+}
+
+
+Document& OpMsgMessage::body()
+{
+	return _body;
+}
+
+
+const Document& OpMsgMessage::body() const
+{
+	return _body;
+}
+
+
+Document::Vector& OpMsgMessage::documents()
+{
+	return _documents;
+}
+
+
+const Document::Vector& OpMsgMessage::documents() const
+{
+	return _documents;
+}
+
+
+bool OpMsgMessage::responseOk() const
+{
+	Poco::Int64 ok {false};
+	if (_body.exists("ok"))
+	{
+		ok = _body.getInteger("ok");
+	}
+	return (ok != 0);
+}
+
+
+void OpMsgMessage::clear()
+{
+	_flags = MSG_FLAGS_DEFAULT;
+	_commandName.clear();
+	_body.clear();
+	_documents.clear();
+}
+
+
+void OpMsgMessage::send(std::ostream& ostr)
+{
+	BinaryWriter socketWriter(ostr, BinaryWriter::LITTLE_ENDIAN_BYTE_ORDER);
+
+	// Serialise the body
+	std::stringstream ss;
+	BinaryWriter writer(ss, BinaryWriter::LITTLE_ENDIAN_BYTE_ORDER);
+	writer << _flags;
+
+	writer << PAYLOAD_TYPE_0;
+	_body.write(writer);
+
+	if (!_documents.empty())
+	{
+		// Serialise attached documents
+
+		std::stringstream ssdoc;
+		BinaryWriter wdoc(ssdoc, BinaryWriter::LITTLE_ENDIAN_BYTE_ORDER);
+		for (auto& doc: _documents)
+		{
+			doc->write(wdoc);
+		}
+		wdoc.flush();
+
+		const std::string& identifier = commandIdentifier(_commandName);
+		const Poco::Int32 size = static_cast<Poco::Int32>(sizeof(size) + identifier.size() + 1 + ssdoc.tellp());
+		writer << PAYLOAD_TYPE_1;
+		writer << size;
+		writer.writeCString(identifier.c_str());
+		StreamCopier::copyStream(ssdoc, ss);
+	}
+	writer.flush();
+
+#if POCO_MONGODB_DUMP
+	const std::string section = ss.str();
+	std::string dump;
+	Logger::formatDump(dump, section.data(), section.length());
+	std::cout << dump << std::endl;
+#endif
+
+	messageLength(static_cast<Poco::Int32>(ss.tellp()));
+
+	_header.write(socketWriter);
+	StreamCopier::copyStream(ss, ostr);
+
+	ostr.flush();
+}
+
+
+void OpMsgMessage::read(std::istream& istr)
+{
+	std::string message;
+	{
+		BinaryReader reader(istr, BinaryReader::LITTLE_ENDIAN_BYTE_ORDER);
+		_header.read(reader);
+
+		poco_assert_dbg(_header.opCode() == _header.OP_MSG);
+
+		const std::streamsize remainingSize {_header.getMessageLength() - _header.MSG_HEADER_SIZE };
+		message.reserve(remainingSize);
+
+#if POCO_MONGODB_DUMP
+		std::cout
+			<< "Message hdr: " << _header.getMessageLength() << " " << remainingSize << " "
+			<< _header.opCode() << " " << _header.getRequestID() << " " << _header.responseTo()
+			<< std::endl;
+#endif
+		
+		reader.readRaw(remainingSize, message);
+
+#if POCO_MONGODB_DUMP
+		std::string dump;
+		Logger::formatDump(dump, message.data(), message.length());
+		std::cout << dump << std::endl;
+#endif
+	}
+	// Read complete message and then interpret it.
+
+	std::istringstream msgss(message);
+	BinaryReader reader(msgss, BinaryReader::LITTLE_ENDIAN_BYTE_ORDER);
+
+	Poco::UInt8 payloadType {0xFF};
+
+	reader >> _flags;
+	reader >> payloadType;
+	poco_assert_dbg(payloadType == PAYLOAD_TYPE_0);
+
+	_body.read(reader);
+
+	// Read next sections from the buffer
+	while (msgss.good())
+	{
+		// NOTE: Not tested yet with database, because it returns everything in the body.
+		// Does MongoDB ever return documents as Payload type 1?
+		reader >> payloadType;
+		if (!msgss.good())
+		{
+			break;
+		}
+		poco_assert_dbg(payloadType == PAYLOAD_TYPE_1);
+#if POCO_MONGODB_DUMP
+		std::cout << "section payload: " << payloadType << std::endl;
+#endif
+
+		Poco::Int32 sectionSize {0};
+		reader >> sectionSize;
+		poco_assert_dbg(sectionSize > 0);
+
+#if POCO_MONGODB_DUMP
+		std::cout << "section size: " << sectionSize << std::endl;
+#endif
+		std::streamoff offset = sectionSize - sizeof(sectionSize);
+		std::streampos endOfSection = msgss.tellg() + offset;
+
+		std::string identifier;
+		reader.readCString(identifier);
+#if POCO_MONGODB_DUMP
+		std::cout << "section identifier: " << identifier << std::endl;
+#endif
+
+		// Loop to read documents from this section.
+		while (msgss.tellg() < endOfSection)
+		{
+#if POCO_MONGODB_DUMP
+			std::cout << "section doc: " << msgss.tellg() << " " << endOfSection << std::endl;
+#endif
+			Document::Ptr doc = new Document();
+			doc->read(reader);
+			_documents.push_back(doc);
+			if (msgss.tellg() < 0)
+			{
+				break;
+			}
+		}
+	}
+
+	// Extract documents from the cursor batch if they are there.
+	MongoDB::Array::Ptr batch;
+	auto curDoc = _body.get<MongoDB::Document::Ptr>(keyCursor, nullptr);
+	if (curDoc)
+	{
+		batch = curDoc->get<MongoDB::Array::Ptr>(keyFirstBatch, nullptr);
+		if (!batch)
+		{
+			batch = curDoc->get<MongoDB::Array::Ptr>(keyNextBatch, nullptr);
+		}
+	}
+	if (batch)
+	{
+		for(std::size_t i = 0; i < batch->size(); i++)
+		{
+			const auto& d = batch->get<MongoDB::Document::Ptr>(i, nullptr);
+			if (d)
+			{
+				_documents.push_back(d);
+			}
+		}
+	}
+
+}
+
+const std::string& commandIdentifier(const std::string& command)
+{
+	// Names of identifiers for commands that send bulk documents in the request
+	// The identifier is set in the section type 1.
+	static std::map<std::string, std::string> identifiers {
+		{ OpMsgMessage::CMD_INSERT, "documents" },
+		{ OpMsgMessage::CMD_DELETE, "deletes" },
+		{ OpMsgMessage::CMD_UPDATE, "updates" },
+
+		// Not sure if create index can send document section
+		{ OpMsgMessage::CMD_CREATE_INDEXES, "indexes" }
+	};
+
+	const auto i = identifiers.find(command);
+	if (i != identifiers.end())
+	{
+		return i->second;
+	}
+
+	// This likely means that documents are incorrectly set for a command
+	// that does not send list of documents in section type 1.
+	static const std::string emptyIdentifier;
+	return emptyIdentifier;
+}
+
+
+} } // namespace Poco::MongoDB
diff --git a/base/poco/MongoDB/src/QueryRequest.cpp b/base/poco/MongoDB/src/QueryRequest.cpp
index 7044335ba30..6d7d23a8456 100644
--- a/base/poco/MongoDB/src/QueryRequest.cpp
+++ b/base/poco/MongoDB/src/QueryRequest.cpp
@@ -20,10 +20,10 @@ namespace MongoDB {
 
 
 QueryRequest::QueryRequest(const std::string& collectionName, QueryRequest::Flags flags):
-	RequestMessage(MessageHeader::OP_QUERY), 
-	_flags(flags), 
+	RequestMessage(MessageHeader::OP_QUERY),
+	_flags(flags),
 	_fullCollectionName(collectionName),
-	_numberToSkip(0), 
+	_numberToSkip(0),
 	_numberToReturn(100),
 	_selector(),
 	_returnFieldSelector()
diff --git a/base/poco/MongoDB/src/RegularExpression.cpp b/base/poco/MongoDB/src/RegularExpression.cpp
index e95e7da82e1..5f7eb6bb51b 100644
--- a/base/poco/MongoDB/src/RegularExpression.cpp
+++ b/base/poco/MongoDB/src/RegularExpression.cpp
@@ -25,8 +25,8 @@ RegularExpression::RegularExpression()
 }
 
 
-RegularExpression::RegularExpression(const std::string& pattern, const std::string& options): 
-	_pattern(pattern), 
+RegularExpression::RegularExpression(const std::string& pattern, const std::string& options):
+	_pattern(pattern),
 	_options(options)
 {
 }
diff --git a/base/poco/MongoDB/src/ReplicaSet.cpp b/base/poco/MongoDB/src/ReplicaSet.cpp
index b56fea49311..fce2f2bdada 100644
--- a/base/poco/MongoDB/src/ReplicaSet.cpp
+++ b/base/poco/MongoDB/src/ReplicaSet.cpp
@@ -21,7 +21,7 @@ namespace Poco {
 namespace MongoDB {
 
 
-ReplicaSet::ReplicaSet(const std::vector<Net::SocketAddress> &addresses): 
+ReplicaSet::ReplicaSet(const std::vector<Net::SocketAddress> &addresses):
 	_addresses(addresses)
 {
 }
@@ -81,8 +81,8 @@ Connection::Ptr ReplicaSet::isMaster(const Net::SocketAddress& address)
 	{
 		conn = 0;
 	}
-	
-	return 0; 
+
+	return 0;
 }
 
 
diff --git a/base/poco/MongoDB/src/RequestMessage.cpp b/base/poco/MongoDB/src/RequestMessage.cpp
index 6391d966198..999ed8a6ba1 100644
--- a/base/poco/MongoDB/src/RequestMessage.cpp
+++ b/base/poco/MongoDB/src/RequestMessage.cpp
@@ -21,7 +21,7 @@ namespace Poco {
 namespace MongoDB {
 
 
-RequestMessage::RequestMessage(MessageHeader::OpCode opcode): 
+RequestMessage::RequestMessage(MessageHeader::OpCode opcode):
 	Message(opcode)
 {
 }
@@ -35,7 +35,7 @@ RequestMessage::~RequestMessage()
 void RequestMessage::send(std::ostream& ostr)
 {
 	std::stringstream ss;
-	BinaryWriter requestWriter(ss);
+	BinaryWriter requestWriter(ss, BinaryWriter::LITTLE_ENDIAN_BYTE_ORDER);
 	buildRequest(requestWriter);
 	requestWriter.flush();
 
diff --git a/base/poco/MongoDB/src/ResponseMessage.cpp b/base/poco/MongoDB/src/ResponseMessage.cpp
index 3254ace63e6..e8216767494 100644
--- a/base/poco/MongoDB/src/ResponseMessage.cpp
+++ b/base/poco/MongoDB/src/ResponseMessage.cpp
@@ -21,10 +21,20 @@ namespace MongoDB {
 
 
 ResponseMessage::ResponseMessage():
-	Message(MessageHeader::OP_REPLY), 
-	_responseFlags(0), 
-	_cursorID(0), 
-	_startingFrom(0), 
+	Message(MessageHeader::OP_REPLY),
+	_responseFlags(0),
+	_cursorID(0),
+	_startingFrom(0),
+	_numberReturned(0)
+{
+}
+
+
+ResponseMessage::ResponseMessage(const Int64& cursorID):
+	Message(MessageHeader::OP_REPLY),
+	_responseFlags(0),
+	_cursorID(cursorID),
+	_startingFrom(0),
 	_numberReturned(0)
 {
 }
@@ -50,7 +60,7 @@ void ResponseMessage::read(std::istream& istr)
 	clear();
 
 	BinaryReader reader(istr, BinaryReader::LITTLE_ENDIAN_BYTE_ORDER);
-	
+
 	_header.read(reader);
 
 	reader >> _responseFlags;
diff --git a/base/poco/MongoDB/src/UpdateRequest.cpp b/base/poco/MongoDB/src/UpdateRequest.cpp
index 2af4621ff64..7477fc752d5 100644
--- a/base/poco/MongoDB/src/UpdateRequest.cpp
+++ b/base/poco/MongoDB/src/UpdateRequest.cpp
@@ -20,7 +20,7 @@ namespace MongoDB {
 
 
 UpdateRequest::UpdateRequest(const std::string& collectionName, UpdateRequest::Flags flags):
-	RequestMessage(MessageHeader::OP_UPDATE), 
+	RequestMessage(MessageHeader::OP_UPDATE),
 	_flags(flags),
 	_fullCollectionName(collectionName),
 	_selector(),
diff --git a/base/poco/Net/include/Poco/Net/HTTPBasicStreamBuf.h b/base/poco/Net/include/Poco/Net/HTTPBasicStreamBuf.h
index c4872d95353..c87719b63a4 100644
--- a/base/poco/Net/include/Poco/Net/HTTPBasicStreamBuf.h
+++ b/base/poco/Net/include/Poco/Net/HTTPBasicStreamBuf.h
@@ -19,7 +19,6 @@
 
 
 #include "Poco/BufferedStreamBuf.h"
-#include "Poco/Net/HTTPBufferAllocator.h"
 #include "Poco/Net/Net.h"
 
 
@@ -27,9 +26,9 @@ namespace Poco
 {
 namespace Net
 {
+    constexpr size_t HTTP_DEFAULT_BUFFER_SIZE = 8 * 1024;
 
-
-    typedef Poco::BasicBufferedStreamBuf<char, std::char_traits<char>, HTTPBufferAllocator> HTTPBasicStreamBuf;
+    typedef Poco::BasicBufferedStreamBuf<char, std::char_traits<char>> HTTPBasicStreamBuf;
 
 
 }
diff --git a/base/poco/Net/include/Poco/Net/HTTPBufferAllocator.h b/base/poco/Net/include/Poco/Net/HTTPBufferAllocator.h
deleted file mode 100644
index 5d088e35297..00000000000
--- a/base/poco/Net/include/Poco/Net/HTTPBufferAllocator.h
+++ /dev/null
@@ -1,53 +0,0 @@
-//
-// HTTPBufferAllocator.h
-//
-// Library: Net
-// Package: HTTP
-// Module:  HTTPBufferAllocator
-//
-// Definition of the HTTPBufferAllocator class.
-//
-// Copyright (c) 2005-2006, Applied Informatics Software Engineering GmbH.
-// and Contributors.
-//
-// SPDX-License-Identifier:	BSL-1.0
-//
-
-
-#ifndef Net_HTTPBufferAllocator_INCLUDED
-#define Net_HTTPBufferAllocator_INCLUDED
-
-
-#include <ios>
-#include "Poco/MemoryPool.h"
-#include "Poco/Net/Net.h"
-
-
-namespace Poco
-{
-namespace Net
-{
-
-
-    class Net_API HTTPBufferAllocator
-    /// A BufferAllocator for HTTP streams.
-    {
-    public:
-        static char * allocate(std::streamsize size);
-        static void deallocate(char * ptr, std::streamsize size);
-
-        enum
-        {
-            BUFFER_SIZE = 128 * 1024
-        };
-
-    private:
-        static Poco::MemoryPool _pool;
-    };
-
-
-}
-} // namespace Poco::Net
-
-
-#endif // Net_HTTPBufferAllocator_INCLUDED
diff --git a/base/poco/Net/include/Poco/Net/HTTPChunkedStream.h b/base/poco/Net/include/Poco/Net/HTTPChunkedStream.h
index 47987b18817..5f4729c9278 100644
--- a/base/poco/Net/include/Poco/Net/HTTPChunkedStream.h
+++ b/base/poco/Net/include/Poco/Net/HTTPChunkedStream.h
@@ -21,7 +21,6 @@
 #include <cstddef>
 #include <istream>
 #include <ostream>
-#include "Poco/MemoryPool.h"
 #include "Poco/Net/HTTPBasicStreamBuf.h"
 #include "Poco/Net/Net.h"
 
@@ -80,12 +79,6 @@ namespace Net
     public:
         HTTPChunkedInputStream(HTTPSession & session);
         ~HTTPChunkedInputStream();
-
-        void * operator new(std::size_t size);
-        void operator delete(void * ptr);
-
-    private:
-        static Poco::MemoryPool _pool;
     };
 
 
@@ -95,12 +88,6 @@ namespace Net
     public:
         HTTPChunkedOutputStream(HTTPSession & session);
         ~HTTPChunkedOutputStream();
-
-        void * operator new(std::size_t size);
-        void operator delete(void * ptr);
-
-    private:
-        static Poco::MemoryPool _pool;
     };
 
 
diff --git a/base/poco/Net/include/Poco/Net/HTTPClientSession.h b/base/poco/Net/include/Poco/Net/HTTPClientSession.h
index 6f67918d2c8..d495d662f75 100644
--- a/base/poco/Net/include/Poco/Net/HTTPClientSession.h
+++ b/base/poco/Net/include/Poco/Net/HTTPClientSession.h
@@ -127,6 +127,9 @@ namespace Net
 
         void setResolvedHost(std::string resolved_host) { _resolved_host.swap(resolved_host); }
 
+        std::string getResolvedHost() const { return _resolved_host; }
+        /// Returns the resolved IP address of the target HTTP server.
+
         Poco::UInt16 getPort() const;
         /// Returns the port number of the target HTTP server.
 
diff --git a/base/poco/Net/include/Poco/Net/HTTPFixedLengthStream.h b/base/poco/Net/include/Poco/Net/HTTPFixedLengthStream.h
index 4de211fdb92..2f4df102605 100644
--- a/base/poco/Net/include/Poco/Net/HTTPFixedLengthStream.h
+++ b/base/poco/Net/include/Poco/Net/HTTPFixedLengthStream.h
@@ -78,12 +78,6 @@ namespace Net
     public:
         HTTPFixedLengthInputStream(HTTPSession & session, HTTPFixedLengthStreamBuf::ContentLength length);
         ~HTTPFixedLengthInputStream();
-
-        void * operator new(std::size_t size);
-        void operator delete(void * ptr);
-
-    private:
-        static Poco::MemoryPool _pool;
     };
 
 
@@ -93,12 +87,6 @@ namespace Net
     public:
         HTTPFixedLengthOutputStream(HTTPSession & session, HTTPFixedLengthStreamBuf::ContentLength length);
         ~HTTPFixedLengthOutputStream();
-
-        void * operator new(std::size_t size);
-        void operator delete(void * ptr);
-
-    private:
-        static Poco::MemoryPool _pool;
     };
 
 
diff --git a/base/poco/Net/include/Poco/Net/HTTPHeaderStream.h b/base/poco/Net/include/Poco/Net/HTTPHeaderStream.h
index bcfca984d8b..cf1a6dba2e6 100644
--- a/base/poco/Net/include/Poco/Net/HTTPHeaderStream.h
+++ b/base/poco/Net/include/Poco/Net/HTTPHeaderStream.h
@@ -21,7 +21,6 @@
 #include <cstddef>
 #include <istream>
 #include <ostream>
-#include "Poco/MemoryPool.h"
 #include "Poco/Net/HTTPBasicStreamBuf.h"
 #include "Poco/Net/Net.h"
 
@@ -74,12 +73,6 @@ namespace Net
     public:
         HTTPHeaderInputStream(HTTPSession & session);
         ~HTTPHeaderInputStream();
-
-        void * operator new(std::size_t size);
-        void operator delete(void * ptr);
-
-    private:
-        static Poco::MemoryPool _pool;
     };
 
 
@@ -89,12 +82,6 @@ namespace Net
     public:
         HTTPHeaderOutputStream(HTTPSession & session);
         ~HTTPHeaderOutputStream();
-
-        void * operator new(std::size_t size);
-        void operator delete(void * ptr);
-
-    private:
-        static Poco::MemoryPool _pool;
     };
 
 
diff --git a/base/poco/Net/include/Poco/Net/HTTPSession.h b/base/poco/Net/include/Poco/Net/HTTPSession.h
index d0045025f5f..934b34be5d5 100644
--- a/base/poco/Net/include/Poco/Net/HTTPSession.h
+++ b/base/poco/Net/include/Poco/Net/HTTPSession.h
@@ -192,7 +192,7 @@ namespace Net
         HTTPSession & operator=(const HTTPSession &);
 
         StreamSocket _socket;
-        char * _pBuffer;
+        std::unique_ptr<char[]> _pBuffer;
         char * _pCurrent;
         char * _pEnd;
         bool _keepAlive;
diff --git a/base/poco/Net/include/Poco/Net/HTTPStream.h b/base/poco/Net/include/Poco/Net/HTTPStream.h
index 0197bc62eb2..48502347b2c 100644
--- a/base/poco/Net/include/Poco/Net/HTTPStream.h
+++ b/base/poco/Net/include/Poco/Net/HTTPStream.h
@@ -21,7 +21,6 @@
 #include <cstddef>
 #include <istream>
 #include <ostream>
-#include "Poco/MemoryPool.h"
 #include "Poco/Net/HTTPBasicStreamBuf.h"
 #include "Poco/Net/Net.h"
 
@@ -75,12 +74,6 @@ namespace Net
     public:
         HTTPInputStream(HTTPSession & session);
         ~HTTPInputStream();
-
-        void * operator new(std::size_t size);
-        void operator delete(void * ptr);
-
-    private:
-        static Poco::MemoryPool _pool;
     };
 
 
@@ -90,12 +83,6 @@ namespace Net
     public:
         HTTPOutputStream(HTTPSession & session);
         ~HTTPOutputStream();
-
-        void * operator new(std::size_t size);
-        void operator delete(void * ptr);
-
-    private:
-        static Poco::MemoryPool _pool;
     };
 
 
diff --git a/base/poco/Net/src/HTTPBufferAllocator.cpp b/base/poco/Net/src/HTTPBufferAllocator.cpp
deleted file mode 100644
index 2944e2a6121..00000000000
--- a/base/poco/Net/src/HTTPBufferAllocator.cpp
+++ /dev/null
@@ -1,44 +0,0 @@
-//
-// HTTPBufferAllocator.cpp
-//
-// Library: Net
-// Package: HTTP
-// Module:  HTTPBufferAllocator
-//
-// Copyright (c) 2005-2006, Applied Informatics Software Engineering GmbH.
-// and Contributors.
-//
-// SPDX-License-Identifier:	BSL-1.0
-//
-
-
-#include "Poco/Net/HTTPBufferAllocator.h"
-
-
-using Poco::MemoryPool;
-
-
-namespace Poco {
-namespace Net {
-
-
-MemoryPool HTTPBufferAllocator::_pool(HTTPBufferAllocator::BUFFER_SIZE, 16);
-
-
-char* HTTPBufferAllocator::allocate(std::streamsize size)
-{
-	poco_assert_dbg (size == BUFFER_SIZE);
-
-	return reinterpret_cast<char*>(_pool.get());
-}
-
-
-void HTTPBufferAllocator::deallocate(char* ptr, std::streamsize size)
-{
-	poco_assert_dbg (size == BUFFER_SIZE);
-
-	_pool.release(ptr);
-}
-
-
-} } // namespace Poco::Net
diff --git a/base/poco/Net/src/HTTPChunkedStream.cpp b/base/poco/Net/src/HTTPChunkedStream.cpp
index f2f79da590b..376e3f55492 100644
--- a/base/poco/Net/src/HTTPChunkedStream.cpp
+++ b/base/poco/Net/src/HTTPChunkedStream.cpp
@@ -34,7 +34,7 @@ namespace Net {
 
 
 HTTPChunkedStreamBuf::HTTPChunkedStreamBuf(HTTPSession& session, openmode mode):
-	HTTPBasicStreamBuf(HTTPBufferAllocator::BUFFER_SIZE, mode),
+	HTTPBasicStreamBuf(HTTP_DEFAULT_BUFFER_SIZE, mode),
 	_session(session),
 	_mode(mode),
 	_chunk(0)
@@ -181,10 +181,6 @@ HTTPChunkedStreamBuf* HTTPChunkedIOS::rdbuf()
 // HTTPChunkedInputStream
 //
 
-
-Poco::MemoryPool HTTPChunkedInputStream::_pool(sizeof(HTTPChunkedInputStream));
-
-
 HTTPChunkedInputStream::HTTPChunkedInputStream(HTTPSession& session):
 	HTTPChunkedIOS(session, std::ios::in),
 	std::istream(&_buf)
@@ -196,34 +192,10 @@ HTTPChunkedInputStream::~HTTPChunkedInputStream()
 {
 }
 
-
-void* HTTPChunkedInputStream::operator new(std::size_t size)
-{
-	return _pool.get();
-}
-
-
-void HTTPChunkedInputStream::operator delete(void* ptr)
-{
-	try
-	{
-		_pool.release(ptr);
-	}
-	catch (...)
-	{
-		poco_unexpected();
-	}
-}
-
-
 //
 // HTTPChunkedOutputStream
 //
 
-
-Poco::MemoryPool HTTPChunkedOutputStream::_pool(sizeof(HTTPChunkedOutputStream));
-
-
 HTTPChunkedOutputStream::HTTPChunkedOutputStream(HTTPSession& session):
 	HTTPChunkedIOS(session, std::ios::out),
 	std::ostream(&_buf)
@@ -235,24 +207,4 @@ HTTPChunkedOutputStream::~HTTPChunkedOutputStream()
 {
 }
 
-
-void* HTTPChunkedOutputStream::operator new(std::size_t size)
-{
-	return _pool.get();
-}
-
-
-void HTTPChunkedOutputStream::operator delete(void* ptr)
-{
-	try
-	{
-		_pool.release(ptr);
-	}
-	catch (...)
-	{
-		poco_unexpected();
-	}
-}
-
-
 } } // namespace Poco::Net
diff --git a/base/poco/Net/src/HTTPFixedLengthStream.cpp b/base/poco/Net/src/HTTPFixedLengthStream.cpp
index d19f6122ee1..fd77ff71cd9 100644
--- a/base/poco/Net/src/HTTPFixedLengthStream.cpp
+++ b/base/poco/Net/src/HTTPFixedLengthStream.cpp
@@ -30,7 +30,7 @@ namespace Net {
 
 
 HTTPFixedLengthStreamBuf::HTTPFixedLengthStreamBuf(HTTPSession& session, ContentLength length, openmode mode):
-	HTTPBasicStreamBuf(HTTPBufferAllocator::BUFFER_SIZE, mode),
+	HTTPBasicStreamBuf(HTTP_DEFAULT_BUFFER_SIZE, mode),
 	_session(session),
 	_length(length),
 	_count(0)
@@ -109,9 +109,6 @@ HTTPFixedLengthStreamBuf* HTTPFixedLengthIOS::rdbuf()
 //
 
 
-Poco::MemoryPool HTTPFixedLengthInputStream::_pool(sizeof(HTTPFixedLengthInputStream));
-
-
 HTTPFixedLengthInputStream::HTTPFixedLengthInputStream(HTTPSession& session, HTTPFixedLengthStreamBuf::ContentLength length):
 	HTTPFixedLengthIOS(session, length, std::ios::in),
 	std::istream(&_buf)
@@ -124,33 +121,10 @@ HTTPFixedLengthInputStream::~HTTPFixedLengthInputStream()
 }
 
 
-void* HTTPFixedLengthInputStream::operator new(std::size_t size)
-{
-	return _pool.get();
-}
-
-
-void HTTPFixedLengthInputStream::operator delete(void* ptr)
-{
-	try
-	{
-		_pool.release(ptr);
-	}
-	catch (...)
-	{
-		poco_unexpected();
-	}
-}
-
-
 //
 // HTTPFixedLengthOutputStream
 //
 
-
-Poco::MemoryPool HTTPFixedLengthOutputStream::_pool(sizeof(HTTPFixedLengthOutputStream));
-
-
 HTTPFixedLengthOutputStream::HTTPFixedLengthOutputStream(HTTPSession& session, HTTPFixedLengthStreamBuf::ContentLength length):
 	HTTPFixedLengthIOS(session, length, std::ios::out),
 	std::ostream(&_buf)
@@ -163,23 +137,4 @@ HTTPFixedLengthOutputStream::~HTTPFixedLengthOutputStream()
 }
 
 
-void* HTTPFixedLengthOutputStream::operator new(std::size_t size)
-{
-	return _pool.get();
-}
-
-
-void HTTPFixedLengthOutputStream::operator delete(void* ptr)
-{
-	try
-	{
-		_pool.release(ptr);
-	}
-	catch (...)
-	{
-		poco_unexpected();
-	}
-}
-
-
 } } // namespace Poco::Net
diff --git a/base/poco/Net/src/HTTPHeaderStream.cpp b/base/poco/Net/src/HTTPHeaderStream.cpp
index 8e0091fcbe3..39b9007062d 100644
--- a/base/poco/Net/src/HTTPHeaderStream.cpp
+++ b/base/poco/Net/src/HTTPHeaderStream.cpp
@@ -26,7 +26,7 @@ namespace Net {
 
 
 HTTPHeaderStreamBuf::HTTPHeaderStreamBuf(HTTPSession& session, openmode mode):
-	HTTPBasicStreamBuf(HTTPBufferAllocator::BUFFER_SIZE, mode),
+	HTTPBasicStreamBuf(HTTP_DEFAULT_BUFFER_SIZE, mode),
 	_session(session),
 	_end(false)
 {
@@ -101,10 +101,6 @@ HTTPHeaderStreamBuf* HTTPHeaderIOS::rdbuf()
 // HTTPHeaderInputStream
 //
 
-
-Poco::MemoryPool HTTPHeaderInputStream::_pool(sizeof(HTTPHeaderInputStream));
-
-
 HTTPHeaderInputStream::HTTPHeaderInputStream(HTTPSession& session):
 	HTTPHeaderIOS(session, std::ios::in),
 	std::istream(&_buf)
@@ -116,34 +112,10 @@ HTTPHeaderInputStream::~HTTPHeaderInputStream()
 {
 }
 
-
-void* HTTPHeaderInputStream::operator new(std::size_t size)
-{
-	return _pool.get();
-}
-
-
-void HTTPHeaderInputStream::operator delete(void* ptr)
-{
-	try
-	{
-		_pool.release(ptr);
-	}
-	catch (...)
-	{
-		poco_unexpected();
-	}
-}
-
-
 //
 // HTTPHeaderOutputStream
 //
 
-
-Poco::MemoryPool HTTPHeaderOutputStream::_pool(sizeof(HTTPHeaderOutputStream));
-
-
 HTTPHeaderOutputStream::HTTPHeaderOutputStream(HTTPSession& session):
 	HTTPHeaderIOS(session, std::ios::out),
 	std::ostream(&_buf)
@@ -155,24 +127,4 @@ HTTPHeaderOutputStream::~HTTPHeaderOutputStream()
 {
 }
 
-
-void* HTTPHeaderOutputStream::operator new(std::size_t size)
-{
-	return _pool.get();
-}
-
-
-void HTTPHeaderOutputStream::operator delete(void* ptr)
-{
-	try
-	{
-		_pool.release(ptr);
-	}
-	catch (...)
-	{
-		poco_unexpected();
-	}
-}
-
-
 } } // namespace Poco::Net
diff --git a/base/poco/Net/src/HTTPSession.cpp b/base/poco/Net/src/HTTPSession.cpp
index cb6fdc25e9a..d2663baaf9f 100644
--- a/base/poco/Net/src/HTTPSession.cpp
+++ b/base/poco/Net/src/HTTPSession.cpp
@@ -13,8 +13,8 @@
 
 
 #include "Poco/Net/HTTPSession.h"
-#include "Poco/Net/HTTPBufferAllocator.h"
 #include "Poco/Net/NetException.h"
+#include "Poco/Net/HTTPBasicStreamBuf.h"
 #include <cstring>
 
 
@@ -68,14 +68,6 @@ HTTPSession::HTTPSession(const StreamSocket& socket, bool keepAlive):
 
 HTTPSession::~HTTPSession()
 {
-	try
-	{
-		if (_pBuffer) HTTPBufferAllocator::deallocate(_pBuffer, HTTPBufferAllocator::BUFFER_SIZE);
-	}
-	catch (...)
-	{
-		poco_unexpected();
-	}
 	try
 	{
 		close();
@@ -177,10 +169,10 @@ void HTTPSession::refill()
 {
 	if (!_pBuffer)
 	{
-		_pBuffer = HTTPBufferAllocator::allocate(HTTPBufferAllocator::BUFFER_SIZE);
+		_pBuffer = std::make_unique<char[]>(HTTP_DEFAULT_BUFFER_SIZE);
 	}
-	_pCurrent = _pEnd = _pBuffer;
-	int n = receive(_pBuffer, HTTPBufferAllocator::BUFFER_SIZE);
+	_pCurrent = _pEnd = _pBuffer.get();
+	int n = receive(_pBuffer.get(), HTTP_DEFAULT_BUFFER_SIZE);
 	_pEnd += n;
 }
 
@@ -199,7 +191,7 @@ void HTTPSession::connect(const SocketAddress& address)
 	_socket.setNoDelay(true);
 	// There may be leftover data from a previous (failed) request in the buffer,
 	// so we clear it.
-	_pCurrent = _pEnd = _pBuffer;
+	_pCurrent = _pEnd = _pBuffer.get();
 }
 
 
diff --git a/base/poco/Net/src/HTTPStream.cpp b/base/poco/Net/src/HTTPStream.cpp
index 4acb881c4f3..c2f27600569 100644
--- a/base/poco/Net/src/HTTPStream.cpp
+++ b/base/poco/Net/src/HTTPStream.cpp
@@ -26,7 +26,7 @@ namespace Net {
 
 
 HTTPStreamBuf::HTTPStreamBuf(HTTPSession& session, openmode mode):
-	HTTPBasicStreamBuf(HTTPBufferAllocator::BUFFER_SIZE, mode),
+	HTTPBasicStreamBuf(HTTP_DEFAULT_BUFFER_SIZE, mode),
 	_session(session),
 	_mode(mode)
 {
@@ -96,10 +96,6 @@ HTTPStreamBuf* HTTPIOS::rdbuf()
 // HTTPInputStream
 //
 
-
-Poco::MemoryPool HTTPInputStream::_pool(sizeof(HTTPInputStream));
-
-
 HTTPInputStream::HTTPInputStream(HTTPSession& session):
 	HTTPIOS(session, std::ios::in),
 	std::istream(&_buf)
@@ -112,33 +108,11 @@ HTTPInputStream::~HTTPInputStream()
 }
 
 
-void* HTTPInputStream::operator new(std::size_t size)
-{
-	return _pool.get();
-}
-
-
-void HTTPInputStream::operator delete(void* ptr)
-{
-	try
-	{
-		_pool.release(ptr);
-	}
-	catch (...)
-	{
-		poco_unexpected();
-	}
-}
-
-
 //
 // HTTPOutputStream
 //
 
 
-Poco::MemoryPool HTTPOutputStream::_pool(sizeof(HTTPOutputStream));
-
-
 HTTPOutputStream::HTTPOutputStream(HTTPSession& session):
 	HTTPIOS(session, std::ios::out),
 	std::ostream(&_buf)
@@ -150,24 +124,4 @@ HTTPOutputStream::~HTTPOutputStream()
 {
 }
 
-
-void* HTTPOutputStream::operator new(std::size_t size)
-{
-	return _pool.get();
-}
-
-
-void HTTPOutputStream::operator delete(void* ptr)
-{
-	try
-	{
-		_pool.release(ptr);
-	}
-	catch (...)
-	{
-		poco_unexpected();
-	}
-}
-
-
 } } // namespace Poco::Net
diff --git a/base/poco/Net/src/SocketImpl.cpp b/base/poco/Net/src/SocketImpl.cpp
index 2aba413b322..484b8cfeec3 100644
--- a/base/poco/Net/src/SocketImpl.cpp
+++ b/base/poco/Net/src/SocketImpl.cpp
@@ -274,7 +274,9 @@ void SocketImpl::shutdown()
 
 int SocketImpl::sendBytes(const void* buffer, int length, int flags)
 {
-	if (_isBrokenTimeout)
+    bool blocking = _blocking && (flags & MSG_DONTWAIT) == 0;
+
+	if (_isBrokenTimeout && blocking)
 	{
 		if (_sndTimeout.totalMicroseconds() != 0)
 		{
@@ -289,11 +291,13 @@ int SocketImpl::sendBytes(const void* buffer, int length, int flags)
 		if (_sockfd == POCO_INVALID_SOCKET) throw InvalidSocketException();
 		rc = ::send(_sockfd, reinterpret_cast<const char*>(buffer), length, flags);
 	}
-	while (_blocking && rc < 0 && lastError() == POCO_EINTR);
+	while (blocking && rc < 0 && lastError() == POCO_EINTR);
 	if (rc < 0)
 	{
 		int err = lastError();
-		if (err == POCO_EAGAIN || err == POCO_ETIMEDOUT)
+		if ((err == POCO_EAGAIN || err == POCO_EWOULDBLOCK) && !blocking)
+			;
+		else if (err == POCO_EAGAIN || err == POCO_ETIMEDOUT)
 			throw TimeoutException();
 		else
 			error(err);
diff --git a/base/poco/NetSSL_OpenSSL/include/Poco/Net/ConsoleCertificateHandler.h b/base/poco/NetSSL_OpenSSL/include/Poco/Net/ConsoleCertificateHandler.h
deleted file mode 100644
index 8e09b6f18ae..00000000000
--- a/base/poco/NetSSL_OpenSSL/include/Poco/Net/ConsoleCertificateHandler.h
+++ /dev/null
@@ -1,53 +0,0 @@
-//
-// ConsoleCertificateHandler.h
-//
-// Library: NetSSL_OpenSSL
-// Package: SSLCore
-// Module:  ConsoleCertificateHandler
-//
-// Definition of the ConsoleCertificateHandler class.
-//
-// Copyright (c) 2006-2009, Applied Informatics Software Engineering GmbH.
-// and Contributors.
-//
-// SPDX-License-Identifier:	BSL-1.0
-//
-
-
-#ifndef NetSSL_ConsoleCertificateHandler_INCLUDED
-#define NetSSL_ConsoleCertificateHandler_INCLUDED
-
-
-#include "Poco/Net/InvalidCertificateHandler.h"
-#include "Poco/Net/NetSSL.h"
-
-
-namespace Poco
-{
-namespace Net
-{
-
-
-    class NetSSL_API ConsoleCertificateHandler : public InvalidCertificateHandler
-    /// A ConsoleCertificateHandler is invoked whenever an error occurs verifying the certificate.
-    ///
-    /// The certificate is printed to stdout and the user is asked via console if he wants to accept it.
-    {
-    public:
-        ConsoleCertificateHandler(bool handleErrorsOnServerSide);
-        /// Creates the ConsoleCertificateHandler.
-
-        virtual ~ConsoleCertificateHandler();
-        /// Destroys the ConsoleCertificateHandler.
-
-        void onInvalidCertificate(const void * pSender, VerificationErrorArgs & errorCert);
-        /// Prints the certificate to stdout and waits for user input on the console
-        /// to decide if a certificate should be accepted/rejected.
-    };
-
-
-}
-} // namespace Poco::Net
-
-
-#endif // NetSSL_ConsoleCertificateHandler_INCLUDED
diff --git a/base/poco/NetSSL_OpenSSL/include/Poco/Net/SSLManager.h b/base/poco/NetSSL_OpenSSL/include/Poco/Net/SSLManager.h
index a4fde26286e..21a1ed685e5 100644
--- a/base/poco/NetSSL_OpenSSL/include/Poco/Net/SSLManager.h
+++ b/base/poco/NetSSL_OpenSSL/include/Poco/Net/SSLManager.h
@@ -85,7 +85,7 @@ namespace Net
     ///                </options>
     ///            </privateKeyPassphraseHandler>
     ///            <invalidCertificateHandler>
-    ///                 <name>ConsoleCertificateHandler</name>
+    ///                 <name>RejectCertificateHandler</name>
     ///            </invalidCertificateHandler>
     ///            <cacheSessions>true|false</cacheSessions>
     ///            <sessionIdContext>someString</sessionIdContext> <!-- server only -->
@@ -186,7 +186,7 @@ namespace Net
         ///
         /// Valid initialization code would be:
         ///     SharedPtr<PrivateKeyPassphraseHandler> pConsoleHandler = new KeyConsoleHandler;
-        ///     SharedPtr<InvalidCertificateHandler> pInvalidCertHandler = new ConsoleCertificateHandler;
+        ///     SharedPtr<InvalidCertificateHandler> pInvalidCertHandler = new RejectCertificateHandler;
         ///     Context::Ptr pContext = new Context(Context::SERVER_USE, "any.pem", "any.pem", "rootcert.pem", Context::VERIFY_RELAXED, 9, false, "ALL:!ADH:!LOW:!EXP:!MD5:@STRENGTH");
         ///     SSLManager::instance().initializeServer(pConsoleHandler, pInvalidCertHandler, pContext);
 
@@ -203,7 +203,7 @@ namespace Net
         ///
         /// Valid initialization code would be:
         ///     SharedPtr<PrivateKeyPassphraseHandler> pConsoleHandler = new KeyConsoleHandler;
-        ///     SharedPtr<InvalidCertificateHandler> pInvalidCertHandler = new ConsoleCertificateHandler;
+        ///     SharedPtr<InvalidCertificateHandler> pInvalidCertHandler = new RejectCertificateHandler;
         ///     Context::Ptr pContext = new Context(Context::CLIENT_USE, "", "", "rootcert.pem", Context::VERIFY_RELAXED, 9, false, "ALL:!ADH:!LOW:!EXP:!MD5:@STRENGTH");
         ///     SSLManager::instance().initializeClient(pConsoleHandler, pInvalidCertHandler, pContext);
 
diff --git a/base/poco/NetSSL_OpenSSL/include/Poco/Net/SecureSocketImpl.h b/base/poco/NetSSL_OpenSSL/include/Poco/Net/SecureSocketImpl.h
index 56c550decfe..49c12b6b45f 100644
--- a/base/poco/NetSSL_OpenSSL/include/Poco/Net/SecureSocketImpl.h
+++ b/base/poco/NetSSL_OpenSSL/include/Poco/Net/SecureSocketImpl.h
@@ -183,6 +183,16 @@ namespace Net
         /// Returns true iff a reused session was negotiated during
         /// the handshake.
 
+        virtual void setBlocking(bool flag);
+        /// Sets the socket in blocking mode if flag is true,
+        /// disables blocking mode if flag is false.
+
+        virtual bool getBlocking() const;
+        /// Returns the blocking mode of the socket.
+        /// This method will only work if the blocking modes of
+        /// the socket are changed via the setBlocking method!
+
+
     protected:
         void acceptSSL();
         /// Assume per-object mutex is locked.
diff --git a/base/poco/NetSSL_OpenSSL/include/Poco/Net/SecureStreamSocketImpl.h b/base/poco/NetSSL_OpenSSL/include/Poco/Net/SecureStreamSocketImpl.h
index b41043769fe..99e2130d673 100644
--- a/base/poco/NetSSL_OpenSSL/include/Poco/Net/SecureStreamSocketImpl.h
+++ b/base/poco/NetSSL_OpenSSL/include/Poco/Net/SecureStreamSocketImpl.h
@@ -201,6 +201,16 @@ namespace Net
         /// Returns true iff a reused session was negotiated during
         /// the handshake.
 
+        virtual void setBlocking(bool flag);
+        /// Sets the socket in blocking mode if flag is true,
+        /// disables blocking mode if flag is false.
+
+        virtual bool getBlocking() const;
+        /// Returns the blocking mode of the socket.
+        /// This method will only work if the blocking modes of
+        /// the socket are changed via the setBlocking method!
+
+
     protected:
         void acceptSSL();
         /// Performs a SSL server-side handshake.
diff --git a/base/poco/NetSSL_OpenSSL/src/CertificateHandlerFactoryMgr.cpp b/base/poco/NetSSL_OpenSSL/src/CertificateHandlerFactoryMgr.cpp
index a89bbea11f2..f570e2d3599 100644
--- a/base/poco/NetSSL_OpenSSL/src/CertificateHandlerFactoryMgr.cpp
+++ b/base/poco/NetSSL_OpenSSL/src/CertificateHandlerFactoryMgr.cpp
@@ -13,7 +13,6 @@
 
 
 #include "Poco/Net/CertificateHandlerFactoryMgr.h"
-#include "Poco/Net/ConsoleCertificateHandler.h"
 #include "Poco/Net/AcceptCertificateHandler.h"
 #include "Poco/Net/RejectCertificateHandler.h"
 
@@ -24,7 +23,6 @@ namespace Net {
 
 CertificateHandlerFactoryMgr::CertificateHandlerFactoryMgr()
 {
-	setFactory("ConsoleCertificateHandler", new CertificateHandlerFactoryImpl<ConsoleCertificateHandler>());
 	setFactory("AcceptCertificateHandler", new CertificateHandlerFactoryImpl<AcceptCertificateHandler>());
 	setFactory("RejectCertificateHandler", new CertificateHandlerFactoryImpl<RejectCertificateHandler>());
 }
diff --git a/base/poco/NetSSL_OpenSSL/src/ConsoleCertificateHandler.cpp b/base/poco/NetSSL_OpenSSL/src/ConsoleCertificateHandler.cpp
deleted file mode 100644
index db64752e70c..00000000000
--- a/base/poco/NetSSL_OpenSSL/src/ConsoleCertificateHandler.cpp
+++ /dev/null
@@ -1,53 +0,0 @@
-//
-// ConsoleCertificateHandler.cpp
-//
-// Library: NetSSL_OpenSSL
-// Package: SSLCore
-// Module:  ConsoleCertificateHandler
-//
-// Copyright (c) 2006-2009, Applied Informatics Software Engineering GmbH.
-// and Contributors.
-//
-// SPDX-License-Identifier:	BSL-1.0
-//
-
-
-#include "Poco/Net/ConsoleCertificateHandler.h"
-#include <iostream>
-
-
-namespace Poco {
-namespace Net {
-
-
-ConsoleCertificateHandler::ConsoleCertificateHandler(bool server): InvalidCertificateHandler(server)
-{
-}
-
-
-ConsoleCertificateHandler::~ConsoleCertificateHandler()
-{
-}
-
-
-void ConsoleCertificateHandler::onInvalidCertificate(const void*, VerificationErrorArgs& errorCert)
-{
-	const X509Certificate& aCert = errorCert.certificate();
-	std::cout << "\n";
-	std::cout << "WARNING: Certificate verification failed\n";
-	std::cout << "----------------------------------------\n";
-	std::cout << "Issuer Name:  " << aCert.issuerName() << "\n";
-	std::cout << "Subject Name: " << aCert.subjectName() << "\n\n";
-	std::cout << "The certificate yielded the error: " << errorCert.errorMessage() << "\n\n";
-	std::cout << "The error occurred in the certificate chain at position " << errorCert.errorDepth() << "\n";
-	std::cout << "Accept the certificate (y,n)? ";
-	char c = 0;
-	std::cin >> c;
-	if (c == 'y' || c == 'Y')
-		errorCert.setIgnoreError(true);
-	else
-		errorCert.setIgnoreError(false);
-}
-
-
-} } // namespace Poco::Net
diff --git a/base/poco/NetSSL_OpenSSL/src/SSLManager.cpp b/base/poco/NetSSL_OpenSSL/src/SSLManager.cpp
index 82eed1a29eb..927602ca658 100644
--- a/base/poco/NetSSL_OpenSSL/src/SSLManager.cpp
+++ b/base/poco/NetSSL_OpenSSL/src/SSLManager.cpp
@@ -46,7 +46,7 @@ const std::string SSLManager::CFG_PREFER_SERVER_CIPHERS("preferServerCiphers");
 const std::string SSLManager::CFG_DELEGATE_HANDLER("privateKeyPassphraseHandler.name");
 const std::string SSLManager::VAL_DELEGATE_HANDLER("KeyConsoleHandler");
 const std::string SSLManager::CFG_CERTIFICATE_HANDLER("invalidCertificateHandler.name");
-const std::string SSLManager::VAL_CERTIFICATE_HANDLER("ConsoleCertificateHandler");
+const std::string SSLManager::VAL_CERTIFICATE_HANDLER("RejectCertificateHandler");
 const std::string SSLManager::CFG_SERVER_PREFIX("openSSL.server.");
 const std::string SSLManager::CFG_CLIENT_PREFIX("openSSL.client.");
 const std::string SSLManager::CFG_CACHE_SESSIONS("cacheSessions");
diff --git a/base/poco/NetSSL_OpenSSL/src/SecureSocketImpl.cpp b/base/poco/NetSSL_OpenSSL/src/SecureSocketImpl.cpp
index 9631c7a401a..efe25f65909 100644
--- a/base/poco/NetSSL_OpenSSL/src/SecureSocketImpl.cpp
+++ b/base/poco/NetSSL_OpenSSL/src/SecureSocketImpl.cpp
@@ -629,5 +629,15 @@ bool SecureSocketImpl::sessionWasReused()
 		return false;
 }
 
+void SecureSocketImpl::setBlocking(bool flag)
+{
+    _pSocket->setBlocking(flag);
+}
+
+bool SecureSocketImpl::getBlocking() const
+{
+    return _pSocket->getBlocking();
+}
+
 
 } } // namespace Poco::Net
diff --git a/base/poco/NetSSL_OpenSSL/src/SecureStreamSocketImpl.cpp b/base/poco/NetSSL_OpenSSL/src/SecureStreamSocketImpl.cpp
index aa1a96e1585..c00dd43b2ed 100644
--- a/base/poco/NetSSL_OpenSSL/src/SecureStreamSocketImpl.cpp
+++ b/base/poco/NetSSL_OpenSSL/src/SecureStreamSocketImpl.cpp
@@ -237,5 +237,15 @@ int SecureStreamSocketImpl::completeHandshake()
 	return _impl.completeHandshake();
 }
 
+bool SecureStreamSocketImpl::getBlocking() const
+{
+    return _impl.getBlocking();
+}
+
+void SecureStreamSocketImpl::setBlocking(bool flag)
+{
+    _impl.setBlocking(flag);
+}
+
 
 } } // namespace Poco::Net
diff --git a/cmake/autogenerated_versions.txt b/cmake/autogenerated_versions.txt
index 462529fbc13..821b7b46855 100644
--- a/cmake/autogenerated_versions.txt
+++ b/cmake/autogenerated_versions.txt
@@ -2,11 +2,11 @@
 
 # NOTE: has nothing common with DBMS_TCP_PROTOCOL_VERSION,
 # only DBMS_TCP_PROTOCOL_VERSION should be incremented on protocol changes.
-SET(VERSION_REVISION 54474)
+SET(VERSION_REVISION 54476)
 SET(VERSION_MAJOR 23)
-SET(VERSION_MINOR 5)
+SET(VERSION_MINOR 7)
 SET(VERSION_PATCH 1)
-SET(VERSION_GITHASH 3920eb987f7ed837ada5de8907284adf123f0583)
-SET(VERSION_DESCRIBE v23.5.1.1-testing)
-SET(VERSION_STRING 23.5.1.1)
+SET(VERSION_GITHASH d1c7e13d08868cb04d3562dcced704dd577cb1df)
+SET(VERSION_DESCRIBE v23.7.1.1-testing)
+SET(VERSION_STRING 23.7.1.1)
 # end of autochange
diff --git a/cmake/toolchain/darwin-x86_64/README.txt b/cmake/toolchain/darwin-x86_64/README.txt
index 65c9aba5be6..90ada960bfa 100644
--- a/cmake/toolchain/darwin-x86_64/README.txt
+++ b/cmake/toolchain/darwin-x86_64/README.txt
@@ -1,2 +1,2 @@
-wget https://github.com/phracker/MacOSX-SDKs/releases/download/10.15/MacOSX10.15.sdk.tar.xz
-tar xJf MacOSX10.15.sdk.tar.xz --strip-components=1
+wget https://github.com/phracker/MacOSX-SDKs/releases/download/11.3/MacOSX11.0.sdk.tar.xz
+tar xJf MacOSX11.0.sdk.tar.xz --strip-components=1
diff --git a/contrib/CMakeLists.txt b/contrib/CMakeLists.txt
index 4a4ff9982ea..2af468970f1 100644
--- a/contrib/CMakeLists.txt
+++ b/contrib/CMakeLists.txt
@@ -146,7 +146,7 @@ add_contrib (amqpcpp-cmake AMQP-CPP) # requires: libuv
 add_contrib (cassandra-cmake cassandra) # requires: libuv
 if (NOT OS_DARWIN)
     add_contrib (curl-cmake curl)
-    add_contrib (azure-cmake azure)
+    add_contrib (azure-cmake azure) # requires: curl
     add_contrib (sentry-native-cmake sentry-native) # requires: curl
 endif()
 add_contrib (fmtlib-cmake fmtlib)
@@ -157,7 +157,7 @@ add_contrib (librdkafka-cmake librdkafka) # requires: libgsasl
 add_contrib (nats-io-cmake nats-io)
 add_contrib (isa-l-cmake isa-l)
 add_contrib (libhdfs3-cmake libhdfs3) # requires: google-protobuf, krb5, isa-l
-add_contrib (hive-metastore-cmake hive-metastore) # requires: thrift/avro/arrow/libhdfs3
+add_contrib (hive-metastore-cmake hive-metastore) # requires: thrift, avro, arrow, libhdfs3
 add_contrib (cppkafka-cmake cppkafka)
 add_contrib (libpqxx-cmake libpqxx)
 add_contrib (libpq-cmake libpq)
diff --git a/contrib/NuRaft b/contrib/NuRaft
index b56784be1ae..491eaf592d9 160000
--- a/contrib/NuRaft
+++ b/contrib/NuRaft
@@ -1 +1 @@
-Subproject commit b56784be1aec568fb72aff47f281097c017623cb
+Subproject commit 491eaf592d950e0e37accbe8b3f217e068c9fecf
diff --git a/contrib/abseil-cpp-cmake/CMakeLists.txt b/contrib/abseil-cpp-cmake/CMakeLists.txt
index 4c31ecfc599..d64b6036611 100644
--- a/contrib/abseil-cpp-cmake/CMakeLists.txt
+++ b/contrib/abseil-cpp-cmake/CMakeLists.txt
@@ -17,3 +17,17 @@ get_target_property(FLAT_HASH_SET_INCLUDE_DIR absl::flat_hash_set INTERFACE_INCL
 target_include_directories (_abseil_swiss_tables SYSTEM BEFORE INTERFACE ${FLAT_HASH_SET_INCLUDE_DIR})
 
 add_library(ch_contrib::abseil_swiss_tables ALIAS _abseil_swiss_tables)
+
+set(ABSL_FORMAT_SRC
+    ${ABSL_ROOT_DIR}/absl/strings/internal/str_format/arg.cc
+    ${ABSL_ROOT_DIR}/absl/strings/internal/str_format/bind.cc
+    ${ABSL_ROOT_DIR}/absl/strings/internal/str_format/extension.cc
+    ${ABSL_ROOT_DIR}/absl/strings/internal/str_format/float_conversion.cc
+    ${ABSL_ROOT_DIR}/absl/strings/internal/str_format/output.cc
+    ${ABSL_ROOT_DIR}/absl/strings/internal/str_format/parser.cc
+)
+
+add_library(_abseil_str_format ${ABSL_FORMAT_SRC})
+target_include_directories(_abseil_str_format PUBLIC ${ABSL_ROOT_DIR})
+
+add_library(ch_contrib::abseil_str_format ALIAS _abseil_str_format)
diff --git a/contrib/arrow-cmake/CMakeLists.txt b/contrib/arrow-cmake/CMakeLists.txt
index 16198887075..46b86cb4ddb 100644
--- a/contrib/arrow-cmake/CMakeLists.txt
+++ b/contrib/arrow-cmake/CMakeLists.txt
@@ -31,12 +31,12 @@ endif()
 
 set (CMAKE_CXX_STANDARD 17)
 
-set(ARROW_VERSION "6.0.1")
+set(ARROW_VERSION "11.0.0")
 string(REGEX MATCH "^[0-9]+\\.[0-9]+\\.[0-9]+" ARROW_BASE_VERSION "${ARROW_VERSION}")
 
-set(ARROW_VERSION_MAJOR "6")
+set(ARROW_VERSION_MAJOR "11")
 set(ARROW_VERSION_MINOR "0")
-set(ARROW_VERSION_PATCH "1")
+set(ARROW_VERSION_PATCH "0")
 
 if(ARROW_VERSION_MAJOR STREQUAL "0")
     # Arrow 0.x.y => SO version is "x", full SO version is "x.y.0"
@@ -116,43 +116,79 @@ configure_file("${ORC_SOURCE_SRC_DIR}/Adaptor.hh.in" "${ORC_BUILD_INCLUDE_DIR}/A
 # ARROW_ORC + adapters/orc/CMakefiles
 set(ORC_SRCS
         "${CMAKE_CURRENT_BINARY_DIR}/orc_proto.pb.h"
-        "${ORC_SOURCE_SRC_DIR}/sargs/ExpressionTree.cc"
-        "${ORC_SOURCE_SRC_DIR}/sargs/Literal.cc"
-        "${ORC_SOURCE_SRC_DIR}/sargs/PredicateLeaf.cc"
-        "${ORC_SOURCE_SRC_DIR}/sargs/SargsApplier.cc"
-        "${ORC_SOURCE_SRC_DIR}/sargs/SearchArgument.cc"
-        "${ORC_SOURCE_SRC_DIR}/sargs/TruthValue.cc"
-        "${ORC_SOURCE_SRC_DIR}/Exceptions.cc"
-        "${ORC_SOURCE_SRC_DIR}/OrcFile.cc"
-        "${ORC_SOURCE_SRC_DIR}/Reader.cc"
+        "${ORC_ADDITION_SOURCE_DIR}/orc_proto.pb.cc"
+        "${ORC_SOURCE_SRC_DIR}/Adaptor.cc"
+        "${ORC_SOURCE_SRC_DIR}/Adaptor.hh.in"
+        "${ORC_SOURCE_SRC_DIR}/BlockBuffer.cc"
+        "${ORC_SOURCE_SRC_DIR}/BlockBuffer.hh"
+        "${ORC_SOURCE_SRC_DIR}/BloomFilter.cc"
+        "${ORC_SOURCE_SRC_DIR}/BloomFilter.hh"
+        "${ORC_SOURCE_SRC_DIR}/Bpacking.hh"
+        "${ORC_SOURCE_SRC_DIR}/BpackingDefault.cc"
+        "${ORC_SOURCE_SRC_DIR}/BpackingDefault.hh"
         "${ORC_SOURCE_SRC_DIR}/ByteRLE.cc"
+        "${ORC_SOURCE_SRC_DIR}/ByteRLE.hh"
+        "${ORC_SOURCE_SRC_DIR}/CMakeLists.txt"
         "${ORC_SOURCE_SRC_DIR}/ColumnPrinter.cc"
         "${ORC_SOURCE_SRC_DIR}/ColumnReader.cc"
+        "${ORC_SOURCE_SRC_DIR}/ColumnReader.hh"
         "${ORC_SOURCE_SRC_DIR}/ColumnWriter.cc"
+        "${ORC_SOURCE_SRC_DIR}/ColumnWriter.hh"
         "${ORC_SOURCE_SRC_DIR}/Common.cc"
         "${ORC_SOURCE_SRC_DIR}/Compression.cc"
+        "${ORC_SOURCE_SRC_DIR}/Compression.hh"
+        "${ORC_SOURCE_SRC_DIR}/ConvertColumnReader.cc"
+        "${ORC_SOURCE_SRC_DIR}/ConvertColumnReader.hh"
+        "${ORC_SOURCE_SRC_DIR}/CpuInfoUtil.cc"
+        "${ORC_SOURCE_SRC_DIR}/CpuInfoUtil.hh"
+        "${ORC_SOURCE_SRC_DIR}/Dispatch.hh"
+        "${ORC_SOURCE_SRC_DIR}/Exceptions.cc"
         "${ORC_SOURCE_SRC_DIR}/Int128.cc"
         "${ORC_SOURCE_SRC_DIR}/LzoDecompressor.cc"
+        "${ORC_SOURCE_SRC_DIR}/LzoDecompressor.hh"
         "${ORC_SOURCE_SRC_DIR}/MemoryPool.cc"
+        "${ORC_SOURCE_SRC_DIR}/Murmur3.cc"
+        "${ORC_SOURCE_SRC_DIR}/Murmur3.hh"
+        "${ORC_SOURCE_SRC_DIR}/Options.hh"
+        "${ORC_SOURCE_SRC_DIR}/OrcFile.cc"
         "${ORC_SOURCE_SRC_DIR}/RLE.cc"
+        "${ORC_SOURCE_SRC_DIR}/RLE.hh"
+        "${ORC_SOURCE_SRC_DIR}/RLEV2Util.cc"
+        "${ORC_SOURCE_SRC_DIR}/RLEV2Util.hh"
         "${ORC_SOURCE_SRC_DIR}/RLEv1.cc"
+        "${ORC_SOURCE_SRC_DIR}/RLEv1.hh"
+        "${ORC_SOURCE_SRC_DIR}/RLEv2.hh"
+        "${ORC_SOURCE_SRC_DIR}/Reader.cc"
+        "${ORC_SOURCE_SRC_DIR}/Reader.hh"
         "${ORC_SOURCE_SRC_DIR}/RleDecoderV2.cc"
         "${ORC_SOURCE_SRC_DIR}/RleEncoderV2.cc"
-        "${ORC_SOURCE_SRC_DIR}/RLEV2Util.cc"
+        "${ORC_SOURCE_SRC_DIR}/SchemaEvolution.cc"
+        "${ORC_SOURCE_SRC_DIR}/SchemaEvolution.hh"
         "${ORC_SOURCE_SRC_DIR}/Statistics.cc"
+        "${ORC_SOURCE_SRC_DIR}/Statistics.hh"
         "${ORC_SOURCE_SRC_DIR}/StripeStream.cc"
+        "${ORC_SOURCE_SRC_DIR}/StripeStream.hh"
         "${ORC_SOURCE_SRC_DIR}/Timezone.cc"
+        "${ORC_SOURCE_SRC_DIR}/Timezone.hh"
         "${ORC_SOURCE_SRC_DIR}/TypeImpl.cc"
+        "${ORC_SOURCE_SRC_DIR}/TypeImpl.hh"
+        "${ORC_SOURCE_SRC_DIR}/Utils.hh"
         "${ORC_SOURCE_SRC_DIR}/Vector.cc"
         "${ORC_SOURCE_SRC_DIR}/Writer.cc"
-        "${ORC_SOURCE_SRC_DIR}/Adaptor.cc"
-        "${ORC_SOURCE_SRC_DIR}/BloomFilter.cc"
-        "${ORC_SOURCE_SRC_DIR}/Murmur3.cc"
-        "${ORC_SOURCE_SRC_DIR}/BlockBuffer.cc"
-        "${ORC_SOURCE_SRC_DIR}/wrap/orc-proto-wrapper.cc"
         "${ORC_SOURCE_SRC_DIR}/io/InputStream.cc"
+        "${ORC_SOURCE_SRC_DIR}/io/InputStream.hh"
         "${ORC_SOURCE_SRC_DIR}/io/OutputStream.cc"
-        "${ORC_ADDITION_SOURCE_DIR}/orc_proto.pb.cc"
+        "${ORC_SOURCE_SRC_DIR}/io/OutputStream.hh"
+        "${ORC_SOURCE_SRC_DIR}/sargs/ExpressionTree.cc"
+        "${ORC_SOURCE_SRC_DIR}/sargs/ExpressionTree.hh"
+        "${ORC_SOURCE_SRC_DIR}/sargs/Literal.cc"
+        "${ORC_SOURCE_SRC_DIR}/sargs/PredicateLeaf.cc"
+        "${ORC_SOURCE_SRC_DIR}/sargs/PredicateLeaf.hh"
+        "${ORC_SOURCE_SRC_DIR}/sargs/SargsApplier.cc"
+        "${ORC_SOURCE_SRC_DIR}/sargs/SargsApplier.hh"
+        "${ORC_SOURCE_SRC_DIR}/sargs/SearchArgument.cc"
+        "${ORC_SOURCE_SRC_DIR}/sargs/SearchArgument.hh"
+        "${ORC_SOURCE_SRC_DIR}/sargs/TruthValue.cc"
         )
 
 add_library(_orc ${ORC_SRCS})
@@ -478,6 +514,10 @@ if (SANITIZE STREQUAL "undefined")
     target_compile_options(_arrow PRIVATE -fno-sanitize=undefined)
 endif ()
 
+# Define Thrift version for parquet (we use 0.16.0)
+add_definitions(-DPARQUET_THRIFT_VERSION_MAJOR=0)
+add_definitions(-DPARQUET_THRIFT_VERSION_MINOR=16)
+
 # === tools
 
 set(TOOLS_DIR "${ClickHouse_SOURCE_DIR}/contrib/arrow/cpp/tools/parquet")
diff --git a/contrib/azure-cmake/CMakeLists.txt b/contrib/azure-cmake/CMakeLists.txt
index 1e2a4c97824..7aba81259d3 100644
--- a/contrib/azure-cmake/CMakeLists.txt
+++ b/contrib/azure-cmake/CMakeLists.txt
@@ -1,6 +1,6 @@
 option (ENABLE_AZURE_BLOB_STORAGE "Enable Azure blob storage" ${ENABLE_LIBRARIES})
 
-if (NOT ENABLE_AZURE_BLOB_STORAGE OR BUILD_STANDALONE_KEEPER OR OS_FREEBSD)
+if (NOT ENABLE_AZURE_BLOB_STORAGE OR OS_FREEBSD)
     message(STATUS "Not using Azure blob storage")
     return()
 endif()
diff --git a/contrib/capnproto b/contrib/capnproto
index dc8b50b9997..976209a6d18 160000
--- a/contrib/capnproto
+++ b/contrib/capnproto
@@ -1 +1 @@
-Subproject commit dc8b50b999777bcb23c89bb5907c785c3f654441
+Subproject commit 976209a6d18074804f60d18ef99b6a809d27dadf
diff --git a/contrib/cityhash102/include/city.h b/contrib/cityhash102/include/city.h
index 77d4c988cdd..87363d16444 100644
--- a/contrib/cityhash102/include/city.h
+++ b/contrib/cityhash102/include/city.h
@@ -61,11 +61,24 @@ namespace CityHash_v1_0_2
 typedef uint8_t uint8;
 typedef uint32_t uint32;
 typedef uint64_t uint64;
-typedef std::pair<uint64, uint64> uint128;
 
+/// Represent an unsigned integer of 128 bits as it's used in CityHash.
+/// Originally CityHash used `std::pair<uint64, uint64>` instead of this struct,
+/// however the members `first` and `second` could be easily confused so they were renamed to `low64` and `high64`:
+/// `first` -> `low64`, `second` -> `high64`.
+struct uint128
+{
+    uint64 low64 = 0;
+    uint64 high64 = 0;
 
-inline uint64 Uint128Low64(const uint128& x) { return x.first; }
-inline uint64 Uint128High64(const uint128& x) { return x.second; }
+    uint128() = default;
+    uint128(uint64 low64_, uint64 high64_) : low64(low64_), high64(high64_) {}
+    friend bool operator ==(const uint128 & x, const uint128 & y) { return (x.low64 == y.low64) && (x.high64 == y.high64); }
+    friend bool operator !=(const uint128 & x, const uint128 & y) { return !(x == y); }
+};
+
+inline uint64 Uint128Low64(const uint128 & x) { return x.low64; }
+inline uint64 Uint128High64(const uint128 & x) { return x.high64; }
 
 // Hash function for a byte array.
 uint64 CityHash64(const char *buf, size_t len);
diff --git a/contrib/jemalloc-cmake/CMakeLists.txt b/contrib/jemalloc-cmake/CMakeLists.txt
index d5ea69d4926..97f723bb540 100644
--- a/contrib/jemalloc-cmake/CMakeLists.txt
+++ b/contrib/jemalloc-cmake/CMakeLists.txt
@@ -4,7 +4,7 @@ if (SANITIZE OR NOT (
 ))
     if (ENABLE_JEMALLOC)
         message (${RECONFIGURE_MESSAGE_LEVEL}
-                 "jemalloc is disabled implicitly: it doesn't work with sanitizers and can only be used with x86_64, aarch64, or ppc64le Linux or FreeBSD builds and RelWithDebInfo macOS builds.")
+                 "jemalloc is disabled implicitly: it doesn't work with sanitizers and can only be used with x86_64, aarch64, or ppc64le Linux or FreeBSD builds and RelWithDebInfo macOS builds. Use -DENABLE_JEMALLOC=0")
     endif ()
     set (ENABLE_JEMALLOC OFF)
 else ()
diff --git a/contrib/libhdfs3 b/contrib/libhdfs3
index 164b89253fa..377220ef351 160000
--- a/contrib/libhdfs3
+++ b/contrib/libhdfs3
@@ -1 +1 @@
-Subproject commit 164b89253fad7991bce77882f01b51ab81d19f3d
+Subproject commit 377220ef351ae24994a5fcd2b5fa3930d00c4db0
diff --git a/contrib/libhdfs3-cmake/CMakeLists.txt b/contrib/libhdfs3-cmake/CMakeLists.txt
index e2f122e282a..a630a8e45c4 100644
--- a/contrib/libhdfs3-cmake/CMakeLists.txt
+++ b/contrib/libhdfs3-cmake/CMakeLists.txt
@@ -1,11 +1,11 @@
-if(NOT ARCH_AARCH64 AND NOT OS_FREEBSD AND NOT APPLE AND NOT ARCH_PPC64LE AND NOT ARCH_S390X)
+if(NOT OS_FREEBSD AND NOT APPLE AND NOT ARCH_PPC64LE AND NOT ARCH_S390X)
     option(ENABLE_HDFS "Enable HDFS" ${ENABLE_LIBRARIES})
 elseif(ENABLE_HDFS)
     message (${RECONFIGURE_MESSAGE_LEVEL} "Cannot use HDFS3 with current configuration")
 endif()
 
 if(NOT ENABLE_HDFS)
-    message(STATUS "Not using hdfs")
+    message(STATUS "Not using HDFS")
     return()
 endif()
 
diff --git a/contrib/lz4 b/contrib/lz4
index 4c9431e9af5..e82198428c8 160000
--- a/contrib/lz4
+++ b/contrib/lz4
@@ -1 +1 @@
-Subproject commit 4c9431e9af596af0556e5da0ae99305bafb2b10b
+Subproject commit e82198428c8061372d5adef1f9bfff4203f6081e
diff --git a/contrib/lz4-cmake/CMakeLists.txt b/contrib/lz4-cmake/CMakeLists.txt
index 94def029410..c0fd574134f 100644
--- a/contrib/lz4-cmake/CMakeLists.txt
+++ b/contrib/lz4-cmake/CMakeLists.txt
@@ -12,6 +12,7 @@ add_library (_lz4 ${SRCS})
 add_library (ch_contrib::lz4 ALIAS _lz4)
 
 target_compile_definitions (_lz4 PUBLIC LZ4_DISABLE_DEPRECATE_WARNINGS=1)
+target_compile_definitions (_lz4 PUBLIC LZ4_FAST_DEC_LOOP=1)
 if (SANITIZE STREQUAL "undefined")
     target_compile_options (_lz4 PRIVATE -fno-sanitize=undefined)
 endif ()
diff --git a/contrib/orc b/contrib/orc
index c5d7755ba0b..568d1d60c25 160000
--- a/contrib/orc
+++ b/contrib/orc
@@ -1 +1 @@
-Subproject commit c5d7755ba0b9a95631c8daea4d094101f26ec761
+Subproject commit 568d1d60c250af1890f226c182bc15bd8cc94cf1
diff --git a/contrib/re2 b/contrib/re2
index 13ebb377c6a..03da4fc0857 160000
--- a/contrib/re2
+++ b/contrib/re2
@@ -1 +1 @@
-Subproject commit 13ebb377c6ad763ca61d12dd6f88b1126bd0b911
+Subproject commit 03da4fc0857c285e3a26782f6bc8931c4c950df4
diff --git a/contrib/re2-cmake/CMakeLists.txt b/contrib/re2-cmake/CMakeLists.txt
index 19939c11ebf..305c2400c77 100644
--- a/contrib/re2-cmake/CMakeLists.txt
+++ b/contrib/re2-cmake/CMakeLists.txt
@@ -12,6 +12,7 @@ endif()
 set(SRC_DIR "${ClickHouse_SOURCE_DIR}/contrib/re2")
 
 set(RE2_SOURCES
+    ${SRC_DIR}/re2/bitmap256.cc
     ${SRC_DIR}/re2/bitstate.cc
     ${SRC_DIR}/re2/compile.cc
     ${SRC_DIR}/re2/dfa.cc
@@ -28,15 +29,16 @@ set(RE2_SOURCES
     ${SRC_DIR}/re2/regexp.cc
     ${SRC_DIR}/re2/set.cc
     ${SRC_DIR}/re2/simplify.cc
-    ${SRC_DIR}/re2/stringpiece.cc
     ${SRC_DIR}/re2/tostring.cc
     ${SRC_DIR}/re2/unicode_casefold.cc
     ${SRC_DIR}/re2/unicode_groups.cc
+    ${SRC_DIR}/util/pcre.cc
     ${SRC_DIR}/util/rune.cc
     ${SRC_DIR}/util/strutil.cc
 )
 add_library(re2 ${RE2_SOURCES})
 target_include_directories(re2 PUBLIC "${SRC_DIR}")
+target_link_libraries(re2 ch_contrib::abseil_str_format)
 
 # Building re2 which is thread-safe and re2_st which is not.
 # re2 changes its state during matching of regular expression, e.g. creates temporary DFA.
@@ -48,6 +50,7 @@ target_compile_definitions (re2_st PRIVATE NDEBUG NO_THREADS re2=re2_st)
 target_include_directories (re2_st PRIVATE .)
 target_include_directories (re2_st SYSTEM PUBLIC ${CMAKE_CURRENT_BINARY_DIR})
 target_include_directories (re2_st SYSTEM BEFORE PUBLIC ${SRC_DIR})
+target_link_libraries (re2_st ch_contrib::abseil_str_format)
 
 file (MAKE_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}/re2_st)
 foreach (FILENAME filtered_re2.h re2.h set.h stringpiece.h)
@@ -60,17 +63,6 @@ foreach (FILENAME filtered_re2.h re2.h set.h stringpiece.h)
     add_dependencies (re2_st transform_${FILENAME})
 endforeach ()
 
-file (MAKE_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}/util)
-foreach (FILENAME mutex.h)
-    add_custom_command (OUTPUT "${CMAKE_CURRENT_BINARY_DIR}/util/${FILENAME}"
-        COMMAND ${CMAKE_COMMAND} -DSOURCE_FILENAME="${SRC_DIR}/util/${FILENAME}"
-            -DTARGET_FILENAME="${CMAKE_CURRENT_BINARY_DIR}/util/${FILENAME}"
-            -P "${CMAKE_CURRENT_SOURCE_DIR}/re2_transform.cmake"
-        COMMENT "Creating ${FILENAME} for re2_st library.")
-    add_custom_target (transform_${FILENAME} DEPENDS "${CMAKE_CURRENT_BINARY_DIR}/util/${FILENAME}")
-    add_dependencies (re2_st transform_${FILENAME})
-endforeach ()
-
 # NOTE: you should not change name of library here, since it is used to generate required header (see above)
 add_library(ch_contrib::re2 ALIAS re2)
 add_library(ch_contrib::re2_st ALIAS re2_st)
diff --git a/docker/images.json b/docker/images.json
index b4f3e755bd1..e8fc329a640 100644
--- a/docker/images.json
+++ b/docker/images.json
@@ -120,11 +120,12 @@
     "docker/test/base": {
          "name": "clickhouse/test-base",
          "dependent": [
-            "docker/test/stateless",
-            "docker/test/integration/base",
             "docker/test/fuzzer",
+            "docker/test/integration/base",
             "docker/test/keeper-jepsen",
-            "docker/test/server-jepsen"
+            "docker/test/server-jepsen",
+            "docker/test/sqllogic",
+            "docker/test/stateless"
          ]
     },
     "docker/test/integration/kerberized_hadoop": {
diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index 73da4515ff4..f13fcdc14d6 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
     esac
 
 ARG REPOSITORY="https://s3.amazonaws.com/clickhouse-builds/22.4/31c367d3cd3aefd316778601ff6565119fe36682/package_release"
-ARG VERSION="23.4.2.11"
+ARG VERSION="23.6.1.1524"
 ARG PACKAGES="clickhouse-keeper"
 
 # user/group precreated explicitly with fixed uid/gid on purpose.
diff --git a/docker/packager/binary/Dockerfile b/docker/packager/binary/Dockerfile
index fa860b2207f..e824161a688 100644
--- a/docker/packager/binary/Dockerfile
+++ b/docker/packager/binary/Dockerfile
@@ -46,10 +46,12 @@ ENV CXX=clang++-${LLVM_VERSION}
 # Rust toolchain and libraries
 ENV RUSTUP_HOME=/rust/rustup
 ENV CARGO_HOME=/rust/cargo
-ENV PATH="/rust/cargo/env:${PATH}"
 ENV PATH="/rust/cargo/bin:${PATH}"
 RUN curl https://sh.rustup.rs -sSf | bash -s -- -y && \
     chmod 777 -R /rust && \
+    rustup toolchain install nightly && \
+    rustup default nightly && \
+    rustup component add rust-src && \
     rustup target add aarch64-unknown-linux-gnu && \
     rustup target add x86_64-apple-darwin && \
     rustup target add x86_64-unknown-freebsd && \
@@ -87,7 +89,7 @@ RUN arch=${TARGETARCH:-amd64} \
     && dpkg -i /tmp/nfpm.deb \
     && rm /tmp/nfpm.deb
 
-ARG GO_VERSION=1.19.5
+ARG GO_VERSION=1.19.10
 # We need go for clickhouse-diagnostics
 RUN arch=${TARGETARCH:-amd64} \
     && curl -Lo /tmp/go.tgz "https://go.dev/dl/go${GO_VERSION}.linux-${arch}.tar.gz" \
diff --git a/docker/packager/binary/build.sh b/docker/packager/binary/build.sh
index 2cd0a011013..c0803c74147 100755
--- a/docker/packager/binary/build.sh
+++ b/docker/packager/binary/build.sh
@@ -11,9 +11,11 @@ ccache_status () {
 
 [ -O /build ] || git config --global --add safe.directory /build
 
-mkdir -p /build/cmake/toolchain/darwin-x86_64
-tar xJf /MacOSX11.0.sdk.tar.xz -C /build/cmake/toolchain/darwin-x86_64 --strip-components=1
-ln -sf darwin-x86_64 /build/cmake/toolchain/darwin-aarch64
+if [ "$EXTRACT_TOOLCHAIN_DARWIN" = "1" ]; then
+  mkdir -p /build/cmake/toolchain/darwin-x86_64
+  tar xJf /MacOSX11.0.sdk.tar.xz -C /build/cmake/toolchain/darwin-x86_64 --strip-components=1
+  ln -sf darwin-x86_64 /build/cmake/toolchain/darwin-aarch64
+fi
 
 # Uncomment to debug ccache. Don't put ccache log in /output right away, or it
 # will be confusingly packed into the "performance" package.
diff --git a/docker/packager/packager b/docker/packager/packager
index a894fe2d8e9..1b3df858cd2 100755
--- a/docker/packager/packager
+++ b/docker/packager/packager
@@ -167,6 +167,7 @@ def parse_env_variables(
         cmake_flags.append(
             "-DCMAKE_TOOLCHAIN_FILE=/build/cmake/darwin/toolchain-x86_64.cmake"
         )
+        result.append("EXTRACT_TOOLCHAIN_DARWIN=1")
     elif is_cross_darwin_arm:
         cc = compiler[: -len(DARWIN_ARM_SUFFIX)]
         cmake_flags.append("-DCMAKE_AR:FILEPATH=/cctools/bin/aarch64-apple-darwin-ar")
@@ -181,6 +182,7 @@ def parse_env_variables(
         cmake_flags.append(
             "-DCMAKE_TOOLCHAIN_FILE=/build/cmake/darwin/toolchain-aarch64.cmake"
         )
+        result.append("EXTRACT_TOOLCHAIN_DARWIN=1")
     elif is_cross_arm:
         cc = compiler[: -len(ARM_SUFFIX)]
         cmake_flags.append(
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index 1a5d2071f6b..5e5be3f6d73 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -33,7 +33,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="23.4.2.11"
+ARG VERSION="23.6.1.1524"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # user/group precreated explicitly with fixed uid/gid on purpose.
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index 8792d419a16..8693193455f 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -1,4 +1,4 @@
-FROM ubuntu:22.04
+FROM ubuntu:20.04
 
 # see https://github.com/moby/moby/issues/4032#issuecomment-192327844
 ARG DEBIAN_FRONTEND=noninteractive
@@ -11,18 +11,19 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
     && apt-get update \
     && apt-get upgrade -yq \
     && apt-get install --yes --no-install-recommends \
-        apt-transport-https \
         ca-certificates \
-        dirmngr \
-        gnupg2 \
-        wget \
         locales \
         tzdata \
-    && apt-get clean
+        wget \
+    && apt-get clean \
+    && rm -rf \
+        /var/lib/apt/lists/* \
+        /var/cache/debconf \
+        /tmp/*
 
 ARG REPO_CHANNEL="stable"
-ARG REPOSITORY="deb https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="23.4.2.11"
+ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
+ARG VERSION="23.6.1.1524"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
@@ -43,49 +44,68 @@ ARG single_binary_location_url=""
 
 ARG TARGETARCH
 
-RUN arch=${TARGETARCH:-amd64} \
+# install from a web location with deb packages
+RUN arch="${TARGETARCH:-amd64}" \
     && if [ -n "${deb_location_url}" ]; then \
         echo "installing from custom url with deb packages: ${deb_location_url}" \
-        rm -rf /tmp/clickhouse_debs \
+        && rm -rf /tmp/clickhouse_debs \
         && mkdir -p /tmp/clickhouse_debs \
         && for package in ${PACKAGES}; do \
             { wget --progress=bar:force:noscroll "${deb_location_url}/${package}_${VERSION}_${arch}.deb" -P /tmp/clickhouse_debs || \
                 wget --progress=bar:force:noscroll "${deb_location_url}/${package}_${VERSION}_all.deb" -P /tmp/clickhouse_debs ; } \
             || exit 1 \
         ; done \
-        && dpkg -i /tmp/clickhouse_debs/*.deb ; \
-    elif [ -n "${single_binary_location_url}" ]; then \
+        && dpkg -i /tmp/clickhouse_debs/*.deb \
+        && rm -rf /tmp/* ; \
+    fi
+
+# install from a single binary
+RUN if [ -n "${single_binary_location_url}" ]; then \
         echo "installing from single binary url: ${single_binary_location_url}" \
         && rm -rf /tmp/clickhouse_binary \
         && mkdir -p /tmp/clickhouse_binary \
         && wget --progress=bar:force:noscroll "${single_binary_location_url}" -O /tmp/clickhouse_binary/clickhouse \
         && chmod +x /tmp/clickhouse_binary/clickhouse \
-        && /tmp/clickhouse_binary/clickhouse install --user "clickhouse" --group "clickhouse" ; \
-    else \
-        mkdir -p /etc/apt/sources.list.d \
-        && apt-key adv --keyserver keyserver.ubuntu.com --recv 8919F6BD2B48D754 \
-        && echo ${REPOSITORY} > /etc/apt/sources.list.d/clickhouse.list \
+        && /tmp/clickhouse_binary/clickhouse install --user "clickhouse" --group "clickhouse" \
+        && rm -rf /tmp/* ; \
+    fi
+
+# A fallback to installation from ClickHouse repository
+RUN if ! clickhouse local -q "SELECT ''" > /dev/null 2>&1; then \
+        apt-get update \
+        && apt-get install --yes --no-install-recommends \
+            apt-transport-https \
+            ca-certificates \
+            dirmngr \
+            gnupg2 \
+        && mkdir -p /etc/apt/sources.list.d \
+        && GNUPGHOME=$(mktemp -d) \
+        && GNUPGHOME="$GNUPGHOME" gpg --no-default-keyring \
+            --keyring /usr/share/keyrings/clickhouse-keyring.gpg \
+            --keyserver hkp://keyserver.ubuntu.com:80 --recv-keys 8919F6BD2B48D754 \
+        && rm -r "$GNUPGHOME" \
+        && chmod +r /usr/share/keyrings/clickhouse-keyring.gpg \
+        && echo "${REPOSITORY}" > /etc/apt/sources.list.d/clickhouse.list \
         && echo "installing from repository: ${REPOSITORY}" \
         && apt-get update \
-        && apt-get --yes -o "Dpkg::Options::=--force-confdef" -o "Dpkg::Options::=--force-confold" upgrade \
         && for package in ${PACKAGES}; do \
             packages="${packages} ${package}=${VERSION}" \
         ; done \
         && apt-get install --allow-unauthenticated --yes --no-install-recommends ${packages} || exit 1 \
-    ; fi \
-    && clickhouse-local -q 'SELECT * FROM system.build_options' \
-    && rm -rf \
-        /var/lib/apt/lists/* \
-        /var/cache/debconf \
-        /tmp/* \
-    && mkdir -p /var/lib/clickhouse /var/log/clickhouse-server /etc/clickhouse-server /etc/clickhouse-client \
-    && chmod ugo+Xrw -R /var/lib/clickhouse /var/log/clickhouse-server /etc/clickhouse-server /etc/clickhouse-client
-
-RUN apt-get autoremove --purge -yq libksba8 && \
-    apt-get autoremove -yq
+        && rm -rf \
+            /var/lib/apt/lists/* \
+            /var/cache/debconf \
+            /tmp/* \
+        && apt-get autoremove --purge -yq libksba8 \
+        && apt-get autoremove -yq \
+    ; fi
 
+# post install
 # we need to allow "others" access to clickhouse folder, because docker container
 # can be started with arbitrary uid (openshift usecase)
+RUN clickhouse-local -q 'SELECT * FROM system.build_options' \
+    && mkdir -p /var/lib/clickhouse /var/log/clickhouse-server /etc/clickhouse-server /etc/clickhouse-client \
+    && chmod ugo+Xrw -R /var/lib/clickhouse /var/log/clickhouse-server /etc/clickhouse-server /etc/clickhouse-client
 
 RUN locale-gen en_US.UTF-8
 ENV LANG en_US.UTF-8
diff --git a/docker/server/README.md b/docker/server/README.md
index e6c9ee51fa7..67646a262f5 100644
--- a/docker/server/README.md
+++ b/docker/server/README.md
@@ -16,6 +16,11 @@ For more information and documentation see https://clickhouse.com/.
 - The tag `head` is built from the latest commit to the default branch.
 - Each tag has optional `-alpine` suffix to reflect that it's built on top of `alpine`.
 
+### Compatibility
+
+- The amd64 image requires support for [SSE3 instructions](https://en.wikipedia.org/wiki/SSE3). Virtually all x86 CPUs after 2005 support SSE3.
+- The arm64 image requires support for the [ARMv8.2-A architecture](https://en.wikipedia.org/wiki/AArch64#ARMv8.2-A). Most ARM CPUs after 2017 support ARMv8.2-A. A notable exception is Raspberry Pi 4 from 2019 whose CPU only supports ARMv8.0-A.
+
 ## How to use this image
 
 ### start server instance
diff --git a/docker/test/fasttest/Dockerfile b/docker/test/fasttest/Dockerfile
index ffb13fc774d..da4baa8c687 100644
--- a/docker/test/fasttest/Dockerfile
+++ b/docker/test/fasttest/Dockerfile
@@ -9,6 +9,7 @@ RUN apt-get update \
         expect \
         file \
         lsof \
+        odbcinst \
         psmisc \
         python3 \
         python3-lxml \
diff --git a/docker/test/fasttest/run.sh b/docker/test/fasttest/run.sh
index dab873377ce..989ed9d2fbb 100755
--- a/docker/test/fasttest/run.sh
+++ b/docker/test/fasttest/run.sh
@@ -80,7 +80,7 @@ function start_server
 
 function clone_root
 {
-    git config --global --add safe.directory "$FASTTEST_SOURCE"
+    [ "$UID" -eq 0 ] && git config --global --add safe.directory "$FASTTEST_SOURCE"
     git clone --depth 1 https://github.com/ClickHouse/ClickHouse.git -- "$FASTTEST_SOURCE" 2>&1 | ts '%Y-%m-%d %H:%M:%S' | tee "$FASTTEST_OUTPUT/clone_log.txt"
 
     (
@@ -151,7 +151,7 @@ function clone_submodules
         )
 
         git submodule sync
-        git submodule update --jobs=16 --depth 1 --init "${SUBMODULES_TO_UPDATE[@]}"
+        git submodule update --jobs=16 --depth 1 --single-branch --init "${SUBMODULES_TO_UPDATE[@]}"
         git submodule foreach git reset --hard
         git submodule foreach git checkout @ -f
         git submodule foreach git clean -xfd
@@ -202,10 +202,11 @@ function build
           | ts '%Y-%m-%d %H:%M:%S' \
           | tee "$FASTTEST_OUTPUT/test_result.txt"
         if [ "$COPY_CLICKHOUSE_BINARY_TO_OUTPUT" -eq "1" ]; then
-            cp programs/clickhouse "$FASTTEST_OUTPUT/clickhouse"
+            mkdir -p "$FASTTEST_OUTPUT/binaries/"
+            cp programs/clickhouse "$FASTTEST_OUTPUT/binaries/clickhouse"
 
-            strip programs/clickhouse -o "$FASTTEST_OUTPUT/clickhouse-stripped"
-            zstd --threads=0 "$FASTTEST_OUTPUT/clickhouse-stripped"
+            strip programs/clickhouse -o programs/clickhouse-stripped
+            zstd --threads=0 programs/clickhouse-stripped -o "$FASTTEST_OUTPUT/binaries/clickhouse-stripped.zst"
         fi
         ccache_status
         ccache --evict-older-than 1d ||:
diff --git a/docker/test/integration/base/Dockerfile b/docker/test/integration/base/Dockerfile
index de8efa20af4..270b40e23a6 100644
--- a/docker/test/integration/base/Dockerfile
+++ b/docker/test/integration/base/Dockerfile
@@ -46,12 +46,13 @@ RUN arch=${TARGETARCH:-amd64} \
       arm64) rarch=aarch64 ;; \
     esac \
   && cd /tmp \
-  && curl -o mysql-odbc.rpm "https://cdn.mysql.com/archives/mysql-connector-odbc-8.0/mysql-connector-odbc-8.0.27-1.el8.${rarch}.rpm" \
+  && curl -o mysql-odbc.rpm "https://cdn.mysql.com/archives/mysql-connector-odbc-8.0/mysql-connector-odbc-8.0.32-1.el9.${rarch}.rpm" \
   && rpm2archive mysql-odbc.rpm \
   && tar xf mysql-odbc.rpm.tgz -C / ./usr/lib64/ \
-  && LINK_DIR=$(dpkg -L libodbc1 | rg '^/usr/lib/.*-linux-gnu/odbc$') \
-  && ln -s /usr/lib64/libmyodbc8a.so "$LINK_DIR" \
-  && ln -s /usr/lib64/libmyodbc8a.so "$LINK_DIR"/libmyodbc.so
+  && rm mysql-odbc.rpm mysql-odbc.rpm.tgz \
+  && ODBC_DIR=$(dpkg -L odbc-postgresql | rg '^/usr/lib/.*-linux-gnu/odbc$') \
+  && ln -s /usr/lib64/libmyodbc8a.so "$ODBC_DIR" \
+  && ln -s /usr/lib64/libmyodbc8a.so "$ODBC_DIR"/libmyodbc.so
 
 # Unfortunately this is required for a single test for conversion data from zookeeper to clickhouse-keeper.
 # ZooKeeper is not started by default, but consumes some space in containers.
diff --git a/docker/test/integration/helper_container/Dockerfile b/docker/test/integration/helper_container/Dockerfile
index 6a093081bf2..60adaea1796 100644
--- a/docker/test/integration/helper_container/Dockerfile
+++ b/docker/test/integration/helper_container/Dockerfile
@@ -2,4 +2,7 @@
 # Helper docker container to run iptables without sudo
 
 FROM alpine
-RUN apk add -U iproute2
+RUN apk add --no-cache -U iproute2 \
+  && for bin in iptables iptables-restore iptables-save; \
+    do ln -sf xtables-nft-multi "/sbin/$bin"; \
+  done
diff --git a/docker/test/integration/mysql_php_client/Dockerfile b/docker/test/integration/mysql_php_client/Dockerfile
index 55db4d15a7f..0e11ae023e6 100644
--- a/docker/test/integration/mysql_php_client/Dockerfile
+++ b/docker/test/integration/mysql_php_client/Dockerfile
@@ -1,7 +1,7 @@
 # docker build -t clickhouse/mysql-php-client .
 # MySQL PHP client docker container
 
-FROM php:8.0.18-cli
+FROM php:8-cli-alpine
 
 COPY ./client.crt client.crt
 COPY ./client.key client.key
diff --git a/docker/test/integration/runner/Dockerfile b/docker/test/integration/runner/Dockerfile
index 14c97e479f6..38d8ed5f223 100644
--- a/docker/test/integration/runner/Dockerfile
+++ b/docker/test/integration/runner/Dockerfile
@@ -1,5 +1,5 @@
 # docker build -t clickhouse/integration-tests-runner .
-FROM ubuntu:20.04
+FROM ubuntu:22.04
 
 # ARG for quick switch to a given ubuntu mirror
 ARG apt_archive="http://archive.ubuntu.com"
@@ -56,17 +56,19 @@ RUN curl -fsSL https://download.docker.com/linux/ubuntu/gpg | apt-key add - \
         /var/lib/apt/lists/* \
         /var/cache/debconf \
         /tmp/* \
-    && apt-get clean
+    && apt-get clean \
+    && dockerd --version; docker --version
 
-RUN dockerd --version; docker --version
 
 RUN python3 -m pip install --no-cache-dir \
     PyMySQL \
-    aerospike==4.0.0 \
-    avro==1.10.2 \
+    aerospike==11.1.0 \
     asyncio \
+    avro==1.10.2 \
+    azure-storage-blob \
     cassandra-driver \
-    confluent-kafka==1.5.0 \
+    confluent-kafka==1.9.2 \
+    delta-spark==2.3.0 \
     dict2xml \
     dicttoxml \
     docker \
@@ -76,47 +78,51 @@ RUN python3 -m pip install --no-cache-dir \
     kafka-python \
     kazoo \
     lz4 \
+    meilisearch==0.18.3 \
     minio \
     nats-py \
     protobuf \
-    psycopg2-binary==2.8.6 \
+    psycopg2-binary==2.9.6 \
+    pyhdfs \
     pymongo==3.11.0 \
+    pyspark==3.3.2 \
     pytest \
     pytest-order==1.0.0 \
-    pytest-timeout \
     pytest-random \
-    pytest-xdist \
     pytest-repeat \
+    pytest-timeout \
+    pytest-xdist \
     pytz \
     redis \
-    tzlocal==2.1 \
-    urllib3 \
     requests-kerberos \
-    pyspark==3.3.2 \
-    delta-spark==2.2.0 \
-    pyhdfs \
-    azure-storage-blob \
-    meilisearch==0.18.3
-
-COPY modprobe.sh /usr/local/bin/modprobe
-COPY dockerd-entrypoint.sh /usr/local/bin/
-COPY compose/ /compose/
-COPY misc/ /misc/
+    tzlocal==2.1 \
+    urllib3
 
+# Hudi supports only spark 3.3.*, not 3.4
 RUN curl -fsSL -O https://dlcdn.apache.org/spark/spark-3.3.2/spark-3.3.2-bin-hadoop3.tgz \
     && tar xzvf spark-3.3.2-bin-hadoop3.tgz -C / \
     && rm spark-3.3.2-bin-hadoop3.tgz
 
 # download spark and packages
 # if you change packages, don't forget to update them in tests/integration/helpers/cluster.py
-RUN echo ":quit" | /spark-3.3.2-bin-hadoop3/bin/spark-shell --packages "org.apache.hudi:hudi-spark3.3-bundle_2.12:0.13.0,io.delta:delta-core_2.12:2.2.0,org.apache.iceberg:iceberg-spark-runtime-3.3_2.12:1.1.0" > /dev/null
+RUN packages="org.apache.hudi:hudi-spark3.3-bundle_2.12:0.13.0,\
+io.delta:delta-core_2.12:2.3.0,\
+org.apache.iceberg:iceberg-spark-runtime-3.3_2.12:1.1.0" \
+    && /spark-3.3.2-bin-hadoop3/bin/spark-shell --packages "$packages" > /dev/null \
+    && find /root/.ivy2/ -name '*.jar' -exec ln -sf {} /spark-3.3.2-bin-hadoop3/jars/ \;
 
 RUN set -x \
   && addgroup --system dockremap \
-    && adduser --system dockremap \
+  && adduser --system dockremap \
   && adduser dockremap dockremap \
   && echo 'dockremap:165536:65536' >> /etc/subuid \
-    && echo 'dockremap:165536:65536' >> /etc/subgid
+  && echo 'dockremap:165536:65536' >> /etc/subgid
+
+COPY modprobe.sh /usr/local/bin/modprobe
+COPY dockerd-entrypoint.sh /usr/local/bin/
+COPY compose/ /compose/
+COPY misc/ /misc/
+
 
 # Same options as in test/base/Dockerfile
 # (in case you need to override them in tests)
diff --git a/docker/test/integration/runner/dockerd-entrypoint.sh b/docker/test/integration/runner/dockerd-entrypoint.sh
index fe47fc90951..3c4ff522b36 100755
--- a/docker/test/integration/runner/dockerd-entrypoint.sh
+++ b/docker/test/integration/runner/dockerd-entrypoint.sh
@@ -12,6 +12,17 @@ echo '{
     "registry-mirrors" : ["http://dockerhub-proxy.dockerhub-proxy-zone:5000"]
 }' | dd of=/etc/docker/daemon.json 2>/dev/null
 
+if [ -f /sys/fs/cgroup/cgroup.controllers ]; then
+    # move the processes from the root group to the /init group,
+    # otherwise writing subtree_control fails with EBUSY.
+    # An error during moving non-existent process (i.e., "cat") is ignored.
+    mkdir -p /sys/fs/cgroup/init
+    xargs -rn1 < /sys/fs/cgroup/cgroup.procs > /sys/fs/cgroup/init/cgroup.procs || :
+    # enable controllers
+    sed -e 's/ / +/g' -e 's/^/+/' < /sys/fs/cgroup/cgroup.controllers \
+        > /sys/fs/cgroup/cgroup.subtree_control
+fi
+
 # In case of test hung it is convenient to use pytest --pdb to debug it,
 # and on hung you can simply press Ctrl-C and it will spawn a python pdb,
 # but on SIGINT dockerd will exit, so ignore it to preserve the daemon.
@@ -52,6 +63,8 @@ export CLICKHOUSE_TESTS_BASE_CONFIG_DIR=/clickhouse-config
 export CLICKHOUSE_ODBC_BRIDGE_BINARY_PATH=/clickhouse-odbc-bridge
 export CLICKHOUSE_LIBRARY_BRIDGE_BINARY_PATH=/clickhouse-library-bridge
 
+export DOCKER_BASE_TAG=${DOCKER_BASE_TAG:=latest}
+export DOCKER_HELPER_TAG=${DOCKER_HELPER_TAG:=latest}
 export DOCKER_MYSQL_GOLANG_CLIENT_TAG=${DOCKER_MYSQL_GOLANG_CLIENT_TAG:=latest}
 export DOCKER_DOTNET_CLIENT_TAG=${DOCKER_DOTNET_CLIENT_TAG:=latest}
 export DOCKER_MYSQL_JAVA_CLIENT_TAG=${DOCKER_MYSQL_JAVA_CLIENT_TAG:=latest}
diff --git a/docker/test/performance-comparison/compare.sh b/docker/test/performance-comparison/compare.sh
index 293ad9ac411..798d2a40b12 100755
--- a/docker/test/performance-comparison/compare.sh
+++ b/docker/test/performance-comparison/compare.sh
@@ -14,6 +14,13 @@ LEFT_SERVER_PORT=9001
 # patched version
 RIGHT_SERVER_PORT=9002
 
+# abort_conf   -- abort if some options is not recognized
+# abort        -- abort if something is not right in the env (i.e. per-cpu arenas does not work)
+# narenas      -- set them explicitly to avoid disabling per-cpu arena in env
+#                 that returns different number of CPUs for some of the following
+#                 _SC_NPROCESSORS_ONLN/_SC_NPROCESSORS_CONF/sched_getaffinity
+export MALLOC_CONF="abort_conf:true,abort:true,narenas:$(nproc --all)"
+
 function wait_for_server # port, pid
 {
     for _ in {1..60}
@@ -109,10 +116,6 @@ function restart
     while pkill -f clickhouse-serv ; do echo . ; sleep 1 ; done
     echo all killed
 
-    # Change the jemalloc settings here.
-    # https://github.com/jemalloc/jemalloc/wiki/Getting-Started
-    export MALLOC_CONF="confirm_conf:true"
-
     set -m # Spawn servers in their own process groups
 
     local left_server_opts=(
@@ -147,8 +150,6 @@ function restart
 
     set +m
 
-    unset MALLOC_CONF
-
     wait_for_server $LEFT_SERVER_PORT $left_pid
     echo left ok
 
diff --git a/docker/test/performance-comparison/report.py b/docker/test/performance-comparison/report.py
index 214f2d550b4..a1f2eb9d9ec 100755
--- a/docker/test/performance-comparison/report.py
+++ b/docker/test/performance-comparison/report.py
@@ -626,7 +626,9 @@ if args.report == "main":
         message_array.append(str(faster_queries) + " faster")
 
     if slower_queries:
-        if slower_queries > 3:
+        # This threshold should be synchronized with the value in https://github.com/ClickHouse/ClickHouse/blob/master/tests/ci/performance_comparison_check.py#L225
+        # False positives rate should be < 1%: https://shorturl.at/CDEK8
+        if slower_queries > 5:
             status = "failure"
         message_array.append(str(slower_queries) + " slower")
 
diff --git a/docker/test/sqlancer/Dockerfile b/docker/test/sqlancer/Dockerfile
index a68b626eb66..5977044345e 100644
--- a/docker/test/sqlancer/Dockerfile
+++ b/docker/test/sqlancer/Dockerfile
@@ -12,10 +12,10 @@ RUN apt-get update --yes && \
 # We need to get the repository's HEAD each time despite, so we invalidate layers' cache
 ARG CACHE_INVALIDATOR=0
 RUN mkdir /sqlancer && \
-	wget -q -O- https://github.com/sqlancer/sqlancer/archive/master.tar.gz | \
+	wget -q -O- https://github.com/sqlancer/sqlancer/archive/main.tar.gz | \
 		tar zx -C /sqlancer && \
-	cd /sqlancer/sqlancer-master && \
-	mvn package -DskipTests && \
+	cd /sqlancer/sqlancer-main && \
+	mvn --no-transfer-progress package -DskipTests && \
 	rm -r /root/.m2
 
 COPY run.sh /
diff --git a/docker/test/sqlancer/process_sqlancer_result.py b/docker/test/sqlancer/process_sqlancer_result.py
index 3bed4578565..06abb52abf8 100755
--- a/docker/test/sqlancer/process_sqlancer_result.py
+++ b/docker/test/sqlancer/process_sqlancer_result.py
@@ -16,7 +16,6 @@ def process_result(result_folder):
         "TLPGroupBy",
         "TLPHaving",
         "TLPWhere",
-        "TLPWhereGroupBy",
         "NoREC",
     ]
     failed_tests = []
diff --git a/docker/test/sqlancer/run.sh b/docker/test/sqlancer/run.sh
index 4a0f0f6a512..b186bc155a2 100755
--- a/docker/test/sqlancer/run.sh
+++ b/docker/test/sqlancer/run.sh
@@ -33,7 +33,7 @@ cd /workspace
 
 for _ in $(seq 1 60); do if [[ $(wget -q 'localhost:8123' -O-) == 'Ok.' ]]; then break ; else sleep 1; fi ; done
 
-cd /sqlancer/sqlancer-master
+cd /sqlancer/sqlancer-main
 
 TIMEOUT=300
 NUM_QUERIES=1000
diff --git a/docker/test/sqllogic/Dockerfile b/docker/test/sqllogic/Dockerfile
index 83dcf7e1f56..5cf71e4d3f8 100644
--- a/docker/test/sqllogic/Dockerfile
+++ b/docker/test/sqllogic/Dockerfile
@@ -13,6 +13,7 @@ RUN apt-get update --yes \
             sqlite3 \
             unixodbc \
             unixodbc-dev \
+            odbcinst \
             sudo \
     && apt-get clean
 
diff --git a/docker/test/stateful/Dockerfile b/docker/test/stateful/Dockerfile
index 71a2e92e3a8..f513735a2d0 100644
--- a/docker/test/stateful/Dockerfile
+++ b/docker/test/stateful/Dockerfile
@@ -16,8 +16,9 @@ COPY s3downloader /s3downloader
 ENV S3_URL="https://clickhouse-datasets.s3.amazonaws.com"
 ENV DATASETS="hits visits"
 
-RUN npm install -g azurite
-RUN npm install tslib
+# The following is already done in clickhouse/stateless-test
+# RUN npm install -g azurite
+# RUN npm install tslib
 
 COPY run.sh /
 CMD ["/bin/bash", "/run.sh"]
diff --git a/docker/test/stateless/Dockerfile b/docker/test/stateless/Dockerfile
index 40109255a7e..32996140521 100644
--- a/docker/test/stateless/Dockerfile
+++ b/docker/test/stateless/Dockerfile
@@ -20,6 +20,7 @@ RUN apt-get update -y \
             netcat-openbsd \
             nodejs \
             npm \
+            odbcinst \
             openjdk-11-jre-headless \
             openssl \
             postgresql-client \
@@ -71,7 +72,7 @@ RUN arch=${TARGETARCH:-amd64} \
     && chmod +x ./mc ./minio
 
 
-RUN wget 'https://dlcdn.apache.org/hadoop/common/hadoop-3.3.1/hadoop-3.3.1.tar.gz' \
+RUN wget --no-verbose 'https://dlcdn.apache.org/hadoop/common/hadoop-3.3.1/hadoop-3.3.1.tar.gz' \
     && tar -xvf hadoop-3.3.1.tar.gz \
     && rm -rf hadoop-3.3.1.tar.gz
 
@@ -79,8 +80,8 @@ ENV MINIO_ROOT_USER="clickhouse"
 ENV MINIO_ROOT_PASSWORD="clickhouse"
 ENV EXPORT_S3_STORAGE_POLICIES=1
 
-RUN npm install -g azurite
-RUN npm install tslib
+RUN npm install -g azurite \
+    && npm install -g tslib
 
 COPY run.sh /
 COPY setup_minio.sh /
diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index 5d0a7b50741..fe53925ecc8 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -15,6 +15,12 @@ dpkg -i package_folder/clickhouse-client_*.deb
 
 ln -s /usr/share/clickhouse-test/clickhouse-test /usr/bin/clickhouse-test
 
+# shellcheck disable=SC1091
+source /usr/share/clickhouse-test/ci/attach_gdb.lib || true  # FIXME: to not break old builds, clean on 2023-09-01
+
+# shellcheck disable=SC1091
+source /usr/share/clickhouse-test/ci/utils.lib || true # FIXME: to not break old builds, clean on 2023-09-01
+
 # install test configs
 /usr/share/clickhouse-test/config/install.sh
 
@@ -85,6 +91,24 @@ fi
 
 sleep 5
 
+attach_gdb_to_clickhouse || true  # FIXME: to not break old builds, clean on 2023-09-01
+
+function fn_exists() {
+    declare -F "$1" > /dev/null;
+}
+
+# FIXME: to not break old builds, clean on 2023-09-01
+function try_run_with_retry() {
+    local total_retries="$1"
+    shift
+
+    if fn_exists run_with_retry; then
+        run_with_retry "$total_retries" "$@"
+    else
+        "$@"
+    fi
+}
+
 function run_tests()
 {
     set -x
@@ -132,8 +156,7 @@ function run_tests()
 
     ADDITIONAL_OPTIONS+=('--report-logs-stats')
 
-    clickhouse-test "00001_select_1" > /dev/null ||:
-    clickhouse-client -q "insert into system.zookeeper (name, path, value) values ('auxiliary_zookeeper2', '/test/chroot/', '')" ||:
+    try_run_with_retry 10 clickhouse-client -q "insert into system.zookeeper (name, path, value) values ('auxiliary_zookeeper2', '/test/chroot/', '')"
 
     set +e
     clickhouse-test --testname --shard --zookeeper --check-zookeeper-session --hung-check --print-time \
diff --git a/docker/test/style/Dockerfile b/docker/test/style/Dockerfile
index 746cc7bb2d5..2aa0b1a62d6 100644
--- a/docker/test/style/Dockerfile
+++ b/docker/test/style/Dockerfile
@@ -18,7 +18,7 @@ RUN apt-get update && env DEBIAN_FRONTEND=noninteractive apt-get install --yes \
     python3-pip \
     shellcheck \
     yamllint \
-    && pip3 install black==23.1.0 boto3 codespell==2.2.1 dohq-artifactory mypy PyGithub unidiff pylint==2.6.2 \
+    && pip3 install black==23.1.0 boto3 codespell==2.2.1 mypy==1.3.0 PyGithub unidiff pylint==2.6.2 \
     && apt-get clean \
     && rm -rf /root/.cache/pip
 
diff --git a/docker/test/upgrade/run.sh b/docker/test/upgrade/run.sh
index bd0c59a12cd..8fd514eaa93 100644
--- a/docker/test/upgrade/run.sh
+++ b/docker/test/upgrade/run.sh
@@ -59,14 +59,9 @@ install_packages previous_release_package_folder
 # available for dump via clickhouse-local
 configure
 
-# local_blob_storage disk type does not exist in older versions
-sudo cat /etc/clickhouse-server/config.d/storage_conf.xml \
-  | sed "s|<type>local_blob_storage</type>|<type>local</type>|" \
-  > /etc/clickhouse-server/config.d/storage_conf.xml.tmp
-sudo mv /etc/clickhouse-server/config.d/storage_conf.xml.tmp /etc/clickhouse-server/config.d/storage_conf.xml
-
 # it contains some new settings, but we can safely remove it
 rm /etc/clickhouse-server/config.d/merge_tree.xml
+rm /etc/clickhouse-server/users.d/nonconst_timezone.xml
 
 start
 stop
@@ -92,13 +87,9 @@ export USE_S3_STORAGE_FOR_MERGE_TREE=1
 export ZOOKEEPER_FAULT_INJECTION=0
 configure
 
-sudo cat /etc/clickhouse-server/config.d/storage_conf.xml \
-  | sed "s|<type>local_blob_storage</type>|<type>local</type>|" \
-  > /etc/clickhouse-server/config.d/storage_conf.xml.tmp
-sudo mv /etc/clickhouse-server/config.d/storage_conf.xml.tmp /etc/clickhouse-server/config.d/storage_conf.xml
-
 # it contains some new settings, but we can safely remove it
 rm /etc/clickhouse-server/config.d/merge_tree.xml
+rm /etc/clickhouse-server/users.d/nonconst_timezone.xml
 
 start
 
@@ -128,6 +119,13 @@ mv /var/log/clickhouse-server/clickhouse-server.log /var/log/clickhouse-server/c
 install_packages package_folder
 export ZOOKEEPER_FAULT_INJECTION=1
 configure
+
+# Just in case previous version left some garbage in zk
+sudo cat /etc/clickhouse-server/config.d/lost_forever_check.xml \
+  | sed "s|>1<|>0<|g" \
+  > /etc/clickhouse-server/config.d/lost_forever_check.xml.tmp
+sudo mv /etc/clickhouse-server/config.d/lost_forever_check.xml.tmp /etc/clickhouse-server/config.d/lost_forever_check.xml
+
 start 500
 clickhouse-client --query "SELECT 'Server successfully started', 'OK', NULL, ''" >> /test_output/test_results.tsv \
     || (rg --text "<Error>.*Application" /var/log/clickhouse-server/clickhouse-server.log > /test_output/application_errors.txt \
@@ -191,6 +189,7 @@ rg -Fav -e "Code: 236. DB::Exception: Cancelled merging parts" \
            -e "Authentication failed" \
            -e "Cannot flush" \
            -e "Container already exists" \
+           -e "doesn't have metadata version on disk" \
     clickhouse-server.upgrade.log \
     | grep -av -e "_repl_01111_.*Mapping for table with UUID" \
     | zgrep -Fa "<Error>" > /test_output/upgrade_error_messages.txt \
diff --git a/docker/test/util/Dockerfile b/docker/test/util/Dockerfile
index a49278e960b..85e888f1df7 100644
--- a/docker/test/util/Dockerfile
+++ b/docker/test/util/Dockerfile
@@ -1,5 +1,5 @@
 # docker build -t clickhouse/test-util .
-FROM ubuntu:20.04
+FROM ubuntu:22.04
 
 # ARG for quick switch to a given ubuntu mirror
 ARG apt_archive="http://archive.ubuntu.com"
diff --git a/docker/test/util/process_functional_tests_result.py b/docker/test/util/process_functional_tests_result.py
index c75a3500831..fd4cc9f4bf7 100755
--- a/docker/test/util/process_functional_tests_result.py
+++ b/docker/test/util/process_functional_tests_result.py
@@ -86,7 +86,7 @@ def process_test_log(log_path, broken_tests):
                                 test_name,
                                 "NOT_FAILED",
                                 test_time,
-                                ["This test passed. Update broken_tests.txt.\n"],
+                                ["This test passed. Update analyzer_tech_debt.txt.\n"],
                             )
                         )
                     else:
@@ -205,7 +205,7 @@ if __name__ == "__main__":
     parser.add_argument("--in-results-dir", default="/test_output/")
     parser.add_argument("--out-results-file", default="/test_output/test_results.tsv")
     parser.add_argument("--out-status-file", default="/test_output/check_status.tsv")
-    parser.add_argument("--broken-tests", default="/broken_tests.txt")
+    parser.add_argument("--broken-tests", default="/analyzer_tech_debt.txt")
     args = parser.parse_args()
 
     broken_tests = list()
diff --git a/docs/_description_templates/template-data-type.md b/docs/_description_templates/template-data-type.md
new file mode 100644
index 00000000000..239edb2808b
--- /dev/null
+++ b/docs/_description_templates/template-data-type.md
@@ -0,0 +1,29 @@
+---
+toc_priority:
+toc_title:
+---
+
+# data_type_name {#data_type-name}
+
+Description.
+
+**Parameters** (Optional)
+
+-   `x` — Description. [Type name](relative/path/to/type/dscr.md#type).
+-   `y` — Description. [Type name](relative/path/to/type/dscr.md#type).
+
+**Examples**
+
+```sql
+
+```
+
+## Additional Info {#additional-info} (Optional)
+
+The name of an additional section can be any, for example, **Usage**.
+
+**See Also** (Optional)
+
+-   [link](#)
+
+[Original article](https://clickhouse.com/docs/en/data-types/<data-type-name>/) <!--hide-->
diff --git a/docs/_description_templates/template-engine.md b/docs/_description_templates/template-engine.md
new file mode 100644
index 00000000000..392bc59ed33
--- /dev/null
+++ b/docs/_description_templates/template-engine.md
@@ -0,0 +1,63 @@
+# EngineName {#enginename}
+
+-   What the Database/Table engine does.
+-   Relations with other engines if they exist.
+
+## Creating a Database {#creating-a-database}
+``` sql
+    CREATE DATABASE ...
+```
+or
+
+## Creating a Table {#creating-a-table}
+``` sql
+    CREATE TABLE ...
+```
+
+**Engine Parameters**
+
+**Query Clauses** (for Table engines only)
+
+## Virtual columns {#virtual-columns} (for Table engines only)
+
+List and virtual columns with description, if they exist.
+
+## Data Types Support {#data_types-support} (for Database engines only)
+
+|  EngineName           | ClickHouse                         |
+|-----------------------|------------------------------------|
+| NativeDataTypeName    | [ClickHouseDataTypeName](link#)    |
+
+
+## Specifics and recommendations {#specifics-and-recommendations}
+
+Algorithms
+Specifics of read and write processes
+Examples of tasks
+Recommendations for usage
+Specifics of data storage
+
+## Usage Example {#usage-example}
+
+The example must show usage and use cases. The following text contains the recommended parts of this section.
+
+Input table:
+
+``` text
+```
+
+Query:
+
+``` sql
+```
+
+Result:
+
+``` text
+```
+
+Follow up with any text to clarify the example.
+
+**See Also**
+
+-   [link](#)
diff --git a/docs/_description_templates/template-function.md b/docs/_description_templates/template-function.md
new file mode 100644
index 00000000000..6bdc764c449
--- /dev/null
+++ b/docs/_description_templates/template-function.md
@@ -0,0 +1,51 @@
+## functionName {#functionname-in-lower-case}
+
+Short description.
+
+**Syntax** (without SELECT)
+
+``` sql
+<function syntax>
+```
+
+Alias: `<alias name>`. (Optional)
+
+More text (Optional).
+
+**Arguments** (Optional)
+
+-   `x` — Description. Optional (only for optional arguments). Possible values: <values list>. Default value: <value>. [Type name](relative/path/to/type/dscr.md#type).
+-   `y` — Description. Optional (only for optional arguments). Possible values: <values list>.Default value: <value>. [Type name](relative/path/to/type/dscr.md#type).
+
+**Parameters** (Optional, only for parametric aggregate functions)
+
+-   `z` — Description. Optional (only for optional parameters). Possible values: <values list>. Default value: <value>. [Type name](relative/path/to/type/dscr.md#type).
+
+**Returned value(s)**
+
+-   Returned values list.
+
+Type: [Type name](relative/path/to/type/dscr.md#type).
+
+**Example**
+
+The example must show usage and/or a use cases. The following text contains recommended parts of an example.
+
+Input table (Optional):
+
+``` text
+```
+
+Query:
+
+``` sql
+```
+
+Result:
+
+``` text
+```
+
+**See Also** (Optional)
+
+-   [link](#)
diff --git a/docs/_description_templates/template-server-setting.md b/docs/_description_templates/template-server-setting.md
new file mode 100644
index 00000000000..0b37d46cf41
--- /dev/null
+++ b/docs/_description_templates/template-server-setting.md
@@ -0,0 +1,33 @@
+## server_setting_name {#server_setting_name}
+
+Description.
+
+Describe what is configured in this section of settings.
+
+Possible value: ...
+
+Default value: ...
+
+**Settings** (Optional)
+
+If the section contains several settings, list them here. Specify possible values and default values:
+
+-   setting_1 — Description.
+-   setting_2 — Description.
+
+**Example**
+
+```xml
+<server_setting_name>
+    <setting_1> ... </setting_1>
+    <setting_2> ... </setting_2>
+</server_setting_name>
+```
+
+**Additional Info** (Optional)
+
+The name of an additional section can be any, for example, **Usage**.
+
+**See Also** (Optional)
+
+-   [link](#)
diff --git a/docs/_description_templates/template-setting.md b/docs/_description_templates/template-setting.md
new file mode 100644
index 00000000000..fc912aba3e1
--- /dev/null
+++ b/docs/_description_templates/template-setting.md
@@ -0,0 +1,27 @@
+## setting_name {#setting_name}
+
+Description.
+
+For the switch setting, use the typical phrase: “Enables or disables something …”.
+
+Possible values:
+
+*For switcher setting:*
+
+-   0 — Disabled.
+-   1 — Enabled.
+
+*For another setting (typical phrases):*
+
+-   Positive integer.
+-   0 — Disabled or unlimited or something else.
+
+Default value: `value`.
+
+**Additional Info** (Optional)
+
+The name of an additional section can be any, for example, **Usage**.
+
+**See Also** (Optional)
+
+-   [link](#)
diff --git a/docs/_description_templates/template-statement.md b/docs/_description_templates/template-statement.md
new file mode 100644
index 00000000000..238570c2217
--- /dev/null
+++ b/docs/_description_templates/template-statement.md
@@ -0,0 +1,24 @@
+# Statement name (for example, SHOW USER) {#statement-name-in-lower-case}
+
+Brief description of what the statement does.
+
+**Syntax**
+
+```sql
+Syntax of the statement.
+```
+
+## Other necessary sections of the description (Optional) {#anchor}
+
+Examples of descriptions with a complicated structure:
+
+- https://clickhouse.com/docs/en/sql-reference/statements/grant/
+- https://clickhouse.com/docs/en/sql-reference/statements/revoke/
+- https://clickhouse.com/docs/en/sql-reference/statements/select/join/
+
+
+**See Also** (Optional)
+
+Links to related topics as a list.
+
+-   [link](#)
diff --git a/docs/_description_templates/template-system-table.md b/docs/_description_templates/template-system-table.md
new file mode 100644
index 00000000000..f2decc4bb6d
--- /dev/null
+++ b/docs/_description_templates/template-system-table.md
@@ -0,0 +1,25 @@
+# system.table_name {#system-tables_table-name}
+
+Description.
+
+Columns:
+
+-   `column_name` ([data_type_name](path/to/data_type.md)) — Description.
+
+**Example**
+
+Query:
+
+``` sql
+SELECT * FROM system.table_name
+```
+
+Result:
+
+``` text
+Some output. It shouldn't be too long.
+```
+
+**See Also**
+
+-   [Article name](path/to/article_name.md) — Some words about referenced information.
diff --git a/docs/changelogs/v22.8.18.31-lts.md b/docs/changelogs/v22.8.18.31-lts.md
new file mode 100644
index 00000000000..709bb926f8a
--- /dev/null
+++ b/docs/changelogs/v22.8.18.31-lts.md
@@ -0,0 +1,32 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v22.8.18.31-lts (4de7a95a544) FIXME as compared to v22.8.17.17-lts (df7f2ef0b41)
+
+#### Performance Improvement
+* Backported in [#49214](https://github.com/ClickHouse/ClickHouse/issues/49214): Fixed excessive reading in queries with `FINAL`. [#47801](https://github.com/ClickHouse/ClickHouse/pull/47801) ([Nikita Taranov](https://github.com/nickitat)).
+
+#### Build/Testing/Packaging Improvement
+* Backported in [#49079](https://github.com/ClickHouse/ClickHouse/issues/49079): Update time zones. The following were updated: Africa/Cairo, Africa/Casablanca, Africa/El_Aaiun, America/Bogota, America/Cambridge_Bay, America/Ciudad_Juarez, America/Godthab, America/Inuvik, America/Iqaluit, America/Nuuk, America/Ojinaga, America/Pangnirtung, America/Rankin_Inlet, America/Resolute, America/Whitehorse, America/Yellowknife, Asia/Gaza, Asia/Hebron, Asia/Kuala_Lumpur, Asia/Singapore, Canada/Yukon, Egypt, Europe/Kirov, Europe/Volgograd, Singapore. [#48572](https://github.com/ClickHouse/ClickHouse/pull/48572) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix bad cast from LowCardinality column when using short circuit function execution [#43311](https://github.com/ClickHouse/ClickHouse/pull/43311) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix msan issue in randomStringUTF8(<uneven number>) [#49750](https://github.com/ClickHouse/ClickHouse/pull/49750) ([Robert Schulze](https://github.com/rschu1ze)).
+* JIT compilation not equals NaN fix [#50056](https://github.com/ClickHouse/ClickHouse/pull/50056) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix crash with `multiIf` and constant condition and nullable arguments [#50123](https://github.com/ClickHouse/ClickHouse/pull/50123) ([Anton Popov](https://github.com/CurtizJ)).
+* Fixed type conversion from Date/Date32 to DateTime64 when querying with DateTime64 index [#50280](https://github.com/ClickHouse/ClickHouse/pull/50280) ([Lucas Chang](https://github.com/lucas-tubi)).
+* Fix Keeper deadlock on exception when preprocessing requests. [#50387](https://github.com/ClickHouse/ClickHouse/pull/50387) ([frinkr](https://github.com/frinkr)).
+* Fix Log family table return wrong rows count after truncate [#50585](https://github.com/ClickHouse/ClickHouse/pull/50585) ([flynn](https://github.com/ucasfl)).
+* Do not read all the columns from right GLOBAL JOIN table. [#50721](https://github.com/ClickHouse/ClickHouse/pull/50721) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Improve test reports [#49151](https://github.com/ClickHouse/ClickHouse/pull/49151) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Update github.com/distribution/distribution [#50114](https://github.com/ClickHouse/ClickHouse/pull/50114) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Catch issues with dockerd during the build [#50700](https://github.com/ClickHouse/ClickHouse/pull/50700) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/docs/changelogs/v22.8.19.10-lts.md b/docs/changelogs/v22.8.19.10-lts.md
new file mode 100644
index 00000000000..b3990c74e46
--- /dev/null
+++ b/docs/changelogs/v22.8.19.10-lts.md
@@ -0,0 +1,19 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v22.8.19.10-lts (989bc2fe8b0) FIXME as compared to v22.8.18.31-lts (4de7a95a544)
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix subtly broken copy-on-write of ColumnLowCardinality dictionary [#51064](https://github.com/ClickHouse/ClickHouse/pull/51064) ([Michael Kolupaev](https://github.com/al13n321)).
+* Generate safe IVs [#51086](https://github.com/ClickHouse/ClickHouse/pull/51086) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Fix a versions' tweak for tagged commits, improve version_helper [#51035](https://github.com/ClickHouse/ClickHouse/pull/51035) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Sqlancer has changed master to main [#51060](https://github.com/ClickHouse/ClickHouse/pull/51060) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/docs/changelogs/v23.2.7.32-stable.md b/docs/changelogs/v23.2.7.32-stable.md
new file mode 100644
index 00000000000..db5e9e76311
--- /dev/null
+++ b/docs/changelogs/v23.2.7.32-stable.md
@@ -0,0 +1,35 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.2.7.32-stable (934f6a2aa0e) FIXME as compared to v23.2.6.34-stable (570190045b0)
+
+#### Performance Improvement
+* Backported in [#49218](https://github.com/ClickHouse/ClickHouse/issues/49218): Fixed excessive reading in queries with `FINAL`. [#47801](https://github.com/ClickHouse/ClickHouse/pull/47801) ([Nikita Taranov](https://github.com/nickitat)).
+
+#### Build/Testing/Packaging Improvement
+* Backported in [#49208](https://github.com/ClickHouse/ClickHouse/issues/49208): Fix glibc compatibility check: replace `preadv` from musl. [#49144](https://github.com/ClickHouse/ClickHouse/pull/49144) ([alesapin](https://github.com/alesapin)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix key not found error for queries with multiple StorageJoin [#49137](https://github.com/ClickHouse/ClickHouse/pull/49137) ([vdimir](https://github.com/vdimir)).
+* Fix race on Outdated parts loading [#49223](https://github.com/ClickHouse/ClickHouse/pull/49223) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix bug in DISTINCT [#49628](https://github.com/ClickHouse/ClickHouse/pull/49628) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix msan issue in randomStringUTF8(<uneven number>) [#49750](https://github.com/ClickHouse/ClickHouse/pull/49750) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix IPv6 encoding in protobuf [#49933](https://github.com/ClickHouse/ClickHouse/pull/49933) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Avoid deadlock when starting table in attach thread of `ReplicatedMergeTree` [#50026](https://github.com/ClickHouse/ClickHouse/pull/50026) ([Antonio Andelic](https://github.com/antonio2368)).
+* JIT compilation not equals NaN fix [#50056](https://github.com/ClickHouse/ClickHouse/pull/50056) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix crash with `multiIf` and constant condition and nullable arguments [#50123](https://github.com/ClickHouse/ClickHouse/pull/50123) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix Keeper deadlock on exception when preprocessing requests. [#50387](https://github.com/ClickHouse/ClickHouse/pull/50387) ([frinkr](https://github.com/frinkr)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Improve test reports [#49151](https://github.com/ClickHouse/ClickHouse/pull/49151) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fallback auth gh api [#49314](https://github.com/ClickHouse/ClickHouse/pull/49314) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Improve CI: status commit, auth for get_gh_api [#49388](https://github.com/ClickHouse/ClickHouse/pull/49388) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Update github.com/distribution/distribution [#50114](https://github.com/ClickHouse/ClickHouse/pull/50114) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Catch issues with dockerd during the build [#50700](https://github.com/ClickHouse/ClickHouse/pull/50700) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/docs/changelogs/v23.3.3.52-lts.md b/docs/changelogs/v23.3.3.52-lts.md
new file mode 100644
index 00000000000..f845e14eb78
--- /dev/null
+++ b/docs/changelogs/v23.3.3.52-lts.md
@@ -0,0 +1,45 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.3.3.52-lts (cb963c474db) FIXME as compared to v23.3.2.37-lts (1b144bcd101)
+
+#### Improvement
+* Backported in [#49954](https://github.com/ClickHouse/ClickHouse/issues/49954): Add support for (an unusual) case where the arguments in the `IN` operator are single-element tuples. [#49844](https://github.com/ClickHouse/ClickHouse/pull/49844) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+
+#### Build/Testing/Packaging Improvement
+* Backported in [#49210](https://github.com/ClickHouse/ClickHouse/issues/49210): Fix glibc compatibility check: replace `preadv` from musl. [#49144](https://github.com/ClickHouse/ClickHouse/pull/49144) ([alesapin](https://github.com/alesapin)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix aggregate empty string error [#48999](https://github.com/ClickHouse/ClickHouse/pull/48999) ([LiuNeng](https://github.com/liuneng1994)).
+* Fix key not found error for queries with multiple StorageJoin [#49137](https://github.com/ClickHouse/ClickHouse/pull/49137) ([vdimir](https://github.com/vdimir)).
+* Fix race on Outdated parts loading [#49223](https://github.com/ClickHouse/ClickHouse/pull/49223) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix bug in DISTINCT [#49628](https://github.com/ClickHouse/ClickHouse/pull/49628) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix msan issue in randomStringUTF8(<uneven number>) [#49750](https://github.com/ClickHouse/ClickHouse/pull/49750) ([Robert Schulze](https://github.com/rschu1ze)).
+* fix `is_prefix` in OptimizeRegularExpression [#49919](https://github.com/ClickHouse/ClickHouse/pull/49919) ([Han Fei](https://github.com/hanfei1991)).
+* Fix IPv6 encoding in protobuf [#49933](https://github.com/ClickHouse/ClickHouse/pull/49933) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Avoid deadlock when starting table in attach thread of `ReplicatedMergeTree` [#50026](https://github.com/ClickHouse/ClickHouse/pull/50026) ([Antonio Andelic](https://github.com/antonio2368)).
+* JIT compilation not equals NaN fix [#50056](https://github.com/ClickHouse/ClickHouse/pull/50056) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix crash with `multiIf` and constant condition and nullable arguments [#50123](https://github.com/ClickHouse/ClickHouse/pull/50123) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix reconnecting of HTTPS session when target host IP was changed [#50240](https://github.com/ClickHouse/ClickHouse/pull/50240) ([Aleksei Filatov](https://github.com/aalexfvk)).
+* Fixed type conversion from Date/Date32 to DateTime64 when querying with DateTime64 index [#50280](https://github.com/ClickHouse/ClickHouse/pull/50280) ([Lucas Chang](https://github.com/lucas-tubi)).
+* Fix Keeper deadlock on exception when preprocessing requests. [#50387](https://github.com/ClickHouse/ClickHouse/pull/50387) ([frinkr](https://github.com/frinkr)).
+* Fix incorrect constant folding [#50536](https://github.com/ClickHouse/ClickHouse/pull/50536) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix Log family table return wrong rows count after truncate [#50585](https://github.com/ClickHouse/ClickHouse/pull/50585) ([flynn](https://github.com/ucasfl)).
+* Fix bug in `uniqExact` parallel merging [#50590](https://github.com/ClickHouse/ClickHouse/pull/50590) ([Nikita Taranov](https://github.com/nickitat)).
+* Do not read all the columns from right GLOBAL JOIN table. [#50721](https://github.com/ClickHouse/ClickHouse/pull/50721) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Implement status comment [#48468](https://github.com/ClickHouse/ClickHouse/pull/48468) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Update curl to 8.0.1 (for CVEs) [#48765](https://github.com/ClickHouse/ClickHouse/pull/48765) ([Boris Kuschel](https://github.com/bkuschel)).
+* Improve test reports [#49151](https://github.com/ClickHouse/ClickHouse/pull/49151) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fallback auth gh api [#49314](https://github.com/ClickHouse/ClickHouse/pull/49314) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Improve CI: status commit, auth for get_gh_api [#49388](https://github.com/ClickHouse/ClickHouse/pull/49388) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Update github.com/distribution/distribution [#50114](https://github.com/ClickHouse/ClickHouse/pull/50114) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Catch issues with dockerd during the build [#50700](https://github.com/ClickHouse/ClickHouse/pull/50700) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/docs/changelogs/v23.3.4.17-lts.md b/docs/changelogs/v23.3.4.17-lts.md
new file mode 100644
index 00000000000..41d9d7dd06c
--- /dev/null
+++ b/docs/changelogs/v23.3.4.17-lts.md
@@ -0,0 +1,22 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.3.4.17-lts (2c99b73ff40) FIXME as compared to v23.3.3.52-lts (cb963c474db)
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix crash when Pool::Entry::disconnect() is called [#50334](https://github.com/ClickHouse/ClickHouse/pull/50334) ([Val Doroshchuk](https://github.com/valbok)).
+* Avoid storing logs in Keeper containing unknown operation [#50751](https://github.com/ClickHouse/ClickHouse/pull/50751) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix subtly broken copy-on-write of ColumnLowCardinality dictionary [#51064](https://github.com/ClickHouse/ClickHouse/pull/51064) ([Michael Kolupaev](https://github.com/al13n321)).
+* Generate safe IVs [#51086](https://github.com/ClickHouse/ClickHouse/pull/51086) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Don't mark a part as broken on `Poco::TimeoutException` [#50811](https://github.com/ClickHouse/ClickHouse/pull/50811) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix a versions' tweak for tagged commits, improve version_helper [#51035](https://github.com/ClickHouse/ClickHouse/pull/51035) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Sqlancer has changed master to main [#51060](https://github.com/ClickHouse/ClickHouse/pull/51060) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/docs/changelogs/v23.3.5.9-lts.md b/docs/changelogs/v23.3.5.9-lts.md
new file mode 100644
index 00000000000..df1aab541ec
--- /dev/null
+++ b/docs/changelogs/v23.3.5.9-lts.md
@@ -0,0 +1,19 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.3.5.9-lts (f5fbc2fd2b3) FIXME as compared to v23.3.4.17-lts (2c99b73ff40)
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix broken index analysis when binary operator contains a null constant argument [#50177](https://github.com/ClickHouse/ClickHouse/pull/50177) ([Amos Bird](https://github.com/amosbird)).
+* Cleanup moving parts [#50489](https://github.com/ClickHouse/ClickHouse/pull/50489) ([vdimir](https://github.com/vdimir)).
+* Do not apply projection if read-in-order was enabled. [#50923](https://github.com/ClickHouse/ClickHouse/pull/50923) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Increase max array size in group bitmap [#50620](https://github.com/ClickHouse/ClickHouse/pull/50620) ([Kruglov Pavel](https://github.com/Avogar)).
+
diff --git a/docs/changelogs/v23.3.6.7-lts.md b/docs/changelogs/v23.3.6.7-lts.md
new file mode 100644
index 00000000000..387cc126aba
--- /dev/null
+++ b/docs/changelogs/v23.3.6.7-lts.md
@@ -0,0 +1,19 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.3.6.7-lts (7e3f0a271b7) FIXME as compared to v23.3.5.9-lts (f5fbc2fd2b3)
+
+#### Improvement
+* Backported in [#51240](https://github.com/ClickHouse/ClickHouse/issues/51240): Improve the progress bar for file/s3/hdfs/url table functions by using chunk size from source data and using incremental total size counting in each thread. Fix the progress bar for *Cluster functions. This closes [#47250](https://github.com/ClickHouse/ClickHouse/issues/47250). [#51088](https://github.com/ClickHouse/ClickHouse/pull/51088) ([Kruglov Pavel](https://github.com/Avogar)).
+
+#### Build/Testing/Packaging Improvement
+* Backported in [#51529](https://github.com/ClickHouse/ClickHouse/issues/51529): Split huge `RUN` in Dockerfile into smaller conditional. Install the necessary tools on demand in the same `RUN` layer, and remove them after that. Upgrade the OS only once at the beginning. Use a modern way to check the signed repository. Downgrade the base repo to ubuntu:20.04 to address the issues on older docker versions. Upgrade golang version to address golang vulnerabilities. [#51504](https://github.com/ClickHouse/ClickHouse/pull/51504) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix type of LDAP server params hash in cache entry [#50865](https://github.com/ClickHouse/ClickHouse/pull/50865) ([Julian Maicher](https://github.com/jmaicher)).
+
diff --git a/docs/changelogs/v23.3.7.5-lts.md b/docs/changelogs/v23.3.7.5-lts.md
new file mode 100644
index 00000000000..7a5fd5a19b6
--- /dev/null
+++ b/docs/changelogs/v23.3.7.5-lts.md
@@ -0,0 +1,16 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.3.7.5-lts (bc683c11c92) FIXME as compared to v23.3.6.7-lts (7e3f0a271b7)
+
+#### Build/Testing/Packaging Improvement
+* Backported in [#51568](https://github.com/ClickHouse/ClickHouse/issues/51568): This a follow-up for [#51504](https://github.com/ClickHouse/ClickHouse/issues/51504), the cleanup was lost during refactoring. [#51564](https://github.com/ClickHouse/ClickHouse/pull/51564) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix fuzzer failure in ActionsDAG [#51301](https://github.com/ClickHouse/ClickHouse/pull/51301) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
diff --git a/docs/changelogs/v23.4.3.48-stable.md b/docs/changelogs/v23.4.3.48-stable.md
new file mode 100644
index 00000000000..8bafd22bfbd
--- /dev/null
+++ b/docs/changelogs/v23.4.3.48-stable.md
@@ -0,0 +1,42 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.4.3.48-stable (d9199f8d3cc) FIXME as compared to v23.4.2.11-stable (b6442320f9d)
+
+#### Backward Incompatible Change
+* Backported in [#49981](https://github.com/ClickHouse/ClickHouse/issues/49981): Revert "`groupArray` returns cannot be nullable" (due to binary compatibility breakage for `groupArray`/`groupArrayLast`/`groupArraySample` over `Nullable` types, which likely will lead to `TOO_LARGE_ARRAY_SIZE` or `CANNOT_READ_ALL_DATA`). [#49971](https://github.com/ClickHouse/ClickHouse/pull/49971) ([Azat Khuzhin](https://github.com/azat)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix key not found error for queries with multiple StorageJoin [#49137](https://github.com/ClickHouse/ClickHouse/pull/49137) ([vdimir](https://github.com/vdimir)).
+* Fix fuzz bug when subquery set is not built when reading from remote() [#49425](https://github.com/ClickHouse/ClickHouse/pull/49425) ([Alexander Gololobov](https://github.com/davenger)).
+* Fix postgres database setting [#49481](https://github.com/ClickHouse/ClickHouse/pull/49481) ([Mal Curtis](https://github.com/snikch)).
+* Fix AsynchronousReadIndirectBufferFromRemoteFS breaking on short seeks [#49525](https://github.com/ClickHouse/ClickHouse/pull/49525) ([Michael Kolupaev](https://github.com/al13n321)).
+* Fix bug in DISTINCT [#49628](https://github.com/ClickHouse/ClickHouse/pull/49628) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix assert in SpanHolder::finish() with fibers [#49673](https://github.com/ClickHouse/ClickHouse/pull/49673) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix msan issue in randomStringUTF8(<uneven number>) [#49750](https://github.com/ClickHouse/ClickHouse/pull/49750) ([Robert Schulze](https://github.com/rschu1ze)).
+* fix `is_prefix` in OptimizeRegularExpression [#49919](https://github.com/ClickHouse/ClickHouse/pull/49919) ([Han Fei](https://github.com/hanfei1991)).
+* Fix IPv6 encoding in protobuf [#49933](https://github.com/ClickHouse/ClickHouse/pull/49933) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Avoid deadlock when starting table in attach thread of `ReplicatedMergeTree` [#50026](https://github.com/ClickHouse/ClickHouse/pull/50026) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix assert in SpanHolder::finish() with fibers attempt 2 [#50034](https://github.com/ClickHouse/ClickHouse/pull/50034) ([Kruglov Pavel](https://github.com/Avogar)).
+* JIT compilation not equals NaN fix [#50056](https://github.com/ClickHouse/ClickHouse/pull/50056) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix crashing in case of Replicated database without arguments [#50058](https://github.com/ClickHouse/ClickHouse/pull/50058) ([Azat Khuzhin](https://github.com/azat)).
+* Fix crash with `multiIf` and constant condition and nullable arguments [#50123](https://github.com/ClickHouse/ClickHouse/pull/50123) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix iceberg metadata parsing [#50232](https://github.com/ClickHouse/ClickHouse/pull/50232) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix bugs in Poco sockets in non-blocking mode, use true non-blocking sockets [#50252](https://github.com/ClickHouse/ClickHouse/pull/50252) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fixed type conversion from Date/Date32 to DateTime64 when querying with DateTime64 index [#50280](https://github.com/ClickHouse/ClickHouse/pull/50280) ([Lucas Chang](https://github.com/lucas-tubi)).
+* Fix Keeper deadlock on exception when preprocessing requests. [#50387](https://github.com/ClickHouse/ClickHouse/pull/50387) ([frinkr](https://github.com/frinkr)).
+* Fix Log family table return wrong rows count after truncate [#50585](https://github.com/ClickHouse/ClickHouse/pull/50585) ([flynn](https://github.com/ucasfl)).
+* Fix bug in `uniqExact` parallel merging [#50590](https://github.com/ClickHouse/ClickHouse/pull/50590) ([Nikita Taranov](https://github.com/nickitat)).
+* Do not read all the columns from right GLOBAL JOIN table. [#50721](https://github.com/ClickHouse/ClickHouse/pull/50721) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Improve CI: status commit, auth for get_gh_api [#49388](https://github.com/ClickHouse/ClickHouse/pull/49388) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Update github.com/distribution/distribution [#50114](https://github.com/ClickHouse/ClickHouse/pull/50114) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Catch issues with dockerd during the build [#50700](https://github.com/ClickHouse/ClickHouse/pull/50700) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/docs/changelogs/v23.4.4.16-stable.md b/docs/changelogs/v23.4.4.16-stable.md
new file mode 100644
index 00000000000..72056f72091
--- /dev/null
+++ b/docs/changelogs/v23.4.4.16-stable.md
@@ -0,0 +1,22 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.4.4.16-stable (747ba4fc6a0) FIXME as compared to v23.4.3.48-stable (d9199f8d3cc)
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix crash when Pool::Entry::disconnect() is called [#50334](https://github.com/ClickHouse/ClickHouse/pull/50334) ([Val Doroshchuk](https://github.com/valbok)).
+* Fix iceberg V2 optional metadata parsing [#50974](https://github.com/ClickHouse/ClickHouse/pull/50974) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix subtly broken copy-on-write of ColumnLowCardinality dictionary [#51064](https://github.com/ClickHouse/ClickHouse/pull/51064) ([Michael Kolupaev](https://github.com/al13n321)).
+* Generate safe IVs [#51086](https://github.com/ClickHouse/ClickHouse/pull/51086) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Don't mark a part as broken on `Poco::TimeoutException` [#50811](https://github.com/ClickHouse/ClickHouse/pull/50811) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix a versions' tweak for tagged commits, improve version_helper [#51035](https://github.com/ClickHouse/ClickHouse/pull/51035) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Sqlancer has changed master to main [#51060](https://github.com/ClickHouse/ClickHouse/pull/51060) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/docs/changelogs/v23.4.5.22-stable.md b/docs/changelogs/v23.4.5.22-stable.md
new file mode 100644
index 00000000000..2d61f5b11cf
--- /dev/null
+++ b/docs/changelogs/v23.4.5.22-stable.md
@@ -0,0 +1,27 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.4.5.22-stable (0ced5d6a8da) FIXME as compared to v23.4.4.16-stable (747ba4fc6a0)
+
+#### Build/Testing/Packaging Improvement
+* Backported in [#51530](https://github.com/ClickHouse/ClickHouse/issues/51530): Split huge `RUN` in Dockerfile into smaller conditional. Install the necessary tools on demand in the same `RUN` layer, and remove them after that. Upgrade the OS only once at the beginning. Use a modern way to check the signed repository. Downgrade the base repo to ubuntu:20.04 to address the issues on older docker versions. Upgrade golang version to address golang vulnerabilities. [#51504](https://github.com/ClickHouse/ClickHouse/pull/51504) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Backported in [#51570](https://github.com/ClickHouse/ClickHouse/issues/51570): This a follow-up for [#51504](https://github.com/ClickHouse/ClickHouse/issues/51504), the cleanup was lost during refactoring. [#51564](https://github.com/ClickHouse/ClickHouse/pull/51564) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix broken index analysis when binary operator contains a null constant argument [#50177](https://github.com/ClickHouse/ClickHouse/pull/50177) ([Amos Bird](https://github.com/amosbird)).
+* Fix reconnecting of HTTPS session when target host IP was changed [#50240](https://github.com/ClickHouse/ClickHouse/pull/50240) ([Aleksei Filatov](https://github.com/aalexfvk)).
+* Fix incorrect constant folding [#50536](https://github.com/ClickHouse/ClickHouse/pull/50536) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix type of LDAP server params hash in cache entry [#50865](https://github.com/ClickHouse/ClickHouse/pull/50865) ([Julian Maicher](https://github.com/jmaicher)).
+* Fallback to parsing big integer from String instead of exception in Parquet format [#50873](https://github.com/ClickHouse/ClickHouse/pull/50873) ([Kruglov Pavel](https://github.com/Avogar)).
+* Do not apply projection if read-in-order was enabled. [#50923](https://github.com/ClickHouse/ClickHouse/pull/50923) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix fuzzer failure in ActionsDAG [#51301](https://github.com/ClickHouse/ClickHouse/pull/51301) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Increase max array size in group bitmap [#50620](https://github.com/ClickHouse/ClickHouse/pull/50620) ([Kruglov Pavel](https://github.com/Avogar)).
+
diff --git a/docs/changelogs/v23.5.1.3174-stable.md b/docs/changelogs/v23.5.1.3174-stable.md
new file mode 100644
index 00000000000..01e5425de71
--- /dev/null
+++ b/docs/changelogs/v23.5.1.3174-stable.md
@@ -0,0 +1,599 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.5.1.3174-stable (2fec796e73e) FIXME as compared to v23.4.1.1943-stable (3920eb987f7)
+
+#### Backward Incompatible Change
+* Make local object storage work consistently with s3 object storage, fix problem with append (closes [#48465](https://github.com/ClickHouse/ClickHouse/issues/48465)), make it configurable as independent storage. The change is backward incompatible because cache on top of local object storage is not incompatible to previous versions. [#48791](https://github.com/ClickHouse/ClickHouse/pull/48791) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Date_trunc function to always return datetime type. [#48851](https://github.com/ClickHouse/ClickHouse/pull/48851) ([Shane Andrade](https://github.com/mauidude)).
+* Remove the experimental feature "in-memory data parts". The data format is still supported, but the settings are no-op, and compact or wide parts will be used instead. This closes [#45409](https://github.com/ClickHouse/ClickHouse/issues/45409). [#49429](https://github.com/ClickHouse/ClickHouse/pull/49429) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Changed default values of settings parallelize_output_from_storages and input_format_parquet_preserve_order. This allows ClickHouse to reorder rows when reading from files (e.g. CSV or Parquet), greatly improving performance in many cases. To restore the old behavior of preserving order, use `parallelize_output_from_storages = 0`, `input_format_parquet_preserve_order = 1`. [#49479](https://github.com/ClickHouse/ClickHouse/pull/49479) ([Michael Kolupaev](https://github.com/al13n321)).
+* Make projections production-ready. Add the `optimize_use_projections` setting to control whether the projections will be selected for SELECT queries. The setting `allow_experimental_projection_optimization` is obsolete and does nothing. [#49719](https://github.com/ClickHouse/ClickHouse/pull/49719) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Mark joinGet() as non deterministic (so as dictGet). [#49843](https://github.com/ClickHouse/ClickHouse/pull/49843) ([Azat Khuzhin](https://github.com/azat)).
+* Revert "`groupArray` returns cannot be nullable" (due to binary compatibility breakage for `groupArray`/`groupArrayLast`/`groupArraySample` over `Nullable` types, which likely will lead to `TOO_LARGE_ARRAY_SIZE` or `CANNOT_READ_ALL_DATA`). [#49971](https://github.com/ClickHouse/ClickHouse/pull/49971) ([Azat Khuzhin](https://github.com/azat)).
+
+#### New Feature
+* Password type in queries like `CREATE USER u IDENTIFIED BY 'p'` will be automatically set according to the setting `default_password_type` in the `config.xml` on the server. Closes [#42915](https://github.com/ClickHouse/ClickHouse/issues/42915). [#44674](https://github.com/ClickHouse/ClickHouse/pull/44674) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Add bcrypt password authentication type. Closes [#34599](https://github.com/ClickHouse/ClickHouse/issues/34599). [#44905](https://github.com/ClickHouse/ClickHouse/pull/44905) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Added `system.zookeeper_connection` table that shows information about ZooKeeper connections. [#45245](https://github.com/ClickHouse/ClickHouse/pull/45245) ([mateng915](https://github.com/mateng0915)).
+* Add urlCluster table function. Refactor all *Cluster table functions to reduce code duplication. Make schema inference work for all possible *Cluster function signatures and for named collections. Closes [#38499](https://github.com/ClickHouse/ClickHouse/issues/38499). [#45427](https://github.com/ClickHouse/ClickHouse/pull/45427) ([attack204](https://github.com/attack204)).
+* Extend `first_value` and `last_value` to accept null. [#46467](https://github.com/ClickHouse/ClickHouse/pull/46467) ([lgbo](https://github.com/lgbo-ustc)).
+* Add server and format settings `display_secrets_in_show_and_select` for displaying secrets of tables, databases, table functions, and dictionaries. Add privilege `displaySecretsInShowAndSelect` controlling which users can view secrets. [#46528](https://github.com/ClickHouse/ClickHouse/pull/46528) ([Mike Kot](https://github.com/myrrc)).
+* Add new function `generateRandomStructure` that generates random table structure. It can be used in combination with table function `generateRandom`. [#47409](https://github.com/ClickHouse/ClickHouse/pull/47409) ([Kruglov Pavel](https://github.com/Avogar)).
+* Added native ClickHouse Keeper CLI Client. [#47414](https://github.com/ClickHouse/ClickHouse/pull/47414) ([pufit](https://github.com/pufit)).
+* The query cache can now be used for production workloads. [#47977](https://github.com/ClickHouse/ClickHouse/pull/47977) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix a bug that prevented the use of `CASE` without an `ELSE` branch and extended `transform` to deal with more types. Also fix some bugs that made transform() return incorrect results when decimal types were mixed with other numeric types. [#48300](https://github.com/ClickHouse/ClickHouse/pull/48300) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Added [server-side encryption using KMS keys](https://docs.aws.amazon.com/AmazonS3/latest/userguide/UsingKMSEncryption.html) with S3 tables, and the `header` setting with S3 disks. Closes [#48723](https://github.com/ClickHouse/ClickHouse/issues/48723). [#48724](https://github.com/ClickHouse/ClickHouse/pull/48724) ([Johann Gan](https://github.com/johanngan)).
+* Add MemoryTracker for the background tasks (merges and mutation). Introduces `merges_mutations_memory_usage_soft_limit` and `merges_mutations_memory_usage_to_ram_ratio` settings that represent the soft memory limit for merges and mutations. If this limit is reached ClickHouse won't schedule new merge or mutation tasks. Also `MergesMutationsMemoryTracking` metric is introduced to allow observing current memory usage of background tasks. Resubmit [#46089](https://github.com/ClickHouse/ClickHouse/issues/46089). Closes [#48774](https://github.com/ClickHouse/ClickHouse/issues/48774). [#48787](https://github.com/ClickHouse/ClickHouse/pull/48787) ([Dmitry Novik](https://github.com/novikd)).
+* Function `dotProduct` work for array. [#49050](https://github.com/ClickHouse/ClickHouse/pull/49050) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
+* Support statement `SHOW INDEX` to improve compatibility with MySQL. [#49158](https://github.com/ClickHouse/ClickHouse/pull/49158) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add virtual column `_file` and `_path` support to table function `url`. - Impove error message for table function `url`. - resolves [#49231](https://github.com/ClickHouse/ClickHouse/issues/49231) - resolves [#49232](https://github.com/ClickHouse/ClickHouse/issues/49232). [#49356](https://github.com/ClickHouse/ClickHouse/pull/49356) ([Ziyi Tan](https://github.com/Ziy1-Tan)).
+* Adding the `grants` field in the users.xml file, which allows specifying grants for users. [#49381](https://github.com/ClickHouse/ClickHouse/pull/49381) ([pufit](https://github.com/pufit)).
+* Add alias `str_to_map` and `mapfromstring` for `extractkeyvaluepairs`. closes [#47185](https://github.com/ClickHouse/ClickHouse/issues/47185). [#49466](https://github.com/ClickHouse/ClickHouse/pull/49466) ([flynn](https://github.com/ucasfl)).
+* Support full/right join by using grace hash join algorithm. [#49483](https://github.com/ClickHouse/ClickHouse/pull/49483) ([lgbo](https://github.com/lgbo-ustc)).
+* `WITH FILL` modifier groups filling by sorting prefix. Controlled by `use_with_fill_by_sorting_prefix` setting (enabled by default). Related to [#33203](https://github.com/ClickHouse/ClickHouse/issues/33203)#issuecomment-1418736794. [#49503](https://github.com/ClickHouse/ClickHouse/pull/49503) ([Igor Nikonov](https://github.com/devcrafter)).
+* Add SQL functions for entropy-learned hashing. [#49656](https://github.com/ClickHouse/ClickHouse/pull/49656) ([Robert Schulze](https://github.com/rschu1ze)).
+* Clickhouse-client now accepts queries after "--multiquery" when "--query" (or "-q") is absent. example: clickhouse-client --multiquery "select 1; select 2;". [#49870](https://github.com/ClickHouse/ClickHouse/pull/49870) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
+* Add separate `handshake_timeout` for receiving Hello packet from replica. Closes [#48854](https://github.com/ClickHouse/ClickHouse/issues/48854). [#49948](https://github.com/ClickHouse/ClickHouse/pull/49948) ([Kruglov Pavel](https://github.com/Avogar)).
+* New setting s3_max_inflight_parts_for_one_file sets the limit of concurrently loaded parts with multipart upload request in scope of one file. [#49961](https://github.com/ClickHouse/ClickHouse/pull/49961) ([Sema Checherinda](https://github.com/CheSema)).
+* Geographical data types (`Point`, `Ring`, `Polygon`, and `MultiPolygon`) are production-ready. [#50022](https://github.com/ClickHouse/ClickHouse/pull/50022) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Added a function "space()" which repeats a space as many times as specified. [#50103](https://github.com/ClickHouse/ClickHouse/pull/50103) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added --input_format_csv_trim_whitespaces option. [#50215](https://github.com/ClickHouse/ClickHouse/pull/50215) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
+* Added the dictGetAll function for regexp tree dictionaries to return values from multiple matches as arrays. Closes [#50254](https://github.com/ClickHouse/ClickHouse/issues/50254). [#50255](https://github.com/ClickHouse/ClickHouse/pull/50255) ([Johann Gan](https://github.com/johanngan)).
+* Added toLastDayOfWeek() function to round a date or a date with time up to the nearest Saturday or Sunday. [#50315](https://github.com/ClickHouse/ClickHouse/pull/50315) ([Victor Krasnov](https://github.com/sirvickr)).
+* Ability to ignore a skip index by specifying `ignore_data_skipping_indices`. [#50329](https://github.com/ClickHouse/ClickHouse/pull/50329) ([Boris Kuschel](https://github.com/bkuschel)).
+* Revert 'Add SQL functions for entropy-learned hashing'. [#50416](https://github.com/ClickHouse/ClickHouse/pull/50416) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add `system.user_processes` table and `SHOW USER PROCESSES` query to show memory info and ProfileEvents on user level. [#50492](https://github.com/ClickHouse/ClickHouse/pull/50492) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Added storage engine `AzureBlobStorage` and `azure_blob_storage` table function. The supported set of features is very similar to storage/table function `S3`. Implements [#19307](https://github.com/ClickHouse/ClickHouse/issues/19307). [#50604](https://github.com/ClickHouse/ClickHouse/pull/50604) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+
+#### Performance Improvement
+* Compress marks and primary key by default. It significantly reduces the cold query time. Upgrade notes: the support for compressed marks and primary key has been added in version 22.9. If you turned on compressed marks or primary key or installed version 23.5 or newer, which has compressed marks or primary key on by default, you will not be able to downgrade to version 22.8 or earlier. You can also explicitly disable compressed marks or primary keys by specifying the `compress_marks` and `compress_primary_key` settings in the `<merge_tree>` section of the server configuration file. **Upgrade notes:** If you upgrade from versions prior to 22.9, you should either upgrade all replicas at once or disable the compression before upgrade, or upgrade through an intermediate version, where the compressed marks are supported but not enabled by default, such as 23.3. [#42587](https://github.com/ClickHouse/ClickHouse/pull/42587) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* When reading from multiple files reduce parallel parsing threads for each file resolves [#42192](https://github.com/ClickHouse/ClickHouse/issues/42192). [#46661](https://github.com/ClickHouse/ClickHouse/pull/46661) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Do not store blocks in `ANY` hash join if nothing is inserted. [#48633](https://github.com/ClickHouse/ClickHouse/pull/48633) ([vdimir](https://github.com/vdimir)).
+* Fixes aggregate combinator `-If` when JIT compiled. Closes [#48120](https://github.com/ClickHouse/ClickHouse/issues/48120). [#49083](https://github.com/ClickHouse/ClickHouse/pull/49083) ([Igor Nikonov](https://github.com/devcrafter)).
+* For reading from remote tables we use smaller tasks (instead of reading the whole part) to make tasks stealing work * task size is determined by size of columns to read * always use 1mb buffers for reading from s3 * boundaries of cache segments aligned to 1mb so they have decent size even with small tasks. it also should prevent fragmentation. [#49287](https://github.com/ClickHouse/ClickHouse/pull/49287) ([Nikita Taranov](https://github.com/nickitat)).
+* Default size of a read buffer for reading from local filesystem changed to a slightly better value. Also two new settings are introduced: `max_read_buffer_size_local_fs` and `max_read_buffer_size_remote_fs`. [#49321](https://github.com/ClickHouse/ClickHouse/pull/49321) ([Nikita Taranov](https://github.com/nickitat)).
+* Improve memory usage and speed of `SPARSE_HASHED`/`HASHED` dictionaries (e.g. `SPARSE_HASHED` now eats 2.6x less memory, and is ~2x faster). [#49380](https://github.com/ClickHouse/ClickHouse/pull/49380) ([Azat Khuzhin](https://github.com/azat)).
+* Use aggregate projection only if it reads fewer granules than normal reading. It should help in case if query hits the PK of the table, but not the projection. Fixes [#49150](https://github.com/ClickHouse/ClickHouse/issues/49150). [#49417](https://github.com/ClickHouse/ClickHouse/pull/49417) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Optimize PODArray::resize_fill() callers. [#49459](https://github.com/ClickHouse/ClickHouse/pull/49459) ([Azat Khuzhin](https://github.com/azat)).
+* Optimize the system.query_log and system.query_thread_log tables by applying LowCardinality when appropriate. The queries over these tables will be faster. [#49530](https://github.com/ClickHouse/ClickHouse/pull/49530) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Better performance when reading local Parquet files (through parallel reading). [#49539](https://github.com/ClickHouse/ClickHouse/pull/49539) ([Michael Kolupaev](https://github.com/al13n321)).
+* Improve the performance of `RIGHT/FULL JOIN` by up to 2 times in certain scenarios, especially when joining a small left table with a large right table. [#49585](https://github.com/ClickHouse/ClickHouse/pull/49585) ([lgbo](https://github.com/lgbo-ustc)).
+* Improve performance of BLAKE3 by 11% by enabling LTO for Rust. [#49600](https://github.com/ClickHouse/ClickHouse/pull/49600) ([Azat Khuzhin](https://github.com/azat)).
+* Optimize the structure of the `system.opentelemetry_span_log`. Use `LowCardinality` where appropriate. Although this table is generally stupid (it is using the Map data type even for common attributes), it will be slightly better. [#49647](https://github.com/ClickHouse/ClickHouse/pull/49647) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Try to reserve hash table's size in `grace_hash` join. [#49816](https://github.com/ClickHouse/ClickHouse/pull/49816) ([lgbo](https://github.com/lgbo-ustc)).
+* As is addresed in issue [#49748](https://github.com/ClickHouse/ClickHouse/issues/49748), the predicates with date converters, such as **toYear, toYYYYMM**, could be rewritten with the equivalent date (YYYY-MM-DD) comparisons at the AST level. And this transformation could bring performance improvement as it is free from the expensive date converter and the comparison between dates (or integers in the low level representation) is quite low-cost. The [prototype](https://github.com/ZhiguoZh/ClickHouse/commit/c7f1753f0c9363a19d95fa46f1cfed1d9f505ee0) shows that, with all identified date converters optimized, the overall QPS of the 13 queries is enhanced by **~11%** on the ICX server (Intel Xeon Platinum 8380 CPU, 80 cores, 160 threads). [#50062](https://github.com/ClickHouse/ClickHouse/pull/50062) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
+* Parallel merge of `uniqExactIf` states. Closes [#49885](https://github.com/ClickHouse/ClickHouse/issues/49885). [#50285](https://github.com/ClickHouse/ClickHouse/pull/50285) ([flynn](https://github.com/ucasfl)).
+* As is addresed in issue [#49748](https://github.com/ClickHouse/ClickHouse/issues/49748), the predicates with date converters, such as toYear, toYYYYMM, could be rewritten with the equivalent date (YYYY-MM-DD) comparisons at the AST level. And this transformation could bring performance improvement as it is free from the expensive date converter and the comparison between dates (or integers in the low level representation) is quite low-cost. [#50307](https://github.com/ClickHouse/ClickHouse/pull/50307) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
+* Parallel merging supported for `uniqExact` with modifiers `-Array`, `-Merge`, `-OrNull`, `-State`. [#50413](https://github.com/ClickHouse/ClickHouse/pull/50413) ([flynn](https://github.com/ucasfl)).
+* Enable LZ4_FAST_DEC_LOOP for Arm LZ4 to get 5% of decompression speed. [#50588](https://github.com/ClickHouse/ClickHouse/pull/50588) ([Daniel Kutenin](https://github.com/danlark1)).
+
+#### Improvement
+* Add support for CGroup version 2 for asynchronous metrics about the memory usage and availability. This closes [#37983](https://github.com/ClickHouse/ClickHouse/issues/37983). [#45999](https://github.com/ClickHouse/ClickHouse/pull/45999) ([sichenzhao](https://github.com/sichenzhao)).
+* Cluster table functions should always skip unavailable shards. close [#46314](https://github.com/ClickHouse/ClickHouse/issues/46314). [#46765](https://github.com/ClickHouse/ClickHouse/pull/46765) ([zk_kiger](https://github.com/zk-kiger)).
+* When your csv file contains empty columns, like： ```. [#47496](https://github.com/ClickHouse/ClickHouse/pull/47496) ([你不要过来啊](https://github.com/iiiuwioajdks)).
+* ROW POLICY for all tables that belong to a DATABASE. [#47640](https://github.com/ClickHouse/ClickHouse/pull/47640) ([Ilya Golshtein](https://github.com/ilejn)).
+* Add Google Cloud Storage S3 compatible table function `gcs`. Like the `oss` and `cosn` functions, it is just an alias over the `s3` table function, and it does not bring any new features. [#47815](https://github.com/ClickHouse/ClickHouse/pull/47815) ([Kuba Kaflik](https://github.com/jkaflik)).
+* Add ability to use strict parts size for S3 (compatibility with CloudFlare R2 S3 Storage). [#48492](https://github.com/ClickHouse/ClickHouse/pull/48492) ([Azat Khuzhin](https://github.com/azat)).
+* Added new columns with info about `Replicated` database replicas to `system.clusters`: `database_shard_name`, `database_replica_name`, `is_active`. Added an optional `FROM SHARD` clause to `SYSTEM DROP DATABASE REPLICA` query. [#48548](https://github.com/ClickHouse/ClickHouse/pull/48548) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Add a new column `zookeeper_name` in system.replicas, to indicate on which (auxiliary) zookeeper cluster the replicated table's metadata is stored. [#48549](https://github.com/ClickHouse/ClickHouse/pull/48549) ([cangyin](https://github.com/cangyin)).
+* `IN` operator support compare `Date` and `Date32`. Closes [#48736](https://github.com/ClickHouse/ClickHouse/issues/48736). [#48806](https://github.com/ClickHouse/ClickHouse/pull/48806) ([flynn](https://github.com/ucasfl)).
+* Support for erasure codes in HDFS, author: @M1eyu2018, @tomscut. [#48833](https://github.com/ClickHouse/ClickHouse/pull/48833) ([M1eyu](https://github.com/M1eyu2018)).
+* The query cache can now supports queries with totals and extremes modifier. [#48853](https://github.com/ClickHouse/ClickHouse/pull/48853) ([Robert Schulze](https://github.com/rschu1ze)).
+* Introduces new keyword `INTO OUTFILE 'file.txt' APPEND`. [#48880](https://github.com/ClickHouse/ClickHouse/pull/48880) ([alekar](https://github.com/alekar)).
+* The `BACKUP` command will not decrypt data from encrypted disks while making a backup. Instead the data will be stored in a backup in encrypted form. Such backups can be restored only to an encrypted disk with the same (or extended) list of encryption keys. [#48896](https://github.com/ClickHouse/ClickHouse/pull/48896) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Keeper improvement: add `CheckNotExists` request to Keeper. [#48897](https://github.com/ClickHouse/ClickHouse/pull/48897) ([Antonio Andelic](https://github.com/antonio2368)).
+* Implement SYSTEM DROP REPLICA from auxillary ZooKeeper clusters, may be close [#48931](https://github.com/ClickHouse/ClickHouse/issues/48931). [#48932](https://github.com/ClickHouse/ClickHouse/pull/48932) ([wangxiaobo](https://github.com/wzb5212)).
+* Add Array data type to MongoDB. Closes [#48598](https://github.com/ClickHouse/ClickHouse/issues/48598). [#48983](https://github.com/ClickHouse/ClickHouse/pull/48983) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Keeper performance improvements: avoid serializing same request twice while processing. Cache deserialization results of large requests. Controlled by new coordination setting `min_request_size_for_cache`. [#49004](https://github.com/ClickHouse/ClickHouse/pull/49004) ([Antonio Andelic](https://github.com/antonio2368)).
+* Support storing `Interval` data types in tables. [#49085](https://github.com/ClickHouse/ClickHouse/pull/49085) ([larryluogit](https://github.com/larryluogit)).
+* Add support for size suffixes in quota creation statement parameters. [#49087](https://github.com/ClickHouse/ClickHouse/pull/49087) ([Eridanus](https://github.com/Eridanus117)).
+* Allow using `ntile` window function without explicit window frame definition: `ntile(3) OVER (ORDER BY a)`, close [#46763](https://github.com/ClickHouse/ClickHouse/issues/46763). [#49093](https://github.com/ClickHouse/ClickHouse/pull/49093) ([vdimir](https://github.com/vdimir)).
+* Added settings (`number_of_mutations_to_delay`, `number_of_mutations_to_throw`) to delay or throw `ALTER` queries that create mutations (`ALTER UPDATE`, `ALTER DELETE`, `ALTER MODIFY COLUMN`, ...) in case when table already has a lot of unfinished mutations. [#49117](https://github.com/ClickHouse/ClickHouse/pull/49117) ([Anton Popov](https://github.com/CurtizJ)).
+* Added setting `async_insert` for `MergeTables`. It has the same meaning as query-level setting `async_insert` and enables asynchronous inserts for specific table. Note: it doesn't take effect for insert queries from `clickhouse-client`, use query-level setting in that case. [#49122](https://github.com/ClickHouse/ClickHouse/pull/49122) ([Anton Popov](https://github.com/CurtizJ)).
+* Catch exception from `create_directories` in filesystem cache. [#49203](https://github.com/ClickHouse/ClickHouse/pull/49203) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Copies embedded examples to a new field `example` in `system.functions` to supplement the field `description`. [#49222](https://github.com/ClickHouse/ClickHouse/pull/49222) ([Dan Roscigno](https://github.com/DanRoscigno)).
+* Enable connection options for the MongoDB dictionary. Example: ``` xml <source> <mongodb> <host>localhost</host> <port>27017</port> <user></user> <password></password> <db>test</db> <collection>dictionary_source</collection> <options>ssl=true</options> </mongodb> </source> ``` ### Documentation entry for user-facing changes. [#49225](https://github.com/ClickHouse/ClickHouse/pull/49225) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* Added an alias `asymptotic` for `asymp` computational method for `kolmogorovSmirnovTest`. Improved documentation. [#49286](https://github.com/ClickHouse/ClickHouse/pull/49286) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Aggregation function groupBitAnd/Or/Xor now work on signed integer data. This makes them consistent with the behavior of scalar functions bitAnd/Or/Xor. [#49292](https://github.com/ClickHouse/ClickHouse/pull/49292) ([exmy](https://github.com/exmy)).
+* Split function-documentation into more fine-granular fields. [#49300](https://github.com/ClickHouse/ClickHouse/pull/49300) ([Robert Schulze](https://github.com/rschu1ze)).
+* Introduced settings: - `merge_max_block_size_bytes` to limit the amount of memory used for background operations. - `vertical_merge_algorithm_min_bytes_to_activate` to add another condition to activate vertical merges. [#49313](https://github.com/ClickHouse/ClickHouse/pull/49313) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Use multiple threads shared between all tables within a server to load outdated data parts. The the size of the pool and its queue is controlled by `max_outdated_parts_loading_thread_pool_size` and `outdated_part_loading_thread_pool_queue_size` settings. [#49317](https://github.com/ClickHouse/ClickHouse/pull/49317) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Don't overestimate the size of processed data for `LowCardinality` columns when they share dictionaries between blocks. This closes [#49322](https://github.com/ClickHouse/ClickHouse/issues/49322). See also [#48745](https://github.com/ClickHouse/ClickHouse/issues/48745). [#49323](https://github.com/ClickHouse/ClickHouse/pull/49323) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Parquet writer now uses reasonable row group size when invoked through OUTFILE. [#49325](https://github.com/ClickHouse/ClickHouse/pull/49325) ([Michael Kolupaev](https://github.com/al13n321)).
+* Allow restricted keywords like `ARRAY` as an alias if the alias is quoted. Closes [#49324](https://github.com/ClickHouse/ClickHouse/issues/49324). [#49360](https://github.com/ClickHouse/ClickHouse/pull/49360) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Added possibility to use temporary tables in FROM part of ATTACH PARTITION FROM and REPLACE PARTITION FROM. [#49436](https://github.com/ClickHouse/ClickHouse/pull/49436) ([Roman Vasin](https://github.com/rvasin)).
+* Data parts loading and deletion jobs were moved to shared server-wide pools instead of per-table pools. Pools sizes are controlled via settings `max_active_parts_loading_thread_pool_size`, `max_outdated_parts_loading_thread_pool_size` and `max_parts_cleaning_thread_pool_size` in top-level config. Table-level settings `max_part_loading_threads` and `max_part_removal_threads` became obsolete. [#49474](https://github.com/ClickHouse/ClickHouse/pull/49474) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Allow `?password=pass` in URL. Password is replaced in browser history. [#49505](https://github.com/ClickHouse/ClickHouse/pull/49505) ([Mike Kot](https://github.com/myrrc)).
+* Allow zero objects in ReadBufferFromRemoteFSGather (because empty files are not backuped, so we might end up with zero blobs in metadata file). Closes [#49480](https://github.com/ClickHouse/ClickHouse/issues/49480). [#49519](https://github.com/ClickHouse/ClickHouse/pull/49519) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Attach thread MemoryTracker to `total_memory_tracker` after `ThreadGroup` detached. [#49527](https://github.com/ClickHouse/ClickHouse/pull/49527) ([Dmitry Novik](https://github.com/novikd)).
+* Make `Pretty` formats prettier: squash blocks if not much time passed since the output of the previous block. This is controlled by a new setting `output_format_pretty_squash_ms` (100ms by default). This closes [#49153](https://github.com/ClickHouse/ClickHouse/issues/49153). [#49537](https://github.com/ClickHouse/ClickHouse/pull/49537) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add initial support to do JOINs with pure parallel replicas. [#49544](https://github.com/ClickHouse/ClickHouse/pull/49544) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix parameterized views when query parameter used multiple times in the query. [#49556](https://github.com/ClickHouse/ClickHouse/pull/49556) ([Azat Khuzhin](https://github.com/azat)).
+* Release memory allocated for the last sent ProfileEvents snapshot in the context of a query. Followup [#47564](https://github.com/ClickHouse/ClickHouse/issues/47564). [#49561](https://github.com/ClickHouse/ClickHouse/pull/49561) ([Dmitry Novik](https://github.com/novikd)).
+* Function "makeDate" now provides a MySQL-compatible overload (year & day of the year argument). [#49603](https://github.com/ClickHouse/ClickHouse/pull/49603) ([Robert Schulze](https://github.com/rschu1ze)).
+* More parallelism on `Outdated` parts removal with "zero-copy replication". [#49630](https://github.com/ClickHouse/ClickHouse/pull/49630) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Reduced number of `List` ZooKeeper requests when selecting parts to merge and a lot of partitions do not have anything to merge. [#49637](https://github.com/ClickHouse/ClickHouse/pull/49637) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Support `dictionary` table function for `RegExpTreeDictionary`. [#49666](https://github.com/ClickHouse/ClickHouse/pull/49666) ([Han Fei](https://github.com/hanfei1991)).
+* Added weighted fair IO scheduling policy. Added dynamic resource manager, which allows IO scheduling hierarchy to be updated in runtime w/o server restarts. [#49671](https://github.com/ClickHouse/ClickHouse/pull/49671) ([Sergei Trifonov](https://github.com/serxa)).
+* Add compose request after multipart upload to GCS. This enables the usage of copy operation on objects uploaded with the multipart upload. It's recommended to set `s3_strict_upload_part_size` to some value because compose request can fail on objects created with parts of different sizes. [#49693](https://github.com/ClickHouse/ClickHouse/pull/49693) ([Antonio Andelic](https://github.com/antonio2368)).
+* Improve the "best-effort" parsing logic to accept `key_value_delimiter` as a valid part of the value. This also simplifies branching and might even speed up things a bit. [#49760](https://github.com/ClickHouse/ClickHouse/pull/49760) ([Arthur Passos](https://github.com/arthurpassos)).
+* Facilitate profile data association and aggregation for the same query. [#49777](https://github.com/ClickHouse/ClickHouse/pull/49777) ([helifu](https://github.com/helifu)).
+* System log tables can now have custom sorting keys. [#49778](https://github.com/ClickHouse/ClickHouse/pull/49778) ([helifu](https://github.com/helifu)).
+* A new field 'partitions' is used to indicate which partitions are participating in the calculation. [#49779](https://github.com/ClickHouse/ClickHouse/pull/49779) ([helifu](https://github.com/helifu)).
+* Added `enable_the_endpoint_id_with_zookeeper_name_prefix` setting for `ReplicatedMergeTree` (disabled by default). When enabled, it adds ZooKeeper cluster name to table's interserver communication endpoint. It avoids `Duplicate interserver IO endpoint` errors when having replicated tables with the same path, but different auxiliary ZooKeepers. [#49780](https://github.com/ClickHouse/ClickHouse/pull/49780) ([helifu](https://github.com/helifu)).
+* Add query parameters to clickhouse-local. Closes [#46561](https://github.com/ClickHouse/ClickHouse/issues/46561). [#49785](https://github.com/ClickHouse/ClickHouse/pull/49785) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Qpl_deflate codec lower the minimum simd version to sse 4.2. [doc change in qpl](https://github.com/intel/qpl/commit/3f8f5cea27739f5261e8fd577dc233ffe88bf679) - intel® qpl relies on a run-time kernels dispatcher and cpuid check to choose the best available implementation(sse/avx2/avx512) - restructured cmakefile for qpl build in clickhouse to align with latest upstream qpl. [#49811](https://github.com/ClickHouse/ClickHouse/pull/49811) ([jasperzhu](https://github.com/jinjunzh)).
+* Allow loading dictionaries and functions from YAML by default. In previous versions, it required editing the `dictionaries_config` or `user_defined_executable_functions_config` in the configuration file, as they expected `*.xml` files. [#49812](https://github.com/ClickHouse/ClickHouse/pull/49812) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The Kafka table engine now allows to use alias columns. [#49824](https://github.com/ClickHouse/ClickHouse/pull/49824) ([Aleksandr Musorin](https://github.com/AVMusorin)).
+* Add setting to limit the max number of pairs produced by extractKeyValuePairs, safeguard to avoid using way too much memory. [#49836](https://github.com/ClickHouse/ClickHouse/pull/49836) ([Arthur Passos](https://github.com/arthurpassos)).
+* Add support for (an unusual) case where the arguments in the `IN` operator are single-element tuples. [#49844](https://github.com/ClickHouse/ClickHouse/pull/49844) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* `bitHammingDistance` function support `String` and `FixedString` data type. Closes [#48827](https://github.com/ClickHouse/ClickHouse/issues/48827). [#49858](https://github.com/ClickHouse/ClickHouse/pull/49858) ([flynn](https://github.com/ucasfl)).
+* Fix timeout resetting errors in the client on OS X. [#49863](https://github.com/ClickHouse/ClickHouse/pull/49863) ([alekar](https://github.com/alekar)).
+* Add support for big integers, such as UInt128, Int128, UInt256, and Int256 in the function `bitCount`. This enables Hamming distance over large bit masks for AI applications. [#49867](https://github.com/ClickHouse/ClickHouse/pull/49867) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* This PR makes fingerprints to be used instead of key IDs in encrypted disks. [#49882](https://github.com/ClickHouse/ClickHouse/pull/49882) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Add UUID data type to PostgreSQL. Closes [#49739](https://github.com/ClickHouse/ClickHouse/issues/49739). [#49894](https://github.com/ClickHouse/ClickHouse/pull/49894) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Make `allow_experimental_query_cache` setting as obsolete for backward-compatibility. It was removed in https://github.com/ClickHouse/ClickHouse/pull/47977. [#49934](https://github.com/ClickHouse/ClickHouse/pull/49934) ([Timur Solodovnikov](https://github.com/tsolodov)).
+* Function toUnixTimestamp() now accepts Date and Date32 arguments. [#49989](https://github.com/ClickHouse/ClickHouse/pull/49989) ([Victor Krasnov](https://github.com/sirvickr)).
+* Charge only server memory for dictionaries. [#49995](https://github.com/ClickHouse/ClickHouse/pull/49995) ([Azat Khuzhin](https://github.com/azat)).
+* Add schema inference to PostgreSQL, MySQL, MeiliSearch, and SQLite table engines. Closes [#49972](https://github.com/ClickHouse/ClickHouse/issues/49972). [#50000](https://github.com/ClickHouse/ClickHouse/pull/50000) ([Nikolay Degterinsky](https://github.com/evillique)).
+* The server will allow using the `SQL_*` settings such as `SQL_AUTO_IS_NULL` as no-ops for MySQL compatibility. This closes [#49927](https://github.com/ClickHouse/ClickHouse/issues/49927). [#50013](https://github.com/ClickHouse/ClickHouse/pull/50013) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Preserve initial_query_id for ON CLUSTER queries, which is useful for introspection (under `distributed_ddl_entry_format_version=5`). [#50015](https://github.com/ClickHouse/ClickHouse/pull/50015) ([Azat Khuzhin](https://github.com/azat)).
+* Preserve backward incompatibility for renamed settings by using aliases (`allow_experimental_projection_optimization` for `optimize_use_projections`, `allow_experimental_lightweight_delete` for `enable_lightweight_delete`). [#50044](https://github.com/ClickHouse/ClickHouse/pull/50044) ([Azat Khuzhin](https://github.com/azat)).
+* Support cross-replication in distributed queries using the new infrastructure. [#50097](https://github.com/ClickHouse/ClickHouse/pull/50097) ([Dmitry Novik](https://github.com/novikd)).
+* Support passing fqdn through setting my_hostname to register cluster node in keeper. Add setting of invisible to support multi compute groups. A compute group as a cluster, is invisible to other compute groups. [#50186](https://github.com/ClickHouse/ClickHouse/pull/50186) ([Yangkuan Liu](https://github.com/LiuYangkuan)).
+* Fix PostgreSQL reading all the data even though `LIMIT n` could be specified. [#50187](https://github.com/ClickHouse/ClickHouse/pull/50187) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* 1) Fixed an error `NOT_FOUND_COLUMN_IN_BLOCK` in case of using parallel replicas with non-replicated storage with disabled setting `parallel_replicas_for_non_replicated_merge_tree` 2) Now `allow_experimental_parallel_reading_from_replicas` have 3 possible values - 0, 1 and 2. 0 - disabled, 1 - enabled, silently disable them in case of failure (in case of FINAL or JOIN), 2 - enabled, throw an expection in case of failure. 3) If FINAL modifier is used in SELECT query and parallel replicas are enabled, ClickHouse will try to disable them if `allow_experimental_parallel_reading_from_replicas` is set to 1 and throw an exception otherwise. [#50195](https://github.com/ClickHouse/ClickHouse/pull/50195) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Don't send head request for all keys in Iceberg schema inference, only for keys that are used for reaing data. [#50203](https://github.com/ClickHouse/ClickHouse/pull/50203) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add new profile events for queries with subqueries (`QueriesWithSubqueries`/`SelectQueriesWithSubqueries`/`InsertQueriesWithSubqueries`). [#50204](https://github.com/ClickHouse/ClickHouse/pull/50204) ([Azat Khuzhin](https://github.com/azat)).
+* Adding the roles field in the users.xml file, which allows specifying roles with grants via a config file. [#50278](https://github.com/ClickHouse/ClickHouse/pull/50278) ([pufit](https://github.com/pufit)).
+* When parallel replicas are enabled they will always skip unavailable servers (the behavior is controlled by the setting `skip_unavailable_shards`, enabled by default and can be only disabled). This closes: [#48565](https://github.com/ClickHouse/ClickHouse/issues/48565). [#50293](https://github.com/ClickHouse/ClickHouse/pull/50293) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Fix a typo. [#50306](https://github.com/ClickHouse/ClickHouse/pull/50306) ([helifu](https://github.com/helifu)).
+* Setting `enable_memory_bound_merging_of_aggregation_results` is enabled by default. If you update from version prior to 22.12, we recommend to set this flag to `false` until update is finished. [#50319](https://github.com/ClickHouse/ClickHouse/pull/50319) ([Nikita Taranov](https://github.com/nickitat)).
+* Report `CGroupCpuCfsPeriod` and `CGroupCpuCfsQuota` in AsynchronousMetrics. - Respect cgroup v2 memory limits during server startup. [#50379](https://github.com/ClickHouse/ClickHouse/pull/50379) ([alekar](https://github.com/alekar)).
+* Bump internal protobuf to v3.18 (fixes CVE-2022-1941). [#50400](https://github.com/ClickHouse/ClickHouse/pull/50400) ([Robert Schulze](https://github.com/rschu1ze)).
+* Bump internal libxml2 to v2.10.4 (fixes CVE-2023-28484 and CVE-2023-29469). [#50402](https://github.com/ClickHouse/ClickHouse/pull/50402) ([Robert Schulze](https://github.com/rschu1ze)).
+* Bump c-ares to v1.19.1 (CVE-2023-32067, CVE-2023-31130, CVE-2023-31147). [#50403](https://github.com/ClickHouse/ClickHouse/pull/50403) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix CVE-2022-2469 in libgsasl. [#50404](https://github.com/ClickHouse/ClickHouse/pull/50404) ([Robert Schulze](https://github.com/rschu1ze)).
+* Make filter push down through cross join. [#50430](https://github.com/ClickHouse/ClickHouse/pull/50430) ([Han Fei](https://github.com/hanfei1991)).
+* Add a signal handler for SIGQUIT to work the same way as SIGINT. Closes [#50298](https://github.com/ClickHouse/ClickHouse/issues/50298). [#50435](https://github.com/ClickHouse/ClickHouse/pull/50435) ([Nikolay Degterinsky](https://github.com/evillique)).
+* In case JSON parse fails due to the large size of the object output the last position to allow debugging. [#50474](https://github.com/ClickHouse/ClickHouse/pull/50474) ([Valentin Alexeev](https://github.com/valentinalexeev)).
+* Support decimals with not fixed size. Closes [#49130](https://github.com/ClickHouse/ClickHouse/issues/49130). [#50586](https://github.com/ClickHouse/ClickHouse/pull/50586) ([Kruglov Pavel](https://github.com/Avogar)).
+* Disable pure parallel replicas if trivial count optimization is possible. [#50594](https://github.com/ClickHouse/ClickHouse/pull/50594) ([Raúl Marín](https://github.com/Algunenano)).
+* Added support of TRUNCATE db.table additional to TRUNCATE TABLE db.table in MaterializedMySQL. [#50624](https://github.com/ClickHouse/ClickHouse/pull/50624) ([Val Doroshchuk](https://github.com/valbok)).
+* Disable parallel replicas automatically when the estimated number of granules is less than threshold. The behavior is controlled by a setting `parallel_replicas_min_number_of_granules_to_enable`. [#50639](https://github.com/ClickHouse/ClickHouse/pull/50639) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* When creating skipping indexes via "ALTER TABLE table ADD INDEX", the "GRANULARITY" clause can now be omitted. In that case, GRANULARITY is assumed to be 1. [#50658](https://github.com/ClickHouse/ClickHouse/pull/50658) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix slow cache in presence of big inserts. [#50680](https://github.com/ClickHouse/ClickHouse/pull/50680) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Set default max_elements limit in filesystem cache to 10000000. [#50682](https://github.com/ClickHouse/ClickHouse/pull/50682) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* SHOW INDICES is now an alias of statement SHOW INDEX/INDEXES/KEYS. [#50713](https://github.com/ClickHouse/ClickHouse/pull/50713) ([Robert Schulze](https://github.com/rschu1ze)).
+
+#### Build/Testing/Packaging Improvement
+* New and improved keeper-bench. Everything can be customized from yaml/XML file: - request generator - each type of request generator can have a specific set of fields - multi requests can be generated just by doing the same under `multi` key - for each request or subrequest in multi a `weight` field can be defined to control distribution - define trees that need to be setup for a test run - hosts can be defined with all timeouts customizable and it's possible to control how many sessions to generate for each host - integers defined with `min_value` and `max_value` fields are random number generators. [#48547](https://github.com/ClickHouse/ClickHouse/pull/48547) ([Antonio Andelic](https://github.com/antonio2368)).
+* ... Add a test to check max_rows_to_read_leaf behaviour. [#48950](https://github.com/ClickHouse/ClickHouse/pull/48950) ([Sean Haynes](https://github.com/seandhaynes)).
+* Io_uring is not supported on macos, don't choose it when running tests on local to avoid occassional failures. [#49250](https://github.com/ClickHouse/ClickHouse/pull/49250) ([Frank Chen](https://github.com/FrankChen021)).
+* Support named fault injection for testing. [#49361](https://github.com/ClickHouse/ClickHouse/pull/49361) ([Han Fei](https://github.com/hanfei1991)).
+* Fix the 01193_metadata_loading test to match the query execution time specific to s390x. [#49455](https://github.com/ClickHouse/ClickHouse/pull/49455) ([MeenaRenganathan22](https://github.com/MeenaRenganathan22)).
+* Use the RapidJSONParser library to parse the JSON float values in case of s390x. [#49457](https://github.com/ClickHouse/ClickHouse/pull/49457) ([MeenaRenganathan22](https://github.com/MeenaRenganathan22)).
+* Allow running ClickHouse in the OS where the `prctl` (process control) syscall is not available, such as AWS Lambda. [#49538](https://github.com/ClickHouse/ClickHouse/pull/49538) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Improve CI check with an enabled analyzer. Now it should be green if only tests from `tests/broken_tests.txt` are broken. [#49562](https://github.com/ClickHouse/ClickHouse/pull/49562) ([Dmitry Novik](https://github.com/novikd)).
+* Fixed the issue of build conflict between contrib/isa-l and isa-l in qpl [49296](https://github.com/ClickHouse/ClickHouse/issues/49296). [#49584](https://github.com/ClickHouse/ClickHouse/pull/49584) ([jasperzhu](https://github.com/jinjunzh)).
+* Utilities are now only build if explicitly requested ("-DENABLE_UTILS=1") instead of by default, this reduces link times in typical development builds. [#49620](https://github.com/ClickHouse/ClickHouse/pull/49620) ([Robert Schulze](https://github.com/rschu1ze)).
+* Pull build description of idxd-config into a separate CMake file to avoid accidental removal in future. [#49651](https://github.com/ClickHouse/ClickHouse/pull/49651) ([jasperzhu](https://github.com/jinjunzh)).
+* Add CI check with an enabled analyzer in the master. Followup [#49562](https://github.com/ClickHouse/ClickHouse/issues/49562). [#49668](https://github.com/ClickHouse/ClickHouse/pull/49668) ([Dmitry Novik](https://github.com/novikd)).
+* Switch to LLVM/clang 16. [#49678](https://github.com/ClickHouse/ClickHouse/pull/49678) ([Azat Khuzhin](https://github.com/azat)).
+* Fixed DefaultHash64 for non-64 bit integers on s390x. [#49833](https://github.com/ClickHouse/ClickHouse/pull/49833) ([Harry Lee](https://github.com/HarryLeeIBM)).
+* Allow building ClickHouse with clang-17. [#49851](https://github.com/ClickHouse/ClickHouse/pull/49851) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* ClickHouse is now easier to be integrated into other cmake projects. [#49991](https://github.com/ClickHouse/ClickHouse/pull/49991) ([Amos Bird](https://github.com/amosbird)).
+* Link `boost::context` library to `clickhouse_common_io`. This closes: [#50381](https://github.com/ClickHouse/ClickHouse/issues/50381). [#50385](https://github.com/ClickHouse/ClickHouse/pull/50385) ([HaiBo Li](https://github.com/marising)).
+* Add support for building with clang-17. [#50410](https://github.com/ClickHouse/ClickHouse/pull/50410) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix strange additional QEMU logging after [#47151](https://github.com/ClickHouse/ClickHouse/issues/47151), see https://s3.amazonaws.com/clickhouse-test-reports/50078/a4743996ee4f3583884d07bcd6501df0cfdaa346/stateless_tests__release__databasereplicated__[3_4].html. [#50442](https://github.com/ClickHouse/ClickHouse/pull/50442) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* ClickHouse can work on Linux RISC-V 6.1.22. This closes [#50456](https://github.com/ClickHouse/ClickHouse/issues/50456). [#50457](https://github.com/ClickHouse/ClickHouse/pull/50457) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* ActionsDAG: fix wrong optimization [#47584](https://github.com/ClickHouse/ClickHouse/pull/47584) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Correctly handle concurrent snapshots in Keeper [#48466](https://github.com/ClickHouse/ClickHouse/pull/48466) ([Antonio Andelic](https://github.com/antonio2368)).
+* MergeTreeMarksLoader holds DataPart instead of DataPartStorage [#48515](https://github.com/ClickHouse/ClickHouse/pull/48515) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* sequence state fix [#48603](https://github.com/ClickHouse/ClickHouse/pull/48603) ([Ilya Golshtein](https://github.com/ilejn)).
+* Back/Restore concurrency check on previous fails [#48726](https://github.com/ClickHouse/ClickHouse/pull/48726) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix Attaching a table with non-existent ZK path does not increase the ReadonlyReplica metric [#48954](https://github.com/ClickHouse/ClickHouse/pull/48954) ([wangxiaobo](https://github.com/wzb5212)).
+* Fix possible terminate called for uncaught exception in some places [#49112](https://github.com/ClickHouse/ClickHouse/pull/49112) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix key not found error for queries with multiple StorageJoin [#49137](https://github.com/ClickHouse/ClickHouse/pull/49137) ([vdimir](https://github.com/vdimir)).
+* Fix wrong query result when using nullable primary key [#49172](https://github.com/ClickHouse/ClickHouse/pull/49172) ([Duc Canh Le](https://github.com/canhld94)).
+* Revert "Fix GCS native copy ([#48981](https://github.com/ClickHouse/ClickHouse/issues/48981))" [#49194](https://github.com/ClickHouse/ClickHouse/pull/49194) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix reinterpretAs*() on big endian machines [#49198](https://github.com/ClickHouse/ClickHouse/pull/49198) ([Suzy Wang](https://github.com/SuzyWangIBMer)).
+* Lock zero copy parts more atomically [#49211](https://github.com/ClickHouse/ClickHouse/pull/49211) ([alesapin](https://github.com/alesapin)).
+* Fix race on Outdated parts loading [#49223](https://github.com/ClickHouse/ClickHouse/pull/49223) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix all key value is null and group use rollup return wrong answer [#49282](https://github.com/ClickHouse/ClickHouse/pull/49282) ([Shuai li](https://github.com/loneylee)).
+* Fix calculating load_factor for HASHED dictionaries with SHARDS [#49319](https://github.com/ClickHouse/ClickHouse/pull/49319) ([Azat Khuzhin](https://github.com/azat)).
+* Disallow configuring compression CODECs for alias columns [#49363](https://github.com/ClickHouse/ClickHouse/pull/49363) ([Timur Solodovnikov](https://github.com/tsolodov)).
+* Fix bug in removal of existing part directory [#49365](https://github.com/ClickHouse/ClickHouse/pull/49365) ([alesapin](https://github.com/alesapin)).
+* Properly fix GCS when HMAC is used [#49390](https://github.com/ClickHouse/ClickHouse/pull/49390) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix fuzz bug when subquery set is not built when reading from remote() [#49425](https://github.com/ClickHouse/ClickHouse/pull/49425) ([Alexander Gololobov](https://github.com/davenger)).
+* Invert `shutdown_wait_unfinished_queries` [#49427](https://github.com/ClickHouse/ClickHouse/pull/49427) ([Konstantin Bogdanov](https://github.com/thevar1able)).
+* Fix another zero copy bug [#49473](https://github.com/ClickHouse/ClickHouse/pull/49473) ([alesapin](https://github.com/alesapin)).
+* Fix postgres database setting [#49481](https://github.com/ClickHouse/ClickHouse/pull/49481) ([Mal Curtis](https://github.com/snikch)).
+* Correctly handle s3Cluster arguments [#49490](https://github.com/ClickHouse/ClickHouse/pull/49490) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix bug in TraceCollector destructor. [#49508](https://github.com/ClickHouse/ClickHouse/pull/49508) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Fix AsynchronousReadIndirectBufferFromRemoteFS breaking on short seeks [#49525](https://github.com/ClickHouse/ClickHouse/pull/49525) ([Michael Kolupaev](https://github.com/al13n321)).
+* Fix dictionaries loading order [#49560](https://github.com/ClickHouse/ClickHouse/pull/49560) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Forbid the change of data type of Object('json') column [#49563](https://github.com/ClickHouse/ClickHouse/pull/49563) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix stress test (Logical error: Expected 7134 >= 11030) [#49623](https://github.com/ClickHouse/ClickHouse/pull/49623) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix bug in DISTINCT [#49628](https://github.com/ClickHouse/ClickHouse/pull/49628) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix: DISTINCT in order with zero values in non-sorted columns [#49636](https://github.com/ClickHouse/ClickHouse/pull/49636) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix one-off error in big integers found by UBSan with fuzzer [#49645](https://github.com/ClickHouse/ClickHouse/pull/49645) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix reading from sparse columns after restart [#49660](https://github.com/ClickHouse/ClickHouse/pull/49660) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix assert in SpanHolder::finish() with fibers [#49673](https://github.com/ClickHouse/ClickHouse/pull/49673) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix short circuit functions and mutations with sparse arguments [#49716](https://github.com/ClickHouse/ClickHouse/pull/49716) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix writing appended files to incremental backups [#49725](https://github.com/ClickHouse/ClickHouse/pull/49725) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Ignore LWD column in checkPartDynamicColumns [#49737](https://github.com/ClickHouse/ClickHouse/pull/49737) ([Alexander Gololobov](https://github.com/davenger)).
+* Fix msan issue in randomStringUTF8(<uneven number>) [#49750](https://github.com/ClickHouse/ClickHouse/pull/49750) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix aggregate function kolmogorovSmirnovTest [#49768](https://github.com/ClickHouse/ClickHouse/pull/49768) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
+* Fix settings aliases in native protocol [#49776](https://github.com/ClickHouse/ClickHouse/pull/49776) ([Azat Khuzhin](https://github.com/azat)).
+* Fix `arrayMap` with array of tuples with single argument [#49789](https://github.com/ClickHouse/ClickHouse/pull/49789) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix per-query IO/BACKUPs throttling settings [#49797](https://github.com/ClickHouse/ClickHouse/pull/49797) ([Azat Khuzhin](https://github.com/azat)).
+* Fix setting NULL in profile definition [#49831](https://github.com/ClickHouse/ClickHouse/pull/49831) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix a bug with projections and the aggregate_functions_null_for_empty setting (for query_plan_optimize_projection) [#49873](https://github.com/ClickHouse/ClickHouse/pull/49873) ([Amos Bird](https://github.com/amosbird)).
+* Fix processing pending batch for Distributed async INSERT after restart [#49884](https://github.com/ClickHouse/ClickHouse/pull/49884) ([Azat Khuzhin](https://github.com/azat)).
+* Fix assertion in CacheMetadata::doCleanup [#49914](https://github.com/ClickHouse/ClickHouse/pull/49914) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* fix `is_prefix` in OptimizeRegularExpression [#49919](https://github.com/ClickHouse/ClickHouse/pull/49919) ([Han Fei](https://github.com/hanfei1991)).
+* Fix metrics `WriteBufferFromS3Bytes`, `WriteBufferFromS3Microseconds` and `WriteBufferFromS3RequestsErrors` [#49930](https://github.com/ClickHouse/ClickHouse/pull/49930) ([Aleksandr Musorin](https://github.com/AVMusorin)).
+* Fix IPv6 encoding in protobuf [#49933](https://github.com/ClickHouse/ClickHouse/pull/49933) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Fix possible Logical error on bad Nullable parsing for text formats [#49960](https://github.com/ClickHouse/ClickHouse/pull/49960) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add setting output_format_parquet_compliant_nested_types to produce more compatible Parquet files [#50001](https://github.com/ClickHouse/ClickHouse/pull/50001) ([Michael Kolupaev](https://github.com/al13n321)).
+* Fix logical error in stress test "Not enough space to add ..." [#50021](https://github.com/ClickHouse/ClickHouse/pull/50021) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Avoid deadlock when starting table in attach thread of `ReplicatedMergeTree` [#50026](https://github.com/ClickHouse/ClickHouse/pull/50026) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix assert in SpanHolder::finish() with fibers attempt 2 [#50034](https://github.com/ClickHouse/ClickHouse/pull/50034) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add proper escaping for DDL OpenTelemetry context serialization [#50045](https://github.com/ClickHouse/ClickHouse/pull/50045) ([Azat Khuzhin](https://github.com/azat)).
+* Fix reporting broken projection parts [#50052](https://github.com/ClickHouse/ClickHouse/pull/50052) ([Amos Bird](https://github.com/amosbird)).
+* JIT compilation not equals NaN fix [#50056](https://github.com/ClickHouse/ClickHouse/pull/50056) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix crashing in case of Replicated database without arguments [#50058](https://github.com/ClickHouse/ClickHouse/pull/50058) ([Azat Khuzhin](https://github.com/azat)).
+* Fix crash with `multiIf` and constant condition and nullable arguments [#50123](https://github.com/ClickHouse/ClickHouse/pull/50123) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix invalid index analysis for date related keys [#50153](https://github.com/ClickHouse/ClickHouse/pull/50153) ([Amos Bird](https://github.com/amosbird)).
+* do not allow modify order by when there are no order by cols [#50154](https://github.com/ClickHouse/ClickHouse/pull/50154) ([Han Fei](https://github.com/hanfei1991)).
+* Fix broken index analysis when binary operator contains a null constant argument [#50177](https://github.com/ClickHouse/ClickHouse/pull/50177) ([Amos Bird](https://github.com/amosbird)).
+* clickhouse-client: disallow usage of `--query` and `--queries-file` at the same time [#50210](https://github.com/ClickHouse/ClickHouse/pull/50210) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
+* Fix UB for INTO OUTFILE extensions (APPEND / AND STDOUT) and WATCH EVENTS [#50216](https://github.com/ClickHouse/ClickHouse/pull/50216) ([Azat Khuzhin](https://github.com/azat)).
+* Fix skipping spaces at end of row in CustomSeparatedIgnoreSpaces format [#50224](https://github.com/ClickHouse/ClickHouse/pull/50224) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix iceberg metadata parsing [#50232](https://github.com/ClickHouse/ClickHouse/pull/50232) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix nested distributed SELECT in WITH clause [#50234](https://github.com/ClickHouse/ClickHouse/pull/50234) ([Azat Khuzhin](https://github.com/azat)).
+* Fix reconnecting of HTTPS session when target host IP was changed [#50240](https://github.com/ClickHouse/ClickHouse/pull/50240) ([Aleksei Filatov](https://github.com/aalexfvk)).
+* Fix msan issue in keyed siphash [#50245](https://github.com/ClickHouse/ClickHouse/pull/50245) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix bugs in Poco sockets in non-blocking mode, use true non-blocking sockets [#50252](https://github.com/ClickHouse/ClickHouse/pull/50252) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix checksum calculation for backup entries [#50264](https://github.com/ClickHouse/ClickHouse/pull/50264) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fixed type conversion from Date/Date32 to DateTime64 when querying with DateTime64 index [#50280](https://github.com/ClickHouse/ClickHouse/pull/50280) ([Lucas Chang](https://github.com/lucas-tubi)).
+* Comparison functions NaN fix [#50287](https://github.com/ClickHouse/ClickHouse/pull/50287) ([Maksim Kita](https://github.com/kitaisreal)).
+* JIT aggregation nullable key fix [#50291](https://github.com/ClickHouse/ClickHouse/pull/50291) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix clickhouse-local crashing when writing empty Arrow or Parquet output [#50328](https://github.com/ClickHouse/ClickHouse/pull/50328) ([Michael Kolupaev](https://github.com/al13n321)).
+* Fix crash when Pool::Entry::disconnect() is called [#50334](https://github.com/ClickHouse/ClickHouse/pull/50334) ([Val Doroshchuk](https://github.com/valbok)).
+* Improved fetch part by holding directory lock longer [#50339](https://github.com/ClickHouse/ClickHouse/pull/50339) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix bitShift* functions with both constant arguments [#50343](https://github.com/ClickHouse/ClickHouse/pull/50343) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix Keeper deadlock on exception when preprocessing requests. [#50387](https://github.com/ClickHouse/ClickHouse/pull/50387) ([frinkr](https://github.com/frinkr)).
+* Fix hashing of const integer values [#50421](https://github.com/ClickHouse/ClickHouse/pull/50421) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix excessive memory usage for FINAL (due to too much streams usage) [#50429](https://github.com/ClickHouse/ClickHouse/pull/50429) ([Azat Khuzhin](https://github.com/azat)).
+* Fix merge_tree_min_rows_for_seek/merge_tree_min_bytes_for_seek for data skipping indexes [#50432](https://github.com/ClickHouse/ClickHouse/pull/50432) ([Azat Khuzhin](https://github.com/azat)).
+* Limit the number of in-flight tasks for loading outdated parts [#50450](https://github.com/ClickHouse/ClickHouse/pull/50450) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Keeper fix: apply uncommitted state after snapshot install [#50483](https://github.com/ClickHouse/ClickHouse/pull/50483) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix incorrect constant folding [#50536](https://github.com/ClickHouse/ClickHouse/pull/50536) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix logical error in stress test (Not enough space to add ...) [#50583](https://github.com/ClickHouse/ClickHouse/pull/50583) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix converting Null to LowCardinality(Nullable) in values table function [#50637](https://github.com/ClickHouse/ClickHouse/pull/50637) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix crash in anti/semi join [#50638](https://github.com/ClickHouse/ClickHouse/pull/50638) ([vdimir](https://github.com/vdimir)).
+* Revert invalid RegExpTreeDictionary optimization [#50642](https://github.com/ClickHouse/ClickHouse/pull/50642) ([Johann Gan](https://github.com/johanngan)).
+* Correctly disable async insert with deduplication when it's not needed [#50663](https://github.com/ClickHouse/ClickHouse/pull/50663) ([Antonio Andelic](https://github.com/antonio2368)).
+
+#### Build Improvement
+
+* Fixed Functional Test 00870_t64_codec, 00871_t64_codec_signed, 00872_t64_bit_codec. [#49658](https://github.com/ClickHouse/ClickHouse/pull/49658) ([Sanjam Panda](https://github.com/saitama951)).
+
+#### NO CL ENTRY
+
+* NO CL ENTRY:  'Fix user MemoryTracker counter in async inserts'. [#47630](https://github.com/ClickHouse/ClickHouse/pull/47630) ([Dmitry Novik](https://github.com/novikd)).
+* NO CL ENTRY:  'Revert "Make `Pretty` formats even prettier."'. [#49850](https://github.com/ClickHouse/ClickHouse/pull/49850) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Update first_value.md:remove redundant 's''. [#50331](https://github.com/ClickHouse/ClickHouse/pull/50331) ([sslouis](https://github.com/savezed)).
+* NO CL ENTRY:  'Revert "less logs in WriteBufferFromS3"'. [#50390](https://github.com/ClickHouse/ClickHouse/pull/50390) ([Alexander Tokmakov](https://github.com/tavplubix)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Attempt to fix the "system.stack_trace" test [#44627](https://github.com/ClickHouse/ClickHouse/pull/44627) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* rework WriteBufferFromS3, add tests, add abortion [#44869](https://github.com/ClickHouse/ClickHouse/pull/44869) ([Sema Checherinda](https://github.com/CheSema)).
+* Rework locking in fs cache [#44985](https://github.com/ClickHouse/ClickHouse/pull/44985) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update ubuntu_ami_for_ci.sh [#47151](https://github.com/ClickHouse/ClickHouse/pull/47151) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Implement status comment [#48468](https://github.com/ClickHouse/ClickHouse/pull/48468) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Update curl to 8.0.1 (for CVEs) [#48765](https://github.com/ClickHouse/ClickHouse/pull/48765) ([Boris Kuschel](https://github.com/bkuschel)).
+* Fix some tests [#48792](https://github.com/ClickHouse/ClickHouse/pull/48792) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Bug Fix for 02432_s3_parallel_parts_cleanup.sql with zero copy replication [#48865](https://github.com/ClickHouse/ClickHouse/pull/48865) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Add AsyncLoader with dependency tracking and runtime prioritization [#48923](https://github.com/ClickHouse/ClickHouse/pull/48923) ([Sergei Trifonov](https://github.com/serxa)).
+* Fix incorrect createColumn call on join clause [#48998](https://github.com/ClickHouse/ClickHouse/pull/48998) ([Ongkong](https://github.com/ongkong)).
+* Try fix flaky 01346_alter_enum_partition_key_replicated_zookeeper_long [#49099](https://github.com/ClickHouse/ClickHouse/pull/49099) ([Sergei Trifonov](https://github.com/serxa)).
+* Fix possible logical error "Cannot cancel. Either no query sent or already cancelled" [#49106](https://github.com/ClickHouse/ClickHouse/pull/49106) ([Kruglov Pavel](https://github.com/Avogar)).
+* Refactor ColumnLowCardinality::cutAndCompact [#49111](https://github.com/ClickHouse/ClickHouse/pull/49111) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix tests with enabled analyzer [#49116](https://github.com/ClickHouse/ClickHouse/pull/49116) ([Dmitry Novik](https://github.com/novikd)).
+* Use `SharedMutex` instead of `UpgradableMutex` [#49139](https://github.com/ClickHouse/ClickHouse/pull/49139) ([Sergei Trifonov](https://github.com/serxa)).
+* Don't add metadata_version file if it doesn't exist [#49146](https://github.com/ClickHouse/ClickHouse/pull/49146) ([alesapin](https://github.com/alesapin)).
+* clearing s3 between tests in a robust way [#49157](https://github.com/ClickHouse/ClickHouse/pull/49157) ([Sema Checherinda](https://github.com/CheSema)).
+* Align connect timeout with aws sdk default [#49161](https://github.com/ClickHouse/ClickHouse/pull/49161) ([Nikita Taranov](https://github.com/nickitat)).
+* Fix test_encrypted_disk_replication [#49193](https://github.com/ClickHouse/ClickHouse/pull/49193) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Allow using function `concat` with `Map` type [#49200](https://github.com/ClickHouse/ClickHouse/pull/49200) ([Anton Popov](https://github.com/CurtizJ)).
+* Slight improvements to coordinator logging [#49204](https://github.com/ClickHouse/ClickHouse/pull/49204) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix some typos in conversion functions [#49221](https://github.com/ClickHouse/ClickHouse/pull/49221) ([Raúl Marín](https://github.com/Algunenano)).
+* CMake: Remove some GCC-specific code [#49224](https://github.com/ClickHouse/ClickHouse/pull/49224) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix oss-fuzz build errors [#49236](https://github.com/ClickHouse/ClickHouse/pull/49236) ([Nikita Taranov](https://github.com/nickitat)).
+* Update version after release [#49237](https://github.com/ClickHouse/ClickHouse/pull/49237) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Update version_date.tsv and changelogs after v23.4.1.1943-stable [#49239](https://github.com/ClickHouse/ClickHouse/pull/49239) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Merge [#24050](https://github.com/ClickHouse/ClickHouse/issues/24050) [#49240](https://github.com/ClickHouse/ClickHouse/pull/49240) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add file name to exception raised during decompression [#49241](https://github.com/ClickHouse/ClickHouse/pull/49241) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Disable ISA-L on aarch64 architectures [#49256](https://github.com/ClickHouse/ClickHouse/pull/49256) ([Jordi Villar](https://github.com/jrdi)).
+* Add a comment in FileCache.cpp [#49260](https://github.com/ClickHouse/ClickHouse/pull/49260) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix garbage [#48719](https://github.com/ClickHouse/ClickHouse/issues/48719) [#49263](https://github.com/ClickHouse/ClickHouse/pull/49263) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Update build for nasm [#49288](https://github.com/ClickHouse/ClickHouse/pull/49288) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix race in `waitForProcessingQueue` [#49302](https://github.com/ClickHouse/ClickHouse/pull/49302) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix stress test [#49309](https://github.com/ClickHouse/ClickHouse/pull/49309) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix 02516_join_with_totals_and_subquery_bug with new analyzer [#49310](https://github.com/ClickHouse/ClickHouse/pull/49310) ([Dmitry Novik](https://github.com/novikd)).
+* Fallback auth gh api [#49314](https://github.com/ClickHouse/ClickHouse/pull/49314) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Unpoison stack frame ptrs from libunwind for msan [#49316](https://github.com/ClickHouse/ClickHouse/pull/49316) ([Robert Schulze](https://github.com/rschu1ze)).
+* Respect projections in 01600_parts [#49318](https://github.com/ClickHouse/ClickHouse/pull/49318) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* move pipe compute into initializePipeline [#49326](https://github.com/ClickHouse/ClickHouse/pull/49326) ([Konstantin Morozov](https://github.com/k-morozov)).
+* Fix compiling average example (suppress -Wframe-larger-than) [#49358](https://github.com/ClickHouse/ClickHouse/pull/49358) ([Azat Khuzhin](https://github.com/azat)).
+* Fix join_use_nulls in analyzer [#49359](https://github.com/ClickHouse/ClickHouse/pull/49359) ([vdimir](https://github.com/vdimir)).
+* Fix 02680_mysql_ast_logical_err in analyzer [#49362](https://github.com/ClickHouse/ClickHouse/pull/49362) ([vdimir](https://github.com/vdimir)).
+* Remove wrong assertion in cache [#49376](https://github.com/ClickHouse/ClickHouse/pull/49376) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* A better way of excluding ISA-L on non-x86 [#49378](https://github.com/ClickHouse/ClickHouse/pull/49378) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix decimal aggregates test for s390x [#49382](https://github.com/ClickHouse/ClickHouse/pull/49382) ([Harry Lee](https://github.com/HarryLeeIBM)).
+* Move logging one line higher [#49387](https://github.com/ClickHouse/ClickHouse/pull/49387) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Improve CI: status commit, auth for get_gh_api [#49388](https://github.com/ClickHouse/ClickHouse/pull/49388) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix printing hung queries in clickhouse-test. [#49389](https://github.com/ClickHouse/ClickHouse/pull/49389) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Correctly stop CNF convert for too many atomics in new analyzer [#49402](https://github.com/ClickHouse/ClickHouse/pull/49402) ([Antonio Andelic](https://github.com/antonio2368)).
+* Remove 02707_complex_query_fails_analyzer test [#49403](https://github.com/ClickHouse/ClickHouse/pull/49403) ([Dmitry Novik](https://github.com/novikd)).
+* Update FileSegment.cpp [#49411](https://github.com/ClickHouse/ClickHouse/pull/49411) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Switch Block::NameMap to google::dense_hash_map over HashMap [#49412](https://github.com/ClickHouse/ClickHouse/pull/49412) ([Azat Khuzhin](https://github.com/azat)).
+* Slightly reduce inter-header dependencies [#49413](https://github.com/ClickHouse/ClickHouse/pull/49413) ([Azat Khuzhin](https://github.com/azat)).
+* Update WithFileName.cpp [#49414](https://github.com/ClickHouse/ClickHouse/pull/49414) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix some assertions failing in stress test [#49415](https://github.com/ClickHouse/ClickHouse/pull/49415) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Correctly cleanup sequential node in ZooKeeperWithFaultInjection [#49418](https://github.com/ClickHouse/ClickHouse/pull/49418) ([vdimir](https://github.com/vdimir)).
+* Throw an exception for non-parametric functions in new analyzer [#49419](https://github.com/ClickHouse/ClickHouse/pull/49419) ([Dmitry Novik](https://github.com/novikd)).
+* Fix some bad error messages [#49420](https://github.com/ClickHouse/ClickHouse/pull/49420) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Update version_date.tsv and changelogs after v23.4.2.11-stable [#49422](https://github.com/ClickHouse/ClickHouse/pull/49422) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Remove trash [#49423](https://github.com/ClickHouse/ClickHouse/pull/49423) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Whitespaces [#49424](https://github.com/ClickHouse/ClickHouse/pull/49424) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove dependency from DB::Context in remote/cache readers [#49426](https://github.com/ClickHouse/ClickHouse/pull/49426) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Merging [#49066](https://github.com/ClickHouse/ClickHouse/issues/49066) (Better error handling during loading of parts) [#49430](https://github.com/ClickHouse/ClickHouse/pull/49430) ([Anton Popov](https://github.com/CurtizJ)).
+* all s3-blobs removed when merge aborted, remove part from failed fetch without unlock keper [#49432](https://github.com/ClickHouse/ClickHouse/pull/49432) ([Sema Checherinda](https://github.com/CheSema)).
+* Make INSERT do more things in parallel to avoid getting bottlenecked on one thread [#49434](https://github.com/ClickHouse/ClickHouse/pull/49434) ([Michael Kolupaev](https://github.com/al13n321)).
+* Make 'exceptions shorter than 30' test less noisy [#49435](https://github.com/ClickHouse/ClickHouse/pull/49435) ([Michael Kolupaev](https://github.com/al13n321)).
+* Build fixes for ENABLE_LIBRARIES=OFF [#49437](https://github.com/ClickHouse/ClickHouse/pull/49437) ([Azat Khuzhin](https://github.com/azat)).
+* Add image for docker-server jepsen [#49452](https://github.com/ClickHouse/ClickHouse/pull/49452) ([alesapin](https://github.com/alesapin)).
+* Follow-up to [#48792](https://github.com/ClickHouse/ClickHouse/issues/48792) [#49458](https://github.com/ClickHouse/ClickHouse/pull/49458) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Add method `getCurrentAvailabilityZone` to `AWSEC2MetadataClient` [#49464](https://github.com/ClickHouse/ClickHouse/pull/49464) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add an integration test for `shutdown_wait_unfinished_queries` [#49469](https://github.com/ClickHouse/ClickHouse/pull/49469) ([Konstantin Bogdanov](https://github.com/thevar1able)).
+* Replace `NO DELAY` with `SYNC` in tests [#49470](https://github.com/ClickHouse/ClickHouse/pull/49470) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Check the PRs body directly in lambda, without rerun. Fix RCE in the CI [#49475](https://github.com/ClickHouse/ClickHouse/pull/49475) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Minor changes for setThreadName [#49476](https://github.com/ClickHouse/ClickHouse/pull/49476) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Static cast std::atomic<size_t> to uint64_t to serialize. [#49482](https://github.com/ClickHouse/ClickHouse/pull/49482) ([alekar](https://github.com/alekar)).
+* Fix logical error in stress test, add some logging [#49491](https://github.com/ClickHouse/ClickHouse/pull/49491) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fixes in server jepsen image [#49492](https://github.com/ClickHouse/ClickHouse/pull/49492) ([alesapin](https://github.com/alesapin)).
+* Fix UserTimeMicroseconds and SystemTimeMicroseconds descriptions [#49521](https://github.com/ClickHouse/ClickHouse/pull/49521) ([Sergei Trifonov](https://github.com/serxa)).
+* Remove garbage from HDFS [#49531](https://github.com/ClickHouse/ClickHouse/pull/49531) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Split ReadWriteBufferFromHTTP.h into .h and .cpp file [#49533](https://github.com/ClickHouse/ClickHouse/pull/49533) ([Michael Kolupaev](https://github.com/al13n321)).
+* Remove garbage from Pretty format [#49534](https://github.com/ClickHouse/ClickHouse/pull/49534) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Make input_format_parquet_preserve_order imply !parallelize_output_from_storages [#49536](https://github.com/ClickHouse/ClickHouse/pull/49536) ([Michael Kolupaev](https://github.com/al13n321)).
+* Remove extra semicolons [#49545](https://github.com/ClickHouse/ClickHouse/pull/49545) ([Bulat Gaifullin](https://github.com/bgaifullin)).
+* Fix 00597_push_down_predicate_long for analyzer [#49551](https://github.com/ClickHouse/ClickHouse/pull/49551) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix stress test (assertion 'key_metadata.lock()') [#49554](https://github.com/ClickHouse/ClickHouse/pull/49554) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix writeAnyEscapedString if quote_character is a meta character [#49558](https://github.com/ClickHouse/ClickHouse/pull/49558) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add CMake option for BOOST_USE_UCONTEXT [#49564](https://github.com/ClickHouse/ClickHouse/pull/49564) ([ltrk2](https://github.com/ltrk2)).
+* Fix 01655_plan_optimizations_optimize_read_in_window_order for analyzer [#49565](https://github.com/ClickHouse/ClickHouse/pull/49565) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix `ThreadPool::wait` [#49572](https://github.com/ClickHouse/ClickHouse/pull/49572) ([Anton Popov](https://github.com/CurtizJ)).
+* Query cache: disable for internal queries [#49573](https://github.com/ClickHouse/ClickHouse/pull/49573) ([Robert Schulze](https://github.com/rschu1ze)).
+* Remove `test_merge_tree_s3_restore` [#49576](https://github.com/ClickHouse/ClickHouse/pull/49576) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix bad test [#49578](https://github.com/ClickHouse/ClickHouse/pull/49578) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove obsolete test about deprecated feature [#49579](https://github.com/ClickHouse/ClickHouse/pull/49579) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Avoid error found by AST Fuzzer [#49580](https://github.com/ClickHouse/ClickHouse/pull/49580) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix wrong assert [#49581](https://github.com/ClickHouse/ClickHouse/pull/49581) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Flaky test 02723_zookeeper_name.sql [#49592](https://github.com/ClickHouse/ClickHouse/pull/49592) ([Sema Checherinda](https://github.com/CheSema)).
+* Query Cache: Safeguard against empty chunks [#49593](https://github.com/ClickHouse/ClickHouse/pull/49593) ([Robert Schulze](https://github.com/rschu1ze)).
+* 02723_zookeeper_name: Force a deterministic result order [#49594](https://github.com/ClickHouse/ClickHouse/pull/49594) ([Robert Schulze](https://github.com/rschu1ze)).
+* Remove dangerous code (stringstream) [#49595](https://github.com/ClickHouse/ClickHouse/pull/49595) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove some code [#49596](https://github.com/ClickHouse/ClickHouse/pull/49596) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove "locale" [#49597](https://github.com/ClickHouse/ClickHouse/pull/49597) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* CMake: Cleanup utils build [#49598](https://github.com/ClickHouse/ClickHouse/pull/49598) ([Robert Schulze](https://github.com/rschu1ze)).
+* Follow-up for [#49580](https://github.com/ClickHouse/ClickHouse/issues/49580) [#49604](https://github.com/ClickHouse/ClickHouse/pull/49604) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix typo [#49605](https://github.com/ClickHouse/ClickHouse/pull/49605) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix bad test 01660_system_parts_smoke [#49611](https://github.com/ClickHouse/ClickHouse/pull/49611) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Minor changes [#49612](https://github.com/ClickHouse/ClickHouse/pull/49612) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Follow-up for [#49576](https://github.com/ClickHouse/ClickHouse/issues/49576) [#49615](https://github.com/ClickHouse/ClickHouse/pull/49615) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix error in [#48300](https://github.com/ClickHouse/ClickHouse/issues/48300) [#49616](https://github.com/ClickHouse/ClickHouse/pull/49616) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix typo: "as much slots" -> "as many slots" [#49617](https://github.com/ClickHouse/ClickHouse/pull/49617) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Better concurrent parts removal with zero copy [#49619](https://github.com/ClickHouse/ClickHouse/pull/49619) ([alesapin](https://github.com/alesapin)).
+* CMake: Remove legacy switch for ccache [#49627](https://github.com/ClickHouse/ClickHouse/pull/49627) ([Robert Schulze](https://github.com/rschu1ze)).
+* Try to fix integration test 'test_ssl_cert_authentication' [#49632](https://github.com/ClickHouse/ClickHouse/pull/49632) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Unflake 01660_system_parts_smoke [#49633](https://github.com/ClickHouse/ClickHouse/pull/49633) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add trash [#49634](https://github.com/ClickHouse/ClickHouse/pull/49634) ([Robert Schulze](https://github.com/rschu1ze)).
+* Remove commented code [#49635](https://github.com/ClickHouse/ClickHouse/pull/49635) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add flaky test [#49646](https://github.com/ClickHouse/ClickHouse/pull/49646) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix race in `Context::createCopy` [#49663](https://github.com/ClickHouse/ClickHouse/pull/49663) ([Anton Popov](https://github.com/CurtizJ)).
+* Disable 01710_projection_aggregation_in_order.sql [#49667](https://github.com/ClickHouse/ClickHouse/pull/49667) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix flaky 02684_bson.sql [#49674](https://github.com/ClickHouse/ClickHouse/pull/49674) ([Kruglov Pavel](https://github.com/Avogar)).
+* Some cache cleanup after rework locking [#49675](https://github.com/ClickHouse/ClickHouse/pull/49675) ([Igor Nikonov](https://github.com/devcrafter)).
+* Correctly update log pointer during database replica recovery [#49676](https://github.com/ClickHouse/ClickHouse/pull/49676) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Enable distinct in order after fix [#49636](https://github.com/ClickHouse/ClickHouse/issues/49636) [#49677](https://github.com/ClickHouse/ClickHouse/pull/49677) ([Igor Nikonov](https://github.com/devcrafter)).
+* Build fixes for RISCV64 [#49688](https://github.com/ClickHouse/ClickHouse/pull/49688) ([Azat Khuzhin](https://github.com/azat)).
+* Add some logging [#49690](https://github.com/ClickHouse/ClickHouse/pull/49690) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix a wrong built generator removal, use `depth=1` [#49692](https://github.com/ClickHouse/ClickHouse/pull/49692) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix member call on null pointer in AST fuzzer [#49696](https://github.com/ClickHouse/ClickHouse/pull/49696) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Improve woboq codebrowser pipeline [#49701](https://github.com/ClickHouse/ClickHouse/pull/49701) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Enable `do_not_evict_index_and_mark_files` by default [#49702](https://github.com/ClickHouse/ClickHouse/pull/49702) ([Nikita Taranov](https://github.com/nickitat)).
+* Backport fix for UBSan error in musl/logf.c [#49705](https://github.com/ClickHouse/ClickHouse/pull/49705) ([Nikita Taranov](https://github.com/nickitat)).
+* Fix flaky test for `kolmogorovSmirnovTest` function [#49710](https://github.com/ClickHouse/ClickHouse/pull/49710) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Update clickhouse-test [#49712](https://github.com/ClickHouse/ClickHouse/pull/49712) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* IBM s390x: ip encoding fix [#49713](https://github.com/ClickHouse/ClickHouse/pull/49713) ([Suzy Wang](https://github.com/SuzyWangIBMer)).
+* Remove not used ErrorCodes [#49715](https://github.com/ClickHouse/ClickHouse/pull/49715) ([Sergei Trifonov](https://github.com/serxa)).
+* Disable mmap for StorageFile in clickhouse-server [#49717](https://github.com/ClickHouse/ClickHouse/pull/49717) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix typo [#49718](https://github.com/ClickHouse/ClickHouse/pull/49718) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Do not launch workflows for PRs w/o "can be tested" [#49726](https://github.com/ClickHouse/ClickHouse/pull/49726) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Move assertions after logging [#49729](https://github.com/ClickHouse/ClickHouse/pull/49729) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Docs: Fix sidebar label for dictionary table function [#49730](https://github.com/ClickHouse/ClickHouse/pull/49730) ([Robert Schulze](https://github.com/rschu1ze)).
+* Do not allocate own buffer in CachedOnDiskReadBufferFromFile when `use_external_buffer == true` [#49733](https://github.com/ClickHouse/ClickHouse/pull/49733) ([Nikita Taranov](https://github.com/nickitat)).
+* fix convertation [#49749](https://github.com/ClickHouse/ClickHouse/pull/49749) ([Sema Checherinda](https://github.com/CheSema)).
+* fix flaky test 02504_regexp_dictionary_ua_parser [#49753](https://github.com/ClickHouse/ClickHouse/pull/49753) ([Han Fei](https://github.com/hanfei1991)).
+* Fix unit test `ExceptionFromWait` [#49755](https://github.com/ClickHouse/ClickHouse/pull/49755) ([Anton Popov](https://github.com/CurtizJ)).
+* Add forgotten lock (addition to [#49117](https://github.com/ClickHouse/ClickHouse/issues/49117)) [#49757](https://github.com/ClickHouse/ClickHouse/pull/49757) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix typo [#49762](https://github.com/ClickHouse/ClickHouse/pull/49762) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix build of `libfiu` on clang-16 [#49766](https://github.com/ClickHouse/ClickHouse/pull/49766) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Update README.md [#49782](https://github.com/ClickHouse/ClickHouse/pull/49782) ([Tyler Hannan](https://github.com/tylerhannan)).
+* Analyzer: fix column not found for optimized prewhere with sample by [#49784](https://github.com/ClickHouse/ClickHouse/pull/49784) ([vdimir](https://github.com/vdimir)).
+* Typo: demange.cpp --> demangle.cpp [#49799](https://github.com/ClickHouse/ClickHouse/pull/49799) ([Robert Schulze](https://github.com/rschu1ze)).
+* Analyzer: apply _CAST to constants only once [#49800](https://github.com/ClickHouse/ClickHouse/pull/49800) ([Dmitry Novik](https://github.com/novikd)).
+* Use CLOCK_MONOTONIC_RAW over CLOCK_MONOTONIC on Linux (fixes non monotonic clock) [#49819](https://github.com/ClickHouse/ClickHouse/pull/49819) ([Azat Khuzhin](https://github.com/azat)).
+* README.md: 4 --> 5 [#49822](https://github.com/ClickHouse/ClickHouse/pull/49822) ([Robert Schulze](https://github.com/rschu1ze)).
+* Allow ASOF JOIN over nullable right column [#49826](https://github.com/ClickHouse/ClickHouse/pull/49826) ([vdimir](https://github.com/vdimir)).
+* Make 01533_multiple_nested test more reliable [#49828](https://github.com/ClickHouse/ClickHouse/pull/49828) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* What happens if I remove everything in msan_suppressions? [#49829](https://github.com/ClickHouse/ClickHouse/pull/49829) ([Robert Schulze](https://github.com/rschu1ze)).
+* Update README.md [#49832](https://github.com/ClickHouse/ClickHouse/pull/49832) ([AnneClickHouse](https://github.com/AnneClickHouse)).
+* Randomize enable_multiple_prewhere_read_steps setting [#49834](https://github.com/ClickHouse/ClickHouse/pull/49834) ([Alexander Gololobov](https://github.com/davenger)).
+* Analyzer: do not optimize GROUP BY keys with ROLLUP and CUBE [#49838](https://github.com/ClickHouse/ClickHouse/pull/49838) ([Dmitry Novik](https://github.com/novikd)).
+* Clearable hash table and zero values [#49846](https://github.com/ClickHouse/ClickHouse/pull/49846) ([Igor Nikonov](https://github.com/devcrafter)).
+* Reset vectorscan reference to an "official" repo [#49848](https://github.com/ClickHouse/ClickHouse/pull/49848) ([Robert Schulze](https://github.com/rschu1ze)).
+* Enable few slow clang-tidy checks for clangd [#49855](https://github.com/ClickHouse/ClickHouse/pull/49855) ([Azat Khuzhin](https://github.com/azat)).
+* Update QPL docs [#49857](https://github.com/ClickHouse/ClickHouse/pull/49857) ([Robert Schulze](https://github.com/rschu1ze)).
+* Small-ish .clang-tidy update [#49859](https://github.com/ClickHouse/ClickHouse/pull/49859) ([Robert Schulze](https://github.com/rschu1ze)).
+* Follow-up for clang-tidy [#49861](https://github.com/ClickHouse/ClickHouse/pull/49861) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix "reference to local binding" after fixes for clang-17 [#49874](https://github.com/ClickHouse/ClickHouse/pull/49874) ([Azat Khuzhin](https://github.com/azat)).
+* fix typo [#49876](https://github.com/ClickHouse/ClickHouse/pull/49876) ([JackyWoo](https://github.com/JackyWoo)).
+* Log with warning if the server was terminated forcefully [#49881](https://github.com/ClickHouse/ClickHouse/pull/49881) ([Azat Khuzhin](https://github.com/azat)).
+* Fix some tests [#49889](https://github.com/ClickHouse/ClickHouse/pull/49889) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* use chassert in MergeTreeDeduplicationLog to have better log info [#49891](https://github.com/ClickHouse/ClickHouse/pull/49891) ([Han Fei](https://github.com/hanfei1991)).
+* Multiple pools support for AsyncLoader [#49893](https://github.com/ClickHouse/ClickHouse/pull/49893) ([Sergei Trifonov](https://github.com/serxa)).
+* Fix stack-use-after-scope in resource manager test [#49908](https://github.com/ClickHouse/ClickHouse/pull/49908) ([Sergei Trifonov](https://github.com/serxa)).
+* Retry connection expired in test_rename_column/test.py [#49911](https://github.com/ClickHouse/ClickHouse/pull/49911) ([alesapin](https://github.com/alesapin)).
+* Try to fix flaky test_distributed_load_balancing tests [#49912](https://github.com/ClickHouse/ClickHouse/pull/49912) ([Kruglov Pavel](https://github.com/Avogar)).
+* Remove unused code [#49918](https://github.com/ClickHouse/ClickHouse/pull/49918) ([alesapin](https://github.com/alesapin)).
+* Fix flakiness of test_distributed_load_balancing test [#49921](https://github.com/ClickHouse/ClickHouse/pull/49921) ([Azat Khuzhin](https://github.com/azat)).
+* Add some logging [#49925](https://github.com/ClickHouse/ClickHouse/pull/49925) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Support hardlinking parts transactionally [#49931](https://github.com/ClickHouse/ClickHouse/pull/49931) ([Michael Kolupaev](https://github.com/al13n321)).
+* Fix for analyzer: 02377_ optimize_sorting_by_input_stream_properties_e… [#49943](https://github.com/ClickHouse/ClickHouse/pull/49943) ([Igor Nikonov](https://github.com/devcrafter)).
+* Follow up to [#49429](https://github.com/ClickHouse/ClickHouse/issues/49429) [#49964](https://github.com/ClickHouse/ClickHouse/pull/49964) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix flaky test_ssl_cert_authentication to use urllib3 [#49982](https://github.com/ClickHouse/ClickHouse/pull/49982) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix woboq codebrowser build with -Wno-poison-system-directories [#49992](https://github.com/ClickHouse/ClickHouse/pull/49992) ([Azat Khuzhin](https://github.com/azat)).
+* test for [#46128](https://github.com/ClickHouse/ClickHouse/issues/46128) [#49993](https://github.com/ClickHouse/ClickHouse/pull/49993) ([Denny Crane](https://github.com/den-crane)).
+* Fix test_insert_same_partition_and_merge failing if one Azure request attempt fails [#49996](https://github.com/ClickHouse/ClickHouse/pull/49996) ([Michael Kolupaev](https://github.com/al13n321)).
+* Check return value of `ftruncate` in Keeper [#50020](https://github.com/ClickHouse/ClickHouse/pull/50020) ([Antonio Andelic](https://github.com/antonio2368)).
+* Add some assertions [#50025](https://github.com/ClickHouse/ClickHouse/pull/50025) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update 02441_alter_delete_and_drop_column.sql [#50027](https://github.com/ClickHouse/ClickHouse/pull/50027) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Move some common code to common [#50028](https://github.com/ClickHouse/ClickHouse/pull/50028) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add method getCredentials() to S3::Client [#50030](https://github.com/ClickHouse/ClickHouse/pull/50030) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update query_log.md [#50032](https://github.com/ClickHouse/ClickHouse/pull/50032) ([Sergei Trifonov](https://github.com/serxa)).
+* Get rid of indirect write buffer in object storages [#50033](https://github.com/ClickHouse/ClickHouse/pull/50033) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Load balancing bugfixes [#50036](https://github.com/ClickHouse/ClickHouse/pull/50036) ([Sergei Trifonov](https://github.com/serxa)).
+* Update S3 sdk to v1.11.61 [#50037](https://github.com/ClickHouse/ClickHouse/pull/50037) ([Nikita Taranov](https://github.com/nickitat)).
+* Fix 02735_system_zookeeper_connection for DatabaseReplicated [#50047](https://github.com/ClickHouse/ClickHouse/pull/50047) ([Azat Khuzhin](https://github.com/azat)).
+* Add more profile events for distributed connections [#50051](https://github.com/ClickHouse/ClickHouse/pull/50051) ([Sergei Trifonov](https://github.com/serxa)).
+* FileCache: simple tryReserve() cleanup [#50059](https://github.com/ClickHouse/ClickHouse/pull/50059) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix hashed/sparse_hashed dictionaries max_load_factor upper range [#50065](https://github.com/ClickHouse/ClickHouse/pull/50065) ([Azat Khuzhin](https://github.com/azat)).
+* Clearer coordinator log [#50101](https://github.com/ClickHouse/ClickHouse/pull/50101) ([Raúl Marín](https://github.com/Algunenano)).
+* Analyzer: Do not execute table functions multiple times [#50105](https://github.com/ClickHouse/ClickHouse/pull/50105) ([Dmitry Novik](https://github.com/novikd)).
+* Update default settings for Replicated database [#50108](https://github.com/ClickHouse/ClickHouse/pull/50108) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Make async prefetched buffer work with arbitrary impl [#50109](https://github.com/ClickHouse/ClickHouse/pull/50109) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update github.com/distribution/distribution [#50114](https://github.com/ClickHouse/ClickHouse/pull/50114) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Docs: Update clickhouse-local arguments [#50138](https://github.com/ClickHouse/ClickHouse/pull/50138) ([Robert Schulze](https://github.com/rschu1ze)).
+* Change fields destruction order in AsyncTaskExecutor [#50151](https://github.com/ClickHouse/ClickHouse/pull/50151) ([Kruglov Pavel](https://github.com/Avogar)).
+* Follow-up to [#49889](https://github.com/ClickHouse/ClickHouse/issues/49889) [#50152](https://github.com/ClickHouse/ClickHouse/pull/50152) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Clarification comment on retries controller behavior [#50155](https://github.com/ClickHouse/ClickHouse/pull/50155) ([Igor Nikonov](https://github.com/devcrafter)).
+* Switch to upstream repository of vectorscan [#50159](https://github.com/ClickHouse/ClickHouse/pull/50159) ([Azat Khuzhin](https://github.com/azat)).
+* Refactor lambdas, prepare to prio runners [#50160](https://github.com/ClickHouse/ClickHouse/pull/50160) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Speed-up the shellcheck with parallel xargs [#50164](https://github.com/ClickHouse/ClickHouse/pull/50164) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Update an exception message [#50180](https://github.com/ClickHouse/ClickHouse/pull/50180) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Upgrade boost submodule [#50188](https://github.com/ClickHouse/ClickHouse/pull/50188) ([ltrk2](https://github.com/ltrk2)).
+* Implement a uniform way to query processor core IDs [#50190](https://github.com/ClickHouse/ClickHouse/pull/50190) ([ltrk2](https://github.com/ltrk2)).
+* Don't replicate delete through DDL worker if there is just 1 shard [#50193](https://github.com/ClickHouse/ClickHouse/pull/50193) ([Alexander Gololobov](https://github.com/davenger)).
+* Fix codebrowser by using clang-15 image [#50197](https://github.com/ClickHouse/ClickHouse/pull/50197) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Add comments to build reports [#50200](https://github.com/ClickHouse/ClickHouse/pull/50200) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Automatic backports of important fixes to cloud-release [#50202](https://github.com/ClickHouse/ClickHouse/pull/50202) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Unify priorities: lower value means higher priority [#50205](https://github.com/ClickHouse/ClickHouse/pull/50205) ([Sergei Trifonov](https://github.com/serxa)).
+* Use transactions for encrypted disks [#50206](https://github.com/ClickHouse/ClickHouse/pull/50206) ([alesapin](https://github.com/alesapin)).
+* Get detailed error instead of unknown error for function test [#50207](https://github.com/ClickHouse/ClickHouse/pull/50207) ([Suzy Wang](https://github.com/SuzyWangIBMer)).
+* README.md: Remove Berlin Meetup from upcoming events [#50218](https://github.com/ClickHouse/ClickHouse/pull/50218) ([Robert Schulze](https://github.com/rschu1ze)).
+* Minor adjustment of clickhouse-client/local parameter docs [#50219](https://github.com/ClickHouse/ClickHouse/pull/50219) ([Robert Schulze](https://github.com/rschu1ze)).
+* Unify priorities: rework IO scheduling subsystem [#50231](https://github.com/ClickHouse/ClickHouse/pull/50231) ([Sergei Trifonov](https://github.com/serxa)).
+* Add new metrics BrokenDistributedBytesToInsert/DistributedBytesToInsert [#50238](https://github.com/ClickHouse/ClickHouse/pull/50238) ([Azat Khuzhin](https://github.com/azat)).
+* Fix URL in backport comment [#50241](https://github.com/ClickHouse/ClickHouse/pull/50241) ([pufit](https://github.com/pufit)).
+* Fix `02535_max_parallel_replicas_custom_key` [#50242](https://github.com/ClickHouse/ClickHouse/pull/50242) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fixes for MergeTree with readonly disks [#50244](https://github.com/ClickHouse/ClickHouse/pull/50244) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Yet another refactoring [#50257](https://github.com/ClickHouse/ClickHouse/pull/50257) ([Anton Popov](https://github.com/CurtizJ)).
+* Unify priorities: rework AsyncLoader [#50272](https://github.com/ClickHouse/ClickHouse/pull/50272) ([Sergei Trifonov](https://github.com/serxa)).
+* buffers d-tor finalize free [#50275](https://github.com/ClickHouse/ClickHouse/pull/50275) ([Sema Checherinda](https://github.com/CheSema)).
+* Fix 02767_into_outfile_extensions_msan under analyzer [#50290](https://github.com/ClickHouse/ClickHouse/pull/50290) ([Azat Khuzhin](https://github.com/azat)).
+* QPL: Add a comment about isal [#50308](https://github.com/ClickHouse/ClickHouse/pull/50308) ([Robert Schulze](https://github.com/rschu1ze)).
+* Avoid clang 15 crash [#50310](https://github.com/ClickHouse/ClickHouse/pull/50310) ([Raúl Marín](https://github.com/Algunenano)).
+* Cleanup Annoy index [#50312](https://github.com/ClickHouse/ClickHouse/pull/50312) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix flaky `AsyncLoader.StaticPriorities` unit test [#50313](https://github.com/ClickHouse/ClickHouse/pull/50313) ([Sergei Trifonov](https://github.com/serxa)).
+* Update gtest_async_loader.cpp [#50317](https://github.com/ClickHouse/ClickHouse/pull/50317) ([Nikita Taranov](https://github.com/nickitat)).
+* Fix IS (NOT) NULL operator priority [#50327](https://github.com/ClickHouse/ClickHouse/pull/50327) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Update README.md [#50340](https://github.com/ClickHouse/ClickHouse/pull/50340) ([Tyler Hannan](https://github.com/tylerhannan)).
+* do not fix the event list in test [#50342](https://github.com/ClickHouse/ClickHouse/pull/50342) ([Sema Checherinda](https://github.com/CheSema)).
+* less logs in WriteBufferFromS3 [#50347](https://github.com/ClickHouse/ClickHouse/pull/50347) ([Sema Checherinda](https://github.com/CheSema)).
+* Remove legacy install scripts superseded by universal.sh [#50360](https://github.com/ClickHouse/ClickHouse/pull/50360) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fail perf tests when too many queries slowed down [#50361](https://github.com/ClickHouse/ClickHouse/pull/50361) ([Nikita Taranov](https://github.com/nickitat)).
+* Fix after [#50109](https://github.com/ClickHouse/ClickHouse/issues/50109) [#50362](https://github.com/ClickHouse/ClickHouse/pull/50362) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix log message [#50363](https://github.com/ClickHouse/ClickHouse/pull/50363) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Compare functions NaN update test [#50366](https://github.com/ClickHouse/ClickHouse/pull/50366) ([Maksim Kita](https://github.com/kitaisreal)).
+* Add re-creation for cherry-pick PRs [#50373](https://github.com/ClickHouse/ClickHouse/pull/50373) ([pufit](https://github.com/pufit)).
+*  Without applying `prepareRightBlock` will cause mismatch block structrue [#50383](https://github.com/ClickHouse/ClickHouse/pull/50383) ([lgbo](https://github.com/lgbo-ustc)).
+* fix hung in unit tests [#50391](https://github.com/ClickHouse/ClickHouse/pull/50391) ([Sema Checherinda](https://github.com/CheSema)).
+* Fix poll timeout in MaterializedMySQL [#50392](https://github.com/ClickHouse/ClickHouse/pull/50392) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Compile aggregate expressions enable by default [#50401](https://github.com/ClickHouse/ClickHouse/pull/50401) ([Maksim Kita](https://github.com/kitaisreal)).
+* Update app.py [#50407](https://github.com/ClickHouse/ClickHouse/pull/50407) ([Nikita Taranov](https://github.com/nickitat)).
+* reuse s3_mocks, rewrite test test_paranoid_check_in_logs [#50408](https://github.com/ClickHouse/ClickHouse/pull/50408) ([Sema Checherinda](https://github.com/CheSema)).
+* test for [#42610](https://github.com/ClickHouse/ClickHouse/issues/42610) [#50409](https://github.com/ClickHouse/ClickHouse/pull/50409) ([Denny Crane](https://github.com/den-crane)).
+* Remove something [#50411](https://github.com/ClickHouse/ClickHouse/pull/50411) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Mark the builds without results as pending [#50415](https://github.com/ClickHouse/ClickHouse/pull/50415) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Revert "Fix msan issue in keyed siphash" [#50426](https://github.com/ClickHouse/ClickHouse/pull/50426) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Revert "Revert "less logs in WriteBufferFromS3" ([#50390](https://github.com/ClickHouse/ClickHouse/issues/50390))" [#50444](https://github.com/ClickHouse/ClickHouse/pull/50444) ([Sema Checherinda](https://github.com/CheSema)).
+* Paranoid fix for removing parts from ZooKeeper [#50448](https://github.com/ClickHouse/ClickHouse/pull/50448) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Add timeout for unit tests [#50449](https://github.com/ClickHouse/ClickHouse/pull/50449) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Changes related to an internal feature [#50453](https://github.com/ClickHouse/ClickHouse/pull/50453) ([Michael Kolupaev](https://github.com/al13n321)).
+* Don't crash if config doesn't have logger section [#50455](https://github.com/ClickHouse/ClickHouse/pull/50455) ([Michael Kolupaev](https://github.com/al13n321)).
+* Update function docs [#50466](https://github.com/ClickHouse/ClickHouse/pull/50466) ([Robert Schulze](https://github.com/rschu1ze)).
+* Revert "make filter push down through cross join" [#50467](https://github.com/ClickHouse/ClickHouse/pull/50467) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Add some assertions [#50470](https://github.com/ClickHouse/ClickHouse/pull/50470) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* CI: Enable aspell on nested docs [#50476](https://github.com/ClickHouse/ClickHouse/pull/50476) ([Robert Schulze](https://github.com/rschu1ze)).
+* Try fix flaky test test_async_query_sending [#50480](https://github.com/ClickHouse/ClickHouse/pull/50480) ([Kruglov Pavel](https://github.com/Avogar)).
+* Disable 00534_functions_bad_arguments with msan [#50481](https://github.com/ClickHouse/ClickHouse/pull/50481) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Typos: Follow-up to [#50476](https://github.com/ClickHouse/ClickHouse/issues/50476) [#50482](https://github.com/ClickHouse/ClickHouse/pull/50482) ([Robert Schulze](https://github.com/rschu1ze)).
+* Remove unneeded Keeper test [#50485](https://github.com/ClickHouse/ClickHouse/pull/50485) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix KeyError in cherry-pick [#50493](https://github.com/ClickHouse/ClickHouse/pull/50493) ([pufit](https://github.com/pufit)).
+* Make typeid_cast for pointers noexcept [#50495](https://github.com/ClickHouse/ClickHouse/pull/50495) ([Sergey Kazmin ](https://github.com/yerseg)).
+* less traces in logs [#50518](https://github.com/ClickHouse/ClickHouse/pull/50518) ([Sema Checherinda](https://github.com/CheSema)).
+* Implement endianness-independent serialization for UUID [#50519](https://github.com/ClickHouse/ClickHouse/pull/50519) ([ltrk2](https://github.com/ltrk2)).
+* Remove strange object storage methods [#50521](https://github.com/ClickHouse/ClickHouse/pull/50521) ([alesapin](https://github.com/alesapin)).
+* Fix low quality code around metadata in RocksDB (experimental feature never used in production) [#50527](https://github.com/ClickHouse/ClickHouse/pull/50527) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Function if constant folding [#50529](https://github.com/ClickHouse/ClickHouse/pull/50529) ([Maksim Kita](https://github.com/kitaisreal)).
+* Add profile events for fs cache eviction [#50533](https://github.com/ClickHouse/ClickHouse/pull/50533) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* QueryNode small fix [#50535](https://github.com/ClickHouse/ClickHouse/pull/50535) ([Maksim Kita](https://github.com/kitaisreal)).
+* Control memory usage in generateRandom [#50538](https://github.com/ClickHouse/ClickHouse/pull/50538) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Disable skim (Rust library) under memory sanitizer [#50539](https://github.com/ClickHouse/ClickHouse/pull/50539) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* MSan support for Rust [#50541](https://github.com/ClickHouse/ClickHouse/pull/50541) ([Azat Khuzhin](https://github.com/azat)).
+* Make 01565_query_loop_after_client_error slightly more robust [#50542](https://github.com/ClickHouse/ClickHouse/pull/50542) ([Azat Khuzhin](https://github.com/azat)).
+* Resize BufferFromVector underlying vector only pos_offset == vector.size() [#50546](https://github.com/ClickHouse/ClickHouse/pull/50546) ([auxten](https://github.com/auxten)).
+* Add async iteration to object storage [#50548](https://github.com/ClickHouse/ClickHouse/pull/50548) ([alesapin](https://github.com/alesapin)).
+* skip extracting darwin toolchain in builder when unncessary [#50550](https://github.com/ClickHouse/ClickHouse/pull/50550) ([SuperDJY](https://github.com/cmsxbc)).
+* Remove flaky test [#50558](https://github.com/ClickHouse/ClickHouse/pull/50558) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Revert "Disable skim (Rust library) under memory sanitizer" [#50574](https://github.com/ClickHouse/ClickHouse/pull/50574) ([Azat Khuzhin](https://github.com/azat)).
+* Analyzer: fix 01487_distributed_in_not_default_db [#50587](https://github.com/ClickHouse/ClickHouse/pull/50587) ([Dmitry Novik](https://github.com/novikd)).
+* Fix commit for DiskObjectStorage [#50599](https://github.com/ClickHouse/ClickHouse/pull/50599) ([alesapin](https://github.com/alesapin)).
+* Fix Jepsen runs in PRs [#50615](https://github.com/ClickHouse/ClickHouse/pull/50615) ([Antonio Andelic](https://github.com/antonio2368)).
+* Revert incorrect optimizations [#50629](https://github.com/ClickHouse/ClickHouse/pull/50629) ([Raúl Marín](https://github.com/Algunenano)).
+* Disable 01676_clickhouse_client_autocomplete under UBSan [#50636](https://github.com/ClickHouse/ClickHouse/pull/50636) ([Nikita Taranov](https://github.com/nickitat)).
+* Merging [#50329](https://github.com/ClickHouse/ClickHouse/issues/50329) [#50660](https://github.com/ClickHouse/ClickHouse/pull/50660) ([Anton Popov](https://github.com/CurtizJ)).
+* Revert "date_trunc function to always return DateTime type" [#50670](https://github.com/ClickHouse/ClickHouse/pull/50670) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Fix flaky test 02461_prewhere_row_level_policy_lightweight_delete [#50674](https://github.com/ClickHouse/ClickHouse/pull/50674) ([Alexander Gololobov](https://github.com/davenger)).
+* Fix asan issue with analyzer and prewhere [#50685](https://github.com/ClickHouse/ClickHouse/pull/50685) ([Alexander Gololobov](https://github.com/davenger)).
+* Catch issues with dockerd during the build [#50700](https://github.com/ClickHouse/ClickHouse/pull/50700) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Temporarily disable annoy index tests (flaky for analyzer) [#50714](https://github.com/ClickHouse/ClickHouse/pull/50714) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix assertion from stress test [#50718](https://github.com/ClickHouse/ClickHouse/pull/50718) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix flaky unit test [#50719](https://github.com/ClickHouse/ClickHouse/pull/50719) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Show correct sharing state in system.query_cache [#50728](https://github.com/ClickHouse/ClickHouse/pull/50728) ([Robert Schulze](https://github.com/rschu1ze)).
+
diff --git a/docs/changelogs/v23.5.2.7-stable.md b/docs/changelogs/v23.5.2.7-stable.md
new file mode 100644
index 00000000000..2e4931c64e0
--- /dev/null
+++ b/docs/changelogs/v23.5.2.7-stable.md
@@ -0,0 +1,18 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.5.2.7-stable (5751aa1ab9f) FIXME as compared to v23.5.1.3174-stable (2fec796e73e)
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Do not read all the columns from right GLOBAL JOIN table. [#50721](https://github.com/ClickHouse/ClickHouse/pull/50721) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Fix build for aarch64 (temporary disable azure) [#50770](https://github.com/ClickHouse/ClickHouse/pull/50770) ([alesapin](https://github.com/alesapin)).
+* Rename azure_blob_storage to azureBlobStorage [#50812](https://github.com/ClickHouse/ClickHouse/pull/50812) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+
diff --git a/docs/changelogs/v23.5.3.24-stable.md b/docs/changelogs/v23.5.3.24-stable.md
new file mode 100644
index 00000000000..967a50b3b0e
--- /dev/null
+++ b/docs/changelogs/v23.5.3.24-stable.md
@@ -0,0 +1,26 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.5.3.24-stable (76f54616d3b) FIXME as compared to v23.5.2.7-stable (5751aa1ab9f)
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix Log family table return wrong rows count after truncate [#50585](https://github.com/ClickHouse/ClickHouse/pull/50585) ([flynn](https://github.com/ucasfl)).
+* Fix bug in `uniqExact` parallel merging [#50590](https://github.com/ClickHouse/ClickHouse/pull/50590) ([Nikita Taranov](https://github.com/nickitat)).
+* Revert recent grace hash join changes [#50699](https://github.com/ClickHouse/ClickHouse/pull/50699) ([vdimir](https://github.com/vdimir)).
+* Avoid storing logs in Keeper containing unknown operation [#50751](https://github.com/ClickHouse/ClickHouse/pull/50751) ([Antonio Andelic](https://github.com/antonio2368)).
+* Add compat setting for non-const timezones [#50834](https://github.com/ClickHouse/ClickHouse/pull/50834) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix iceberg V2 optional metadata parsing [#50974](https://github.com/ClickHouse/ClickHouse/pull/50974) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix subtly broken copy-on-write of ColumnLowCardinality dictionary [#51064](https://github.com/ClickHouse/ClickHouse/pull/51064) ([Michael Kolupaev](https://github.com/al13n321)).
+* Generate safe IVs [#51086](https://github.com/ClickHouse/ClickHouse/pull/51086) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Don't mark a part as broken on `Poco::TimeoutException` [#50811](https://github.com/ClickHouse/ClickHouse/pull/50811) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix a versions' tweak for tagged commits, improve version_helper [#51035](https://github.com/ClickHouse/ClickHouse/pull/51035) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Sqlancer has changed master to main [#51060](https://github.com/ClickHouse/ClickHouse/pull/51060) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/docs/changelogs/v23.5.4.25-stable.md b/docs/changelogs/v23.5.4.25-stable.md
new file mode 100644
index 00000000000..53d3a7c9c0a
--- /dev/null
+++ b/docs/changelogs/v23.5.4.25-stable.md
@@ -0,0 +1,31 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.5.4.25-stable (190f962abcf) FIXME as compared to v23.5.3.24-stable (76f54616d3b)
+
+#### Improvement
+* Backported in [#51235](https://github.com/ClickHouse/ClickHouse/issues/51235): Improve the progress bar for file/s3/hdfs/url table functions by using chunk size from source data and using incremental total size counting in each thread. Fix the progress bar for *Cluster functions. This closes [#47250](https://github.com/ClickHouse/ClickHouse/issues/47250). [#51088](https://github.com/ClickHouse/ClickHouse/pull/51088) ([Kruglov Pavel](https://github.com/Avogar)).
+* Backported in [#51255](https://github.com/ClickHouse/ClickHouse/issues/51255): Disable cache setting `do_not_evict_index_and_mark_files` (Was enabled in `23.5`). [#51222](https://github.com/ClickHouse/ClickHouse/pull/51222) ([Kseniia Sumarokova](https://github.com/kssenii)).
+
+#### Build/Testing/Packaging Improvement
+* Backported in [#51531](https://github.com/ClickHouse/ClickHouse/issues/51531): Split huge `RUN` in Dockerfile into smaller conditional. Install the necessary tools on demand in the same `RUN` layer, and remove them after that. Upgrade the OS only once at the beginning. Use a modern way to check the signed repository. Downgrade the base repo to ubuntu:20.04 to address the issues on older docker versions. Upgrade golang version to address golang vulnerabilities. [#51504](https://github.com/ClickHouse/ClickHouse/pull/51504) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Backported in [#51572](https://github.com/ClickHouse/ClickHouse/issues/51572): This a follow-up for [#51504](https://github.com/ClickHouse/ClickHouse/issues/51504), the cleanup was lost during refactoring. [#51564](https://github.com/ClickHouse/ClickHouse/pull/51564) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Query Cache: Try to fix bad cast from ColumnConst to ColumnVector<char8_t> [#50704](https://github.com/ClickHouse/ClickHouse/pull/50704) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix type of LDAP server params hash in cache entry [#50865](https://github.com/ClickHouse/ClickHouse/pull/50865) ([Julian Maicher](https://github.com/jmaicher)).
+* Fallback to parsing big integer from String instead of exception in Parquet format [#50873](https://github.com/ClickHouse/ClickHouse/pull/50873) ([Kruglov Pavel](https://github.com/Avogar)).
+* Do not apply projection if read-in-order was enabled. [#50923](https://github.com/ClickHouse/ClickHouse/pull/50923) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix race azure blob storage iterator [#50936](https://github.com/ClickHouse/ClickHouse/pull/50936) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix ineffective query cache for SELECTs with subqueries [#51132](https://github.com/ClickHouse/ClickHouse/pull/51132) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix fuzzer failure in ActionsDAG [#51301](https://github.com/ClickHouse/ClickHouse/pull/51301) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Fix ParallelReadBuffer seek [#50820](https://github.com/ClickHouse/ClickHouse/pull/50820) ([Michael Kolupaev](https://github.com/al13n321)).
+
diff --git a/docs/changelogs/v23.6.1.1524-stable.md b/docs/changelogs/v23.6.1.1524-stable.md
new file mode 100644
index 00000000000..6d295d61ef4
--- /dev/null
+++ b/docs/changelogs/v23.6.1.1524-stable.md
@@ -0,0 +1,301 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.6.1.1524-stable (d1c7e13d088) FIXME as compared to v23.5.1.3174-stable (2fec796e73e)
+
+#### Backward Incompatible Change
+* Delete feature `do_not_evict_index_and_mark_files` in the fs cache. This feature was only making things worse. [#51253](https://github.com/ClickHouse/ClickHouse/pull/51253) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Remove ALTER support for experimental LIVE VIEW. [#51287](https://github.com/ClickHouse/ClickHouse/pull/51287) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### New Feature
+* Add setting `session_timezone`, it is used as default timezone for session when not explicitly specified. [#44149](https://github.com/ClickHouse/ClickHouse/pull/44149) ([Andrey Zvonov](https://github.com/zvonand)).
+* Added overlay database engine and representation of a directory as a database This commit adds 4 databases: 1. DatabaseOverlay: Implements the IDatabase interface. Allow to combine multiple databases, such as FileSystem and Memory. Internally, it stores a vector with other database pointers and proxies requests to them in turn until it is executed successfully. 2. DatabaseFilesystem: allows to read-only interact with files stored on the file system. Internally, it uses TableFunctionFile to implicitly load file when a user requests the table. Result of TableFunctionFile call cached inside to provide quick access. 3. DatabaseS3: allows to read-only interact with s3 storage. It uses TableFunctionS3 to implicitly load table from s3 4. DatabaseHDFS: allows to interact with hdfs storage. It uses TableFunctionHDFS to implicitly load table from hdfs. [#48821](https://github.com/ClickHouse/ClickHouse/pull/48821) ([alekseygolub](https://github.com/alekseygolub)).
+* Add a new setting named `use_mysql_types_in_show_columns` to alter the `SHOW COLUMNS` SQL statement to display MySQL equivalent types when a client is connected via the MySQL compatibility port. [#49577](https://github.com/ClickHouse/ClickHouse/pull/49577) ([Thomas Panetti](https://github.com/tpanetti)).
+* Added option `--rename_files_after_processing <pattern>`. This closes [#34207](https://github.com/ClickHouse/ClickHouse/issues/34207). [#49626](https://github.com/ClickHouse/ClickHouse/pull/49626) ([alekseygolub](https://github.com/alekseygolub)).
+* 1. Add `TableFunctionRedis` 3. Add table engine Redis 4. Add `RedisCommon` which contains Redis related tools and types 5. Support `equals` and `in` filter push down into Redis. [#50150](https://github.com/ClickHouse/ClickHouse/pull/50150) ([JackyWoo](https://github.com/JackyWoo)).
+* Allow to skip empty files in file/s3/url/hdfs table functions using settings `s3_skip_empty_files`, `hdfs_skip_empty_files`, `engine_file_skip_empty_files`, `engine_url_skip_empty_files`. [#50364](https://github.com/ClickHouse/ClickHouse/pull/50364) ([Kruglov Pavel](https://github.com/Avogar)).
+* Clickhouse-client can now be called with a connection instead of "--host", "--port", "--user" etc. [#50689](https://github.com/ClickHouse/ClickHouse/pull/50689) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
+* Codec DEFLATE_QPL is now controlled via server setting "enable_deflate_qpl_codec" (default: false) instead of setting "allow_experimental_codecs". This marks QPL_DEFLATE non-experimental. [#50775](https://github.com/ClickHouse/ClickHouse/pull/50775) ([Robert Schulze](https://github.com/rschu1ze)).
+
+#### Performance Improvement
+* Improve performance with enabled QueryProfiler using thread-local timer_id instead of global object. [#48778](https://github.com/ClickHouse/ClickHouse/pull/48778) ([Jiebin Sun](https://github.com/jiebinn)).
+* Rewrite CapnProto input/output format to improve its performance. Map column names and CapnProto fields case insensitive, fix reading/writing of nested structure fields. [#49752](https://github.com/ClickHouse/ClickHouse/pull/49752) ([Kruglov Pavel](https://github.com/Avogar)).
+* Optimize parquet write performance for parallel threads. [#50102](https://github.com/ClickHouse/ClickHouse/pull/50102) ([Hongbin Ma](https://github.com/binmahone)).
+* ### Documentation entry for user-facing changes Disable `parallelize_output_from_storages` for processing MATERIALIZED VIEWs and storages with one block only. [#50214](https://github.com/ClickHouse/ClickHouse/pull/50214) ([Azat Khuzhin](https://github.com/azat)).
+* Merge PR https://github.com/ClickHouse/ClickHouse/pull/46558 (Avoid processing already sorted data). Avoid block permutation during sort if the block is already sorted. [#50697](https://github.com/ClickHouse/ClickHouse/pull/50697) ([Maksim Kita](https://github.com/kitaisreal)).
+* In the earlier PRs ([#50062](https://github.com/ClickHouse/ClickHouse/issues/50062), [#50307](https://github.com/ClickHouse/ClickHouse/issues/50307)), we used to propose an optimization pattern which transforms the predicates with toYear/toYYYYMM into its equivalent but converter-free form. This transformation could bring significant performance impact to some workloads, such as SSB. However, as issue [#50628](https://github.com/ClickHouse/ClickHouse/issues/50628) indicated, these two PRs would introduce some issues which may results in incomplete query results, and as a result, they were reverted by [#50629](https://github.com/ClickHouse/ClickHouse/issues/50629). [#50951](https://github.com/ClickHouse/ClickHouse/pull/50951) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
+* Make multiple list requests to ZooKeeper in parallel to speed up reading from system.zookeeper table. [#51042](https://github.com/ClickHouse/ClickHouse/pull/51042) ([Alexander Gololobov](https://github.com/davenger)).
+* Speedup initialization of DateTime lookup tables for time zones. This should reduce startup/connect time of clickhouse client especially in debug build as it is rather heavy. [#51347](https://github.com/ClickHouse/ClickHouse/pull/51347) ([Alexander Gololobov](https://github.com/davenger)).
+
+#### Improvement
+* Allow to cast IPv6 to IPv4 address for CIDR ::ffff:0:0/96 (IPv4-mapped addresses). [#49759](https://github.com/ClickHouse/ClickHouse/pull/49759) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Update MongoDB protocol to support MongoDB 5.1 version and newer. Support for the versions with the old protocol (<3.6) is preserved. Closes [#45621](https://github.com/ClickHouse/ClickHouse/issues/45621), [#49879](https://github.com/ClickHouse/ClickHouse/issues/49879). [#50061](https://github.com/ClickHouse/ClickHouse/pull/50061) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Improved scheduling of merge selecting and cleanup tasks in `ReplicatedMergeTree`. The tasks will not be executed too frequently when there's nothing to merge or cleanup. Added settings `max_merge_selecting_sleep_ms`, `merge_selecting_sleep_slowdown_factor`, `max_cleanup_delay_period` and `cleanup_thread_preferred_points_per_iteration`. It should close [#31919](https://github.com/ClickHouse/ClickHouse/issues/31919). [#50107](https://github.com/ClickHouse/ClickHouse/pull/50107) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Support parallel replicas with the analyzer. [#50441](https://github.com/ClickHouse/ClickHouse/pull/50441) ([Raúl Marín](https://github.com/Algunenano)).
+* Add setting `input_format_max_bytes_to_read_for_schema_inference` to limit the number of bytes to read in schema inference. Closes [#50577](https://github.com/ClickHouse/ClickHouse/issues/50577). [#50592](https://github.com/ClickHouse/ClickHouse/pull/50592) ([Kruglov Pavel](https://github.com/Avogar)).
+* Respect setting input_format_as_default in schema inference. [#50602](https://github.com/ClickHouse/ClickHouse/pull/50602) ([Kruglov Pavel](https://github.com/Avogar)).
+* Make filter push down through cross join. [#50605](https://github.com/ClickHouse/ClickHouse/pull/50605) ([Han Fei](https://github.com/hanfei1991)).
+* Actual lz4 version is used now. [#50621](https://github.com/ClickHouse/ClickHouse/pull/50621) ([Nikita Taranov](https://github.com/nickitat)).
+* Allow to skip trailing empty lines in CSV/TSV/CustomSeparated formats via settings `input_format_csv_skip_trailing_empty_lines`, `input_format_tsv_skip_trailing_empty_lines` and `input_format_custom_skip_trailing_empty_lines` (disabled by default). Closes [#49315](https://github.com/ClickHouse/ClickHouse/issues/49315). [#50635](https://github.com/ClickHouse/ClickHouse/pull/50635) ([Kruglov Pavel](https://github.com/Avogar)).
+* Functions "toDateOrDefault|OrNull()" and "accuateCast[OrDefault|OrNull]()" now correctly parse numeric arguments. [#50709](https://github.com/ClickHouse/ClickHouse/pull/50709) ([Dmitry Kardymon](https://github.com/kardymonds)).
+* Currently, the csv input format can not parse the csv file with whitespace or \t field delimiter, and these delimiters is supported in spark. [#50712](https://github.com/ClickHouse/ClickHouse/pull/50712) ([KevinyhZou](https://github.com/KevinyhZou)).
+* Settings `number_of_mutations_to_delay` and `number_of_mutations_to_throw` are enabled by default now with values 500 and 1000 respectively. [#50726](https://github.com/ClickHouse/ClickHouse/pull/50726) ([Anton Popov](https://github.com/CurtizJ)).
+* Keeper improvement: add feature flags for Keeper API. Each feature flag can be disabled or enabled by defining it under `keeper_server.feature_flags` config. E.g. to enable `CheckNotExists` request, `keeper_server.feature_flags.check_not_exists` should be set to `1` on Keeper. [#50796](https://github.com/ClickHouse/ClickHouse/pull/50796) ([Antonio Andelic](https://github.com/antonio2368)).
+* The dashboard correctly shows missing values. This closes [#50831](https://github.com/ClickHouse/ClickHouse/issues/50831). [#50832](https://github.com/ClickHouse/ClickHouse/pull/50832) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* CGroups metrics related to CPU are replaced with one metric, `CGroupMaxCPU` for better usability. The `Normalized` CPU usage metrics will be normalized to CGroups limits instead of the total number of CPUs when they are set. This closes [#50836](https://github.com/ClickHouse/ClickHouse/issues/50836). [#50835](https://github.com/ClickHouse/ClickHouse/pull/50835) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Relax the thresholds for "too many parts" to be more modern. Return the backpressure during long-running insert queries. [#50856](https://github.com/ClickHouse/ClickHouse/pull/50856) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Added the possibility to use date and time arguments in syslog timestamp format in functions parseDateTimeBestEffort*() and parseDateTime64BestEffort*(). [#50925](https://github.com/ClickHouse/ClickHouse/pull/50925) ([Victor Krasnov](https://github.com/sirvickr)).
+* Suggest using `APPEND` or `TRUNCATE` for `INTO OUTFILE` when file exists. [#50950](https://github.com/ClickHouse/ClickHouse/pull/50950) ([alekar](https://github.com/alekar)).
+* Add embedded keeper-client to standalone keeper binary. [#50964](https://github.com/ClickHouse/ClickHouse/pull/50964) ([pufit](https://github.com/pufit)).
+* Command line parameter "--password" in clickhouse-client can now be specified only once. [#50966](https://github.com/ClickHouse/ClickHouse/pull/50966) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
+* Fix data lakes slowness because of synchronous head requests. (Related to Iceberg/Deltalake/Hudi being slow with a lot of files). [#50976](https://github.com/ClickHouse/ClickHouse/pull/50976) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Use `hash_of_all_files` from `system.parts` to check identity of parts during on-cluster backups. [#50997](https://github.com/ClickHouse/ClickHouse/pull/50997) ([Vitaly Baranov](https://github.com/vitlibar)).
+* The system table zookeeper_connection connected_time identifies the time when the connection is established (standard format), and session_uptime_elapsed_seconds is added, which labels the duration of the established connection session (in seconds). [#51026](https://github.com/ClickHouse/ClickHouse/pull/51026) ([郭小龙](https://github.com/guoxiaolongzte)).
+* Show halves of checksums in `system.parts`, `system.projection_parts` and in error messages in the correct order. [#51040](https://github.com/ClickHouse/ClickHouse/pull/51040) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Do not replicate `ALTER PARTITION` queries and mutations through `Replicated` database if it has only one shard and the underlying table is `ReplicatedMergeTree`. [#51049](https://github.com/ClickHouse/ClickHouse/pull/51049) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Improve the progress bar for file/s3/hdfs/url table functions by using chunk size from source data and using incremental total size counting in each thread. Fix the progress bar for *Cluster functions. This closes [#47250](https://github.com/ClickHouse/ClickHouse/issues/47250). [#51088](https://github.com/ClickHouse/ClickHouse/pull/51088) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add total_bytes_to_read to Progress packet in TCP protocol for better Progress bar. [#51158](https://github.com/ClickHouse/ClickHouse/pull/51158) ([Kruglov Pavel](https://github.com/Avogar)).
+* Better checking of data parts on disks with filesystem cache. [#51164](https://github.com/ClickHouse/ClickHouse/pull/51164) ([Anton Popov](https://github.com/CurtizJ)).
+* Disable cache setting `do_not_evict_index_and_mark_files` (Was enabled in `23.5`). [#51222](https://github.com/ClickHouse/ClickHouse/pull/51222) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix sometimes not correct current_elements_num in fs cache. [#51242](https://github.com/ClickHouse/ClickHouse/pull/51242) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add random sleep before merges/mutations execution to split load more evenly between replicas in case of zero-copy replication. [#51282](https://github.com/ClickHouse/ClickHouse/pull/51282) ([alesapin](https://github.com/alesapin)).
+* The function `transform` as well as `CASE` with value matching started to support all data types. This closes [#29730](https://github.com/ClickHouse/ClickHouse/issues/29730). This closes [#32387](https://github.com/ClickHouse/ClickHouse/issues/32387). This closes [#50827](https://github.com/ClickHouse/ClickHouse/issues/50827). This closes [#31336](https://github.com/ClickHouse/ClickHouse/issues/31336). This closes [#40493](https://github.com/ClickHouse/ClickHouse/issues/40493). [#51351](https://github.com/ClickHouse/ClickHouse/pull/51351) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* We have found a bug in LLVM that makes the usage of `compile_expressions` setting unsafe. It is disabled by default. [#51368](https://github.com/ClickHouse/ClickHouse/pull/51368) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Issue [#50220](https://github.com/ClickHouse/ClickHouse/issues/50220) reports a core in `grace_hash` join. We finally reproduce the exception on local, and found that the issue is related to the failure of creating temporary file. Somehow this is triggered in https://github.com/ClickHouse/ClickHouse/pull/49816 https://github.com/ClickHouse/ClickHouse/pull/49483. [#51382](https://github.com/ClickHouse/ClickHouse/pull/51382) ([lgbo](https://github.com/lgbo-ustc)).
+
+#### Build/Testing/Packaging Improvement
+* Update contrib/re2 to 2023-06-02. [#50949](https://github.com/ClickHouse/ClickHouse/pull/50949) ([Yuriy Chernyshov](https://github.com/georgthegreat)).
+* ClickHouse server will print the list of changed settings on fatal errors. This closes [#51137](https://github.com/ClickHouse/ClickHouse/issues/51137). [#51138](https://github.com/ClickHouse/ClickHouse/pull/51138) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* In https://github.com/ClickHouse/ClickHouse/pull/51143 the fasstests failed, but the status wasn't created because of the chown `file not found`. This addresses it. Decrease the default values for `http-max-field-value-size` and `http_max_field_name_size` to 128K. [#51163](https://github.com/ClickHouse/ClickHouse/pull/51163) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Update Ubuntu version in docker containers. [#51180](https://github.com/ClickHouse/ClickHouse/pull/51180) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Allow building ClickHouse with clang-17. [#51300](https://github.com/ClickHouse/ClickHouse/pull/51300) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* [SQLancer](https://github.com/sqlancer/sqlancer) check is considered stable as bugs that were triggered by it are fixed. Now failures of SQLancer check will be reported as failed check status. [#51340](https://github.com/ClickHouse/ClickHouse/pull/51340) ([Ilya Yatsishin](https://github.com/qoega)).
+* Making our CI even better. [#51494](https://github.com/ClickHouse/ClickHouse/pull/51494) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Split huge `RUN` in Dockerfile into smaller conditional. Install the necessary tools on demand in the same `RUN` layer, and remove them after that. Upgrade the OS only once at the beginning. Use a modern way to check the signed repository. Downgrade the base repo to ubuntu:20.04 to address the issues on older docker versions. Upgrade golang version to address golang vulnerabilities. [#51504](https://github.com/ClickHouse/ClickHouse/pull/51504) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* This a follow-up for [#51504](https://github.com/ClickHouse/ClickHouse/issues/51504), the cleanup was lost during refactoring. [#51564](https://github.com/ClickHouse/ClickHouse/pull/51564) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Report loading status for executable dictionaries correctly [#48775](https://github.com/ClickHouse/ClickHouse/pull/48775) ([Anton Kozlov](https://github.com/tonickkozlov)).
+* Proper mutation of skip indices and projections [#50104](https://github.com/ClickHouse/ClickHouse/pull/50104) ([Amos Bird](https://github.com/amosbird)).
+* Cleanup moving parts [#50489](https://github.com/ClickHouse/ClickHouse/pull/50489) ([vdimir](https://github.com/vdimir)).
+* Fix backward compatibility for IP types hashing in aggregate functions [#50551](https://github.com/ClickHouse/ClickHouse/pull/50551) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Fix Log family table return wrong rows count after truncate [#50585](https://github.com/ClickHouse/ClickHouse/pull/50585) ([flynn](https://github.com/ucasfl)).
+* Fix bug in `uniqExact` parallel merging [#50590](https://github.com/ClickHouse/ClickHouse/pull/50590) ([Nikita Taranov](https://github.com/nickitat)).
+* Revert recent grace hash join changes [#50699](https://github.com/ClickHouse/ClickHouse/pull/50699) ([vdimir](https://github.com/vdimir)).
+* Query Cache: Try to fix bad cast from ColumnConst to ColumnVector<char8_t> [#50704](https://github.com/ClickHouse/ClickHouse/pull/50704) ([Robert Schulze](https://github.com/rschu1ze)).
+* Do not read all the columns from right GLOBAL JOIN table. [#50721](https://github.com/ClickHouse/ClickHouse/pull/50721) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Avoid storing logs in Keeper containing unknown operation [#50751](https://github.com/ClickHouse/ClickHouse/pull/50751) ([Antonio Andelic](https://github.com/antonio2368)).
+* SummingMergeTree support for DateTime64 [#50797](https://github.com/ClickHouse/ClickHouse/pull/50797) ([Jordi Villar](https://github.com/jrdi)).
+* Add compat setting for non-const timezones [#50834](https://github.com/ClickHouse/ClickHouse/pull/50834) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix type of LDAP server params hash in cache entry [#50865](https://github.com/ClickHouse/ClickHouse/pull/50865) ([Julian Maicher](https://github.com/jmaicher)).
+* Fallback to parsing big integer from String instead of exception in Parquet format [#50873](https://github.com/ClickHouse/ClickHouse/pull/50873) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix checking the lock file too often while writing a backup [#50889](https://github.com/ClickHouse/ClickHouse/pull/50889) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Do not apply projection if read-in-order was enabled. [#50923](https://github.com/ClickHouse/ClickHouse/pull/50923) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix race azure blob storage iterator [#50936](https://github.com/ClickHouse/ClickHouse/pull/50936) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix erroneous `sort_description` propagation in `CreatingSets` [#50955](https://github.com/ClickHouse/ClickHouse/pull/50955) ([Nikita Taranov](https://github.com/nickitat)).
+* Fix iceberg V2 optional metadata parsing [#50974](https://github.com/ClickHouse/ClickHouse/pull/50974) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* MaterializedMySQL: Keep parentheses for empty table overrides [#50977](https://github.com/ClickHouse/ClickHouse/pull/50977) ([Val Doroshchuk](https://github.com/valbok)).
+* Fix crash in BackupCoordinationStageSync::setError() [#51012](https://github.com/ClickHouse/ClickHouse/pull/51012) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix subtly broken copy-on-write of ColumnLowCardinality dictionary [#51064](https://github.com/ClickHouse/ClickHouse/pull/51064) ([Michael Kolupaev](https://github.com/al13n321)).
+* Generate safe IVs [#51086](https://github.com/ClickHouse/ClickHouse/pull/51086) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Fix ineffective query cache for SELECTs with subqueries [#51132](https://github.com/ClickHouse/ClickHouse/pull/51132) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix Set index with constant nullable comparison. [#51205](https://github.com/ClickHouse/ClickHouse/pull/51205) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix a crash in s3 and s3Cluster functions [#51209](https://github.com/ClickHouse/ClickHouse/pull/51209) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix core dump when compile expression [#51231](https://github.com/ClickHouse/ClickHouse/pull/51231) ([LiuNeng](https://github.com/liuneng1994)).
+* Fix use-after-free in StorageURL when switching URLs [#51260](https://github.com/ClickHouse/ClickHouse/pull/51260) ([Michael Kolupaev](https://github.com/al13n321)).
+* Updated check for parameterized view [#51272](https://github.com/ClickHouse/ClickHouse/pull/51272) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix multiple writing of same file to backup [#51299](https://github.com/ClickHouse/ClickHouse/pull/51299) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix fuzzer failure in ActionsDAG [#51301](https://github.com/ClickHouse/ClickHouse/pull/51301) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove garbage from function `transform` [#51350](https://github.com/ClickHouse/ClickHouse/pull/51350) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix MSan report in lowerUTF8/upperUTF8 [#51371](https://github.com/ClickHouse/ClickHouse/pull/51371) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* fs cache: fix a bit incorrect use_count after [#44985](https://github.com/ClickHouse/ClickHouse/issues/44985) [#51406](https://github.com/ClickHouse/ClickHouse/pull/51406) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix segfault in MathUnary [#51499](https://github.com/ClickHouse/ClickHouse/pull/51499) ([Ilya Yatsishin](https://github.com/qoega)).
+* Fix logical assert in `tupleElement()` with default values [#51534](https://github.com/ClickHouse/ClickHouse/pull/51534) ([Robert Schulze](https://github.com/rschu1ze)).
+* fs cache: remove file from opened file cache immediately when evicting file [#51596](https://github.com/ClickHouse/ClickHouse/pull/51596) ([Kseniia Sumarokova](https://github.com/kssenii)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Deprecate delete-on-destroy.txt [#49181](https://github.com/ClickHouse/ClickHouse/pull/49181) ([Alexander Gololobov](https://github.com/davenger)).
+* Attempt to increase the general runners' survival rate [#49283](https://github.com/ClickHouse/ClickHouse/pull/49283) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Refactor subqueries for IN [#49570](https://github.com/ClickHouse/ClickHouse/pull/49570) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Test plan optimization analyzer [#50095](https://github.com/ClickHouse/ClickHouse/pull/50095) ([Igor Nikonov](https://github.com/devcrafter)).
+* Implement endianness-independent serialization for quantileTiming [#50324](https://github.com/ClickHouse/ClickHouse/pull/50324) ([ltrk2](https://github.com/ltrk2)).
+* require `finalize()` call before d-tor for all writes buffers [#50395](https://github.com/ClickHouse/ClickHouse/pull/50395) ([Sema Checherinda](https://github.com/CheSema)).
+* Implement big-endian support for the deterministic reservoir sampler [#50405](https://github.com/ClickHouse/ClickHouse/pull/50405) ([ltrk2](https://github.com/ltrk2)).
+* Fix compilation error on big-endian platforms [#50406](https://github.com/ClickHouse/ClickHouse/pull/50406) ([ltrk2](https://github.com/ltrk2)).
+* Attach gdb in stateless tests [#50487](https://github.com/ClickHouse/ClickHouse/pull/50487) ([Kruglov Pavel](https://github.com/Avogar)).
+* JIT infrastructure refactoring [#50531](https://github.com/ClickHouse/ClickHouse/pull/50531) ([Maksim Kita](https://github.com/kitaisreal)).
+* Analyzer: Do not apply Query Tree optimizations on shards [#50584](https://github.com/ClickHouse/ClickHouse/pull/50584) ([Dmitry Novik](https://github.com/novikd)).
+* Increase max array size in group bitmap [#50620](https://github.com/ClickHouse/ClickHouse/pull/50620) ([Kruglov Pavel](https://github.com/Avogar)).
+* Misc Annoy index improvements [#50661](https://github.com/ClickHouse/ClickHouse/pull/50661) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix reading negative decimals in avro format [#50668](https://github.com/ClickHouse/ClickHouse/pull/50668) ([Kruglov Pavel](https://github.com/Avogar)).
+* Unify priorities for connection pools [#50675](https://github.com/ClickHouse/ClickHouse/pull/50675) ([Sergei Trifonov](https://github.com/serxa)).
+* Prostpone check of outdated parts [#50676](https://github.com/ClickHouse/ClickHouse/pull/50676) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Unify priorities: `IExecutableTask`s [#50677](https://github.com/ClickHouse/ClickHouse/pull/50677) ([Sergei Trifonov](https://github.com/serxa)).
+* Disable grace_hash join in stress tests [#50693](https://github.com/ClickHouse/ClickHouse/pull/50693) ([vdimir](https://github.com/vdimir)).
+* ReverseTransform small improvement [#50698](https://github.com/ClickHouse/ClickHouse/pull/50698) ([Maksim Kita](https://github.com/kitaisreal)).
+* Support OPTIMIZE for temporary tables  [#50710](https://github.com/ClickHouse/ClickHouse/pull/50710) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Refactor reading from object storages [#50711](https://github.com/ClickHouse/ClickHouse/pull/50711) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix data race in log message of cached buffer [#50723](https://github.com/ClickHouse/ClickHouse/pull/50723) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add new keywords into projections documentation [#50743](https://github.com/ClickHouse/ClickHouse/pull/50743) ([YalalovSM](https://github.com/YalalovSM)).
+* Fix build for aarch64 (temporary disable azure) [#50770](https://github.com/ClickHouse/ClickHouse/pull/50770) ([alesapin](https://github.com/alesapin)).
+* Update version after release [#50772](https://github.com/ClickHouse/ClickHouse/pull/50772) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Update version_date.tsv and changelogs after v23.5.1.3174-stable [#50774](https://github.com/ClickHouse/ClickHouse/pull/50774) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update CHANGELOG.md [#50788](https://github.com/ClickHouse/ClickHouse/pull/50788) ([Ilya Yatsishin](https://github.com/qoega)).
+* Update version_date.tsv and changelogs after v23.2.7.32-stable [#50809](https://github.com/ClickHouse/ClickHouse/pull/50809) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Desctructing --> Destructing [#50810](https://github.com/ClickHouse/ClickHouse/pull/50810) ([Robert Schulze](https://github.com/rschu1ze)).
+* Don't mark a part as broken on `Poco::TimeoutException` [#50811](https://github.com/ClickHouse/ClickHouse/pull/50811) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Rename azure_blob_storage to azureBlobStorage [#50812](https://github.com/ClickHouse/ClickHouse/pull/50812) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix ParallelReadBuffer seek [#50820](https://github.com/ClickHouse/ClickHouse/pull/50820) ([Michael Kolupaev](https://github.com/al13n321)).
+* [RFC] Print git hash when crashing [#50823](https://github.com/ClickHouse/ClickHouse/pull/50823) ([Michael Kolupaev](https://github.com/al13n321)).
+* Add tests for function "transform" [#50833](https://github.com/ClickHouse/ClickHouse/pull/50833) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Update version_date.tsv and changelogs after v23.5.2.7-stable [#50844](https://github.com/ClickHouse/ClickHouse/pull/50844) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Updated changelog with azureBlobStorage table function & engine entry [#50850](https://github.com/ClickHouse/ClickHouse/pull/50850) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Update easy_tasks_sorted_ru.md [#50853](https://github.com/ClickHouse/ClickHouse/pull/50853) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Document x86 / ARM prerequisites for Docker image [#50867](https://github.com/ClickHouse/ClickHouse/pull/50867) ([Robert Schulze](https://github.com/rschu1ze)).
+* MaterializedMySQL: Add test_named_collections [#50874](https://github.com/ClickHouse/ClickHouse/pull/50874) ([Val Doroshchuk](https://github.com/valbok)).
+* Update version_date.tsv and changelogs after v22.8.18.31-lts [#50881](https://github.com/ClickHouse/ClickHouse/pull/50881) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.3.3.52-lts [#50882](https://github.com/ClickHouse/ClickHouse/pull/50882) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.4.3.48-stable [#50883](https://github.com/ClickHouse/ClickHouse/pull/50883) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* MaterializedMySQL: Add additional test case to insert_with_modify_binlog_checksum [#50884](https://github.com/ClickHouse/ClickHouse/pull/50884) ([Val Doroshchuk](https://github.com/valbok)).
+* Update broken tests list [#50886](https://github.com/ClickHouse/ClickHouse/pull/50886) ([Dmitry Novik](https://github.com/novikd)).
+* Fix LOGICAL_ERROR in snowflakeToDateTime*() [#50893](https://github.com/ClickHouse/ClickHouse/pull/50893) ([Robert Schulze](https://github.com/rschu1ze)).
+* Tests with parallel replicas are no more "always green" [#50896](https://github.com/ClickHouse/ClickHouse/pull/50896) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Slightly more information in error message about cached disk [#50897](https://github.com/ClickHouse/ClickHouse/pull/50897) ([Michael Kolupaev](https://github.com/al13n321)).
+* do not call finalize after exception [#50907](https://github.com/ClickHouse/ClickHouse/pull/50907) ([Sema Checherinda](https://github.com/CheSema)).
+* Update Annoy docs [#50912](https://github.com/ClickHouse/ClickHouse/pull/50912) ([Robert Schulze](https://github.com/rschu1ze)).
+* A bit safer UserDefinedSQLFunctionVisitor [#50913](https://github.com/ClickHouse/ClickHouse/pull/50913) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update contribe/orc in .gitmodules [#50920](https://github.com/ClickHouse/ClickHouse/pull/50920) ([San](https://github.com/santrancisco)).
+* MaterializedMySQL: Add missing DROP DATABASE for tests [#50924](https://github.com/ClickHouse/ClickHouse/pull/50924) ([Val Doroshchuk](https://github.com/valbok)).
+* Fix 'Illegal column timezone' in stress tests [#50929](https://github.com/ClickHouse/ClickHouse/pull/50929) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix tests sanity checks and avoid dropping system.query_log table [#50934](https://github.com/ClickHouse/ClickHouse/pull/50934) ([Azat Khuzhin](https://github.com/azat)).
+* Fix tests for throttling by allowing more margin of error for trottling event [#50935](https://github.com/ClickHouse/ClickHouse/pull/50935) ([Azat Khuzhin](https://github.com/azat)).
+* 01746_convert_type_with_default: Temporarily disable flaky test [#50937](https://github.com/ClickHouse/ClickHouse/pull/50937) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix the statless tests image for old commits [#50947](https://github.com/ClickHouse/ClickHouse/pull/50947) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix logic in `AsynchronousBoundedReadBuffer::seek` [#50952](https://github.com/ClickHouse/ClickHouse/pull/50952) ([Nikita Taranov](https://github.com/nickitat)).
+* Uncomment flaky test (01746_convert_type_with_default) [#50954](https://github.com/ClickHouse/ClickHouse/pull/50954) ([Dmitry Kardymon](https://github.com/kardymonds)).
+* Fix keeper-client help message [#50965](https://github.com/ClickHouse/ClickHouse/pull/50965) ([pufit](https://github.com/pufit)).
+* fix build issue on clang 15 [#50967](https://github.com/ClickHouse/ClickHouse/pull/50967) ([Chang chen](https://github.com/baibaichen)).
+* Docs: Fix embedded video link [#50972](https://github.com/ClickHouse/ClickHouse/pull/50972) ([Robert Schulze](https://github.com/rschu1ze)).
+* Change submodule capnproto to it's fork in ClickHouse [#50987](https://github.com/ClickHouse/ClickHouse/pull/50987) ([Kruglov Pavel](https://github.com/Avogar)).
+* Attempt to make 01281_group_by_limit_memory_tracking not flaky [#50995](https://github.com/ClickHouse/ClickHouse/pull/50995) ([Dmitry Novik](https://github.com/novikd)).
+* Fix flaky 02561_null_as_default_more_formats [#51001](https://github.com/ClickHouse/ClickHouse/pull/51001) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix flaky test_seekable_formats [#51002](https://github.com/ClickHouse/ClickHouse/pull/51002) ([Kruglov Pavel](https://github.com/Avogar)).
+* Follow-up to [#50448](https://github.com/ClickHouse/ClickHouse/issues/50448) [#51006](https://github.com/ClickHouse/ClickHouse/pull/51006) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix a versions' tweak for tagged commits, improve version_helper [#51035](https://github.com/ClickHouse/ClickHouse/pull/51035) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Sqlancer has changed master to main [#51060](https://github.com/ClickHouse/ClickHouse/pull/51060) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Do not spam sqlancer build log [#51061](https://github.com/ClickHouse/ClickHouse/pull/51061) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Refactor IColumn::forEachSubcolumn to make it slightly harder to implement incorrectly [#51072](https://github.com/ClickHouse/ClickHouse/pull/51072) ([Michael Kolupaev](https://github.com/al13n321)).
+* MaterializedMySQL: Rename materialize_with_ddl.py -> materialized_with_ddl [#51074](https://github.com/ClickHouse/ClickHouse/pull/51074) ([Val Doroshchuk](https://github.com/valbok)).
+* Improve woboq browser report [#51077](https://github.com/ClickHouse/ClickHouse/pull/51077) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix for part_names_mutex used after destruction [#51099](https://github.com/ClickHouse/ClickHouse/pull/51099) ([Alexander Gololobov](https://github.com/davenger)).
+* Fix ColumnConst::forEachSubcolumn missing from previous PR [#51102](https://github.com/ClickHouse/ClickHouse/pull/51102) ([Michael Kolupaev](https://github.com/al13n321)).
+* Fix the test 02783_parsedatetimebesteffort_syslog flakiness [#51112](https://github.com/ClickHouse/ClickHouse/pull/51112) ([Victor Krasnov](https://github.com/sirvickr)).
+* Compatibility with clang-17 [#51114](https://github.com/ClickHouse/ClickHouse/pull/51114) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Make more parallel get requests to ZooKeeper in system.zookeeper [#51118](https://github.com/ClickHouse/ClickHouse/pull/51118) ([Alexander Gololobov](https://github.com/davenger)).
+* Fix 02703_max_local_write_bandwidth flakiness [#51120](https://github.com/ClickHouse/ClickHouse/pull/51120) ([Azat Khuzhin](https://github.com/azat)).
+* Update version_date.tsv and changelogs after v23.5.3.24-stable [#51121](https://github.com/ClickHouse/ClickHouse/pull/51121) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.4.4.16-stable [#51122](https://github.com/ClickHouse/ClickHouse/pull/51122) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.3.4.17-lts [#51123](https://github.com/ClickHouse/ClickHouse/pull/51123) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v22.8.19.10-lts [#51124](https://github.com/ClickHouse/ClickHouse/pull/51124) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Fix typo [#51126](https://github.com/ClickHouse/ClickHouse/pull/51126) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Slightly better diagnostics [#51127](https://github.com/ClickHouse/ClickHouse/pull/51127) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Small fix in `MergeTreePrefetchedReadPool` [#51131](https://github.com/ClickHouse/ClickHouse/pull/51131) ([Nikita Taranov](https://github.com/nickitat)).
+* Don't report table function accesses to system.errors [#51147](https://github.com/ClickHouse/ClickHouse/pull/51147) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix SQLancer branch name [#51148](https://github.com/ClickHouse/ClickHouse/pull/51148) ([Ilya Yatsishin](https://github.com/qoega)).
+* Revert "Added ability to implicitly use file/hdfs/s3 table functions in clickhouse-local" [#51149](https://github.com/ClickHouse/ClickHouse/pull/51149) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* More profile events for fs cache [#51161](https://github.com/ClickHouse/ClickHouse/pull/51161) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Unforget to pass callback to readBigAt() in ParallelReadBuffer [#51165](https://github.com/ClickHouse/ClickHouse/pull/51165) ([Michael Kolupaev](https://github.com/al13n321)).
+* Update README.md [#51179](https://github.com/ClickHouse/ClickHouse/pull/51179) ([Tyler Hannan](https://github.com/tylerhannan)).
+* Update exception message [#51187](https://github.com/ClickHouse/ClickHouse/pull/51187) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Split long test 02149_schema_inference_formats_with_schema into several tests to avoid timeout in debug [#51197](https://github.com/ClickHouse/ClickHouse/pull/51197) ([Kruglov Pavel](https://github.com/Avogar)).
+* Avoid initializing DateLUT from emptyArray function registration [#51199](https://github.com/ClickHouse/ClickHouse/pull/51199) ([Alexander Gololobov](https://github.com/davenger)).
+* Suppress check for covered parts in ZooKeeper [#51207](https://github.com/ClickHouse/ClickHouse/pull/51207) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* One more profile event for fs cache [#51223](https://github.com/ClickHouse/ClickHouse/pull/51223) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Typo: passowrd_sha256_hex --> password_sha256_hex [#51233](https://github.com/ClickHouse/ClickHouse/pull/51233) ([Robert Schulze](https://github.com/rschu1ze)).
+* Introduce settings enum field with auto-generated values list [#51237](https://github.com/ClickHouse/ClickHouse/pull/51237) ([Sergei Trifonov](https://github.com/serxa)).
+* Drop session if we fail to get Keeper API version  [#51238](https://github.com/ClickHouse/ClickHouse/pull/51238) ([Alexander Gololobov](https://github.com/davenger)).
+* Revert "Fix a crash in s3 and s3Cluster functions" [#51239](https://github.com/ClickHouse/ClickHouse/pull/51239) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* fix flaky `AsyncLoader` destructor [#51245](https://github.com/ClickHouse/ClickHouse/pull/51245) ([Sergei Trifonov](https://github.com/serxa)).
+* Docs: little cleanup of configuration-files.md [#51249](https://github.com/ClickHouse/ClickHouse/pull/51249) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix a stupid bug on Replicated database recovery [#51252](https://github.com/ClickHouse/ClickHouse/pull/51252) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* FileCache: tryReserve() slight improvement [#51259](https://github.com/ClickHouse/ClickHouse/pull/51259) ([Igor Nikonov](https://github.com/devcrafter)).
+* Ugly hotfix for "terminate on uncaught exception" in WriteBufferFromOStream [#51265](https://github.com/ClickHouse/ClickHouse/pull/51265) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Avoid too many calls to Poco::Logger::get [#51266](https://github.com/ClickHouse/ClickHouse/pull/51266) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update version_date.tsv and changelogs after v23.3.5.9-lts [#51269](https://github.com/ClickHouse/ClickHouse/pull/51269) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Better reporting of broken parts [#51270](https://github.com/ClickHouse/ClickHouse/pull/51270) ([Anton Popov](https://github.com/CurtizJ)).
+* Update ext-dict-functions.md [#51283](https://github.com/ClickHouse/ClickHouse/pull/51283) ([Mike Kot](https://github.com/myrrc)).
+* Disable table structure check for secondary queries from Replicated db [#51284](https://github.com/ClickHouse/ClickHouse/pull/51284) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Define Thrift version for parquet and use correct arrow version [#51285](https://github.com/ClickHouse/ClickHouse/pull/51285) ([Kruglov Pavel](https://github.com/Avogar)).
+* Restore Azure build on ARM [#51288](https://github.com/ClickHouse/ClickHouse/pull/51288) ([Robert Schulze](https://github.com/rschu1ze)).
+* Query Cache: Un-comment settings in server cfg [#51294](https://github.com/ClickHouse/ClickHouse/pull/51294) ([Robert Schulze](https://github.com/rschu1ze)).
+* Require more checks [#51295](https://github.com/ClickHouse/ClickHouse/pull/51295) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix metadata loading test [#51297](https://github.com/ClickHouse/ClickHouse/pull/51297) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Scratch the strange Python code [#51302](https://github.com/ClickHouse/ClickHouse/pull/51302) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add a test for [#47865](https://github.com/ClickHouse/ClickHouse/issues/47865) [#51306](https://github.com/ClickHouse/ClickHouse/pull/51306) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add a test for [#48894](https://github.com/ClickHouse/ClickHouse/issues/48894) [#51307](https://github.com/ClickHouse/ClickHouse/pull/51307) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add a test for [#48676](https://github.com/ClickHouse/ClickHouse/issues/48676) [#51308](https://github.com/ClickHouse/ClickHouse/pull/51308) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix long test `functions_bad_arguments` [#51310](https://github.com/ClickHouse/ClickHouse/pull/51310) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Unify merge predicate [#51344](https://github.com/ClickHouse/ClickHouse/pull/51344) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix using locks in ProcessList [#51348](https://github.com/ClickHouse/ClickHouse/pull/51348) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Add a test for [#42631](https://github.com/ClickHouse/ClickHouse/issues/42631) [#51353](https://github.com/ClickHouse/ClickHouse/pull/51353) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix performance tests due to warnings from jemalloc about Per-CPU arena disabled [#51362](https://github.com/ClickHouse/ClickHouse/pull/51362) ([Azat Khuzhin](https://github.com/azat)).
+* Fix "merge_truncate_long" test [#51369](https://github.com/ClickHouse/ClickHouse/pull/51369) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Increase timeout of Fast Test [#51372](https://github.com/ClickHouse/ClickHouse/pull/51372) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix bad tests for DNS [#51374](https://github.com/ClickHouse/ClickHouse/pull/51374) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Attempt to fix the `relax_too_many_parts` test [#51375](https://github.com/ClickHouse/ClickHouse/pull/51375) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix MySQL test in Debug mode [#51376](https://github.com/ClickHouse/ClickHouse/pull/51376) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix bad test `01018_Distributed__shard_num` [#51377](https://github.com/ClickHouse/ClickHouse/pull/51377) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix "logical error" in addressToLineWithInlines [#51379](https://github.com/ClickHouse/ClickHouse/pull/51379) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix test 01280_ttl_where_group_by [#51380](https://github.com/ClickHouse/ClickHouse/pull/51380) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Attempt to fix `test_ssl_cert_authentication` [#51384](https://github.com/ClickHouse/ClickHouse/pull/51384) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Revert "Merge pull request [#50951](https://github.com/ClickHouse/ClickHouse/issues/50951) from ZhiguoZh/20230607-toyear-fix" [#51390](https://github.com/ClickHouse/ClickHouse/pull/51390) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Two tests are twice longer in average with Analyzer and sometimes failing [#51391](https://github.com/ClickHouse/ClickHouse/pull/51391) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix 00899_long_attach_memory_limit [#51395](https://github.com/ClickHouse/ClickHouse/pull/51395) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix test 01293_optimize_final_force [#51396](https://github.com/ClickHouse/ClickHouse/pull/51396) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix test 02481_parquet_list_monotonically_increasing_offsets [#51397](https://github.com/ClickHouse/ClickHouse/pull/51397) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix test 02497_trace_events_stress_long [#51398](https://github.com/ClickHouse/ClickHouse/pull/51398) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix broken labeling for `manual approve` [#51405](https://github.com/ClickHouse/ClickHouse/pull/51405) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix parts lifetime in `MergeTreeTransaction` [#51407](https://github.com/ClickHouse/ClickHouse/pull/51407) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix flaky test test_skip_empty_files [#51409](https://github.com/ClickHouse/ClickHouse/pull/51409) ([Kruglov Pavel](https://github.com/Avogar)).
+* fix flacky test test_profile_events_s3 [#51412](https://github.com/ClickHouse/ClickHouse/pull/51412) ([Sema Checherinda](https://github.com/CheSema)).
+* Update README.md [#51413](https://github.com/ClickHouse/ClickHouse/pull/51413) ([Tyler Hannan](https://github.com/tylerhannan)).
+* Replace try/catch logic in hasTokenOrNull() by something more lightweight [#51425](https://github.com/ClickHouse/ClickHouse/pull/51425) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add retries to `tlsv1_3` tests [#51434](https://github.com/ClickHouse/ClickHouse/pull/51434) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Update exception message [#51440](https://github.com/ClickHouse/ClickHouse/pull/51440) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* fs cache: add check for intersecting ranges [#51444](https://github.com/ClickHouse/ClickHouse/pull/51444) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Slightly better code around packets for parallel replicas [#51451](https://github.com/ClickHouse/ClickHouse/pull/51451) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Update system_warnings test [#51453](https://github.com/ClickHouse/ClickHouse/pull/51453) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Many fixes [#51455](https://github.com/ClickHouse/ClickHouse/pull/51455) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix test 01605_adaptive_granularity_block_borders [#51457](https://github.com/ClickHouse/ClickHouse/pull/51457) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Try fix flaky 02497_storage_file_reader_selection [#51468](https://github.com/ClickHouse/ClickHouse/pull/51468) ([Kruglov Pavel](https://github.com/Avogar)).
+* Try making Keeper in `DatabaseReplicated` tests more stable [#51473](https://github.com/ClickHouse/ClickHouse/pull/51473) ([Antonio Andelic](https://github.com/antonio2368)).
+* Convert 02003_memory_limit_in_client from expect to sh test (to fix flakiness) [#51475](https://github.com/ClickHouse/ClickHouse/pull/51475) ([Azat Khuzhin](https://github.com/azat)).
+* Fix test_disk_over_web_server [#51476](https://github.com/ClickHouse/ClickHouse/pull/51476) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Delay shutdown of system and temporary databases [#51479](https://github.com/ClickHouse/ClickHouse/pull/51479) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix memory leakage in CompressionCodecDeflateQpl [#51480](https://github.com/ClickHouse/ClickHouse/pull/51480) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Increase retries in test_multiple_disks/test.py::test_start_stop_moves [#51482](https://github.com/ClickHouse/ClickHouse/pull/51482) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix race in BoundedReadBuffer [#51484](https://github.com/ClickHouse/ClickHouse/pull/51484) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix flaky unit test [#51485](https://github.com/ClickHouse/ClickHouse/pull/51485) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix flaky test `test_host_regexp_multiple_ptr_records` [#51506](https://github.com/ClickHouse/ClickHouse/pull/51506) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Add a comment [#51517](https://github.com/ClickHouse/ClickHouse/pull/51517) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Make `test_ssl_cert_authentication` similar to `test_tlvs1_3` [#51520](https://github.com/ClickHouse/ClickHouse/pull/51520) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Fix duplicate storage set logical error. [#51521](https://github.com/ClickHouse/ClickHouse/pull/51521) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Update test_storage_postgresql/test.py::test_concurrent_queries [#51523](https://github.com/ClickHouse/ClickHouse/pull/51523) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix FATAL: query context is not detached from thread group [#51540](https://github.com/ClickHouse/ClickHouse/pull/51540) ([Igor Nikonov](https://github.com/devcrafter)).
+* Update version_date.tsv and changelogs after v23.3.6.7-lts [#51548](https://github.com/ClickHouse/ClickHouse/pull/51548) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Decoupled commits from [#51180](https://github.com/ClickHouse/ClickHouse/issues/51180) for backports [#51561](https://github.com/ClickHouse/ClickHouse/pull/51561) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Try to fix deadlock in ZooKeeper client [#51563](https://github.com/ClickHouse/ClickHouse/pull/51563) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Retry chroot creation in ZK before stateless tests [#51585](https://github.com/ClickHouse/ClickHouse/pull/51585) ([Antonio Andelic](https://github.com/antonio2368)).
+* use timeout instead trap in 01443_merge_truncate_long.sh [#51593](https://github.com/ClickHouse/ClickHouse/pull/51593) ([Sema Checherinda](https://github.com/CheSema)).
+* Update version_date.tsv and changelogs after v23.5.4.25-stable [#51604](https://github.com/ClickHouse/ClickHouse/pull/51604) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Fix MergeTreeMarksLoader segfaulting if marks file is longer than expected [#51636](https://github.com/ClickHouse/ClickHouse/pull/51636) ([Michael Kolupaev](https://github.com/al13n321)).
+* Update version_date.tsv and changelogs after v23.4.5.22-stable [#51638](https://github.com/ClickHouse/ClickHouse/pull/51638) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.3.7.5-lts [#51639](https://github.com/ClickHouse/ClickHouse/pull/51639) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update parts.md [#51643](https://github.com/ClickHouse/ClickHouse/pull/51643) ([Ramazan Polat](https://github.com/ramazanpolat)).
+
diff --git a/docs/en/engines/table-engines/index.md b/docs/en/engines/table-engines/index.md
index d7c582164de..bd704d0e87e 100644
--- a/docs/en/engines/table-engines/index.md
+++ b/docs/en/engines/table-engines/index.md
@@ -53,6 +53,7 @@ Engines in the family:
 - [JDBC](../../engines/table-engines/integrations/jdbc.md)
 - [MySQL](../../engines/table-engines/integrations/mysql.md)
 - [MongoDB](../../engines/table-engines/integrations/mongodb.md)
+- [Redis](../../engines/table-engines/integrations/redis.md)
 - [HDFS](../../engines/table-engines/integrations/hdfs.md)
 - [S3](../../engines/table-engines/integrations/s3.md)
 - [Kafka](../../engines/table-engines/integrations/kafka.md)
diff --git a/docs/en/engines/table-engines/integrations/ExternalDistributed.md b/docs/en/engines/table-engines/integrations/ExternalDistributed.md
index 3fb3fe88b55..d995c34e00a 100644
--- a/docs/en/engines/table-engines/integrations/ExternalDistributed.md
+++ b/docs/en/engines/table-engines/integrations/ExternalDistributed.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/ExternalDistributed
-sidebar_position: 12
+sidebar_position: 55
 sidebar_label: ExternalDistributed
 title: ExternalDistributed
 ---
diff --git a/docs/en/engines/table-engines/integrations/azureBlobStorage.md b/docs/en/engines/table-engines/integrations/azureBlobStorage.md
new file mode 100644
index 00000000000..60e448377d0
--- /dev/null
+++ b/docs/en/engines/table-engines/integrations/azureBlobStorage.md
@@ -0,0 +1,52 @@
+---
+slug: /en/engines/table-engines/integrations/azureBlobStorage
+sidebar_position: 10
+sidebar_label: Azure Blob Storage
+---
+
+# AzureBlobStorage Table Engine
+
+This engine provides an integration with [Azure Blob Storage](https://azure.microsoft.com/en-us/products/storage/blobs) ecosystem.
+
+## Create Table
+
+``` sql
+CREATE TABLE azure_blob_storage_table (name String, value UInt32)
+    ENGINE = AzureBlobStorage(connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression])
+    [PARTITION BY expr]
+    [SETTINGS ...]
+```
+
+### Engine parameters
+
+- `connection_string|storage_account_url` — connection_string includes account name & key ([Create connection string](https://learn.microsoft.com/en-us/azure/storage/common/storage-configure-connection-string?toc=%2Fazure%2Fstorage%2Fblobs%2Ftoc.json&bc=%2Fazure%2Fstorage%2Fblobs%2Fbreadcrumb%2Ftoc.json#configure-a-connection-string-for-an-azure-storage-account)) or you could also provide the storage account url here and account name & account key as separate parameters (see parameters account_name & account_key)
+- `container_name` - Container name
+- `blobpath` - file path. Supports following wildcards in readonly mode: `*`, `?`, `{abc,def}` and `{N..M}` where `N`, `M` — numbers, `'abc'`, `'def'` — strings.
+- `account_name` - if storage_account_url is used, then account name can be specified here
+- `account_key` - if storage_account_url is used, then account key can be specified here
+- `format` — The [format](/docs/en/interfaces/formats.md) of the file.
+- `compression` — Supported values: `none`, `gzip/gz`, `brotli/br`, `xz/LZMA`, `zstd/zst`. By default, it will autodetect compression by file extension. (same as setting to `auto`).
+
+**Example**
+
+``` sql
+CREATE TABLE test_table (key UInt64, data String)
+    ENGINE = AzureBlobStorage('DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;BlobEndpoint=http://azurite1:10000/devstoreaccount1/;',
+    'test_container', 'test_table', 'CSV');
+
+INSERT INTO test_table VALUES (1, 'a'), (2, 'b'), (3, 'c');
+
+SELECT * FROM test_table;
+```
+
+```text
+┌─key──┬─data──┐
+│  1   │   a   │
+│  2   │   b   │
+│  3   │   c   │
+└──────┴───────┘
+```
+
+## See also
+
+[Azure Blob Storage Table Function](/docs/en/sql-reference/table-functions/azureBlobStorage)
diff --git a/docs/en/engines/table-engines/integrations/deltalake.md b/docs/en/engines/table-engines/integrations/deltalake.md
index 3e2e177e28f..b562e9d7fe6 100644
--- a/docs/en/engines/table-engines/integrations/deltalake.md
+++ b/docs/en/engines/table-engines/integrations/deltalake.md
@@ -1,5 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/deltalake
+sidebar_position: 40
 sidebar_label: DeltaLake
 ---
 
diff --git a/docs/en/engines/table-engines/integrations/embedded-rocksdb.md b/docs/en/engines/table-engines/integrations/embedded-rocksdb.md
index a3604b3c332..2de981d33b7 100644
--- a/docs/en/engines/table-engines/integrations/embedded-rocksdb.md
+++ b/docs/en/engines/table-engines/integrations/embedded-rocksdb.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/embedded-rocksdb
-sidebar_position: 9
+sidebar_position: 50
 sidebar_label: EmbeddedRocksDB
 ---
 
@@ -99,7 +99,7 @@ INSERT INTO test VALUES ('some key', 1, 'value', 3.2);
 
 ### Deletes
 
-Rows can be deleted using `DELETE` query or `TRUNCATE`. 
+Rows can be deleted using `DELETE` query or `TRUNCATE`.
 
 ```sql
 DELETE FROM test WHERE key LIKE 'some%' AND v1 > 1;
@@ -120,3 +120,93 @@ Values can be updated using the `ALTER TABLE` query. The primary key cannot be u
 ```sql
 ALTER TABLE test UPDATE v1 = v1 * 10 + 2 WHERE key LIKE 'some%' AND v3 > 3.1;
 ```
+
+### Joins
+
+A special `direct` join with EmbeddedRocksDB tables is supported.
+This direct join avoids forming a hash table in memory and accesses
+the data directly from the EmbeddedRocksDB.
+
+With large joins you may see much lower memory usage with direct joins
+because the hash table is not created.
+
+To enable direct joins:
+```sql
+SET join_algorithm = 'direct, hash'
+```
+
+:::tip
+When the `join_algorithm` is set to `direct, hash`, direct joins will be used
+when possible, and hash otherwise.
+:::
+
+#### Example
+
+##### Create and populate an EmbeddedRocksDB table:
+```sql
+CREATE TABLE rdb
+(
+    `key` UInt32,
+    `value` Array(UInt32),
+    `value2` String
+)
+ENGINE = EmbeddedRocksDB
+PRIMARY KEY key
+```
+
+```sql
+INSERT INTO rdb
+    SELECT
+        toUInt32(sipHash64(number) % 10) as key,
+        [key, key+1] as value,
+        ('val2' || toString(key)) as value2
+    FROM numbers_mt(10);
+```
+
+##### Create and populate a table to join with table `rdb`:
+
+```sql
+CREATE TABLE t2
+(
+    `k` UInt16
+)
+ENGINE = TinyLog
+```
+
+```sql
+INSERT INTO t2 SELECT number AS k
+FROM numbers_mt(10)
+```
+
+##### Set the join algorithm to `direct`:
+
+```sql
+SET join_algorithm = 'direct'
+```
+
+##### An INNER JOIN:
+```sql
+SELECT *
+FROM
+(
+    SELECT k AS key
+    FROM t2
+) AS t2
+INNER JOIN rdb ON rdb.key = t2.key
+ORDER BY key ASC
+```
+```response
+┌─key─┬─rdb.key─┬─value──┬─value2─┐
+│   0 │       0 │ [0,1]  │ val20  │
+│   2 │       2 │ [2,3]  │ val22  │
+│   3 │       3 │ [3,4]  │ val23  │
+│   6 │       6 │ [6,7]  │ val26  │
+│   7 │       7 │ [7,8]  │ val27  │
+│   8 │       8 │ [8,9]  │ val28  │
+│   9 │       9 │ [9,10] │ val29  │
+└─────┴─────────┴────────┴────────┘
+```
+
+### More information on Joins
+- [`join_algorithm` setting](/docs/en/operations/settings/settings.md#settings-join_algorithm)
+- [JOIN clause](/docs/en/sql-reference/statements/select/join.md)
diff --git a/docs/en/engines/table-engines/integrations/hdfs.md b/docs/en/engines/table-engines/integrations/hdfs.md
index 08cd88826e5..c677123a8d0 100644
--- a/docs/en/engines/table-engines/integrations/hdfs.md
+++ b/docs/en/engines/table-engines/integrations/hdfs.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/hdfs
-sidebar_position: 6
+sidebar_position: 80
 sidebar_label: HDFS
 ---
 
@@ -63,7 +63,7 @@ SELECT * FROM hdfs_engine_table LIMIT 2
     - `ALTER` and `SELECT...SAMPLE` operations.
     - Indexes.
     - [Zero-copy](../../../operations/storing-data.md#zero-copy) replication is possible, but not recommended.
-  
+
   :::note Zero-copy replication is not ready for production
   Zero-copy replication is disabled by default in ClickHouse version 22.8 and higher.  This feature is not recommended for production use.
   :::
@@ -233,6 +233,12 @@ libhdfs3 support HDFS namenode HA.
 - `_path` — Path to the file.
 - `_file` — Name of the file.
 
+## Storage Settings {#storage-settings}
+
+- [hdfs_truncate_on_insert](/docs/en/operations/settings/settings.md#hdfs-truncate-on-insert) - allows to truncate file before insert into it. Disabled by default.
+- [hdfs_create_multiple_files](/docs/en/operations/settings/settings.md#hdfs_allow_create_multiple_files) - allows to create a new file on each insert if format has suffix. Disabled by default.
+- [hdfs_skip_empty_files](/docs/en/operations/settings/settings.md#hdfs_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
+
 **See Also**
 
 - [Virtual columns](../../../engines/table-engines/index.md#table_engines-virtual_columns)
diff --git a/docs/en/engines/table-engines/integrations/hive.md b/docs/en/engines/table-engines/integrations/hive.md
index 5d10e417ae3..48867394418 100644
--- a/docs/en/engines/table-engines/integrations/hive.md
+++ b/docs/en/engines/table-engines/integrations/hive.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/hive
-sidebar_position: 4
+sidebar_position: 84
 sidebar_label: Hive
 ---
 
diff --git a/docs/en/engines/table-engines/integrations/hudi.md b/docs/en/engines/table-engines/integrations/hudi.md
index a11e915aa3d..c60618af289 100644
--- a/docs/en/engines/table-engines/integrations/hudi.md
+++ b/docs/en/engines/table-engines/integrations/hudi.md
@@ -1,5 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/hudi
+sidebar_position: 86
 sidebar_label: Hudi
 ---
 
diff --git a/docs/en/engines/table-engines/integrations/iceberg.md b/docs/en/engines/table-engines/integrations/iceberg.md
index 77cefc9283d..9d6395f73ac 100644
--- a/docs/en/engines/table-engines/integrations/iceberg.md
+++ b/docs/en/engines/table-engines/integrations/iceberg.md
@@ -1,5 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/iceberg
+sidebar_position: 90
 sidebar_label: Iceberg
 ---
 
diff --git a/docs/en/engines/table-engines/integrations/index.md b/docs/en/engines/table-engines/integrations/index.md
index b321a644d32..d3b4afc95a2 100644
--- a/docs/en/engines/table-engines/integrations/index.md
+++ b/docs/en/engines/table-engines/integrations/index.md
@@ -6,24 +6,4 @@ sidebar_label:  Integrations
 
 # Table Engines for Integrations
 
-ClickHouse provides various means for integrating with external systems, including table engines. Like with all other table engines, the configuration is done using `CREATE TABLE` or `ALTER TABLE` queries. Then from a user perspective, the configured integration looks like a normal table, but queries to it are proxied to the external system. This transparent querying is one of the key advantages of this approach over alternative integration methods, like dictionaries or table functions, which require to use custom query methods on each use.
-
-List of supported integrations:
-
-- [ODBC](../../../engines/table-engines/integrations/odbc.md)
-- [JDBC](../../../engines/table-engines/integrations/jdbc.md)
-- [MySQL](../../../engines/table-engines/integrations/mysql.md)
-- [MongoDB](../../../engines/table-engines/integrations/mongodb.md)
-- [HDFS](../../../engines/table-engines/integrations/hdfs.md)
-- [S3](../../../engines/table-engines/integrations/s3.md)
-- [Kafka](../../../engines/table-engines/integrations/kafka.md)
-- [EmbeddedRocksDB](../../../engines/table-engines/integrations/embedded-rocksdb.md)
-- [RabbitMQ](../../../engines/table-engines/integrations/rabbitmq.md)
-- [PostgreSQL](../../../engines/table-engines/integrations/postgresql.md)
-- [SQLite](../../../engines/table-engines/integrations/sqlite.md)
-- [Hive](../../../engines/table-engines/integrations/hive.md)
-- [ExternalDistributed](../../../engines/table-engines/integrations/ExternalDistributed.md)
-- [MaterializedPostgreSQL](../../../engines/table-engines/integrations/materialized-postgresql.md)
-- [NATS](../../../engines/table-engines/integrations/nats.md)
-- [DeltaLake](../../../engines/table-engines/integrations/deltalake.md)
-- [Hudi](../../../engines/table-engines/integrations/hudi.md)
+ClickHouse provides various means for integrating with external systems, including table engines. Like with all other table engines, the configuration is done using `CREATE TABLE` or `ALTER TABLE` queries. Then from a user perspective, the configured integration looks like a normal table, but queries to it are proxied to the external system. This transparent querying is one of the key advantages of this approach over alternative integration methods, like dictionaries or table functions, which require the use of custom query methods on each use.
diff --git a/docs/en/engines/table-engines/integrations/jdbc.md b/docs/en/engines/table-engines/integrations/jdbc.md
index 99f851dcf3e..a4a1e2a31ae 100644
--- a/docs/en/engines/table-engines/integrations/jdbc.md
+++ b/docs/en/engines/table-engines/integrations/jdbc.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/jdbc
-sidebar_position: 3
+sidebar_position: 100
 sidebar_label: JDBC
 ---
 
diff --git a/docs/en/engines/table-engines/integrations/kafka.md b/docs/en/engines/table-engines/integrations/kafka.md
index ccfca4c1f1f..b81d5624c1a 100644
--- a/docs/en/engines/table-engines/integrations/kafka.md
+++ b/docs/en/engines/table-engines/integrations/kafka.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/kafka
-sidebar_position: 8
+sidebar_position: 110
 sidebar_label: Kafka
 ---
 
diff --git a/docs/en/engines/table-engines/integrations/materialized-postgresql.md b/docs/en/engines/table-engines/integrations/materialized-postgresql.md
index e112ca3bbb1..bccafd67c2c 100644
--- a/docs/en/engines/table-engines/integrations/materialized-postgresql.md
+++ b/docs/en/engines/table-engines/integrations/materialized-postgresql.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/materialized-postgresql
-sidebar_position: 12
+sidebar_position: 130
 sidebar_label: MaterializedPostgreSQL
 title: MaterializedPostgreSQL
 ---
diff --git a/docs/en/engines/table-engines/integrations/mongodb.md b/docs/en/engines/table-engines/integrations/mongodb.md
index a647ac9993f..912f81573db 100644
--- a/docs/en/engines/table-engines/integrations/mongodb.md
+++ b/docs/en/engines/table-engines/integrations/mongodb.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/mongodb
-sidebar_position: 5
+sidebar_position: 135
 sidebar_label: MongoDB
 ---
 
diff --git a/docs/en/engines/table-engines/integrations/mysql.md b/docs/en/engines/table-engines/integrations/mysql.md
index 6ff6221c877..e50ed8caedd 100644
--- a/docs/en/engines/table-engines/integrations/mysql.md
+++ b/docs/en/engines/table-engines/integrations/mysql.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/mysql
-sidebar_position: 4
+sidebar_position: 138
 sidebar_label: MySQL
 ---
 
@@ -35,6 +35,10 @@ The table structure can differ from the original MySQL table structure:
 - Column types may differ from those in the original MySQL table. ClickHouse tries to [cast](../../../engines/database-engines/mysql.md#data_types-support) values to the ClickHouse data types.
 - The [external_table_functions_use_nulls](../../../operations/settings/settings.md#external-table-functions-use-nulls) setting defines how to handle Nullable columns. Default value: 1. If 0, the table function does not make Nullable columns and inserts default values instead of nulls. This is also applicable for NULL values inside arrays.
 
+:::note
+The MySQL Table Engine is currently not available on the ClickHouse builds for MacOS ([issue](https://github.com/ClickHouse/ClickHouse/issues/21191))
+:::
+
 **Engine Parameters**
 
 - `host:port` — MySQL server address.
diff --git a/docs/en/engines/table-engines/integrations/nats.md b/docs/en/engines/table-engines/integrations/nats.md
index a82d74e0d95..25f442e5ce7 100644
--- a/docs/en/engines/table-engines/integrations/nats.md
+++ b/docs/en/engines/table-engines/integrations/nats.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/nats
-sidebar_position: 14
+sidebar_position: 140
 sidebar_label: NATS
 ---
 
@@ -83,12 +83,12 @@ You can select one of the subjects the table reads from and publish your data th
   CREATE TABLE queue (
     key UInt64,
     value UInt64
-  ) ENGINE = NATS 
+  ) ENGINE = NATS
     SETTINGS nats_url = 'localhost:4444',
              nats_subjects = 'subject1,subject2',
              nats_format = 'JSONEachRow';
 
-  INSERT INTO queue 
+  INSERT INTO queue
   SETTINGS stream_like_engine_insert_queue = 'subject2'
   VALUES (1, 1);
 ```
@@ -102,7 +102,7 @@ Example:
     key UInt64,
     value UInt64,
     date DateTime
-  ) ENGINE = NATS 
+  ) ENGINE = NATS
     SETTINGS nats_url = 'localhost:4444',
              nats_subjects = 'subject1',
              nats_format = 'JSONEachRow',
@@ -137,7 +137,7 @@ Example:
   CREATE TABLE queue (
     key UInt64,
     value UInt64
-  ) ENGINE = NATS 
+  ) ENGINE = NATS
     SETTINGS nats_url = 'localhost:4444',
              nats_subjects = 'subject1',
              nats_format = 'JSONEachRow',
diff --git a/docs/en/engines/table-engines/integrations/odbc.md b/docs/en/engines/table-engines/integrations/odbc.md
index 37e08dc1420..e29e56c10b2 100644
--- a/docs/en/engines/table-engines/integrations/odbc.md
+++ b/docs/en/engines/table-engines/integrations/odbc.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/odbc
-sidebar_position: 2
+sidebar_position: 150
 sidebar_label: ODBC
 ---
 
diff --git a/docs/en/engines/table-engines/integrations/postgresql.md b/docs/en/engines/table-engines/integrations/postgresql.md
index 51b3048706f..aa3dc855537 100644
--- a/docs/en/engines/table-engines/integrations/postgresql.md
+++ b/docs/en/engines/table-engines/integrations/postgresql.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/postgresql
-sidebar_position: 11
+sidebar_position: 160
 sidebar_label: PostgreSQL
 ---
 
@@ -136,7 +136,7 @@ postgresql> SELECT * FROM test;
 
 ### Creating Table in ClickHouse, and connecting to  PostgreSQL table created above
 
-This example uses the [PostgreSQL table engine](/docs/en/engines/table-engines/integrations/postgresql.md) to connect the ClickHouse table to the PostgreSQL table:
+This example uses the [PostgreSQL table engine](/docs/en/engines/table-engines/integrations/postgresql.md) to connect the ClickHouse table to the PostgreSQL table and use both SELECT and INSERT statements to the PostgreSQL database:
 
 ``` sql
 CREATE TABLE default.postgresql_table
@@ -150,10 +150,21 @@ ENGINE = PostgreSQL('localhost:5432', 'public', 'test', 'postges_user', 'postgre
 
 ### Inserting initial data from PostgreSQL table into ClickHouse table, using a SELECT query
 
-The [postgresql table function](/docs/en/sql-reference/table-functions/postgresql.md) copies the data from PostgreSQL to ClickHouse, which is often used for improving the query performance of the data by querying or performing analytics in ClickHouse rather than in PostgreSQL, or can also be used for migrating data from PostgreSQL to ClickHouse:
+The [postgresql table function](/docs/en/sql-reference/table-functions/postgresql.md) copies the data from PostgreSQL to ClickHouse, which is often used for improving the query performance of the data by querying or performing analytics in ClickHouse rather than in PostgreSQL, or can also be used for migrating data from PostgreSQL to ClickHouse. Since we will be copying the data from PostgreSQL to ClickHouse, we will use a MergeTree table engine in ClickHouse and call it postgresql_copy:
 
 ``` sql
-INSERT INTO default.postgresql_table
+CREATE TABLE default.postgresql_copy
+(
+    `float_nullable` Nullable(Float32),
+    `str` String,
+    `int_id` Int32
+)
+ENGINE = MergeTree
+ORDER BY (int_id);
+```
+
+``` sql
+INSERT INTO default.postgresql_copy
 SELECT * FROM postgresql('localhost:5432', 'public', 'test', 'postges_user', 'postgres_password');
 ```
 
@@ -164,13 +175,13 @@ If then performing ongoing synchronization between the PostgreSQL table and Clic
 This would require keeping track of the max ID or timestamp previously added, such as the following:
 
 ``` sql
-SELECT max(`int_id`) AS maxIntID FROM default.postgresql_table;
+SELECT max(`int_id`) AS maxIntID FROM default.postgresql_copy;
 ```
 
 Then inserting values from PostgreSQL table greater than the max
 
 ``` sql
-INSERT INTO default.postgresql_table
+INSERT INTO default.postgresql_copy
 SELECT * FROM postgresql('localhost:5432', 'public', 'test', 'postges_user', 'postgres_password');
 WHERE int_id > maxIntID;
 ```
@@ -178,7 +189,7 @@ WHERE int_id > maxIntID;
 ### Selecting data from the resulting ClickHouse table
 
 ``` sql
-SELECT * FROM postgresql_table WHERE str IN ('test');
+SELECT * FROM postgresql_copy WHERE str IN ('test');
 ```
 
 ``` text
diff --git a/docs/en/engines/table-engines/integrations/rabbitmq.md b/docs/en/engines/table-engines/integrations/rabbitmq.md
index 08062278904..3fd5a130173 100644
--- a/docs/en/engines/table-engines/integrations/rabbitmq.md
+++ b/docs/en/engines/table-engines/integrations/rabbitmq.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/rabbitmq
-sidebar_position: 10
+sidebar_position: 170
 sidebar_label: RabbitMQ
 ---
 
@@ -42,7 +42,6 @@ CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
     [rabbitmq_queue_consume = false,]
     [rabbitmq_address = '',]
     [rabbitmq_vhost = '/',]
-    [rabbitmq_queue_consume = false,]
     [rabbitmq_username = '',]
     [rabbitmq_password = '',]
     [rabbitmq_commit_on_select = false,]
diff --git a/docs/en/engines/table-engines/integrations/redis.md b/docs/en/engines/table-engines/integrations/redis.md
new file mode 100644
index 00000000000..8086a6503b8
--- /dev/null
+++ b/docs/en/engines/table-engines/integrations/redis.md
@@ -0,0 +1,127 @@
+---
+slug: /en/engines/table-engines/integrations/redis
+sidebar_position: 175
+sidebar_label: Redis
+---
+
+# Redis
+
+This engine allows integrating ClickHouse with [Redis](https://redis.io/). For Redis takes kv model, we strongly recommend you only query it in a point way, such as `where k=xx` or `where k in (xx, xx)`.
+
+## Creating a Table {#creating-a-table}
+
+``` sql
+CREATE TABLE [IF NOT EXISTS] [db.]table_name
+(
+    name1 [type1],
+    name2 [type2],
+    ...
+) ENGINE = Redis(host:port[, db_index[, password[, pool_size]]]) PRIMARY KEY(primary_key_name);
+```
+
+**Engine Parameters**
+
+- `host:port` — Redis server address, you can ignore port and default Redis port 6379 will be used.
+
+- `db_index` — Redis db index range from 0 to 15, default is 0.
+
+- `password` — User password, default is blank string.
+
+- `pool_size` — Redis max connection pool size, default is 16.
+
+- `primary_key_name` - any column name in the column list.
+
+- `primary` must be specified, it supports only one column in the primary key. The primary key will be serialized in binary as a Redis key.
+
+- columns other than the primary key will be serialized in binary as Redis value in corresponding order.
+
+- queries with key equals or in filtering will be optimized to multi keys lookup from Redis. If queries without filtering key full table scan will happen which is a heavy operation.
+
+## Usage Example {#usage-example}
+
+Create a table in ClickHouse which allows to read data from Redis:
+
+``` sql
+CREATE TABLE redis_table
+(
+    `key` String,
+    `v1` UInt32,
+    `v2` String,
+    `v3` Float32
+)
+ENGINE = Redis('redis1:6379') PRIMARY KEY(key);
+```
+
+Insert:
+
+```sql
+INSERT INTO redis_table Values('1', 1, '1', 1.0), ('2', 2, '2', 2.0);
+```
+
+Query:
+
+``` sql
+SELECT COUNT(*) FROM redis_table;
+```
+
+``` text
+┌─count()─┐
+│       2 │
+└─────────┘
+```
+
+``` sql
+SELECT * FROM redis_table WHERE key='1';
+```
+
+```text
+┌─key─┬─v1─┬─v2─┬─v3─┐
+│ 1   │  1 │ 1  │  1 │
+└─────┴────┴────┴────┘
+```
+
+``` sql
+SELECT * FROM redis_table WHERE v1=2;
+```
+
+```text
+┌─key─┬─v1─┬─v2─┬─v3─┐
+│ 2   │  2 │ 2  │  2 │
+└─────┴────┴────┴────┘
+```
+
+Update:
+
+Note that the primary key cannot be updated.
+
+```sql
+ALTER TABLE redis_table UPDATE v1=2 WHERE key='1';
+```
+
+Delete:
+
+```sql
+ALTER TABLE redis_table DELETE WHERE key='1';
+```
+
+Truncate:
+
+Flush Redis db asynchronously. Also `Truncate` support SYNC mode.
+
+```sql
+TRUNCATE TABLE redis_table SYNC;
+```
+
+Join:
+
+Join with other tables.
+
+```
+SELECT * FROM redis_table JOIN merge_tree_table ON merge_tree_table.key=redis_table.key;
+```
+
+## Limitations {#limitations}
+
+Redis engine also supports scanning queries, such as `where k > xx`, but it has some limitations:
+1. Scanning query may produce some duplicated keys in a very rare case when it is rehashing. See details in [Redis Scan](https://github.com/redis/redis/blob/e4d183afd33e0b2e6e8d1c79a832f678a04a7886/src/dict.c#L1186-L1269).
+2. During the scanning, keys could be created and deleted, so the resulting dataset can not represent a valid point in time.
diff --git a/docs/en/engines/table-engines/integrations/s3.md b/docs/en/engines/table-engines/integrations/s3.md
index f2eaacd92a5..0e2b48ef6a6 100644
--- a/docs/en/engines/table-engines/integrations/s3.md
+++ b/docs/en/engines/table-engines/integrations/s3.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/s3
-sidebar_position: 7
+sidebar_position: 180
 sidebar_label: S3
 ---
 
@@ -8,30 +8,7 @@ sidebar_label: S3
 
 This engine provides integration with [Amazon S3](https://aws.amazon.com/s3/) ecosystem. This engine is similar to the [HDFS](../../../engines/table-engines/special/file.md#table_engines-hdfs) engine, but provides S3-specific features.
 
-## Create Table {#creating-a-table}
-
-``` sql
-CREATE TABLE s3_engine_table (name String, value UInt32)
-    ENGINE = S3(path [, NOSIGN | aws_access_key_id, aws_secret_access_key,] format, [compression])
-    [PARTITION BY expr]
-    [SETTINGS ...]
-```
-
-**Engine parameters**
-
-- `path` — Bucket url with path to file. Supports following wildcards in readonly mode: `*`, `?`, `{abc,def}` and `{N..M}` where `N`, `M` — numbers, `'abc'`, `'def'` — strings. For more information see [below](#wildcards-in-path).
-- `NOSIGN` - If this keyword is provided in place of credentials, all the requests will not be signed. 
-- `format` — The [format](../../../interfaces/formats.md#formats) of the file.
-- `aws_access_key_id`, `aws_secret_access_key` - Long-term credentials for the [AWS](https://aws.amazon.com/) account user.  You can use these to authenticate your requests. Parameter is optional. If credentials are not specified, they are used from the configuration file. For more information see [Using S3 for Data Storage](../mergetree-family/mergetree.md#table_engine-mergetree-s3).
-- `compression` — Compression type. Supported values: `none`, `gzip/gz`, `brotli/br`, `xz/LZMA`, `zstd/zst`. Parameter is optional. By default, it will auto-detect compression by file extension.
-
-### PARTITION BY
-
-`PARTITION BY` — Optional. In most cases you don't need a partition key, and if it is needed you generally don't need a partition key more granular than by month. Partitioning does not speed up queries (in contrast to the ORDER BY expression). You should never use too granular partitioning. Don't partition your data by client identifiers or names (instead, make client identifier or name the first column in the ORDER BY expression).
-
-For partitioning by month, use the `toYYYYMM(date_column)` expression, where `date_column` is a column with a date of the type [Date](/docs/en/sql-reference/data-types/date.md). The partition names here have the `"YYYYMM"` format.
-
-**Example**
+## Example
 
 ``` sql
 CREATE TABLE s3_engine_table (name String, value UInt32)
@@ -49,6 +26,135 @@ SELECT * FROM s3_engine_table LIMIT 2;
 │ two  │     2 │
 └──────┴───────┘
 ```
+## Create Table {#creating-a-table}
+
+``` sql
+CREATE TABLE s3_engine_table (name String, value UInt32)
+    ENGINE = S3(path [, NOSIGN | aws_access_key_id, aws_secret_access_key,] format, [compression])
+    [PARTITION BY expr]
+    [SETTINGS ...]
+```
+
+### Engine parameters
+
+- `path` — Bucket url with path to file. Supports following wildcards in readonly mode: `*`, `?`, `{abc,def}` and `{N..M}` where `N`, `M` — numbers, `'abc'`, `'def'` — strings. For more information see [below](#wildcards-in-path).
+- `NOSIGN` - If this keyword is provided in place of credentials, all the requests will not be signed.
+- `format` — The [format](../../../interfaces/formats.md#formats) of the file.
+- `aws_access_key_id`, `aws_secret_access_key` - Long-term credentials for the [AWS](https://aws.amazon.com/) account user.  You can use these to authenticate your requests. Parameter is optional. If credentials are not specified, they are used from the configuration file. For more information see [Using S3 for Data Storage](../mergetree-family/mergetree.md#table_engine-mergetree-s3).
+- `compression` — Compression type. Supported values: `none`, `gzip/gz`, `brotli/br`, `xz/LZMA`, `zstd/zst`. Parameter is optional. By default, it will auto-detect compression by file extension.
+
+### PARTITION BY
+
+`PARTITION BY` — Optional. In most cases you don't need a partition key, and if it is needed you generally don't need a partition key more granular than by month. Partitioning does not speed up queries (in contrast to the ORDER BY expression). You should never use too granular partitioning. Don't partition your data by client identifiers or names (instead, make client identifier or name the first column in the ORDER BY expression).
+
+For partitioning by month, use the `toYYYYMM(date_column)` expression, where `date_column` is a column with a date of the type [Date](/docs/en/sql-reference/data-types/date.md). The partition names here have the `"YYYYMM"` format.
+
+### Querying partitioned data
+
+This example uses the [docker compose recipe](https://github.com/ClickHouse/examples/tree/5fdc6ff72f4e5137e23ea075c88d3f44b0202490/docker-compose-recipes/recipes/ch-and-minio-S3), which integrates ClickHouse and MinIO.  You should be able to reproduce the same queries using S3 by replacing the endpoint and authentication values.
+
+Notice that the S3 endpoint in the `ENGINE` configuration uses the parameter token `{_partition_id}` as part of the S3 object (filename), and that the SELECT queries select against those resulting object names (e.g., `test_3.csv`). 
+
+:::note
+As shown in the example, querying from S3 tables that are partitioned is
+not directly supported at this time, but can be accomplished by querying the bucket contents with a wildcard.
+
+The primary use-case for writing 
+partitioned data in S3 is to enable transferring that data into another
+ClickHouse system (for example, moving from on-prem systems to ClickHouse
+Cloud).  Because ClickHouse datasets are often very large, and network
+reliability is sometimes imperfect it makes sense to transfer datasets
+in subsets, hence partitioned writes.
+:::
+
+#### Create the table
+```sql
+CREATE TABLE p
+(
+    `column1` UInt32,
+    `column2` UInt32,
+    `column3` UInt32
+)
+ENGINE = S3(
+# highlight-next-line
+           'http://minio:10000/clickhouse//test_{_partition_id}.csv', 
+           'minioadmin', 
+           'minioadminpassword', 
+           'CSV')
+PARTITION BY column3
+```
+
+#### Insert data
+```sql
+insert into p values (1, 2, 3), (3, 2, 1), (78, 43, 45)
+```
+
+#### Select from partition 3
+
+:::tip
+This query uses the s3 table function
+:::
+
+```sql
+SELECT *
+FROM s3('http://minio:10000/clickhouse//test_3.csv', 'minioadmin', 'minioadminpassword', 'CSV')
+```
+```response
+┌─c1─┬─c2─┬─c3─┐
+│  1 │  2 │  3 │
+└────┴────┴────┘
+```
+
+#### Select from partition 1
+```sql
+SELECT *
+FROM s3('http://minio:10000/clickhouse//test_1.csv', 'minioadmin', 'minioadminpassword', 'CSV')
+```
+```response
+┌─c1─┬─c2─┬─c3─┐
+│  3 │  2 │  1 │
+└────┴────┴────┘
+```
+
+#### Select from partition 45
+```sql
+SELECT *
+FROM s3('http://minio:10000/clickhouse//test_45.csv', 'minioadmin', 'minioadminpassword', 'CSV')
+```
+```response
+┌─c1─┬─c2─┬─c3─┐
+│ 78 │ 43 │ 45 │
+└────┴────┴────┘
+```
+
+#### Select from all partitions
+
+```sql
+SELECT *
+FROM s3('http://minio:10000/clickhouse//**', 'minioadmin', 'minioadminpassword', 'CSV')
+```
+```response
+┌─c1─┬─c2─┬─c3─┐
+│  3 │  2 │  1 │
+└────┴────┴────┘
+┌─c1─┬─c2─┬─c3─┐
+│  1 │  2 │  3 │
+└────┴────┴────┘
+┌─c1─┬─c2─┬─c3─┐
+│ 78 │ 43 │ 45 │
+└────┴────┴────┘
+```
+
+You may naturally try to `Select * from p`, but as noted above, this query will fail; use the preceding query.
+
+```sql
+SELECT * FROM p
+```
+```response
+Received exception from server (version 23.4.1):
+Code: 48. DB::Exception: Received from localhost:9000. DB::Exception: Reading from a partitioned S3 storage is not implemented yet. (NOT_IMPLEMENTED)
+```
+
 ## Virtual columns {#virtual-columns}
 
 - `_path` — Path to the file.
@@ -127,6 +233,12 @@ CREATE TABLE table_with_asterisk (name String, value UInt32)
     ENGINE = S3('https://clickhouse-public-datasets.s3.amazonaws.com/my-bucket/{some,another}_folder/*', 'CSV');
 ```
 
+## Storage Settings {#storage-settings}
+
+- [s3_truncate_on_insert](/docs/en/operations/settings/settings.md#s3-truncate-on-insert) - allows to truncate file before insert into it. Disabled by default.
+- [s3_create_multiple_files](/docs/en/operations/settings/settings.md#s3_allow_create_multiple_files) - allows to create a new file on each insert if format has suffix. Disabled by default.
+- [s3_skip_empty_files](/docs/en/operations/settings/settings.md#s3_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
+
 ## S3-related Settings {#settings}
 
 The following settings can be set before query execution or placed into configuration file.
diff --git a/docs/en/engines/table-engines/integrations/sqlite.md b/docs/en/engines/table-engines/integrations/sqlite.md
index 20597d37a87..c67f863d390 100644
--- a/docs/en/engines/table-engines/integrations/sqlite.md
+++ b/docs/en/engines/table-engines/integrations/sqlite.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-engines/integrations/sqlite
-sidebar_position: 7
+sidebar_position: 185
 sidebar_label: SQLite
 ---
 
diff --git a/docs/en/engines/table-engines/mergetree-family/aggregatingmergetree.md b/docs/en/engines/table-engines/mergetree-family/aggregatingmergetree.md
index 2b8b43802ea..62191d9b5e4 100644
--- a/docs/en/engines/table-engines/mergetree-family/aggregatingmergetree.md
+++ b/docs/en/engines/table-engines/mergetree-family/aggregatingmergetree.md
@@ -109,7 +109,7 @@ INSERT INTO test.visits (StartDate, CounterID, Sign, UserID)
  VALUES (1667446031, 1, 6, 3)
 ```
 
-The data are inserted in both the table and the materialized view `test.mv_visits`.
+The data is inserted in both the table and the materialized view `test.mv_visits`.
 
 To get the aggregated data, we need to execute a query such as `SELECT ... GROUP BY ...` from the materialized view `test.mv_visits`:
 
diff --git a/docs/en/engines/table-engines/mergetree-family/annindexes.md b/docs/en/engines/table-engines/mergetree-family/annindexes.md
index 03617a1a709..4a4ebb47bdc 100644
--- a/docs/en/engines/table-engines/mergetree-family/annindexes.md
+++ b/docs/en/engines/table-engines/mergetree-family/annindexes.md
@@ -1,147 +1,211 @@
 # Approximate Nearest Neighbor Search Indexes [experimental] {#table_engines-ANNIndex}
 
-The main task that indexes achieve is to quickly find nearest neighbors for multidimensional data. An example of such a problem can be finding similar pictures (texts) for a given picture (text). That problem can be reduced to finding the nearest [embeddings](https://cloud.google.com/architecture/overview-extracting-and-serving-feature-embeddings-for-machine-learning). They can be created from data using [UDF](/docs/en/sql-reference/functions/index.md/#executable-user-defined-functions).
+Nearest neighborhood search is the problem of finding the M closest points for a given point in an N-dimensional vector space. The most
+straightforward approach to solve this problem is a brute force search where the distance between all points in the vector space and the
+reference point is computed. This method guarantees perfect accuracy but it is usually too slow for practical applications. Thus, nearest
+neighborhood search problems are often solved with [approximative algorithms](https://github.com/erikbern/ann-benchmarks). Approximative
+nearest neighborhood search techniques, in conjunction with [embedding
+methods](https://cloud.google.com/architecture/overview-extracting-and-serving-feature-embeddings-for-machine-learning) allow to search huge
+amounts of media (pictures, songs, articles, etc.) in milliseconds.
 
-The next queries find the closest neighbors in N-dimensional space using the L2 (Euclidean) distance:
-``` sql 
-SELECT * 
-FROM table_name 
-WHERE L2Distance(Column, Point) < MaxDistance 
+Blogs:
+- [Vector Search with ClickHouse - Part 1](https://clickhouse.com/blog/vector-search-clickhouse-p1)
+- [Vector Search with ClickHouse - Part 2](https://clickhouse.com/blog/vector-search-clickhouse-p2)
+
+
+In terms of SQL, the nearest neighborhood problem can be expressed as follows:
+
+``` sql
+SELECT *
+FROM table
+ORDER BY Distance(vectors, Point)
 LIMIT N
 ```
 
-``` sql 
-SELECT * 
-FROM table_name 
-ORDER BY L2Distance(Column, Point)
+`vectors` contains N-dimensional values of type [Array](../../../sql-reference/data-types/array.md) or
+[Tuple](../../../sql-reference/data-types/tuple.md), for example embeddings. Function `Distance` computes the distance between two vectors.
+Often, the the Euclidean (L2) distance is chosen as distance function but [other
+distance functions](/docs/en/sql-reference/functions/distance-functions.md) are also possible. `Point` is the reference point, e.g. `(0.17,
+0.33, ...)`, and `N` limits the number of search results.
+
+An alternative formulation of the nearest neighborhood search problem looks as follows:
+
+``` sql
+SELECT *
+FROM table
+WHERE Distance(vectors, Point) < MaxDistance
 LIMIT N
 ```
-But it will take some time for execution because of the long calculation of the distance between `TargetEmbedding` and all other vectors. This is where ANN indexes can help. They store a compact approximation of the search space (e.g. using clustering, search trees, etc.) and are able to compute approximate neighbors quickly.
 
-## Indexes Structure
+While the first query returns the top-`N` closest points to the reference point, the second query returns all points closer to the reference
+point than a maximally allowed radius `MaxDistance`. Parameter `N` limits the number of returned values which is useful for situations where
+`MaxDistance` is difficult to determine in advance.
 
-Approximate Nearest Neighbor Search Indexes (`ANNIndexes`) are similar to skip indexes. They are constructed by some granules and determine which of them should be skipped. Compared to skip indices, ANN indices use their results not only to skip some group of granules, but also to select particular granules from a set of granules.
+With brute force search, both queries are expensive (linear in the number of points) because the distance between all points in `vectors` and
+`Point` must be computed. To speed this process up, Approximate Nearest Neighbor Search Indexes (ANN indexes) store a compact representation
+of the search space (using clustering, search trees, etc.) which allows to compute an approximate answer much quicker (in sub-linear time).
 
-`ANNIndexes` are designed to speed up two types of queries:
+# Creating and Using ANN Indexes
+
+Syntax to create an ANN index over an [Array](../../../sql-reference/data-types/array.md) column:
+
+```sql
+CREATE TABLE table
+(
+  `id` Int64,
+  `vectors` Array(Float32),
+  INDEX [ann_index_name vectors TYPE [ann_index_type]([ann_index_parameters]) [GRANULARITY [N]]
+)
+ENGINE = MergeTree
+ORDER BY id;
+```
+
+Syntax to create an ANN index over a [Tuple](../../../sql-reference/data-types/tuple.md) column:
+
+```sql
+CREATE TABLE table
+(
+  `id` Int64,
+  `vectors` Tuple(Float32[, Float32[, ...]]),
+  INDEX [ann_index_name] vectors TYPE [ann_index_type]([ann_index_parameters]) [GRANULARITY [N]]
+)
+ENGINE = MergeTree
+ORDER BY id;
+```
+
+ANN indexes are built during column insertion and merge. As a result, `INSERT` and `OPTIMIZE` statements will be slower than for ordinary
+tables. ANNIndexes are ideally used only with immutable or rarely changed data, respectively when are far more read requests than write
+requests.
+
+ANN indexes support two types of queries:
+
+- ORDER BY queries:
 
-- ######  Type 1: Where 
-   ``` sql 
-   SELECT * 
-   FROM table_name 
-   WHERE DistanceFunction(Column, Point) < MaxDistance 
-   LIMIT N
-   ```
-- ###### Type 2: Order by
   ``` sql
-  SELECT * 
-  FROM table_name [WHERE ...] 
-  ORDER BY DistanceFunction(Column, Point) 
+  SELECT *
+  FROM table
+  [WHERE ...]
+  ORDER BY Distance(vectors, Point)
   LIMIT N
   ```
 
-In these queries, `DistanceFunction` is selected from [distance functions](/docs/en/sql-reference/functions/distance-functions.md). `Point` is a known vector (something like `(0.1, 0.1, ... )`). To avoid writing large vectors, use [client parameters](/docs/en//interfaces/cli.md#queries-with-parameters-cli-queries-with-parameters). `Value` - a float value that will bound the neighbourhood.
+- WHERE queries:
 
-:::note
-ANN index can't speed up query that satisfies both types (`where + order by`, only one of them). All queries must have the limit, as algorithms are used to find nearest neighbors and need a specific number of them.
+   ``` sql
+   SELECT *
+   FROM table
+   WHERE Distance(vectors, Point) < MaxDistance
+   LIMIT N
+   ```
+
+:::tip
+To avoid writing out large vectors, you can use [query
+parameters](/docs/en/interfaces/cli.md#queries-with-parameters-cli-queries-with-parameters), e.g.
+
+```bash
+clickhouse-client --param_vec='hello' --query="SELECT * FROM table WHERE L2Distance(vectors, {vec: Array(Float32)}) < 1.0"
+```
 :::
 
-:::note
-Indexes are applied only to queries with a limit less than the `max_limit_for_ann_queries` setting. This helps to avoid memory overflows in queries with a large limit. `max_limit_for_ann_queries` setting can be changed if you know you can provide enough memory. The default value is `1000000`.
-:::
+**Restrictions**: Queries that contain both a `WHERE Distance(vectors, Point) < MaxDistance` and an `ORDER BY Distance(vectors, Point)`
+clause cannot use ANN indexes. Also, the approximate algorithms used to determine the nearest neighbors require a limit, hence queries
+without `LIMIT` clause cannot utilize ANN indexes. Also ANN indexes are only used if the query has a `LIMIT` value smaller than setting
+`max_limit_for_ann_queries` (default: 1 million rows). This is a safeguard to prevent large memory allocations by external libraries for
+approximate neighbor search.
 
-Both types of queries are handled the same way. The indexes get `n` neighbors (where `n` is taken from the `LIMIT` clause) and work with them. In `ORDER BY` query they remember the numbers of all parts of the granule that have at least one of neighbor. In `WHERE` query they remember only those parts that satisfy the requirements.
+**Differences to Skip Indexes** Similar to regular [skip indexes](https://clickhouse.com/docs/en/optimize/skipping-indexes), ANN indexes are
+constructed over granules and each indexed block consists of `GRANULARITY = [N]`-many granules (`[N]` = 1 by default for normal skip
+indexes). For example, if the primary index granularity of the table is 8192 (setting `index_granularity = 8192`) and `GRANULARITY = 2`,
+then each indexed block will contain 16384 rows. However, data structures and algorithms for approximate neighborhood search (usually
+provided by external libraries) are inherently row-oriented. They store a compact representation of a set of rows and also return rows for
+ANN queries. This causes some rather unintuitive differences in the way ANN indexes behave compared to normal skip indexes.
+
+When a user defines a ANN index on a column, ClickHouse internally creates a ANN "sub-index" for each index block. The sub-index is "local"
+in the sense that it only knows about the rows of its containing index block. In the previous example and assuming that a column has 65536
+rows, we obtain four index blocks (spanning eight granules) and a ANN sub-index for each index block. A sub-index is theoretically able to
+return the rows with the N closest points within its index block directly. However, since ClickHouse loads data from disk to memory at the
+granularity of granules, sub-indexes extrapolate matching rows to granule granularity. This is different from regular skip indexes which
+skip data at the granularity of index blocks.
+
+The `GRANULARITY` parameter determines how many ANN sub-indexes are created. Bigger `GRANULARITY` values mean fewer but larger ANN
+sub-indexes, up to the point where a column (or a column's data part) has only a single sub-index. In that case, the sub-index has a
+"global" view of all column rows and can directly return all granules of the column (part) with relevant rows (there are at most 
+`LIMIT [N]`-many such granules). In a second step, ClickHouse will load these granules and identify the actually best rows by performing a
+brute-force distance calculation over all rows of the granules. With a small `GRANULARITY` value, each of the sub-indexes returns up to
+`LIMIT N`-many granules. As a result, more granules need to be loaded and post-filtered. Note that the search accuracy is with both cases
+equally good, only the processing performance differs. It is generally recommended to use a large `GRANULARITY` for ANN indexes and fall
+back to a smaller `GRANULARITY` values only in case of problems like excessive memory consumption of the ANN structures. If no `GRANULARITY`
+was specified for ANN indexes, the default value is 100 million.
 
 
-## Create table with ANNIndex
+# Available ANN Indexes
 
-This feature is disabled by default. To enable it, set `allow_experimental_annoy_index` to 1. Also, this feature is disabled on ARM, due to likely problems with the algorithm.
-
-```sql
-CREATE TABLE t
-(
-  `id` Int64,
-  `data` Tuple(Float32, Float32, Float32),
-  INDEX ann_index_name data TYPE ann_index_type(ann_index_parameters) GRANULARITY N
-)
-ENGINE = MergeTree
-ORDER BY id;
-```
-
-```sql
-CREATE TABLE t
-(
-  `id` Int64,
-  `data` Array(Float32),
-  INDEX ann_index_name data TYPE ann_index_type(ann_index_parameters) GRANULARITY N
-)
-ENGINE = MergeTree
-ORDER BY id;
-```
-
-With greater `GRANULARITY` indexes remember the data structure better. The `GRANULARITY` indicates how many granules will be used to construct the index. The more data is provided for the index, the more of it can be handled by one index and the more chances that with the right hyper parameters the index will remember the data structure better. But some indexes can't be built if they don't have enough data, so this granule will always participate in the query. For more information, see the description of indexes.
-
-As the indexes are built only during insertions into table, `INSERT` and `OPTIMIZE` queries are slower than for ordinary table. At this stage indexes remember all the information about the given data. ANNIndexes should be used if you have immutable or rarely changed data and many read requests.
-
-You can create your table with index which uses certain algorithm. Now only indices based on the following algorithms are supported:
-
-# Index list
 - [Annoy](/docs/en/engines/table-engines/mergetree-family/annindexes.md#annoy-annoy)
 
-# Annoy {#annoy}
-Implementation of the algorithm was taken from [this repository](https://github.com/spotify/annoy).
+## Annoy {#annoy}
 
-Short description of the algorithm:
-The algorithm recursively divides in half all space by random linear surfaces (lines in 2D, planes in 3D etc.). Thus it makes tree of polyhedrons and points that they contains. Repeating the operation several times for greater accuracy it creates a forest.
-To find K Nearest Neighbours it goes down through the trees and fills the buffer of closest points using the priority queue of polyhedrons. Next, it sorts buffer and return the nearest K points.
+Annoy indexes are currently experimental, to use them you first need to `SET allow_experimental_annoy_index = 1`. They are also currently
+disabled on ARM due to memory safety problems with the algorithm.
+
+This type of ANN index implements [the Annoy algorithm](https://github.com/spotify/annoy) which is based on a recursive division of the
+space in random linear surfaces (lines in 2D, planes in 3D etc.).
+
+<div class='vimeo-container'>
+  <iframe src="//www.youtube.com/embed/QkCCyLW0ehU"
+    width="640"
+    height="360"
+    frameborder="0"
+    allow="autoplay;
+    fullscreen;
+    picture-in-picture"
+    allowfullscreen>
+  </iframe>
+</div>
+
+Syntax to create an Annoy index over an [Array](../../../sql-reference/data-types/array.md) column:
 
-__Examples__:
 ```sql
-CREATE TABLE t
+CREATE TABLE table
 (
   id Int64,
-  data Tuple(Float32, Float32, Float32),
-  INDEX ann_index_name data TYPE annoy(NumTrees, DistanceName) GRANULARITY N
+  vectors Array(Float32),
+  INDEX [ann_index_name] vectors TYPE annoy([Distance[, NumTrees]]) [GRANULARITY N]
 )
 ENGINE = MergeTree
 ORDER BY id;
 ```
 
+Syntax to create an ANN index over a [Tuple](../../../sql-reference/data-types/tuple.md) column:
+
 ```sql
-CREATE TABLE t
+CREATE TABLE table
 (
   id Int64,
-  data Array(Float32),
-  INDEX ann_index_name data TYPE annoy(NumTrees, DistanceName) GRANULARITY N
+  vectors Tuple(Float32[, Float32[, ...]]),
+  INDEX [ann_index_name] vectors TYPE annoy([Distance[, NumTrees]]) [GRANULARITY N]
 )
 ENGINE = MergeTree
 ORDER BY id;
 ```
 
+Annoy currently supports `L2Distance` and `cosineDistance` as distance function `Distance`. If no distance function was specified during
+index creation, `L2Distance` is used as default. Parameter `NumTrees` is the number of trees which the algorithm creates (default if not
+specified: 100). Higher values of `NumTree` mean more accurate search results but slower index creation / query times (approximately
+linearly) as well as larger index sizes.
+
 :::note
-Table with array field will work faster, but all arrays **must** have same length. Use [CONSTRAINT](/docs/en/sql-reference/statements/create/table.md#constraints) to avoid errors. For example, `CONSTRAINT constraint_name_1 CHECK length(data) = 256`.
+Indexes over columns of type `Array` will generally work faster than indexes on `Tuple` columns. All arrays **must** have same length. Use
+[CONSTRAINT](/docs/en/sql-reference/statements/create/table.md#constraints) to avoid errors. For example, `CONSTRAINT constraint_name_1
+CHECK length(vectors) = 256`.
 :::
 
-Parameter `NumTrees` is the number of trees which the algorithm will create. The bigger it is, the slower (approximately linear) it works (in both `CREATE` and `SELECT` requests), but the better accuracy you get (adjusted for randomness). By default it is set to `100`. Parameter `DistanceName` is name of distance function. By default it is set to `L2Distance`. It can be set without changing first parameter, for example
+Setting `annoy_index_search_k_nodes` (default: `NumTrees * LIMIT`) determines how many tree nodes are inspected during SELECTs. Larger
+values mean more accurate results at the cost of longer query runtime:
+
 ```sql
-CREATE TABLE t
-(
-  id Int64,
-  data Array(Float32),
-  INDEX ann_index_name data TYPE annoy('cosineDistance') GRANULARITY N
-)
-ENGINE = MergeTree
-ORDER BY id;
-```
-
-Annoy supports `L2Distance` and `cosineDistance`.
-
-In the `SELECT` in the settings (`ann_index_select_query_params`) you can specify the size of the internal buffer (more details in the description above or in the [original repository](https://github.com/spotify/annoy)). During the query it will inspect up to `search_k` nodes which defaults to `n_trees * n` if not provided. `search_k` gives you a run-time trade-off between better accuracy and speed.
-
-__Example__:
-``` sql
-SELECT * 
-FROM table_name [WHERE ...] 
-ORDER BY L2Distance(Column, Point) 
+SELECT *
+FROM table_name
+ORDER BY L2Distance(vectors, Point)
 LIMIT N
-SETTING ann_index_select_query_params=`k_search=100`
+SETTINGS annoy_index_search_k_nodes=100;
 ```
diff --git a/docs/en/engines/table-engines/mergetree-family/invertedindexes.md b/docs/en/engines/table-engines/mergetree-family/invertedindexes.md
index 31f5a87a2b6..db3d6d0a479 100644
--- a/docs/en/engines/table-engines/mergetree-family/invertedindexes.md
+++ b/docs/en/engines/table-engines/mergetree-family/invertedindexes.md
@@ -15,6 +15,18 @@ tokenized cells of the string column. For example, the string cell "I will be a
 " wi", "wil", "ill", "ll ", "l b", " be" etc. The more fine-granular the input strings are tokenized, the bigger but also the more
 useful the resulting inverted index will be.
 
+<div class='vimeo-container'>
+  <iframe src="//www.youtube.com/embed/O_MnyUkrIq8"
+    width="640"
+    height="360"
+    frameborder="0"
+    allow="autoplay;
+    fullscreen;
+    picture-in-picture"
+    allowfullscreen>
+  </iframe>
+</div>
+
 :::note
 Inverted indexes are experimental and should not be used in production environments yet. They may change in the future in backward-incompatible
 ways, for example with respect to their DDL/DQL syntax or performance/compression characteristics.
diff --git a/docs/en/engines/table-engines/mergetree-family/mergetree.md b/docs/en/engines/table-engines/mergetree-family/mergetree.md
index 07f706af91d..67043ef1062 100644
--- a/docs/en/engines/table-engines/mergetree-family/mergetree.md
+++ b/docs/en/engines/table-engines/mergetree-family/mergetree.md
@@ -491,7 +491,7 @@ Syntax: `tokenbf_v1(size_of_bloom_filter_in_bytes, number_of_hash_functions, ran
 
 #### Special-purpose
 
-- An experimental index to support approximate nearest neighbor (ANN) search. See [here](annindexes.md) for details.
+- Experimental indexes to support approximate nearest neighbor (ANN) search. See [here](annindexes.md) for details.
 - An experimental inverted index to support full-text search. See [here](invertedindexes.md) for details.
 
 ### Functions Support {#functions-support}
@@ -756,6 +756,17 @@ If you perform the `SELECT` query between merges, you may get expired data. To a
 - [ttl_only_drop_parts](/docs/en/operations/settings/settings.md/#ttl_only_drop_parts) setting
 
 
+## Disk types
+
+In addition to local block devices, ClickHouse supports these storage types:
+- [`s3` for S3 and MinIO](#table_engine-mergetree-s3)
+- [`gcs` for GCS](/docs/en/integrations/data-ingestion/gcs/index.md/#creating-a-disk)
+- [`blob_storage_disk` for Azure Blob Storage](#table_engine-mergetree-azure-blob-storage)
+- [`hdfs` for HDFS](#hdfs-storage)
+- [`web` for read-only from web](#web-storage)
+- [`cache` for local caching](/docs/en/operations/storing-data.md/#using-local-cache)
+- [`s3_plain` for backups to S3](/docs/en/operations/backup#backuprestore-using-an-s3-disk)
+
 ## Using Multiple Block Devices for Data Storage {#table_engine-mergetree-multiple-volumes}
 
 ### Introduction {#introduction}
@@ -853,7 +864,7 @@ Tags:
 - `max_data_part_size_bytes` — the maximum size of a part that can be stored on any of the volume’s disks. If the a size of a merged part estimated to be bigger than `max_data_part_size_bytes` then this part will be written to a next volume. Basically this feature allows to keep new/small parts on a hot (SSD) volume and move them to a cold (HDD) volume when they reach large size. Do not use this setting if your policy has only one volume.
 - `move_factor` — when the amount of available space gets lower than this factor, data automatically starts to move on the next volume if any (by default, 0.1). ClickHouse sorts existing parts by size from largest to smallest (in descending order) and selects parts with the total size that is sufficient to meet the `move_factor` condition. If the total size of all parts is insufficient, all parts will be moved.
 - `prefer_not_to_merge` — Disables merging of data parts on this volume. When this setting is enabled, merging data on this volume is not allowed. This allows controlling how ClickHouse works with slow disks.
-- `perform_ttl_move_on_insert` — Disables TTL move on data part INSERT. By default if we insert a data part that already expired by the TTL move rule it immediately goes to a volume/disk declared in move rule. This can significantly slowdown insert in case if destination volume/disk is slow (e.g. S3).
+- `perform_ttl_move_on_insert` — Disables TTL move on data part INSERT. By default (if enabled) if we insert a data part that already expired by the TTL move rule it immediately goes to a volume/disk declared in move rule. This can significantly slowdown insert in case if destination volume/disk is slow (e.g. S3). If disabled then already expired data part is written into a default volume and then right after moved to TTL volume.
 - `load_balancing` - Policy for disk balancing, `round_robin` or `least_used`.
 
 Configuration examples:
@@ -936,7 +947,16 @@ configuration files; all the settings are in the CREATE/ATTACH query.
 The example uses `type=web`, but any disk type can be configured as dynamic, even Local disk. Local disks require a path argument to be inside the server config parameter `custom_local_disks_base_directory`, which has no default, so set that also when using local disk.
 :::
 
+#### Example dynamic web storage
+
+:::tip
+A [demo dataset](https://github.com/ClickHouse/web-tables-demo) is hosted in GitHub.  To prepare your own tables for web storage see the tool [clickhouse-static-files-uploader](/docs/en/operations/storing-data.md/#storing-data-on-webserver)
+:::
+
+In this `ATTACH TABLE` query the `UUID` provided matches the directory name of the data, and the endpoint is the URL for the raw GitHub content.
+
 ```sql
+# highlight-next-line
 ATTACH TABLE uk_price_paid UUID 'cf712b4f-2ca8-435c-ac23-c4393efe52f7'
 (
     price UInt32,
@@ -1138,7 +1158,7 @@ These parameters define the cache layer:
 
 Cache parameters:
 - `path` — The path where metadata for the cache is stored.
-- `max_size` — The size (amount of memory) that the cache can grow to.
+- `max_size` — The size (amount of disk space) that the cache can grow to.
 
 :::tip
 There are several other cache parameters that you can use to tune your storage, see [using local cache](/docs/en/operations/storing-data.md/#using-local-cache) for the details.
@@ -1238,6 +1258,93 @@ Examples of working configurations can be found in integration tests directory (
   Zero-copy replication is disabled by default in ClickHouse version 22.8 and higher.  This feature is not recommended for production use.
   :::
 
+## HDFS storage {#hdfs-storage}
+
+In this sample configuration:
+- the disk is of type `hdfs`
+- the data is hosted at `hdfs://hdfs1:9000/clickhouse/`
+
+```xml
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <hdfs>
+                <type>hdfs</type>
+                <endpoint>hdfs://hdfs1:9000/clickhouse/</endpoint>
+                <skip_access_check>true</skip_access_check>
+            </hdfs>
+            <hdd>
+                <type>local</type>
+                <path>/</path>
+            </hdd>
+        </disks>
+        <policies>
+            <hdfs>
+                <volumes>
+                    <main>
+                        <disk>hdfs</disk>
+                    </main>
+                    <external>
+                        <disk>hdd</disk>
+                    </external>
+                </volumes>
+            </hdfs>
+        </policies>
+    </storage_configuration>
+</clickhouse>
+```
+
+## Web storage (read-only) {#web-storage}
+
+Web storage can be used for read-only purposes. An example use is for hosting sample
+data, or for migrating data.
+
+:::tip
+Storage can also be configured temporarily within a query, if a web dataset is not expected
+to be used routinely, see [dynamic storage](#dynamic-storage) and skip editing the
+configuration file.
+:::
+
+In this sample configuration:
+- the disk is of type `web`
+- the data is hosted at `http://nginx:80/test1/`
+- a cache on local storage is used 
+
+```xml
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <web>
+                <type>web</type>
+                <endpoint>http://nginx:80/test1/</endpoint>
+            </web>
+            <cached_web>
+                <type>cache</type>
+                <disk>web</disk>
+                <path>cached_web_cache/</path>
+                <max_size>100000000</max_size>
+            </cached_web>
+        </disks>
+        <policies>
+            <web>
+                <volumes>
+                    <main>
+                        <disk>web</disk>
+                    </main>
+                </volumes>
+            </web>
+            <cached_web>
+                <volumes>
+                    <main>
+                        <disk>cached_web</disk>
+                    </main>
+                </volumes>
+            </cached_web>
+        </policies>
+    </storage_configuration>
+</clickhouse>
+```
+
 ## Virtual Columns {#virtual-columns}
 
 - `_part` — Name of a part.
diff --git a/docs/en/engines/table-engines/special/file.md b/docs/en/engines/table-engines/special/file.md
index 9c4e87487b4..27945b30c03 100644
--- a/docs/en/engines/table-engines/special/file.md
+++ b/docs/en/engines/table-engines/special/file.md
@@ -92,3 +92,11 @@ $ echo -e "1,2\n3,4" | clickhouse-local -q "CREATE TABLE table (a Int64, b Int64
 `PARTITION BY` — Optional.  It is possible to create separate files by partitioning the data on a partition key. In most cases, you don't need a partition key, and if it is needed you generally don't need a partition key more granular than by month. Partitioning does not speed up queries (in contrast to the ORDER BY expression). You should never use too granular partitioning. Don't partition your data by client identifiers or names (instead, make client identifier or name the first column in the ORDER BY expression).
 
 For partitioning by month, use the `toYYYYMM(date_column)` expression, where `date_column` is a column with a date of the type [Date](/docs/en/sql-reference/data-types/date.md). The partition names here have the `"YYYYMM"` format.
+
+## Settings {#settings}
+
+- [engine_file_empty_if_not_exists](/docs/en/operations/settings/settings.md#engine-file-emptyif-not-exists) - allows to select empty data from a file that doesn't exist. Disabled by default.
+- [engine_file_truncate_on_insert](/docs/en/operations/settings/settings.md#engine-file-truncate-on-insert) - allows to truncate file before insert into it. Disabled by default.
+- [engine_file_allow_create_multiple_files](/docs/en/operations/settings/settings.md#engine_file_allow_create_multiple_files) - allows to create a new file on each insert if format has suffix. Disabled by default.
+- [engine_file_skip_empty_files](/docs/en/operations/settings/settings.md#engine_file_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
+- [storage_file_read_method](/docs/en/operations/settings/settings.md#engine-file-emptyif-not-exists) - method of reading data from storage file, one of: `read`, `pread`, `mmap`. The mmap method does not apply to clickhouse-server (it's intended for clickhouse-local). Default value: `pread` for clickhouse-server, `mmap` for clickhouse-local.
diff --git a/docs/en/engines/table-engines/special/url.md b/docs/en/engines/table-engines/special/url.md
index a4530767e11..26d4975954f 100644
--- a/docs/en/engines/table-engines/special/url.md
+++ b/docs/en/engines/table-engines/special/url.md
@@ -102,3 +102,7 @@ SELECT * FROM url_engine_table
 `PARTITION BY` — Optional.  It is possible to create separate files by partitioning the data on a partition key. In most cases, you don't need a partition key, and if it is needed you generally don't need a partition key more granular than by month. Partitioning does not speed up queries (in contrast to the ORDER BY expression). You should never use too granular partitioning. Don't partition your data by client identifiers or names (instead, make client identifier or name the first column in the ORDER BY expression).
 
 For partitioning by month, use the `toYYYYMM(date_column)` expression, where `date_column` is a column with a date of the type [Date](/docs/en/sql-reference/data-types/date.md). The partition names here have the `"YYYYMM"` format.
+
+## Storage Settings {#storage-settings}
+
+- [engine_url_skip_empty_files](/docs/en/operations/settings/settings.md#engine_url_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
diff --git a/docs/en/getting-started/example-datasets/nyc-taxi.md b/docs/en/getting-started/example-datasets/nyc-taxi.md
index 9730faa873c..cac75fdc45a 100644
--- a/docs/en/getting-started/example-datasets/nyc-taxi.md
+++ b/docs/en/getting-started/example-datasets/nyc-taxi.md
@@ -75,7 +75,7 @@ SELECT
     payment_type,
     pickup_ntaname,
     dropoff_ntaname
-FROM s3(
+FROM gcs(
     'https://storage.googleapis.com/clickhouse-public-datasets/nyc-taxi/trips_{0..2}.gz',
     'TabSeparatedWithNames'
 );
diff --git a/docs/en/getting-started/install.md b/docs/en/getting-started/install.md
index d44dc861888..d2e7ab30478 100644
--- a/docs/en/getting-started/install.md
+++ b/docs/en/getting-started/install.md
@@ -378,6 +378,10 @@ request](https://github.com/ClickHouse/ClickHouse/commits/master) and find CI ch
 https://s3.amazonaws.com/clickhouse/builds/PRs/.../.../binary_aarch64_v80compat/clickhouse". You can then click the link to download the
 build.
 
+### macOS-only: Install with Homebrew
+
+To install ClickHouse using the popular `brew` package manager, follow the instructions listed in the [ClickHouse Homebrew tap](https://github.com/ClickHouse/homebrew-clickhouse).
+
 ## Launch {#launch}
 
 To start the server as a daemon, run:
diff --git a/docs/en/interfaces/cli.md b/docs/en/interfaces/cli.md
index f670d464006..8779dd1a544 100644
--- a/docs/en/interfaces/cli.md
+++ b/docs/en/interfaces/cli.md
@@ -194,7 +194,129 @@ You can pass parameters to `clickhouse-client` (all parameters have a default va
 - `--print-profile-events` – Print `ProfileEvents` packets.
 - `--profile-events-delay-ms` – Delay between printing `ProfileEvents` packets (-1 - print only totals, 0 - print every single packet).
 
-Since version 20.5, `clickhouse-client` has automatic syntax highlighting (always enabled).
+Instead of `--host`, `--port`, `--user` and `--password` options, ClickHouse client also supports connection strings (see next section).
+
+
+## Connection string {#connection_string}
+
+clickhouse-client alternatively supports connecting to clickhouse server using a connection string similar to [MongoDB](https://www.mongodb.com/docs/manual/reference/connection-string/), [PostgreSQL](https://www.postgresql.org/docs/current/libpq-connect.html#LIBPQ-CONNSTRING), [MySQL](https://dev.mysql.com/doc/refman/8.0/en/connecting-using-uri-or-key-value-pairs.html#connecting-using-uri). It has the following syntax:
+
+```text
+clickhouse:[//[user[:password]@][hosts_and_ports]][/database][?query_parameters]
+```
+
+Where
+
+- `user` - (optional) is a user name,
+- `password` - (optional) is a user password. If `:` is specified and the password is blank, the client will prompt for the user's password.
+- `hosts_and_ports` - (optional) is a list of hosts and optional ports `host[:port] [, host:[port]], ...`,
+- `database` - (optional) is the database name,
+- `query_parameters` - (optional) is a list of key-value pairs `param1=value1[,&param2=value2], ...`. For some parameters, no value is required. Parameter names and values are case-sensitive.
+
+If no user is specified, `default` user without password will be used.
+If no host is specified, the `localhost` will be used (localhost).
+If no port is specified is not specified, `9000` will be used as port.
+If no database is specified, the `default` database will be used.
+
+If the user name, password or database was specified in the connection string, it cannot be specified using `--user`, `--password` or `--database` (and vice versa).
+
+The host component can either be an a host name and IP address. Put an IPv6 address in square brackets to specify it:
+
+```text
+clickhouse://[2001:db8::1234]
+```
+
+URI allows multiple hosts to be connected to. Connection strings can contain multiple hosts. ClickHouse-client will try to connect to these hosts in order (i.e. from left to right). After the connection is established, no attempt to connect to the remaining hosts is made.
+
+The connection string must be specified as the first argument of clickhouse-client. The connection string can be combined with arbitrary other [command-line-options](#command-line-options) except `--host/-h` and `--port`.
+
+The following keys are allowed for component `query_parameter`:
+
+- `secure` or shorthanded `s` - no value. If specified, client will connect to the server over a secure connection (TLS). See `secure` in [command-line-options](#command-line-options)
+
+### Percent encoding {#connection_string_uri_percent_encoding}
+
+Non-US ASCII, spaces and special characters in the `user`, `password`, `hosts`, `database` and `query parameters` must be [percent-encoded](https://en.wikipedia.org/wiki/URL_encoding).
+
+### Examples {#connection_string_examples}
+
+Connect to localhost using port 9000 and execute the query `SELECT 1`.
+
+``` bash
+clickhouse-client clickhouse://localhost:9000 --query "SELECT 1"
+```
+
+Connect to localhost using user `john` with password `secret`, host `127.0.0.1` and port `9000`
+
+``` bash
+clickhouse-client clickhouse://john:secret@127.0.0.1:9000
+```
+
+Connect to localhost using default user, host with IPV6 address `[::1]` and port `9000`.
+
+``` bash
+clickhouse-client clickhouse://[::1]:9000
+```
+
+Connect to localhost using port 9000 in multiline mode.
+
+``` bash
+clickhouse-client clickhouse://localhost:9000 '-m'
+```
+
+Connect to localhost using port 9000 with the user `default`.
+
+``` bash
+clickhouse-client clickhouse://default@localhost:9000
+
+# equivalent to:
+clickhouse-client clickhouse://localhost:9000 --user default
+```
+
+Connect to localhost using port 9000 to `my_database` database.
+
+``` bash
+clickhouse-client clickhouse://localhost:9000/my_database
+
+# equivalent to:
+clickhouse-client clickhouse://localhost:9000 --database my_database
+```
+
+Connect to localhost using port 9000 to `my_database` database specified in the connection string and a secure connection using shorthanded 's' URI parameter.
+
+```bash
+clickhouse-client clickhouse://localhost/my_database?s
+
+# equivalent to:
+clickhouse-client clickhouse://localhost/my_database -s
+```
+
+Connect to default host using default port, default user, and default database.
+
+``` bash
+clickhouse-client clickhouse:
+```
+
+Connect to the default host using the default port, using user `my_user` and no password.
+
+``` bash
+clickhouse-client clickhouse://my_user@
+
+# Using a blank password between : and @ means to asking user to enter the password before starting the connection.
+clickhouse-client clickhouse://my_user:@
+```
+
+Connect to localhost using email as the user name. `@` symbol is percent encoded to `%40`.
+
+``` bash
+clickhouse-client clickhouse://some_user%40some_mail.com@localhost:9000
+```
+
+Connect to one of provides hosts: `192.168.1.15`, `192.168.1.25`.
+
+``` bash
+clickhouse-client clickhouse://192.168.1.15,192.168.1.25 
+```
 
 ### Configuration Files {#configuration_files}
 
diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index 2ab9e8caec4..378a1c46d93 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -193,6 +193,7 @@ SELECT * FROM nestedt FORMAT TSV
 - [output_format_tsv_crlf_end_of_line](/docs/en/operations/settings/settings-formats.md/#output_format_tsv_crlf_end_of_line) - if it is set true, end of line in TSV output format will be `\r\n` instead of `\n`. Default value - `false`.
 - [input_format_tsv_skip_first_lines](/docs/en/operations/settings/settings-formats.md/#input_format_tsv_skip_first_lines) - skip specified number of lines at the beginning of data. Default value - `0`.
 - [input_format_tsv_detect_header](/docs/en/operations/settings/settings-formats.md/#input_format_tsv_detect_header) - automatically detect header with names and types in TSV format. Default value - `true`.
+- [input_format_tsv_skip_trailing_empty_lines](/docs/en/operations/settings/settings-formats.md/#input_format_tsv_skip_trailing_empty_lines) - skip trailing empty lines at the end of data. Default value - `false`.
 
 ## TabSeparatedRaw {#tabseparatedraw}
 
@@ -467,6 +468,9 @@ The CSV format supports the output of totals and extremes the same way as `TabSe
 - [output_format_csv_crlf_end_of_line](/docs/en/operations/settings/settings-formats.md/#output_format_csv_crlf_end_of_line) - if it is set to true, end of line in CSV output format will be `\r\n` instead of `\n`. Default value - `false`.
 - [input_format_csv_skip_first_lines](/docs/en/operations/settings/settings-formats.md/#input_format_csv_skip_first_lines) - skip the specified number of lines at the beginning of data. Default value - `0`.
 - [input_format_csv_detect_header](/docs/en/operations/settings/settings-formats.md/#input_format_csv_detect_header) - automatically detect header with names and types in CSV format. Default value - `true`.
+- [input_format_csv_skip_trailing_empty_lines](/docs/en/operations/settings/settings-formats.md/#input_format_csv_skip_trailing_empty_lines) - skip trailing empty lines at the end of data. Default value - `false`.
+- [input_format_csv_trim_whitespaces](/docs/en/operations/settings/settings-formats.md/#input_format_csv_trim_whitespaces) - trim spaces and tabs in non-quoted CSV strings. Default value - `true`.
+- [input_format_csv_allow_whitespace_or_tab_as_delimiter](/docs/en/operations/settings/settings-formats.md/# input_format_csv_allow_whitespace_or_tab_as_delimiter) - Allow to use whitespace or tab as field delimiter in CSV strings. Default value - `false`.
 
 ## CSVWithNames {#csvwithnames}
 
@@ -494,7 +498,9 @@ the types from input data will be compared with the types of the corresponding c
 
 Similar to [Template](#format-template), but it prints or reads all names and types of columns and uses escaping rule from [format_custom_escaping_rule](/docs/en/operations/settings/settings-formats.md/#format_custom_escaping_rule) setting and delimiters from [format_custom_field_delimiter](/docs/en/operations/settings/settings-formats.md/#format_custom_field_delimiter), [format_custom_row_before_delimiter](/docs/en/operations/settings/settings-formats.md/#format_custom_row_before_delimiter), [format_custom_row_after_delimiter](/docs/en/operations/settings/settings-formats.md/#format_custom_row_after_delimiter), [format_custom_row_between_delimiter](/docs/en/operations/settings/settings-formats.md/#format_custom_row_between_delimiter), [format_custom_result_before_delimiter](/docs/en/operations/settings/settings-formats.md/#format_custom_result_before_delimiter) and [format_custom_result_after_delimiter](/docs/en/operations/settings/settings-formats.md/#format_custom_result_after_delimiter) settings, not from format strings.
 
-If setting [input_format_custom_detect_header](/docs/en/operations/settings/settings.md/#input_format_custom_detect_header) is enabled, ClickHouse will automatically detect header with names and types if any.
+If setting [input_format_custom_detect_header](/docs/en/operations/settings/settings-formats.md/#input_format_custom_detect_header) is enabled, ClickHouse will automatically detect header with names and types if any.
+
+If setting [input_format_tsv_skip_trailing_empty_lines](/docs/en/operations/settings/settings-formats.md/#input_format_custom_detect_header) is enabled, trailing empty lines at the end of file will be skipped.
 
 There is also `CustomSeparatedIgnoreSpaces` format, which is similar to [TemplateIgnoreSpaces](#templateignorespaces).
 
@@ -1292,8 +1298,8 @@ For output it uses the following correspondence between ClickHouse types and BSO
 | [Tuple](/docs/en/sql-reference/data-types/tuple.md)                                                                   | `\x04` array                                                                                                  |
 | [Named Tuple](/docs/en/sql-reference/data-types/tuple.md)                                                             | `\x03` document                                                                                               |
 | [Map](/docs/en/sql-reference/data-types/map.md)                                                                       | `\x03` document                                                                                               |
-| [IPv4](/docs/en/sql-reference/data-types/domains/ipv4.md)                                                             | `\x10` int32                                                                                                  |
-| [IPv6](/docs/en/sql-reference/data-types/domains/ipv6.md)                                                             | `\x05` binary, `\x00` binary subtype                                                                          |
+| [IPv4](/docs/en/sql-reference/data-types/ipv4.md)                                                                     | `\x10` int32                                                                                                  |
+| [IPv6](/docs/en/sql-reference/data-types/ipv6.md)                                                                     | `\x05` binary, `\x00` binary subtype                                                                          |
 
 For input it uses the following correspondence between BSON types and ClickHouse types:
 
@@ -1303,7 +1309,7 @@ For input it uses the following correspondence between BSON types and ClickHouse
 | `\x02` string                            | [String](/docs/en/sql-reference/data-types/string.md)/[FixedString](/docs/en/sql-reference/data-types/fixedstring.md)                                                                                                                       |
 | `\x03` document                          | [Map](/docs/en/sql-reference/data-types/map.md)/[Named Tuple](/docs/en/sql-reference/data-types/tuple.md)                                                                                                                                   |
 | `\x04` array                             | [Array](/docs/en/sql-reference/data-types/array.md)/[Tuple](/docs/en/sql-reference/data-types/tuple.md)                                                                                                                                     |
-| `\x05` binary, `\x00` binary subtype     | [String](/docs/en/sql-reference/data-types/string.md)/[FixedString](/docs/en/sql-reference/data-types/fixedstring.md)/[IPv6](/docs/en/sql-reference/data-types/domains/ipv6.md)                                                             |
+| `\x05` binary, `\x00` binary subtype     | [String](/docs/en/sql-reference/data-types/string.md)/[FixedString](/docs/en/sql-reference/data-types/fixedstring.md)/[IPv6](/docs/en/sql-reference/data-types/ipv6.md)                                                             |
 | `\x05` binary, `\x02` old binary subtype | [String](/docs/en/sql-reference/data-types/string.md)/[FixedString](/docs/en/sql-reference/data-types/fixedstring.md)                                                                                                                       |
 | `\x05` binary, `\x03` old uuid subtype   | [UUID](/docs/en/sql-reference/data-types/uuid.md)                                                                                                                                                                                           |
 | `\x05` binary, `\x04` uuid subtype       | [UUID](/docs/en/sql-reference/data-types/uuid.md)                                                                                                                                                                                           |
@@ -1313,7 +1319,7 @@ For input it uses the following correspondence between BSON types and ClickHouse
 | `\x0A` null value                        | [NULL](/docs/en/sql-reference/data-types/nullable.md)                                                                                                                                                                                       |
 | `\x0D` JavaScript code                   | [String](/docs/en/sql-reference/data-types/string.md)/[FixedString](/docs/en/sql-reference/data-types/fixedstring.md)                                                                                                                       |
 | `\x0E` symbol                            | [String](/docs/en/sql-reference/data-types/string.md)/[FixedString](/docs/en/sql-reference/data-types/fixedstring.md)                                                                                                                       |
-| `\x10` int32                             | [Int32/UInt32](/docs/en/sql-reference/data-types/int-uint.md)/[Decimal32](/docs/en/sql-reference/data-types/decimal.md)/[IPv4](/docs/en/sql-reference/data-types/domains/ipv4.md)/[Enum8/Enum16](/docs/en/sql-reference/data-types/enum.md) |
+| `\x10` int32                             | [Int32/UInt32](/docs/en/sql-reference/data-types/int-uint.md)/[Decimal32](/docs/en/sql-reference/data-types/decimal.md)/[IPv4](/docs/en/sql-reference/data-types/ipv4.md)/[Enum8/Enum16](/docs/en/sql-reference/data-types/enum.md) |
 | `\x12` int64                             | [Int64/UInt64](/docs/en/sql-reference/data-types/int-uint.md)/[Decimal64](/docs/en/sql-reference/data-types/decimal.md)/[DateTime64](/docs/en/sql-reference/data-types/datetime64.md)                                                       |
 
 Other BSON types are not supported. Also, it performs conversion between different integer types (for example, you can insert BSON int32 value into ClickHouse UInt8).
@@ -1663,8 +1669,8 @@ The table below shows supported data types and how they match ClickHouse [data t
 | `ENUM`                                               | [Enum(8/16)](/docs/en/sql-reference/data-types/enum.md)                                                                                                                        | `ENUM`                                               |
 | `LIST`                                               | [Array](/docs/en/sql-reference/data-types/array.md)                                                                                                                            | `LIST`                                               |
 | `STRUCT`                                             | [Tuple](/docs/en/sql-reference/data-types/tuple.md)                                                                                                                            | `STRUCT`                                             |
-| `UINT32`                                             | [IPv4](/docs/en/sql-reference/data-types/domains/ipv4.md)                                                                                                                      | `UINT32`                                             |
-| `DATA`                                               | [IPv6](/docs/en/sql-reference/data-types/domains/ipv6.md)                                                                                                                      | `DATA`                                               |
+| `UINT32`                                             | [IPv4](/docs/en/sql-reference/data-types/ipv4.md)                                                                                                                              | `UINT32`                                             |
+| `DATA`                                               | [IPv6](/docs/en/sql-reference/data-types/ipv6.md)                                                                                                                              | `DATA`                                               |
 | `DATA`                                               | [Int128/UInt128/Int256/UInt256](/docs/en/sql-reference/data-types/int-uint.md)                                                                                                 | `DATA`                                               |
 | `DATA`                                               | [Decimal128/Decimal256](/docs/en/sql-reference/data-types/decimal.md)                                                                                                          | `DATA`                                               |
 | `STRUCT(entries LIST(STRUCT(key Key, value Value)))` | [Map](/docs/en/sql-reference/data-types/map.md)                                                                                                                                | `STRUCT(entries LIST(STRUCT(key Key, value Value)))` |
@@ -1866,19 +1872,19 @@ The table below shows supported data types and how they match ClickHouse [data t
 | `long (timestamp-millis)` \**               | [DateTime64(3)](/docs/en/sql-reference/data-types/datetime.md)                                                                | `long (timestamp-millis)` \** |
 | `long (timestamp-micros)` \**               | [DateTime64(6)](/docs/en/sql-reference/data-types/datetime.md)                                                                | `long (timestamp-micros)` \** |
 | `bytes (decimal)`  \**                      | [DateTime64(N)](/docs/en/sql-reference/data-types/datetime.md)                                                                | `bytes (decimal)`  \**        |
-| `int`                                       | [IPv4](/docs/en/sql-reference/data-types/domains/ipv4.md)                                                                     | `int`                         |
-| `fixed(16)`                                 | [IPv6](/docs/en/sql-reference/data-types/domains/ipv6.md)                                                                     | `fixed(16)`                   |
+| `int`                                       | [IPv4](/docs/en/sql-reference/data-types/ipv4.md)                                                                             | `int`                         |
+| `fixed(16)`                                 | [IPv6](/docs/en/sql-reference/data-types/ipv6.md)                                                                             | `fixed(16)`                   |
 | `bytes (decimal)` \**                       | [Decimal(P, S)](/docs/en/sql-reference/data-types/decimal.md)                                                                 | `bytes (decimal)` \**         |
 | `string (uuid)` \**                         | [UUID](/docs/en/sql-reference/data-types/uuid.md)                                                                             | `string (uuid)` \**           |
 | `fixed(16)`                                 | [Int128/UInt128](/docs/en/sql-reference/data-types/int-uint.md)                                                               | `fixed(16)`                   |
 | `fixed(32)`                                 | [Int256/UInt256](/docs/en/sql-reference/data-types/int-uint.md)                                                               | `fixed(32)`                   |
+| `record`                                    | [Tuple](/docs/en/sql-reference/data-types/tuple.md)                                                                           | `record`                      |
+
 
 
 \* `bytes` is default, controlled by [output_format_avro_string_column_pattern](/docs/en/operations/settings/settings-formats.md/#output_format_avro_string_column_pattern)
 \** [Avro logical types](https://avro.apache.org/docs/current/spec.html#Logical+Types)
 
-Unsupported Avro data types: `record` (non-root), `map`
-
 Unsupported Avro logical data types: `time-millis`, `time-micros`, `duration`
 
 ### Inserting Data {#inserting-data-1}
@@ -1917,7 +1923,26 @@ Output Avro file compression and sync interval can be configured with [output_fo
 
 Using the ClickHouse [DESCRIBE](/docs/en/sql-reference/statements/describe-table) function, you can quickly view the inferred format of an Avro file like the following example. This example includes the URL of a publicly accessible Avro file in the ClickHouse S3 public bucket:
 
-``` DESCRIBE url('https://clickhouse-public-datasets.s3.eu-central-1.amazonaws.com/hits.avro','Avro');
+```
+DESCRIBE url('https://clickhouse-public-datasets.s3.eu-central-1.amazonaws.com/hits.avro','Avro);
+```
+```
+┌─name───────────────────────┬─type────────────┬─default_type─┬─default_expression─┬─comment─┬─codec_expression─┬─ttl_expression─┐
+│ WatchID                    │ Int64           │              │                    │         │                  │                │
+│ JavaEnable                 │ Int32           │              │                    │         │                  │                │
+│ Title                      │ String          │              │                    │         │                  │                │
+│ GoodEvent                  │ Int32           │              │                    │         │                  │                │
+│ EventTime                  │ Int32           │              │                    │         │                  │                │
+│ EventDate                  │ Date32          │              │                    │         │                  │                │
+│ CounterID                  │ Int32           │              │                    │         │                  │                │
+│ ClientIP                   │ Int32           │              │                    │         │                  │                │
+│ ClientIP6                  │ FixedString(16) │              │                    │         │                  │                │
+│ RegionID                   │ Int32           │              │                    │         │                  │                │
+...
+│ IslandID                   │ FixedString(16) │              │                    │         │                  │                │
+│ RequestNum                 │ Int32           │              │                    │         │                  │                │
+│ RequestTry                 │ Int32           │              │                    │         │                  │                │
+└────────────────────────────┴─────────────────┴──────────────┴────────────────────┴─────────┴──────────────────┴────────────────┘
 ```
 
 ## AvroConfluent {#data-format-avro-confluent}
@@ -2001,9 +2026,9 @@ The table below shows supported data types and how they match ClickHouse [data t
 | `LIST`                                        | [Array](/docs/en/sql-reference/data-types/array.md)                                                        | `LIST`                        |
 | `STRUCT`                                      | [Tuple](/docs/en/sql-reference/data-types/tuple.md)                                                        | `STRUCT`                      |
 | `MAP`                                         | [Map](/docs/en/sql-reference/data-types/map.md)                                                            | `MAP`                         |
-| `UINT32`                                      | [IPv4](/docs/en/sql-reference/data-types/domains/ipv4.md)                                                  | `UINT32`                      |
-| `FIXED_LENGTH_BYTE_ARRAY`, `BINARY`           | [IPv6](/docs/en/sql-reference/data-types/domains/ipv6.md)                                                  | `FIXED_LENGTH_BYTE_ARRAY`     |
-| `FIXED_LENGTH_BYTE_ARRAY`, `BINARY`           | [Int128/UInt128/Int256/UInt256](/docs/en/sql-reference/data-types/int-uint.md)                     | `FIXED_LENGTH_BYTE_ARRAY`     |
+| `UINT32`                                      | [IPv4](/docs/en/sql-reference/data-types/ipv4.md)                                                          | `UINT32`                      |
+| `FIXED_LENGTH_BYTE_ARRAY`, `BINARY`           | [IPv6](/docs/en/sql-reference/data-types/ipv6.md)                                                          | `FIXED_LENGTH_BYTE_ARRAY`     |
+| `FIXED_LENGTH_BYTE_ARRAY`, `BINARY`           | [Int128/UInt128/Int256/UInt256](/docs/en/sql-reference/data-types/int-uint.md)                             | `FIXED_LENGTH_BYTE_ARRAY`     |
 
 Arrays can be nested and can have a value of the `Nullable` type as an argument. `Tuple` and `Map` types also can be nested.
 
@@ -2057,7 +2082,7 @@ Special format for reading Parquet file metadata (https://parquet.apache.org/doc
   - logical_type - column logical type
   - compression - compression used for this column
   - total_uncompressed_size - total uncompressed bytes size of the column, calculated as the sum of total_uncompressed_size of the column from all row groups
-  - total_compressed_size - total compressed bytes size of the column,  calculated as the sum of total_compressed_size of the column from all row groups 
+  - total_compressed_size - total compressed bytes size of the column,  calculated as the sum of total_compressed_size of the column from all row groups
   - space_saved - percent of space saved by compression, calculated as (1 - total_compressed_size/total_uncompressed_size).
   - encodings - the list of encodings used for this column
 - row_groups - the list of row groups metadata with the next structure:
@@ -2204,9 +2229,9 @@ The table below shows supported data types and how they match ClickHouse [data t
 | `LIST`                                  | [Array](/docs/en/sql-reference/data-types/array.md)                                                        | `LIST`                     |
 | `STRUCT`                                | [Tuple](/docs/en/sql-reference/data-types/tuple.md)                                                        | `STRUCT`                   |
 | `MAP`                                   | [Map](/docs/en/sql-reference/data-types/map.md)                                                            | `MAP`                      |
-| `UINT32`                                | [IPv4](/docs/en/sql-reference/data-types/domains/ipv4.md)                                                  | `UINT32`                   |
-| `FIXED_SIZE_BINARY`, `BINARY`           | [IPv6](/docs/en/sql-reference/data-types/domains/ipv6.md)                                                  | `FIXED_SIZE_BINARY`        |
-| `FIXED_SIZE_BINARY`, `BINARY`           | [Int128/UInt128/Int256/UInt256](/docs/en/sql-reference/data-types/int-uint.md)                     | `FIXED_SIZE_BINARY`        |
+| `UINT32`                                | [IPv4](/docs/en/sql-reference/data-types/ipv4.md)                                                          | `UINT32`                   |
+| `FIXED_SIZE_BINARY`, `BINARY`           | [IPv6](/docs/en/sql-reference/data-types/ipv6.md)                                                          | `FIXED_SIZE_BINARY`        |
+| `FIXED_SIZE_BINARY`, `BINARY`           | [Int128/UInt128/Int256/UInt256](/docs/en/sql-reference/data-types/int-uint.md)                             | `FIXED_SIZE_BINARY`        |
 
 Arrays can be nested and can have a value of the `Nullable` type as an argument. `Tuple` and `Map` types also can be nested.
 
@@ -2272,7 +2297,7 @@ The table below shows supported data types and how they match ClickHouse [data t
 | `Struct`                              | [Tuple](/docs/en/sql-reference/data-types/tuple.md)                                                               | `Struct`                 |
 | `Map`                                 | [Map](/docs/en/sql-reference/data-types/map.md)                                                                   | `Map`                    |
 | `Int`                                 | [IPv4](/docs/en/sql-reference/data-types/int-uint.md)                                                             | `Int`                    |
-| `Binary`                              | [IPv6](/docs/en/sql-reference/data-types/domains/ipv6.md)                                                         | `Binary`                 |
+| `Binary`                              | [IPv6](/docs/en/sql-reference/data-types/ipv6.md)                                                                 | `Binary`                 |
 | `Binary`                              | [Int128/UInt128/Int256/UInt256](/docs/en/sql-reference/data-types/int-uint.md)                                    | `Binary`                 |
 | `Binary`                              | [Decimal256](/docs/en/sql-reference/data-types/decimal.md)                                                        | `Binary`                 |
 
@@ -2429,18 +2454,22 @@ In this format, all input data is read to a single value. It is possible to pars
 The result is output in binary format without delimiters and escaping. If more than one value is output, the format is ambiguous, and it will be impossible to read the data back.
 
 Below is a comparison of the formats `RawBLOB` and [TabSeparatedRaw](#tabseparatedraw).
+
 `RawBLOB`:
 - data is output in binary format, no escaping;
 - there are no delimiters between values;
 - no newline at the end of each value.
-[TabSeparatedRaw] (#tabseparatedraw):
+
+`TabSeparatedRaw`:
 - data is output without escaping;
 - the rows contain values separated by tabs;
 - there is a line feed after the last value in every row.
 
 The following is a comparison of the `RawBLOB` and [RowBinary](#rowbinary) formats.
+
 `RawBLOB`:
 - String fields are output without being prefixed by length.
+
 `RowBinary`:
 - String fields are represented as length in varint format (unsigned [LEB128] (https://en.wikipedia.org/wiki/LEB128)), followed by the bytes of the string.
 
@@ -2485,7 +2514,7 @@ ClickHouse supports reading and writing [MessagePack](https://msgpack.org/) data
 | `uint 64`                                                          | [DateTime64](/docs/en/sql-reference/data-types/datetime.md)                                             | `uint 64`                        |
 | `fixarray`, `array 16`, `array 32`                                 | [Array](/docs/en/sql-reference/data-types/array.md)/[Tuple](/docs/en/sql-reference/data-types/tuple.md) | `fixarray`, `array 16`, `array 32` |
 | `fixmap`, `map 16`, `map 32`                                       | [Map](/docs/en/sql-reference/data-types/map.md)                                                         | `fixmap`, `map 16`, `map 32`     |
-| `uint 32`                                                          | [IPv4](/docs/en/sql-reference/data-types/domains/ipv4.md)                                               | `uint 32`                        |
+| `uint 32`                                                          | [IPv4](/docs/en/sql-reference/data-types/ipv4.md)                                                       | `uint 32`                        |
 | `bin 8`                                                            | [String](/docs/en/sql-reference/data-types/string.md)                                                   | `bin 8`                          |
 | `int 8`                                                            | [Enum8](/docs/en/sql-reference/data-types/enum.md)                                                      | `int 8`                          |
 | `bin 8`                                                            | [(U)Int128/(U)Int256](/docs/en/sql-reference/data-types/int-uint.md)                                    | `bin 8`                          |
diff --git a/docs/en/interfaces/schema-inference.md b/docs/en/interfaces/schema-inference.md
index c448d0aee47..a4c7eb61e50 100644
--- a/docs/en/interfaces/schema-inference.md
+++ b/docs/en/interfaces/schema-inference.md
@@ -329,8 +329,8 @@ SELECT count() FROM system.schema_inference_cache WHERE storage='S3'
 ## Text formats {#text-formats}
 
 For text formats, ClickHouse reads the data row by row, extracts column values according to the format,
-and then uses some recursive parsers and heuristics to determine the type for each value. The maximum number of rows read from the data in schema inference
-is controlled by the setting `input_format_max_rows_to_read_for_schema_inference` with default value 25000.
+and then uses some recursive parsers and heuristics to determine the type for each value. The maximum number of rows and bytes read from the data in schema inference
+is controlled by the settings `input_format_max_rows_to_read_for_schema_inference` (25000 by default) and `input_format_max_bytes_to_read_for_schema_inference` (32Mb by default).
 By default, all inferred types are [Nullable](../sql-reference/data-types/nullable.md), but you can change this by setting `schema_inference_make_columns_nullable` (see examples in the [settings](#settings-for-text-formats) section).
 
 ### JSON formats {#json-formats}
@@ -1144,13 +1144,15 @@ Line: value_1=2, value_2="Some string 2", value_3="[4, 5, NULL]"$$)
 
 ### Settings for text formats {#settings-for-text-formats}
 
-#### input_format_max_rows_to_read_for_schema_inference
+#### input_format_max_rows_to_read_for_schema_inference/input_format_max_bytes_to_read_for_schema_inference
 
-This setting controls the maximum number of rows to be read while schema inference.
-The more rows are read, the more time is spent on schema inference, but the greater the chance to
+These settings control the amount of data to be read while schema inference.
+The more rows/bytes are read, the more time is spent on schema inference, but the greater the chance to
 correctly determine the types (especially when the data contains a lot of nulls).
 
-Default value: `25000`.
+Default values:
+-   `25000` for `input_format_max_rows_to_read_for_schema_inference`.
+-   `33554432` (32 Mb) for `input_format_max_bytes_to_read_for_schema_inference`.
 
 #### column_names_for_schema_inference
 
@@ -1192,7 +1194,7 @@ DESC format(JSONEachRow, '{"id" : 1, "age" : 25, "name" : "Josh", "status" : nul
 #### schema_inference_make_columns_nullable
 
 Controls making inferred types `Nullable` in schema inference for formats without information about nullability.
-If the setting is enabled, all inferred type will be `Nullable`, if disabled, the inferred type will be `Nullable` only if the column contains `NULL` in a sample that is parsed during schema inference.
+If the setting is enabled, all inferred type will be `Nullable`, if disabled, the inferred type will be `Nullable` only if `input_format_null_as_default` is disabled and the column contains `NULL` in a sample that is parsed during schema inference.
 
 Enabled by default.
 
@@ -1215,7 +1217,8 @@ DESC format(JSONEachRow, $$
 └─────────┴─────────────────────────┴──────────────┴────────────────────┴─────────┴──────────────────┴────────────────┘
 ```
 ```sql
-SET schema_inference_make_columns_nullable = 0
+SET schema_inference_make_columns_nullable = 0;
+SET input_format_null_as_default = 0;    
 DESC format(JSONEachRow, $$
                                 {"id" :  1, "age" :  25, "name" : "Josh", "status" : null, "hobbies" : ["football", "cooking"]}
                                 {"id" :  2, "age" :  19, "name" :  "Alan", "status" : "married", "hobbies" :  ["tennis", "art"]}
@@ -1232,6 +1235,25 @@ DESC format(JSONEachRow, $$
 └─────────┴──────────────────┴──────────────┴────────────────────┴─────────┴──────────────────┴────────────────┘
 ```
 
+```sql
+SET schema_inference_make_columns_nullable = 0;
+SET input_format_null_as_default = 1;    
+DESC format(JSONEachRow, $$
+                                {"id" :  1, "age" :  25, "name" : "Josh", "status" : null, "hobbies" : ["football", "cooking"]}
+                                {"id" :  2, "age" :  19, "name" :  "Alan", "status" : "married", "hobbies" :  ["tennis", "art"]}
+                         $$)
+```
+```response
+
+┌─name────┬─type──────────┬─default_type─┬─default_expression─┬─comment─┬─codec_expression─┬─ttl_expression─┐
+│ id      │ Int64         │              │                    │         │                  │                │
+│ age     │ Int64         │              │                    │         │                  │                │
+│ name    │ String        │              │                    │         │                  │                │
+│ status  │ String        │              │                    │         │                  │                │
+│ hobbies │ Array(String) │              │                    │         │                  │                │
+└─────────┴───────────────┴──────────────┴────────────────────┴─────────┴──────────────────┴────────────────┘
+```
+
 #### input_format_try_infer_integers
 
 If enabled, ClickHouse will try to infer integers instead of floats in schema inference for text formats.
@@ -1623,7 +1645,7 @@ In schema inference for CapnProto format ClickHouse uses the following type matc
 ## Strong-typed binary formats {#strong-typed-binary-formats}
 
 In such formats, each serialized value contains information about its type (and possibly about its name), but there is no information about the whole table.
-In schema inference for such formats, ClickHouse reads data row by row (up to `input_format_max_rows_to_read_for_schema_inference` rows) and extracts
+In schema inference for such formats, ClickHouse reads data row by row (up to `input_format_max_rows_to_read_for_schema_inference` rows or `input_format_max_bytes_to_read_for_schema_inference` bytes) and extracts
 the type (and possibly name) for each value from the data and then converts these types to ClickHouse types.
 
 ### MsgPack {#msgpack}
diff --git a/docs/en/operations/backup.md b/docs/en/operations/backup.md
index 6da61833c12..c3ddee07d0b 100644
--- a/docs/en/operations/backup.md
+++ b/docs/en/operations/backup.md
@@ -83,6 +83,7 @@ The BACKUP and RESTORE statements take a list of DATABASE and TABLE names, a des
     - [`compression_method`](/docs/en/sql-reference/statements/create/table.md/#column-compression-codecs) and compression_level
     - `password` for the file on disk
     - `base_backup`: the destination of the previous backup of this source.  For example, `Disk('backups', '1.zip')`
+    - `structure_only`: if enabled, allows to only backup or restore the CREATE statements without the data of tables
 
 ### Usage examples
 
@@ -398,4 +399,4 @@ To disallow concurrent backup/restore, you can use these settings respectively.
 ```
 
 The default value for both is true, so by default concurrent backup/restores are allowed.
-When these settings are false on a cluster, only 1 backup/restore is allowed to run on a cluster at a time.
\ No newline at end of file
+When these settings are false on a cluster, only 1 backup/restore is allowed to run on a cluster at a time.
diff --git a/docs/en/operations/configuration-files.md b/docs/en/operations/configuration-files.md
index b3583e156ad..d3e21cb2364 100644
--- a/docs/en/operations/configuration-files.md
+++ b/docs/en/operations/configuration-files.md
@@ -6,32 +6,43 @@ sidebar_label: Configuration Files
 
 # Configuration Files
 
-ClickHouse supports multi-file configuration management. The main server configuration file is `/etc/clickhouse-server/config.xml` or `/etc/clickhouse-server/config.yaml`. Other files must be in the `/etc/clickhouse-server/config.d` directory. Note, that any configuration file can be written either in XML or YAML, but mixing formats in one file is not supported. For example, you can have main configs as `config.xml` and `users.xml` and write additional files in `config.d` and `users.d` directories in `.yaml`.
+The ClickHouse server can be configured with configuration files in XML or YAML syntax. In most installation types, the ClickHouse server runs with `/etc/clickhouse-server/config.xml` as default configuration file but it is also possible to specify the location of the configuration file manually at server startup using command line option `--config-file=` or `-C`. Additional configuration files may be placed into directory `config.d/` relative to the main configuration file, for example into directory `/etc/clickhouse-server/config.d/`. Files in this directory and the main configuration are merged in a preprocessing step before the configuration is applied in ClickHouse server. Configuration files are merged in alphabetical order. To simplify updates and improve modularization, it is best practice to keep the default `config.xml` file unmodified and place additional customization into `config.d/`.
 
-All XML files should have the same root element, usually `<clickhouse>`. As for YAML, `clickhouse:` should not be present, the parser will insert it automatically.
+It is possible to mix XML and YAML configuration files, for example you could have a main configuration file `config.xml` and additional configuration files `config.d/network.xml`, `config.d/timezone.yaml` and `config.d/keeper.yaml`. Mixing XML and YAML within a single configuration file is not supported. XML configuration files should use `<clickhouse>...</clickhouse>` as top-level tag. In YAML configuration files, `clickhouse:` is optional, the parser inserts it implicitly if absent.
 
-## Override {#override}
+## Overriding Configuration {#override}
 
-Some settings specified in the main configuration file can be overridden in other configuration files:
+The merge of configuration files behaves as one intuitively expects: The contents of both files are combined recursively, children with the same name are replaced by the element of the more specific configuration file. The merge can be customized using attributes `replace` and `remove`.
+- Attribute `replace` means that the element is replaced by the specified one.
+- Attribute `remove` means that the element is deleted.
 
-- The `replace` or `remove` attributes can be specified for the elements of these configuration files.
-- If neither is specified, it combines the contents of elements recursively, replacing values of duplicate children.
-- If `replace` is specified, it replaces the entire element with the specified one.
-- If `remove` is specified, it deletes the element.
+To specify that a value of an element should be replaced by the value of an environment variable, you can use attribute `from_env`.
 
-You can also declare attributes as coming from environment variables by using `from_env="VARIABLE_NAME"`:
+Example with `$MAX_QUERY_SIZE = 150000`:
 
 ```xml
 <clickhouse>
-    <macros>
-        <replica from_env="REPLICA" />
-        <layer from_env="LAYER" />
-        <shard from_env="SHARD" />
-    </macros>
+    <profiles>
+        <default>
+            <max_query_size from_env="MAX_QUERY_SIZE"/>
+        </default>
+    </profiles>
 </clickhouse>
 ```
 
-## Substitution {#substitution}
+which is equal to
+
+``` xml
+<clickhouse>
+    <profiles>
+        <default>
+            <max_query_size/>150000</max_query_size>
+        </default>
+    </profiles>
+</clickhouse>
+```
+
+## Substituting Configuration {#substitution}
 
 The config can also define “substitutions”. If an element has the `incl` attribute, the corresponding substitution from the file will be used as the value. By default, the path to the file with substitutions is `/etc/metrika.xml`. This can be changed in the [include_from](../operations/server-configuration-parameters/settings.md#server_configuration_parameters-include_from) element in the server config. The substitution values are specified in `/clickhouse/substitution_name` elements in this file. If a substitution specified in `incl` does not exist, it is recorded in the log. To prevent ClickHouse from logging missing substitutions, specify the `optional="true"` attribute (for example, settings for [macros](../operations/server-configuration-parameters/settings.md#macros)).
 
diff --git a/docs/en/operations/named-collections.md b/docs/en/operations/named-collections.md
index a521a369721..02f52b6f8bf 100644
--- a/docs/en/operations/named-collections.md
+++ b/docs/en/operations/named-collections.md
@@ -50,7 +50,7 @@ To manage named collections with DDL a user must have the `named_control_collect
 ```
 
 :::tip
-In the above example the `passowrd_sha256_hex` value is the hexadecimal representation of the SHA256 hash of the password.  This configuration for the user `default` has the attribute `replace=true` as in the default configuration has a plain text `password` set, and it is not possible to have both plain text and sha256 hex passwords set for a user. 
+In the above example the `password_sha256_hex` value is the hexadecimal representation of the SHA256 hash of the password.  This configuration for the user `default` has the attribute `replace=true` as in the default configuration has a plain text `password` set, and it is not possible to have both plain text and sha256 hex passwords set for a user. 
 :::
 
 ## Storing named collections in configuration files
diff --git a/docs/en/operations/optimizing-performance/index.md b/docs/en/operations/optimizing-performance/index.md
deleted file mode 100644
index 83e9430ed27..00000000000
--- a/docs/en/operations/optimizing-performance/index.md
+++ /dev/null
@@ -1,9 +0,0 @@
----
-slug: /en/operations/optimizing-performance/
-sidebar_label: Optimizing Performance
-sidebar_position: 52
----
-
-# Optimizing Performance
-
-- [Sampling query profiler](../../operations/optimizing-performance/sampling-query-profiler.md)
diff --git a/docs/en/operations/server-configuration-parameters/index.md b/docs/en/operations/server-configuration-parameters/index.md
deleted file mode 100644
index d4b941c0819..00000000000
--- a/docs/en/operations/server-configuration-parameters/index.md
+++ /dev/null
@@ -1,16 +0,0 @@
----
-slug: /en/operations/server-configuration-parameters/
-sidebar_position: 54
-sidebar_label: Server Configuration Parameters
-pagination_next: en/operations/server-configuration-parameters/settings
----
-
-# Server Configuration Parameters 
-
-This section contains descriptions of server settings that cannot be changed at the session or query level.
-
-These settings are stored in the `config.xml` file on the ClickHouse server.
-
-Other settings are described in the “[Settings](../../operations/settings/index.md#session-settings-intro)” section.
-
-Before studying the settings, read the [Configuration files](../../operations/configuration-files.md#configuration_files) section and note the use of substitutions (the `incl` and `optional` attributes).
diff --git a/docs/en/operations/server-configuration-parameters/settings.md b/docs/en/operations/server-configuration-parameters/settings.md
index f93ab264511..bad7e388377 100644
--- a/docs/en/operations/server-configuration-parameters/settings.md
+++ b/docs/en/operations/server-configuration-parameters/settings.md
@@ -7,6 +7,14 @@ description: This section contains descriptions of server settings that cannot b
 
 # Server Settings
 
+This section contains descriptions of server settings that cannot be changed at the session or query level.
+
+These settings are stored in the `config.xml` file on the ClickHouse server.
+
+Other settings are described in the “[Settings](../../operations/settings/index.md#session-settings-intro)” section.
+
+Before studying the settings, read the [Configuration files](../../operations/configuration-files.md#configuration_files) section and note the use of substitutions (the `incl` and `optional` attributes).
+
 ## allow_use_jemalloc_memory
 
 Allows to use jemalloc memory.
@@ -202,7 +210,7 @@ Default: 15
 
 ## dns_max_consecutive_failures
 
-Max connection failures before dropping host from ClickHouse DNS cache
+Max consecutive resolving failures before dropping a host from ClickHouse DNS cache
 
 Type: UInt32
 
@@ -1594,7 +1602,7 @@ Keys for server/client settings:
 - requireTLSv1_2 (default: false) – Require a TLSv1.2 connection. Acceptable values: `true`, `false`.
 - fips (default: false) – Activates OpenSSL FIPS mode. Supported if the library’s OpenSSL version supports FIPS.
 - privateKeyPassphraseHandler (default: `KeyConsoleHandler`)– Class (PrivateKeyPassphraseHandler subclass) that requests the passphrase for accessing the private key. For example: `<privateKeyPassphraseHandler>`, `<name>KeyFileHandler</name>`, `<options><password>test</password></options>`, `</privateKeyPassphraseHandler>`.
-- invalidCertificateHandler (default: `ConsoleCertificateHandler`) – Class (a subclass of CertificateHandler) for verifying invalid certificates. For example: `<invalidCertificateHandler> <name>ConsoleCertificateHandler</name> </invalidCertificateHandler>` .
+- invalidCertificateHandler (default: `RejectCertificateHandler`) – Class (a subclass of CertificateHandler) for verifying invalid certificates. For example: `<invalidCertificateHandler> <name>RejectCertificateHandler</name> </invalidCertificateHandler>` .
 - disableProtocols (default: "") – Protocols that are not allowed to use.
 - preferServerCiphers (default: false) – Preferred server ciphers on the client.
 
@@ -1881,6 +1889,32 @@ The default server configuration file `config.xml` contains the following settin
 </trace_log>
 ```
 
+## asynchronous_insert_log {#server_configuration_parameters-asynchronous_insert_log}
+
+Settings for the [asynchronous_insert_log](../../operations/system-tables/asynchronous_insert_log.md#system_tables-asynchronous_insert_log) system table for logging async inserts.
+
+Parameters:
+
+- `database` — Database name.
+- `table` — Table name.
+- `partition_by` — [Custom partitioning key](../../engines/table-engines/mergetree-family/custom-partitioning-key.md) for a system table. Can't be used if `engine` defined.
+- `engine` - [MergeTree Engine Definition](../../engines/table-engines/mergetree-family/mergetree.md#table_engine-mergetree-creating-a-table) for a system table. Can't be used if `partition_by` defined.
+- `flush_interval_milliseconds` — Interval for flushing data from the buffer in memory to the table.
+- `storage_policy` – Name of storage policy to use for the table (optional)
+
+**Example**
+```xml
+<clickhouse>
+    <asynchronous_insert_log>
+        <database>system</database>
+        <table>asynchronous_insert_log</table>
+        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
+        <partition_by>toYYYYMM(event_date)</partition_by>
+        <!-- <engine>Engine = MergeTree PARTITION BY event_date ORDER BY event_time TTL event_date + INTERVAL 30 day</engine> -->
+    </asynchronous_insert_log>
+</clickhouse>
+```
+
 ## query_masking_rules {#query-masking-rules}
 
 Regexp-based rules, which will be applied to queries as well as all log messages before storing them in server logs,
@@ -1941,6 +1975,10 @@ The time zone is necessary for conversions between String and DateTime formats w
 <timezone>Asia/Istanbul</timezone>
 ```
 
+**See also**
+
+- [session_timezone](../settings/settings.md#session_timezone)
+
 ## tcp_port {#server_configuration_parameters-tcp_port}
 
 Port for communicating with clients over the TCP protocol.
@@ -2082,7 +2120,13 @@ This section contains the following parameters:
 - `operation_timeout_ms` — Maximum timeout for one operation in milliseconds.
 - `root` — The [znode](http://zookeeper.apache.org/doc/r3.5.5/zookeeperOver.html#Nodes+and+ephemeral+nodes) that is used as the root for znodes used by the ClickHouse server. Optional.
 - `identity` — User and password, that can be required by ZooKeeper to give access to requested znodes. Optional.
-
+- zookeeper_load_balancing - Specifies the algorithm of ZooKeeper node selection.
+  * random - randomly selects one of ZooKeeper nodes.
+  * in_order - selects the first ZooKeeper node, if it's not available then the second, and so on.
+  * nearest_hostname - selects a ZooKeeper node with a hostname that is most similar to the server’s hostname.
+  * first_or_random - selects the first ZooKeeper node, if it's not available then randomly selects one of remaining ZooKeeper nodes.
+  * round_robin - selects the first ZooKeeper node, if reconnection happens selects the next.
+    
 **Example configuration**
 
 ``` xml
@@ -2101,6 +2145,8 @@ This section contains the following parameters:
     <root>/path/to/zookeeper/node</root>
     <!-- Optional. Zookeeper digest ACL string. -->
     <identity>user:password</identity>
+    <!--<zookeeper_load_balancing>random / in_order / nearest_hostname / first_or_random / round_robin</zookeeper_load_balancing>-->
+    <zookeeper_load_balancing>random</zookeeper_load_balancing>
 </zookeeper>
 ```
 
diff --git a/docs/en/operations/settings/settings-formats.md b/docs/en/operations/settings/settings-formats.md
index 65038d3a256..1b22a6d1223 100644
--- a/docs/en/operations/settings/settings-formats.md
+++ b/docs/en/operations/settings/settings-formats.md
@@ -137,6 +137,12 @@ The maximum rows of data to read for automatic schema inference.
 
 Default value: `25'000`.
 
+## input_format_max_bytes_to_read_for_schema_inference {#input_format_max_bytes_to_read_for_schema_inference}
+
+The maximum amount of data in bytes to read for automatic schema inference.
+
+Default value: `33554432` (32 Mb).
+
 ## column_names_for_schema_inference {#column_names_for_schema_inference}
 
 The list of column names to use in schema inference for formats without column names. The format: 'column1,column2,column3,...'
@@ -728,6 +734,12 @@ My NULL
 My NULL
 ```
 
+### input_format_tsv_skip_trailing_empty_lines {input_format_tsv_skip_trailing_empty_lines}
+
+When enabled, trailing empty lines at the end of TSV file will be skipped.
+
+Disabled by default.
+
 ## CSV format settings {#csv-format-settings}
 
 ### format_csv_delimiter {#format_csv_delimiter}
@@ -882,6 +894,76 @@ My NULL
 My NULL
 ```
 
+### input_format_csv_skip_trailing_empty_lines {input_format_csv_skip_trailing_empty_lines}
+
+When enabled, trailing empty lines at the end of CSV file will be skipped.
+
+Disabled by default.
+
+### input_format_csv_trim_whitespaces {#input_format_csv_trim_whitespaces}
+
+Trims spaces and tabs in non-quoted CSV strings.
+
+Default value: `true`.
+
+**Examples**
+
+Query
+
+```bash
+echo '  string  ' | ./clickhouse local -q  "select * from table FORMAT CSV" --input-format="CSV" --input_format_csv_trim_whitespaces=true
+```
+
+Result
+
+```text
+"string"
+```
+
+Query
+
+```bash
+echo '  string  ' | ./clickhouse local -q  "select * from table FORMAT CSV" --input-format="CSV" --input_format_csv_trim_whitespaces=false
+```
+
+Result
+
+```text
+"  string  "
+```
+
+### input_format_csv_allow_whitespace_or_tab_as_delimiter {#input_format_csv_allow_whitespace_or_tab_as_delimiter}
+
+Allow to use whitespace or tab as field delimiter in CSV strings.
+
+Default value: `false`.
+
+**Examples**
+
+Query
+
+```bash
+echo 'a b' | ./clickhouse local -q  "select * from table FORMAT CSV" --input-format="CSV" --input_format_csv_allow_whitespace_or_tab_as_delimiter=true --format_csv_delimiter=' '
+```
+
+Result
+
+```text
+a  b
+```
+
+Query
+
+```bash
+echo 'a         b' | ./clickhouse local -q  "select * from table FORMAT CSV" --input-format="CSV" --input_format_csv_allow_whitespace_or_tab_as_delimiter=true --format_csv_delimiter='\t'
+```
+
+Result
+
+```text
+a  b
+```
+
 ## Values format settings {#values-format-settings}
 
 ### input_format_values_interpret_expressions {#input_format_values_interpret_expressions}
@@ -1443,6 +1525,12 @@ Sets the character that is interpreted as a suffix after the result set for [Cus
 
 Default value: `''`.
 
+### input_format_custom_skip_trailing_empty_lines {input_format_custom_skip_trailing_empty_lines}
+
+When enabled, trailing empty lines at the end of file in CustomSeparated format will be skipped.
+
+Disabled by default.
+
 ## Regexp format settings {#regexp-format-settings}
 
 ### format_regexp_escaping_rule {#format_regexp_escaping_rule}
diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 6c951739d41..cff13302cdc 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -227,6 +227,89 @@ SELECT * FROM data_01515 WHERE d1 = 0 SETTINGS force_data_skipping_indices='`d1_
 SELECT * FROM data_01515 WHERE d1 = 0 AND assumeNotNull(d1_null) = 0 SETTINGS force_data_skipping_indices='`d1_idx`, d1_null_idx'; -- Ok.
 ```
 
+## ignore_data_skipping_indices {#settings-ignore_data_skipping_indices}
+
+Ignores the skipping indexes specified if used by the query.
+
+Consider the following example:
+
+```sql
+CREATE TABLE data
+(
+    key Int,
+    x Int,
+    y Int,
+    INDEX x_idx x TYPE minmax GRANULARITY 1,
+    INDEX y_idx y TYPE minmax GRANULARITY 1,
+    INDEX xy_idx (x,y) TYPE minmax GRANULARITY 1
+)
+Engine=MergeTree()
+ORDER BY key;
+
+INSERT INTO data VALUES (1, 2, 3);
+
+SELECT * FROM data;
+SELECT * FROM data SETTINGS ignore_data_skipping_indices=''; -- query will produce CANNOT_PARSE_TEXT error.
+SELECT * FROM data SETTINGS ignore_data_skipping_indices='x_idx'; -- Ok.
+SELECT * FROM data SETTINGS ignore_data_skipping_indices='na_idx'; -- Ok.
+
+SELECT * FROM data WHERE x = 1 AND y = 1 SETTINGS ignore_data_skipping_indices='xy_idx',force_data_skipping_indices='xy_idx' ; -- query will produce INDEX_NOT_USED error, since xy_idx is explictly ignored.
+SELECT * FROM data WHERE x = 1 AND y = 2 SETTINGS ignore_data_skipping_indices='xy_idx';
+```
+
+The query without ignoring any indexes:
+```sql
+EXPLAIN indexes = 1 SELECT * FROM data WHERE x = 1 AND y = 2;
+
+Expression ((Projection + Before ORDER BY))
+  Filter (WHERE)
+    ReadFromMergeTree (default.data)
+    Indexes:
+      PrimaryKey
+        Condition: true
+        Parts: 1/1
+        Granules: 1/1
+      Skip
+        Name: x_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/1
+        Granules: 0/1
+      Skip
+        Name: y_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/0
+        Granules: 0/0
+      Skip
+        Name: xy_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/0
+        Granules: 0/0
+```
+
+Ignoring the `xy_idx` index:
+```sql
+EXPLAIN indexes = 1 SELECT * FROM data WHERE x = 1 AND y = 2 SETTINGS ignore_data_skipping_indices='xy_idx';
+
+Expression ((Projection + Before ORDER BY))
+  Filter (WHERE)
+    ReadFromMergeTree (default.data)
+    Indexes:
+      PrimaryKey
+        Condition: true
+        Parts: 1/1
+        Granules: 1/1
+      Skip
+        Name: x_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/1
+        Granules: 0/1
+      Skip
+        Name: y_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/0
+        Granules: 0/0
+```
+
 Works with tables in the MergeTree family.
 
 ## convert_query_to_cnf {#convert_query_to_cnf}
@@ -452,8 +535,6 @@ Possible values:
 
  The first phase of a grace join reads the right table and splits it into N buckets depending on the hash value of key columns (initially, N is `grace_hash_join_initial_buckets`). This is done in a way to ensure that each bucket can be processed independently. Rows from the first bucket are added to an in-memory hash table while the others are saved to disk. If the hash table grows beyond the memory limit (e.g., as set by [`max_bytes_in_join`](/docs/en/operations/settings/query-complexity.md/#settings-max_bytes_in_join)), the number of buckets is increased and the assigned bucket for each row. Any rows which don’t belong to the current bucket are flushed and reassigned.
 
- Supports `INNER/LEFT/RIGHT/FULL ALL/ANY JOIN`.
-
 - hash
 
  [Hash join algorithm](https://en.wikipedia.org/wiki/Hash_join) is used. The most generic implementation that supports all combinations of kind and strictness and multiple join keys that are combined with `OR` in the `JOIN ON` section.
@@ -1241,7 +1322,7 @@ Connection pool size for PostgreSQL table engine and database engine.
 
 Default value: 16
 
-## postgresql_connection_pool_size {#postgresql-connection-pool-size}
+## postgresql_connection_pool_wait_timeout {#postgresql-connection-pool-wait-timeout}
 
 Connection pool push/pop timeout on empty pool for PostgreSQL table engine and database engine. By default it will block on empty pool.
 
@@ -1876,6 +1957,10 @@ Default value: empty string (disabled)
 For the replicated tables by default the only 100 of the most recent inserts for each partition are deduplicated (see [replicated_deduplication_window](merge-tree-settings.md/#replicated-deduplication-window), [replicated_deduplication_window_seconds](merge-tree-settings.md/#replicated-deduplication-window-seconds)).
 For not replicated tables see [non_replicated_deduplication_window](merge-tree-settings.md/#non-replicated-deduplication-window).
 
+:::note
+`insert_deduplication_token` works on a partition level (the same as `insert_deduplication` checksum). Multiple partitions can have the same `insert_deduplication_token`.
+:::
+
 Example:
 
 ```sql
@@ -2856,7 +2941,7 @@ Default value: `0`.
 
 ## mutations_sync {#mutations_sync}
 
-Allows to execute `ALTER TABLE ... UPDATE|DELETE` queries ([mutations](../../sql-reference/statements/alter/index.md#mutations)) synchronously.
+Allows to execute `ALTER TABLE ... UPDATE|DELETE|MATERIALIZE INDEX|MATERIALIZE PROJECTION|MATERIALIZE COLUMN` queries ([mutations](../../sql-reference/statements/alter/index.md#mutations)) synchronously.
 
 Possible values:
 
@@ -3155,7 +3240,7 @@ Possible values:
 - Positive integer.
 - 0 or 1 — Disabled. `SELECT` queries are executed in a single thread.
 
-Default value: `16`.
+Default value: `max_threads`.
 
 ## opentelemetry_start_trace_probability {#opentelemetry-start-trace-probability}
 
@@ -3243,7 +3328,35 @@ Possible values:
 
 Default value: `0`.
 
-## s3_truncate_on_insert
+## engine_file_allow_create_multiple_files {#engine_file_allow_create_multiple_files}
+
+Enables or disables creating a new file on each insert in file engine tables if the format has the suffix (`JSON`, `ORC`, `Parquet`, etc.). If enabled, on each insert a new file will be created with a name following this pattern:
+
+`data.Parquet` -> `data.1.Parquet` -> `data.2.Parquet`, etc.
+
+Possible values:
+- 0 — `INSERT` query appends new data to the end of the file.
+- 1 — `INSERT` query creates a new file.
+
+Default value: `0`.
+
+## engine_file_skip_empty_files {#engine_file_skip_empty_files}
+
+Enables or disables skipping empty files in [File](../../engines/table-engines/special/file.md) engine tables.
+
+Possible values:
+- 0 — `SELECT` throws an exception if empty file is not compatible with requested format.
+- 1 — `SELECT` returns empty result for empty file.
+
+Default value: `0`.
+
+## storage_file_read_method {#storage_file_read_method}
+
+Method of reading data from storage file, one of: `read`, `pread`, `mmap`. The mmap method does not apply to clickhouse-server (it's intended for clickhouse-local).
+
+Default value: `pread` for clickhouse-server, `mmap` for clickhouse-local.
+
+## s3_truncate_on_insert {#s3_truncate_on_insert}
 
 Enables or disables truncate before inserts in s3 engine tables. If disabled, an exception will be thrown on insert attempts if an S3 object already exists.
 
@@ -3253,7 +3366,29 @@ Possible values:
 
 Default value: `0`.
 
-## hdfs_truncate_on_insert
+## s3_create_new_file_on_insert {#s3_create_new_file_on_insert}
+
+Enables or disables creating a new file on each insert in s3 engine tables. If enabled, on each insert a new S3 object will be created with the key, similar to this pattern:
+
+initial: `data.Parquet.gz` -> `data.1.Parquet.gz` -> `data.2.Parquet.gz`, etc.
+
+Possible values:
+- 0 — `INSERT` query appends new data to the end of the file.
+- 1 — `INSERT` query creates a new file.
+
+Default value: `0`.
+
+## s3_skip_empty_files {#s3_skip_empty_files}
+
+Enables or disables skipping empty files in [S3](../../engines/table-engines/integrations/s3.md) engine tables.
+
+Possible values:
+- 0 — `SELECT` throws an exception if empty file is not compatible with requested format.
+- 1 — `SELECT` returns empty result for empty file.
+
+Default value: `0`.
+
+## hdfs_truncate_on_insert {#hdfs_truncate_on_insert}
 
 Enables or disables truncation before an insert in hdfs engine tables. If disabled, an exception will be thrown on an attempt to insert if a file in HDFS already exists.
 
@@ -3263,31 +3398,7 @@ Possible values:
 
 Default value: `0`.
 
-## engine_file_allow_create_multiple_files
-
-Enables or disables creating a new file on each insert in file engine tables if the format has the suffix (`JSON`, `ORC`, `Parquet`, etc.). If enabled, on each insert a new file will be created with a name following this pattern:
-
-`data.Parquet` -> `data.1.Parquet` -> `data.2.Parquet`, etc.
-
-Possible values:
-- 0 — `INSERT` query appends new data to the end of the file.
-- 1 — `INSERT` query replaces existing content of the file with the new data.
-
-Default value: `0`.
-
-## s3_create_new_file_on_insert
-
-Enables or disables creating a new file on each insert in s3 engine tables. If enabled, on each insert a new S3 object will be created with the key, similar to this pattern:
-
-initial: `data.Parquet.gz` -> `data.1.Parquet.gz` -> `data.2.Parquet.gz`, etc.
-
-Possible values:
-- 0 — `INSERT` query appends new data to the end of the file.
-- 1 — `INSERT` query replaces existing content of the file with the new data.
-
-Default value: `0`.
-
-## hdfs_create_new_file_on_insert
+## hdfs_create_new_file_on_insert {#hdfs_create_new_file_on_insert
 
 Enables or disables creating a new file on each insert in HDFS engine tables. If enabled, on each insert a new HDFS file will be created with the name, similar to this pattern:
 
@@ -3295,7 +3406,27 @@ initial: `data.Parquet.gz` -> `data.1.Parquet.gz` -> `data.2.Parquet.gz`, etc.
 
 Possible values:
 - 0 — `INSERT` query appends new data to the end of the file.
-- 1 — `INSERT` query replaces existing content of the file with the new data.
+- 1 — `INSERT` query creates a new file.
+
+Default value: `0`.
+
+## hdfs_skip_empty_files {#hdfs_skip_empty_files}
+
+Enables or disables skipping empty files in [HDFS](../../engines/table-engines/integrations/hdfs.md) engine tables.
+
+Possible values:
+- 0 — `SELECT` throws an exception if empty file is not compatible with requested format.
+- 1 — `SELECT` returns empty result for empty file.
+
+Default value: `0`.
+
+## engine_url_skip_empty_files {#engine_url_skip_empty_files}
+
+Enables or disables skipping empty files in [URL](../../engines/table-engines/special/url.md) engine tables.
+
+Possible values:
+- 0 — `SELECT` throws an exception if empty file is not compatible with requested format.
+- 1 — `SELECT` returns empty result for empty file.
 
 Default value: `0`.
 
@@ -4120,6 +4251,69 @@ Default value: `0`.
 Use this setting only for backward compatibility if your use cases depend on old syntax.
 :::
 
+## session_timezone {#session_timezone}
+
+Sets the implicit time zone of the current session or query.
+The implicit time zone is the time zone applied to values of type DateTime/DateTime64 which have no explicitly specified time zone. 
+The setting takes precedence over the globally configured (server-level) implicit time zone.
+A value of '' (empty string) means that the implicit time zone of the current session or query is equal to the [server time zone](../server-configuration-parameters/settings.md#server_configuration_parameters-timezone).
+
+You can use functions `timeZone()` and `serverTimeZone()` to get the session time zone and server time zone.
+
+Possible values:
+
+-    Any time zone name from `system.time_zones`, e.g. `Europe/Berlin`, `UTC` or `Zulu`
+
+Default value: `''`.
+
+Examples:
+
+```sql
+SELECT timeZone(), serverTimeZone() FORMAT TSV
+
+Europe/Berlin	Europe/Berlin
+```
+
+```sql
+SELECT timeZone(), serverTimeZone() SETTINGS session_timezone = 'Asia/Novosibirsk' FORMAT TSV
+
+Asia/Novosibirsk	Europe/Berlin
+```
+
+Assign session time zone 'America/Denver' to the inner DateTime without explicitly specified time zone:
+
+```sql
+SELECT toDateTime64(toDateTime64('1999-12-12 23:23:23.123', 3), 3, 'Europe/Zurich') SETTINGS session_timezone = 'America/Denver' FORMAT TSV
+
+1999-12-13 07:23:23.123
+```
+
+:::warning
+Not all functions that parse DateTime/DateTime64 respect `session_timezone`. This can lead to subtle errors. 
+See the following example and explanation.
+:::
+
+```sql
+CREATE TABLE test_tz (`d` DateTime('UTC')) ENGINE = Memory AS SELECT toDateTime('2000-01-01 00:00:00', 'UTC');
+
+SELECT *, timeZone() FROM test_tz WHERE d = toDateTime('2000-01-01 00:00:00') SETTINGS session_timezone = 'Asia/Novosibirsk'
+0 rows in set.
+
+SELECT *, timeZone() FROM test_tz WHERE d = '2000-01-01 00:00:00' SETTINGS session_timezone = 'Asia/Novosibirsk'
+┌───────────────────d─┬─timeZone()───────┐
+│ 2000-01-01 00:00:00 │ Asia/Novosibirsk │
+└─────────────────────┴──────────────────┘
+```
+
+This happens due to different parsing pipelines:
+
+- `toDateTime()` without explicitly given time zone used in the first `SELECT` query honors setting `session_timezone` and the global time zone.
+- In the second query, a DateTime is parsed from a String, and inherits the type and time zone of the existing column`d`. Thus, setting `session_timezone` and the global time zone are not honored.
+
+**See also**
+
+- [timezone](../server-configuration-parameters/settings.md#server_configuration_parameters-timezone)
+
 ## final {#final}
 
 Automatically applies [FINAL](../../sql-reference/statements/select/from.md#final-modifier) modifier to all tables in a query, to tables where [FINAL](../../sql-reference/statements/select/from.md#final-modifier) is applicable, including joined tables and tables in sub-queries, and
@@ -4229,6 +4423,12 @@ Default value: `2000`
 If it's enabled, in hedged requests we can start new connection until receiving first data packet even if we have already made some progress
 (but progress haven't updated for `receive_data_timeout` timeout), otherwise we disable changing replica after the first time we made progress.
 
+## parallel_view_processing
+
+Enables pushing to attached views concurrently instead of sequentially.
+
+Default value: `false`.
+
 ## partial_result_on_first_cancel {#partial_result_on_first_cancel}
 When set to `true` and the user wants to interrupt a query (for example using `Ctrl+C` on the client), then the query continues execution only on data that was already read from the table. Afterwards, it will return a partial result of the query for the part of the table that was read. To fully stop the execution of a query without a partial result, the user should send 2 cancel requests.
 
@@ -4278,6 +4478,32 @@ Possible values:
 
 Default value: `false`.
 
+## rename_files_after_processing
+
+- **Type:** String
+
+- **Default value:** Empty string
+
+This setting allows to specify renaming pattern for files processed by `file` table function. When option is set, all files read by `file` table function will be renamed according to specified pattern with placeholders, only if files processing was successful.
+
+### Placeholders
+
+- `%f` — Original filename without extension (e.g., "sample").
+- `%e` — Original file extension with dot (e.g., ".csv").
+- `%t` — Timestamp (in microseconds).
+- `%%` — Percentage sign ("%").
+
+### Example
+- Option: `--rename_files_after_processing="processed_%f_%t%e"`
+
+- Query: `SELECT * FROM file('sample.csv')`
+
+
+If reading `sample.csv` is successful, file will be renamed to `processed_sample_1683473210851438.csv`
+
+
+
+
 ## function_json_value_return_type_allow_complex
 
 Control whether allow to return complex type (such as: struct, array, map) for json_value function.
diff --git a/docs/en/operations/storing-data.md b/docs/en/operations/storing-data.md
index 5804ad8545b..fe6e8e15b0c 100644
--- a/docs/en/operations/storing-data.md
+++ b/docs/en/operations/storing-data.md
@@ -184,13 +184,15 @@ These settings should be defined in the disk configuration section.
 
 - `enable_filesystem_query_cache_limit` - allow to limit the size of cache which is downloaded within each query (depends on user setting `max_query_cache_size`). Default: `false`.
 
-- `enable_cache_hits_threshold` - number which defines how many times some data needs to be read before it will be cached. Default: `0`, e.g. the data is cached at the first attempt to read it.
+- `enable_cache_hits_threshold` - number which defines how many times some data needs to be read before it will be cached. Default: `false`. This threshold can be defined by `cache_hits_threshold`. Default: `0`, e.g. the data is cached at the first attempt to read it.
+
+- `enable_bypass_cache_with_threshold` - allows to skip cache completely in case the requested read range exceeds the threshold. Default: `false`. This threshold can be defined by `bypass_cache_threashold`. Default: `268435456` (`256Mi`).
 
 - `do_not_evict_index_and_mark_files` - do not evict small frequently used files according to cache policy. Default: `false`. This setting was added in version 22.8. If you used filesystem cache before this version, then it will not work on versions starting from 22.8 if this setting is set to `true`. If you want to use this setting, clear old cache created before version 22.8 before upgrading.
 
-- `max_file_segment_size` - a maximum size of a single cache file in bytes or in readable format (`ki, Mi, Gi, etc`, example `10Gi`). Default: `104857600` (`100Mi`).
+- `max_file_segment_size` - a maximum size of a single cache file in bytes or in readable format (`ki, Mi, Gi, etc`, example `10Gi`). Default: `8388608` (`8Mi`).
 
-- `max_elements` - a limit for a number of cache files. Default: `1048576`.
+- `max_elements` - a limit for a number of cache files. Default: `10000000`.
 
 File Cache **query/profile settings**:
 
diff --git a/docs/en/operations/system-tables/asynchronous_insert_log.md b/docs/en/operations/system-tables/asynchronous_insert_log.md
new file mode 100644
index 00000000000..c3aaa8e6c41
--- /dev/null
+++ b/docs/en/operations/system-tables/asynchronous_insert_log.md
@@ -0,0 +1,64 @@
+---
+slug: /en/operations/system-tables/asynchronous_insert_log
+---
+# asynchronous_insert_log
+
+Contains information about async inserts. Each entry represents an insert query buffered into an async insert query.
+
+To start logging configure parameters in the [asynchronous_insert_log](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-asynchronous_insert_log) section.
+
+The flushing period of data is set in `flush_interval_milliseconds` parameter of the [asynchronous_insert_log](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-asynchronous_insert_log) server settings section. To force flushing, use the [SYSTEM FLUSH LOGS](../../sql-reference/statements/system.md#query_language-system-flush_logs) query.
+
+ClickHouse does not delete data from the table automatically. See [Introduction](../../operations/system-tables/index.md#system-tables-introduction) for more details.
+
+Columns:
+
+- `event_date` ([Date](../../sql-reference/data-types/date.md)) — The date when the async insert happened.
+- `event_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — The date and time when the async insert finished execution.
+- `event_time_microseconds` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — The date and time when the async insert finished execution with microseconds precision.
+- `query` ([String](../../sql-reference/data-types/string.md)) — Query string.
+- `database` ([String](../../sql-reference/data-types/string.md)) — The name of the database the table is in.
+- `table` ([String](../../sql-reference/data-types/string.md)) — Table name.
+- `format` ([String](/docs/en/sql-reference/data-types/string.md)) — Format name.
+- `query_id` ([String](../../sql-reference/data-types/string.md)) — ID of the initial query.
+- `bytes` ([UInt64](../../sql-reference/data-types/int-uint.md#uint-ranges)) — Number of inserted bytes.
+- `exception` ([String](../../sql-reference/data-types/string.md)) — Exception message.
+- `status` ([Enum8](../../sql-reference/data-types/enum.md)) — Status of the view. Values:
+    - `'Ok' = 1` — Successful insert.
+    - `'ParsingError' = 2` — Exception when parsing the data.
+    - `'FlushError' = 3` — Exception when flushing the data.
+- `flush_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — The date and time when the flush happened.
+- `flush_time_microseconds` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — The date and time when the flush happened with microseconds precision.
+- `flush_query_id` ([String](../../sql-reference/data-types/string.md)) — ID of the flush query.
+
+**Example**
+
+Query:
+
+``` sql
+SELECT * FROM system.asynchronous_insert_log LIMIT 1 \G;
+```
+
+Result:
+
+``` text
+event_date:              2023-06-08
+event_time:              2023-06-08 10:08:53
+event_time_microseconds: 2023-06-08 10:08:53.199516
+query:                   INSERT INTO public.data_guess (user_id, datasource_id, timestamp, path, type, num, str) FORMAT CSV
+database:                public
+table:                   data_guess
+format:                  CSV
+query_id:                b46cd4c4-0269-4d0b-99f5-d27668c6102e
+bytes:                   133223
+exception:
+status:                  Ok
+flush_time:              2023-06-08 10:08:55
+flush_time_microseconds: 2023-06-08 10:08:55.139676
+flush_query_id:          cd2c1e43-83f5-49dc-92e4-2fbc7f8d3716
+```
+
+**See Also**
+
+- [system.query_log](../../operations/system-tables/query_log.md#system_tables-query_log) — Description of the `query_log` system table which contains common information about queries execution.
+- [system.asynchronous_inserts](../../operations/system-tables/asynchronous_inserts.md#system_tables-asynchronous_inserts) — This table contains information about pending asynchronous inserts in queue.
diff --git a/docs/en/operations/system-tables/asynchronous_inserts.md b/docs/en/operations/system-tables/asynchronous_inserts.md
new file mode 100644
index 00000000000..8fd5f2bb520
--- /dev/null
+++ b/docs/en/operations/system-tables/asynchronous_inserts.md
@@ -0,0 +1,45 @@
+---
+slug: /en/operations/system-tables/asynchronous_inserts
+---
+# asynchronous_inserts
+
+Contains information about pending asynchronous inserts in queue.
+
+Columns:
+
+- `query` ([String](../../sql-reference/data-types/string.md)) — Query string.
+- `database` ([String](../../sql-reference/data-types/string.md)) — The name of the database the table is in.
+- `table` ([String](../../sql-reference/data-types/string.md)) — Table name.
+- `format` ([String](/docs/en/sql-reference/data-types/string.md)) — Format name.
+- `first_update` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — First insert time with microseconds resolution.
+- `total_bytes` ([UInt64](../../sql-reference/data-types/int-uint.md#uint-ranges)) — Total number of bytes waiting in the queue.
+- `entries.query_id` ([Array(String)](../../sql-reference/data-types/array.md)) - Array of query ids of the inserts waiting in the queue.
+- `entries.bytes` ([Array(UInt64)](../../sql-reference/data-types/array.md)) - Array of bytes of each insert query waiting in the queue.
+
+**Example**
+
+Query:
+
+``` sql
+SELECT * FROM system.asynchronous_inserts LIMIT 1 \G;
+```
+
+Result:
+
+``` text
+Row 1:
+──────
+query:            INSERT INTO public.data_guess (user_id, datasource_id, timestamp, path, type, num, str) FORMAT CSV
+database:         public
+table:            data_guess
+format:           CSV
+first_update:     2023-06-08 10:08:54.199606
+total_bytes:      133223
+entries.query_id: ['b46cd4c4-0269-4d0b-99f5-d27668c6102e']
+entries.bytes:    [133223]
+```
+
+**See Also**
+
+- [system.query_log](../../operations/system-tables/query_log.md#system_tables-query_log) — Description of the `query_log` system table which contains common information about queries execution.
+- [system.asynchronous_insert_log](../../operations/system-tables/asynchronous_insert_log.md#system_tables-asynchronous_insert_log) — This table contains information about async inserts performed.
diff --git a/docs/en/operations/system-tables/parts.md b/docs/en/operations/system-tables/parts.md
index 9159d1e9284..5829e5ad313 100644
--- a/docs/en/operations/system-tables/parts.md
+++ b/docs/en/operations/system-tables/parts.md
@@ -27,7 +27,7 @@ Columns:
 
     Data storing format is controlled by the `min_bytes_for_wide_part` and `min_rows_for_wide_part` settings of the [MergeTree](../../engines/table-engines/mergetree-family/mergetree.md) table.
 
-   - `active` ([UInt8](../../sql-reference/data-types/int-uint.md)) – Flag that indicates whether the data part is active. If a data part is active, it’s used in a table. Otherwise, it’s deleted. Inactive data parts remain after merging.
+- `active` ([UInt8](../../sql-reference/data-types/int-uint.md)) – Flag that indicates whether the data part is active. If a data part is active, it’s used in a table. Otherwise, it’s deleted. Inactive data parts remain after merging.
 
 - `marks` ([UInt64](../../sql-reference/data-types/int-uint.md)) – The number of marks. To get the approximate number of rows in a data part, multiply `marks` by the index granularity (usually 8192) (this hint does not work for adaptive granularity).
 
diff --git a/docs/en/operations/system-tables/processes.md b/docs/en/operations/system-tables/processes.md
index 2e729920ed0..ffa37357053 100644
--- a/docs/en/operations/system-tables/processes.md
+++ b/docs/en/operations/system-tables/processes.md
@@ -10,14 +10,14 @@ Columns:
 - `user` (String) – The user who made the query. Keep in mind that for distributed processing, queries are sent to remote servers under the `default` user. The field contains the username for a specific query, not for a query that this query initiated.
 - `address` (String) – The IP address the request was made from. The same for distributed processing. To track where a distributed query was originally made from, look at `system.processes` on the query requestor server.
 - `elapsed` (Float64) – The time in seconds since request execution started.
-- `rows_read` (UInt64) – The number of rows read from the table. For distributed processing, on the requestor server, this is the total for all remote servers.
-- `bytes_read` (UInt64) – The number of uncompressed bytes read from the table. For distributed processing, on the requestor server, this is the total for all remote servers.
+- `read_rows` (UInt64) – The number of rows read from the table. For distributed processing, on the requestor server, this is the total for all remote servers.
+- `read_bytes` (UInt64) – The number of uncompressed bytes read from the table. For distributed processing, on the requestor server, this is the total for all remote servers.
 - `total_rows_approx` (UInt64) – The approximation of the total number of rows that should be read. For distributed processing, on the requestor server, this is the total for all remote servers. It can be updated during request processing, when new sources to process become known.
-- `memory_usage` (UInt64) – Amount of RAM the request uses. It might not include some types of dedicated memory. See the [max_memory_usage](../../operations/settings/query-complexity.md#settings_max_memory_usage) setting.
+- `memory_usage` (Int64) – Amount of RAM the request uses. It might not include some types of dedicated memory. See the [max_memory_usage](../../operations/settings/query-complexity.md#settings_max_memory_usage) setting.
 - `query` (String) – The query text. For `INSERT`, it does not include the data to insert.
 - `query_id` (String) – Query ID, if defined.
-- `is_cancelled` (Int8) – Was query cancelled.
-- `is_all_data_sent` (Int8) – Was all data sent to the client (in other words query had been finished on the server).
+- `is_cancelled` (UInt8) – Was query cancelled.
+- `is_all_data_sent` (UInt8) – Was all data sent to the client (in other words query had been finished on the server).
 
 ```sql
 SELECT * FROM system.processes LIMIT 10 FORMAT Vertical;
diff --git a/docs/en/operations/system-tables/query_log.md b/docs/en/operations/system-tables/query_log.md
index 71e1452cef1..b9fdd19c643 100644
--- a/docs/en/operations/system-tables/query_log.md
+++ b/docs/en/operations/system-tables/query_log.md
@@ -71,11 +71,11 @@ Columns:
     - 0 — Query was initiated by another query as part of distributed query execution.
 - `user` ([String](../../sql-reference/data-types/string.md)) — Name of the user who initiated the current query.
 - `query_id` ([String](../../sql-reference/data-types/string.md)) — ID of the query.
-- `address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — IP address that was used to make the query.
+- `address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — IP address that was used to make the query.
 - `port` ([UInt16](../../sql-reference/data-types/int-uint.md)) — The client port that was used to make the query.
 - `initial_user` ([String](../../sql-reference/data-types/string.md)) — Name of the user who ran the initial query (for distributed query execution).
 - `initial_query_id` ([String](../../sql-reference/data-types/string.md)) — ID of the initial query (for distributed query execution).
-- `initial_address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — IP address that the parent query was launched from.
+- `initial_address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — IP address that the parent query was launched from.
 - `initial_port` ([UInt16](../../sql-reference/data-types/int-uint.md)) — The client port that was used to make the parent query.
 - `initial_query_start_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — Initial query starting time (for distributed query execution).
 - `initial_query_start_time_microseconds` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — Initial query starting time with microseconds precision (for distributed query execution).
diff --git a/docs/en/operations/system-tables/query_thread_log.md b/docs/en/operations/system-tables/query_thread_log.md
index cdd23bb15db..a6d5632ade9 100644
--- a/docs/en/operations/system-tables/query_thread_log.md
+++ b/docs/en/operations/system-tables/query_thread_log.md
@@ -40,11 +40,11 @@ Columns:
     - 0 — Query was initiated by another query for distributed query execution.
 - `user` ([String](../../sql-reference/data-types/string.md)) — Name of the user who initiated the current query.
 - `query_id` ([String](../../sql-reference/data-types/string.md)) — ID of the query.
-- `address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — IP address that was used to make the query.
+- `address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — IP address that was used to make the query.
 - `port` ([UInt16](../../sql-reference/data-types/int-uint.md#uint-ranges)) — The client port that was used to make the query.
 - `initial_user` ([String](../../sql-reference/data-types/string.md)) — Name of the user who ran the initial query (for distributed query execution).
 - `initial_query_id` ([String](../../sql-reference/data-types/string.md)) — ID of the initial query (for distributed query execution).
-- `initial_address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — IP address that the parent query was launched from.
+- `initial_address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — IP address that the parent query was launched from.
 - `initial_port` ([UInt16](../../sql-reference/data-types/int-uint.md#uint-ranges)) — The client port that was used to make the parent query.
 - `interface` ([UInt8](../../sql-reference/data-types/int-uint.md#uint-ranges)) — Interface that the query was initiated from. Possible values:
     - 1 — TCP.
diff --git a/docs/en/operations/system-tables/session_log.md b/docs/en/operations/system-tables/session_log.md
index 661d34677e4..5b1a2b2a489 100644
--- a/docs/en/operations/system-tables/session_log.md
+++ b/docs/en/operations/system-tables/session_log.md
@@ -28,7 +28,7 @@ Columns:
 - `profiles` ([Array](../../sql-reference/data-types/array.md)([LowCardinality(String)](../../sql-reference/data-types/lowcardinality.md))) — The list of profiles set for all roles and/or users.
 - `roles` ([Array](../../sql-reference/data-types/array.md)([LowCardinality(String)](../../sql-reference/data-types/lowcardinality.md))) — The list of roles to which the profile is applied.
 - `settings` ([Array](../../sql-reference/data-types/array.md)([Tuple](../../sql-reference/data-types/tuple.md)([LowCardinality(String)](../../sql-reference/data-types/lowcardinality.md), [String](../../sql-reference/data-types/string.md)))) — Settings that were changed when the client logged in/out.
-- `client_address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — The IP address that was used to log in/out.
+- `client_address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — The IP address that was used to log in/out.
 - `client_port` ([UInt16](../../sql-reference/data-types/int-uint.md)) — The client port that was used to log in/out.
 - `interface` ([Enum8](../../sql-reference/data-types/enum.md)) — The interface from which the login was initiated. Possible values:
     - `TCP`
diff --git a/docs/en/operations/system-tables/user_processes.md b/docs/en/operations/system-tables/user_processes.md
new file mode 100644
index 00000000000..94c153fb683
--- /dev/null
+++ b/docs/en/operations/system-tables/user_processes.md
@@ -0,0 +1,28 @@
+---
+slug: /en/operations/system-tables/user_processes
+---
+# user_processes
+
+This system table can be used to get overview of memory usage and ProfileEvents of users.
+
+Columns:
+
+- `user` ([String](../../sql-reference/data-types/string.md)) — User name.
+- `memory_usage` ([Int64](../../sql-reference/data-types/int-uint#int-ranges)) – Sum of RAM used by all processes of the user. It might not include some types of dedicated memory. See the [max_memory_usage](../../operations/settings/query-complexity.md#settings_max_memory_usage) setting.
+- `peak_memory_usage` ([Int64](../../sql-reference/data-types/int-uint#int-ranges)) — The peak of memory usage of the user. It can be reset when no queries are run for the user.
+- `ProfileEvents` ([Map(String, UInt64)](../../sql-reference/data-types/map)) – Summary of ProfileEvents that measure different metrics for the user. The description of them could be found in the table [system.events](../../operations/system-tables/events.md#system_tables-events)
+
+```sql
+SELECT * FROM system.user_processes LIMIT 10 FORMAT Vertical;
+```
+
+```response
+Row 1:
+──────
+user:              default
+memory_usage:      9832
+peak_memory_usage: 9832
+ProfileEvents:     {'Query':5,'SelectQuery':5,'QueriesWithSubqueries':38,'SelectQueriesWithSubqueries':38,'QueryTimeMicroseconds':842048,'SelectQueryTimeMicroseconds':842048,'ReadBufferFromFileDescriptorRead':6,'ReadBufferFromFileDescriptorReadBytes':234,'IOBufferAllocs':3,'IOBufferAllocBytes':98493,'ArenaAllocChunks':283,'ArenaAllocBytes':1482752,'FunctionExecute':670,'TableFunctionExecute':16,'DiskReadElapsedMicroseconds':19,'NetworkSendElapsedMicroseconds':684,'NetworkSendBytes':139498,'SelectedRows':6076,'SelectedBytes':685802,'ContextLock':1140,'RWLockAcquiredReadLocks':193,'RWLockReadersWaitMilliseconds':4,'RealTimeMicroseconds':1585163,'UserTimeMicroseconds':889767,'SystemTimeMicroseconds':13630,'SoftPageFaults':1947,'OSCPUWaitMicroseconds':6,'OSCPUVirtualTimeMicroseconds':903251,'OSReadChars':28631,'OSWriteChars':28888,'QueryProfilerRuns':3,'LogTrace':79,'LogDebug':24}
+
+1 row in set. Elapsed: 0.010 sec.
+```
diff --git a/docs/en/operations/system-tables/zookeeper_connection.md b/docs/en/operations/system-tables/zookeeper_connection.md
index 9438cda1808..2f0ed303ce3 100644
--- a/docs/en/operations/system-tables/zookeeper_connection.md
+++ b/docs/en/operations/system-tables/zookeeper_connection.md
@@ -11,7 +11,8 @@ Columns:
 -   `host` ([String](../../sql-reference/data-types/string.md)) — The hostname/IP of the ZooKeeper node that ClickHouse connected to.
 -   `port` ([String](../../sql-reference/data-types/string.md)) — The port of the ZooKeeper node that ClickHouse connected to.
 -   `index` ([UInt8](../../sql-reference/data-types/int-uint.md)) — The index of the ZooKeeper node that ClickHouse connected to. The index is from ZooKeeper config.
--   `connected_time` ([String](../../sql-reference/data-types/string.md)) — When the connection was established
+-   `connected_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — When the connection was established
+-   `session_uptime_elapsed_seconds` ([UInt64](../../sql-reference/data-types/int-uint.md)) — Seconds elapsed since the connection was established
 -   `is_expired` ([UInt8](../../sql-reference/data-types/int-uint.md)) — Is the current connection expired.
 -   `keeper_api_version` ([String](../../sql-reference/data-types/string.md)) — Keeper API version.
 -   `client_id` ([UInt64](../../sql-reference/data-types/int-uint.md)) — Session id of the connection.
@@ -23,7 +24,7 @@ SELECT * FROM system.zookeeper_connection;
 ```
 
 ``` text
-┌─name──────────────┬─host─────────┬─port─┬─index─┬──────connected_time─┬─is_expired─┬─keeper_api_version─┬──────────client_id─┐
-│ default_zookeeper │ 127.0.0.1    │ 2181 │     0 │ 2023-05-19 14:30:16 │          0 │                  0 │ 216349144108826660 │
-└───────────────────┴──────────────┴──────┴───────┴─────────────────────┴────────────┴────────────────────┴────────────────────┘
+┌─name────┬─host──────┬─port─┬─index─┬──────connected_time─┬─session_uptime_elapsed_seconds─┬─is_expired─┬─keeper_api_version─┬─client_id─┐
+│ default │ 127.0.0.1 │ 9181 │     0 │ 2023-06-15 14:36:01 │                           3058 │          0 │                  3 │         5 │
+└─────────┴───────────┴──────┴───────┴─────────────────────┴────────────────────────────────┴────────────┴────────────────────┴───────────┘
 ```
diff --git a/docs/en/operations/system-tables/zookeeper_log.md b/docs/en/operations/system-tables/zookeeper_log.md
index b7cc4e22cd6..dce5be29f62 100644
--- a/docs/en/operations/system-tables/zookeeper_log.md
+++ b/docs/en/operations/system-tables/zookeeper_log.md
@@ -15,7 +15,7 @@ Columns with request parameters:
     - `Finalize` — The connection is lost, no response was received.
 - `event_date` ([Date](../../sql-reference/data-types/date.md)) — The date when the event happened.
 - `event_time` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — The date and time when the event happened.
-- `address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — IP address of ZooKeeper server that was used to make the request.
+- `address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — IP address of ZooKeeper server that was used to make the request.
 - `port` ([UInt16](../../sql-reference/data-types/int-uint.md)) — The port of ZooKeeper server that was used to make the request.
 - `session_id` ([Int64](../../sql-reference/data-types/int-uint.md)) — The session ID that the ZooKeeper server sets for each connection.
 - `xid` ([Int32](../../sql-reference/data-types/int-uint.md)) — The ID of the request within the session. This is usually a sequential request number. It is the same for the request row and the paired `response`/`finalize` row.
diff --git a/docs/en/sql-reference/aggregate-functions/combinators.md b/docs/en/sql-reference/aggregate-functions/combinators.md
index e1db5d8d23e..a395b350a55 100644
--- a/docs/en/sql-reference/aggregate-functions/combinators.md
+++ b/docs/en/sql-reference/aggregate-functions/combinators.md
@@ -30,7 +30,34 @@ Example 2: `uniqArray(arr)` – Counts the number of unique elements in all ‘a
 
 The -Map suffix can be appended to any aggregate function. This will create an aggregate function which gets Map type as an argument, and aggregates values of each key of the map separately using the specified aggregate function. The result is also of a Map type.
 
-Examples: `sumMap(map(1,1))`, `avgMap(map('a', 1))`.
+**Example**
+
+```sql
+CREATE TABLE map_map(
+    date Date,
+    timeslot DateTime,
+    status Map(String, UInt64)
+) ENGINE = Log;
+
+INSERT INTO map_map VALUES
+    ('2000-01-01', '2000-01-01 00:00:00', (['a', 'b', 'c'], [10, 10, 10])),
+    ('2000-01-01', '2000-01-01 00:00:00', (['c', 'd', 'e'], [10, 10, 10])),
+    ('2000-01-01', '2000-01-01 00:01:00', (['d', 'e', 'f'], [10, 10, 10])),
+    ('2000-01-01', '2000-01-01 00:01:00', (['f', 'g', 'g'], [10, 10, 10]));
+    
+SELECT
+    timeslot,
+    sumMap(status),
+    avgMap(status),
+    minMap(status)
+FROM map_map
+GROUP BY timeslot;
+
+┌────────────timeslot─┬─sumMap(status)───────────────────────┬─avgMap(status)───────────────────────┬─minMap(status)───────────────────────┐
+│ 2000-01-01 00:00:00 │ {'a':10,'b':10,'c':20,'d':10,'e':10} │ {'a':10,'b':10,'c':10,'d':10,'e':10} │ {'a':10,'b':10,'c':10,'d':10,'e':10} │
+│ 2000-01-01 00:01:00 │ {'d':10,'e':10,'f':20,'g':20}        │ {'d':10,'e':10,'f':10,'g':10}        │ {'d':10,'e':10,'f':10,'g':10}        │
+└─────────────────────┴──────────────────────────────────────┴──────────────────────────────────────┴──────────────────────────────────────┘
+```
 
 ## -SimpleState
 
@@ -70,6 +97,10 @@ Result:
 
 If you apply this combinator, the aggregate function does not return the resulting value (such as the number of unique values for the [uniq](../../sql-reference/aggregate-functions/reference/uniq.md#agg_function-uniq) function), but an intermediate state of the aggregation (for `uniq`, this is the hash table for calculating the number of unique values). This is an `AggregateFunction(...)` that can be used for further processing or stored in a table to finish aggregating later.
 
+:::note
+Please notice, that -MapState is not an invariant for the same data due to the fact that order of data in intermediate state can change, though it doesn't impact ingestion of this data.
+:::
+
 To work with these states, use:
 
 - [AggregatingMergeTree](../../engines/table-engines/mergetree-family/aggregatingmergetree.md) table engine.
diff --git a/docs/en/sql-reference/aggregate-functions/index.md b/docs/en/sql-reference/aggregate-functions/index.md
index 8951ac4ee6a..5d2229fbcce 100644
--- a/docs/en/sql-reference/aggregate-functions/index.md
+++ b/docs/en/sql-reference/aggregate-functions/index.md
@@ -4,7 +4,7 @@ sidebar_label: Aggregate Functions
 sidebar_position: 33
 ---
 
-# Aggregate Functions 
+# Aggregate Functions
 
 Aggregate functions work in the [normal](http://www.sql-tutorial.com/sql-aggregate-functions-sql-tutorial) way as expected by database experts.
 
@@ -72,3 +72,16 @@ FROM t_null_big
 │ 2.3333333333333335 │                 1.4 │
 └────────────────────┴─────────────────────┘
 ```
+
+Also you can use [Tuple](/docs/en/sql-reference/data-types/tuple.md) to work around NULL skipping behavior. The a `Tuple` that contains only a `NULL` value is not `NULL`, so the aggregate functions won't skip that row because of that `NULL` value.
+
+```sql
+SELECT
+    groupArray(y),
+    groupArray(tuple(y)).1
+FROM t_null_big;
+
+┌─groupArray(y)─┬─tupleElement(groupArray(tuple(y)), 1)─┐
+│ [2,2,3]       │ [2,NULL,2,3,NULL]                     │
+└───────────────┴───────────────────────────────────────┘
+```
diff --git a/docs/en/sql-reference/aggregate-functions/reference/argmax.md b/docs/en/sql-reference/aggregate-functions/reference/argmax.md
index 65c43ab04c0..8f10318838b 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/argmax.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/argmax.md
@@ -6,6 +6,7 @@ sidebar_position: 106
 # argMax
 
 Calculates the `arg` value for a maximum `val` value. If there are several different values of `arg` for maximum values of `val`, returns the first of these values encountered.
+Both parts the `arg` and the `max` behave as [aggregate functions](/docs/en/sql-reference/aggregate-functions/index.md), they both [skip `Null`](/docs/en/sql-reference/aggregate-functions/index.md#null-processing) during processing and return not `Null` values if not `Null` values are available.
 
 **Syntax**
 
@@ -49,3 +50,60 @@ Result:
 │ director             │
 └──────────────────────┘
 ```
+
+**Extended example**
+
+```sql
+CREATE TABLE test
+(
+    a Nullable(String),
+    b Nullable(Int64)
+)
+ENGINE = Memory AS
+SELECT *
+FROM VALUES(('a', 1), ('b', 2), ('c', 2), (NULL, 3), (NULL, NULL), ('d', NULL));
+
+select * from test;
+┌─a────┬────b─┐
+│ a    │    1 │
+│ b    │    2 │
+│ c    │    2 │
+│ ᴺᵁᴸᴸ │    3 │
+│ ᴺᵁᴸᴸ │ ᴺᵁᴸᴸ │
+│ d    │ ᴺᵁᴸᴸ │
+└──────┴──────┘
+
+SELECT argMax(a, b), max(b) FROM test;
+┌─argMax(a, b)─┬─max(b)─┐
+│ b            │      3 │ -- argMax = 'b' because it the first not Null value, max(b) is from another row!
+└──────────────┴────────┘
+
+SELECT argMax(tuple(a), b) FROM test;
+┌─argMax(tuple(a), b)─┐
+│ (NULL)              │ -- The a `Tuple` that contains only a `NULL` value is not `NULL`, so the aggregate functions won't skip that row because of that `NULL` value
+└─────────────────────┘
+
+SELECT (argMax((a, b), b) as t).1 argMaxA, t.2 argMaxB FROM test;
+┌─argMaxA─┬─argMaxB─┐
+│ ᴺᵁᴸᴸ    │       3 │ -- you can use Tuple and get both (all - tuple(*)) columns for the according max(b)
+└─────────┴─────────┘
+
+SELECT argMax(a, b), max(b) FROM test WHERE a IS NULL AND b IS NULL;
+┌─argMax(a, b)─┬─max(b)─┐
+│ ᴺᵁᴸᴸ         │   ᴺᵁᴸᴸ │ -- All aggregated rows contains at least one `NULL` value because of the filter, so all rows are skipped, therefore the result will be `NULL`
+└──────────────┴────────┘
+
+SELECT argMax(a, (b,a)) FROM test;
+┌─argMax(a, tuple(b, a))─┐
+│ c                      │ -- There are two rows with b=2, `Tuple` in the `Max` allows to get not the first `arg`
+└────────────────────────┘
+
+SELECT argMax(a, tuple(b)) FROM test;
+┌─argMax(a, tuple(b))─┐
+│ b                   │ -- `Tuple` can be used in `Max` to not skip Nulls in `Max`
+└─────────────────────┘
+```
+
+**See also**
+
+- [Tuple](/docs/en/sql-reference/data-types/tuple.md)
diff --git a/docs/en/sql-reference/aggregate-functions/reference/argmin.md b/docs/en/sql-reference/aggregate-functions/reference/argmin.md
index a7c21e3f15b..fdfce0833e0 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/argmin.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/argmin.md
@@ -6,6 +6,7 @@ sidebar_position: 105
 # argMin
 
 Calculates the `arg` value for a minimum `val` value. If there are several different values of `arg` for minimum values of `val`, returns the first of these values encountered.
+Both parts the `arg` and the `min` behave as [aggregate functions](/docs/en/sql-reference/aggregate-functions/index.md), they both [skip `Null`](/docs/en/sql-reference/aggregate-functions/index.md#null-processing) during processing and return not `Null` values if not `Null` values are available.
 
 **Syntax**
 
@@ -49,3 +50,65 @@ Result:
 │ worker               │
 └──────────────────────┘
 ```
+
+**Extended example**
+
+```sql
+CREATE TABLE test
+(
+    a Nullable(String),
+    b Nullable(Int64)
+)
+ENGINE = Memory AS
+SELECT *
+FROM VALUES((NULL, 0), ('a', 1), ('b', 2), ('c', 2), (NULL, NULL), ('d', NULL));
+
+select * from test;
+┌─a────┬────b─┐
+│ ᴺᵁᴸᴸ │    0 │
+│ a    │    1 │
+│ b    │    2 │
+│ c    │    2 │
+│ ᴺᵁᴸᴸ │ ᴺᵁᴸᴸ │
+│ d    │ ᴺᵁᴸᴸ │
+└──────┴──────┘
+
+SELECT argMin(a, b), min(b) FROM test;
+┌─argMin(a, b)─┬─min(b)─┐
+│ a            │      0 │ -- argMin = a because it the first not `NULL` value, min(b) is from another row!
+└──────────────┴────────┘
+
+SELECT argMin(tuple(a), b) FROM test;
+┌─argMin(tuple(a), b)─┐
+│ (NULL)              │ -- The a `Tuple` that contains only a `NULL` value is not `NULL`, so the aggregate functions won't skip that row because of that `NULL` value
+└─────────────────────┘
+
+SELECT (argMin((a, b), b) as t).1 argMinA, t.2 argMinB from test;
+┌─argMinA─┬─argMinB─┐
+│ ᴺᵁᴸᴸ    │       0 │ -- you can use `Tuple` and get both (all - tuple(*)) columns for the according max(b)
+└─────────┴─────────┘
+
+SELECT argMin(a, b), min(b) FROM test WHERE a IS NULL and b IS NULL;
+┌─argMin(a, b)─┬─min(b)─┐
+│ ᴺᵁᴸᴸ         │   ᴺᵁᴸᴸ │ -- All aggregated rows contains at least one `NULL` value because of the filter, so all rows are skipped, therefore the result will be `NULL`
+└──────────────┴────────┘
+
+SELECT argMin(a, (b, a)), min(tuple(b, a)) FROM test;
+┌─argMin(a, tuple(b, a))─┬─min(tuple(b, a))─┐
+│ d                      │ (NULL,NULL)      │ -- 'd' is the first not `NULL` value for the min
+└────────────────────────┴──────────────────┘
+
+SELECT argMin((a, b), (b, a)), min(tuple(b, a)) FROM test;
+┌─argMin(tuple(a, b), tuple(b, a))─┬─min(tuple(b, a))─┐
+│ (NULL,NULL)                      │ (NULL,NULL)      │ -- argMin returns (NULL,NULL) here because `Tuple` allows to don't skip `NULL` and min(tuple(b, a)) in this case is minimal value for this dataset
+└──────────────────────────────────┴──────────────────┘
+
+SELECT argMin(a, tuple(b)) FROM test;
+┌─argMax(a, tuple(b))─┐
+│ d                   │ -- `Tuple` can be used in `min` to not skip rows with `NULL` values as b.
+└─────────────────────┘
+```
+
+**See also**
+
+- [Tuple](/docs/en/sql-reference/data-types/tuple.md)
diff --git a/docs/en/sql-reference/aggregate-functions/reference/first_value.md b/docs/en/sql-reference/aggregate-functions/reference/first_value.md
index f343ca3f66c..c1965b23fe3 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/first_value.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/first_value.md
@@ -6,24 +6,32 @@ sidebar_position: 7
 # first_value
 
 Selects the first encountered value, similar to `any`, but could accept NULL.
+Mostly it should be used with [Window Functions](../../window-functions/index.md).
+Without Window Functions the result will be random if the source stream is not ordered.
 
 ## examples
 
 ```sql
-insert into test_data (a,b) values (1,null), (2,3), (4, 5), (6,null)
+CREATE TABLE test_data
+(
+    a Int64,
+    b Nullable(Int64)
+)
+ENGINE = Memory;
+
+INSERT INTO test_data (a, b) Values (1,null), (2,3), (4, 5), (6,null);
 ```
 
 ### example1
 The NULL value is ignored at default.
 ```sql
-select first_value(b) from test_data
+select first_value(b) from test_data;
 ```
 
 ```text
 ┌─first_value_ignore_nulls(b)─┐
 │                           3 │
 └─────────────────────────────┘
-
 ```
 
 ### example2
@@ -36,7 +44,6 @@ select first_value(b) ignore nulls from test_data
 ┌─first_value_ignore_nulls(b)─┐
 │                           3 │
 └─────────────────────────────┘
-
 ```
 
 ### example3
@@ -46,10 +53,28 @@ select first_value(b) respect nulls from test_data
 ```
 
 ```text
-
 ┌─first_value_respect_nulls(b)─┐
 │                         ᴺᵁᴸᴸ │
 └──────────────────────────────┘
 ```
 
+### example4
+Stabilized result using the sub-query with `ORDER BY`.
+```sql
+SELECT
+    first_value_respect_nulls(b),
+    first_value(b)
+FROM
+(
+    SELECT *
+    FROM test_data
+    ORDER BY a ASC
+)
+```
+
+```text
+┌─first_value_respect_nulls(b)─┬─first_value(b)─┐
+│                         ᴺᵁᴸᴸ │              3 │
+└──────────────────────────────┴────────────────┘
+```
 
diff --git a/docs/en/sql-reference/aggregate-functions/reference/index.md b/docs/en/sql-reference/aggregate-functions/reference/index.md
index 17ef494e9ad..6c56aefd51d 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/index.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/index.md
@@ -19,8 +19,19 @@ Standard aggregate functions:
 - [stddevSamp](/docs/en/sql-reference/aggregate-functions/reference/stddevsamp.md)
 - [varPop](/docs/en/sql-reference/aggregate-functions/reference/varpop.md)
 - [varSamp](/docs/en/sql-reference/aggregate-functions/reference/varsamp.md)
+- [corr](./corr.md)
 - [covarPop](/docs/en/sql-reference/aggregate-functions/reference/covarpop.md)
 - [covarSamp](/docs/en/sql-reference/aggregate-functions/reference/covarsamp.md)
+- [entropy](./entropy.md)
+- [exponentialMovingAverage](./exponentialmovingaverage.md)
+- [intervalLengthSum](./intervalLengthSum.md)
+- [kolmogorovSmirnovTest](./kolmogorovsmirnovtest.md)
+- [mannwhitneyutest](./mannwhitneyutest.md)
+- [median](./median.md)
+- [rankCorr](./rankCorr.md)
+- [sumKahan](./sumkahan.md)
+- [studentTTest](./studentttest.md)
+- [welchTTest](./welchttest.md)
 
 ClickHouse-specific aggregate functions:
 
@@ -34,12 +45,15 @@ ClickHouse-specific aggregate functions:
 - [avgWeighted](/docs/en/sql-reference/aggregate-functions/reference/avgweighted.md)
 - [topK](/docs/en/sql-reference/aggregate-functions/reference/topk.md)
 - [topKWeighted](/docs/en/sql-reference/aggregate-functions/reference/topkweighted.md)
+- [deltaSum](./deltasum.md)
+- [deltaSumTimestamp](./deltasumtimestamp.md)
 - [groupArray](/docs/en/sql-reference/aggregate-functions/reference/grouparray.md)
 - [groupArrayLast](/docs/en/sql-reference/aggregate-functions/reference/grouparraylast.md)
 - [groupUniqArray](/docs/en/sql-reference/aggregate-functions/reference/groupuniqarray.md)
 - [groupArrayInsertAt](/docs/en/sql-reference/aggregate-functions/reference/grouparrayinsertat.md)
 - [groupArrayMovingAvg](/docs/en/sql-reference/aggregate-functions/reference/grouparraymovingavg.md)
 - [groupArrayMovingSum](/docs/en/sql-reference/aggregate-functions/reference/grouparraymovingsum.md)
+- [groupArraySample](./grouparraysample.md)
 - [groupBitAnd](/docs/en/sql-reference/aggregate-functions/reference/groupbitand.md)
 - [groupBitOr](/docs/en/sql-reference/aggregate-functions/reference/groupbitor.md)
 - [groupBitXor](/docs/en/sql-reference/aggregate-functions/reference/groupbitxor.md)
@@ -84,3 +98,9 @@ ClickHouse-specific aggregate functions:
 - [theilsU](./theilsu.md)
 - [maxIntersections](./maxintersections.md)
 - [maxIntersectionsPosition](./maxintersectionsposition.md)
+- [meanZTest](./meanztest.md)
+- [quantileGK](./quantileGK.md)
+- [quantileInterpolatedWeighted](./quantileinterpolatedweighted.md)
+- [sparkBar](./sparkbar.md)
+- [sumCount](./sumcount.md)
+
diff --git a/docs/en/sql-reference/aggregate-functions/reference/last_value.md b/docs/en/sql-reference/aggregate-functions/reference/last_value.md
index 7b6e14e4a55..21a86a5f130 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/last_value.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/last_value.md
@@ -6,12 +6,20 @@ sidebar_position: 8
 # last_value
 
 Selects the last encountered value, similar to `anyLast`, but could accept NULL.
-
+Mostly it should be used with [Window Functions](../../window-functions/index.md).
+Without Window Functions the result will be random if the source stream is not ordered.
 
 ## examples
 
 ```sql
-insert into test_data (a,b) values (1,null), (2,3), (4, 5), (6,null)
+CREATE TABLE test_data
+(
+    a Int64,
+    b Nullable(Int64)
+)
+ENGINE = Memory;
+
+INSERT INTO test_data (a, b) Values (1,null), (2,3), (4, 5), (6,null)
 ```
 
 ### example1
@@ -50,4 +58,24 @@ select last_value(b) respect nulls from test_data
 └─────────────────────────────┘
 ```
 
+### example4
+Stabilized result using the sub-query with `ORDER BY`.
+```sql
+SELECT
+    last_value_respect_nulls(b),
+    last_value(b)
+FROM
+(
+    SELECT *
+    FROM test_data
+    ORDER BY a ASC
+)
+```
+
+```text
+┌─last_value_respect_nulls(b)─┬─last_value(b)─┐
+│                        ᴺᵁᴸᴸ │             5 │
+└─────────────────────────────┴───────────────┘
+```
+
 
diff --git a/docs/en/sql-reference/aggregate-functions/reference/summap.md b/docs/en/sql-reference/aggregate-functions/reference/summap.md
index 1acfde3783a..baa25edc250 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/summap.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/summap.md
@@ -5,7 +5,11 @@ sidebar_position: 141
 
 # sumMap
 
-Syntax: `sumMap(key, value)` or `sumMap(Tuple(key, value))`
+Syntax: `sumMap(key <Array>, value <Array>)` [Array type](../../data-types/array.md) or `sumMap(Tuple(key <Array>, value <Array>))` [Tuple type](../../data-types/tuple.md).
+
+Arguments: 
+
+Alias: `sumMappedArrays`.
 
 Totals the `value` array according to the keys specified in the `key` array.
 
@@ -27,6 +31,7 @@ CREATE TABLE sum_map(
     ),
     statusMapTuple Tuple(Array(Int32), Array(Int32))
 ) ENGINE = Log;
+
 INSERT INTO sum_map VALUES
     ('2000-01-01', '2000-01-01 00:00:00', [1, 2, 3], [10, 10, 10], ([1, 2, 3], [10, 10, 10])),
     ('2000-01-01', '2000-01-01 00:00:00', [3, 4, 5], [10, 10, 10], ([3, 4, 5], [10, 10, 10])),
@@ -47,3 +52,7 @@ GROUP BY timeslot
 │ 2000-01-01 00:01:00 │ ([4,5,6,7,8],[10,10,20,10,10])               │ ([4,5,6,7,8],[10,10,20,10,10]) │
 └─────────────────────┴──────────────────────────────────────────────┴────────────────────────────────┘
 ```
+
+**See Also**
+    
+- [-Map combinator for Map datatype](../combinators.md#-map)
diff --git a/docs/en/sql-reference/data-types/datetime64.md b/docs/en/sql-reference/data-types/datetime64.md
index 2d4035831fa..793691850b1 100644
--- a/docs/en/sql-reference/data-types/datetime64.md
+++ b/docs/en/sql-reference/data-types/datetime64.md
@@ -63,7 +63,7 @@ SELECT * FROM dt WHERE timestamp = toDateTime64('2019-01-01 00:00:00', 3, 'Asia/
 
 ``` text
 ┌───────────────timestamp─┬─event_id─┐
-│ 2019-01-01 00:00:00.000 │        2 │
+│ 2019-01-01 00:00:00.000 │        3 │
 └─────────────────────────┴──────────┘
 ```
 
@@ -75,8 +75,8 @@ SELECT * FROM dt WHERE timestamp = toDateTime64(1546300800.123, 3);
 
 ``` text
 ┌───────────────timestamp─┬─event_id─┐
-│ 2019-01-01 00:00:00.123 │        1 │
-│ 2019-01-01 00:00:00.123 │        2 │
+│ 2019-01-01 03:00:00.123 │        1 │
+│ 2019-01-01 03:00:00.123 │        2 │
 └─────────────────────────┴──────────┘
 ```
 
@@ -91,7 +91,7 @@ SELECT toDateTime64(now(), 3, 'Asia/Istanbul') AS column, toTypeName(column) AS
 
 ``` text
 ┌──────────────────column─┬─x──────────────────────────────┐
-│ 2019-10-16 04:12:04.000 │ DateTime64(3, 'Asia/Istanbul') │
+│ 2023-06-05 00:09:52.000 │ DateTime64(3, 'Asia/Istanbul') │
 └─────────────────────────┴────────────────────────────────┘
 ```
 
@@ -100,13 +100,14 @@ SELECT toDateTime64(now(), 3, 'Asia/Istanbul') AS column, toTypeName(column) AS
 ``` sql
 SELECT
 toDateTime64(timestamp, 3, 'Europe/London') as lon_time,
-toDateTime64(timestamp, 3, 'Asia/Istanbul') as mos_time
+toDateTime64(timestamp, 3, 'Asia/Istanbul') as istanbul_time
 FROM dt;
 ```
 
 ``` text
-┌───────────────lon_time──┬────────────────mos_time─┐
-│ 2019-01-01 00:00:00.000 │ 2019-01-01 03:00:00.000 │
+┌────────────────lon_time─┬───────────istanbul_time─┐
+│ 2019-01-01 00:00:00.123 │ 2019-01-01 03:00:00.123 │
+│ 2019-01-01 00:00:00.123 │ 2019-01-01 03:00:00.123 │
 │ 2018-12-31 21:00:00.000 │ 2019-01-01 00:00:00.000 │
 └─────────────────────────┴─────────────────────────┘
 ```
@@ -115,10 +116,9 @@ FROM dt;
 
 - [Type conversion functions](../../sql-reference/functions/type-conversion-functions.md)
 - [Functions for working with dates and times](../../sql-reference/functions/date-time-functions.md)
-- [Functions for working with arrays](../../sql-reference/functions/array-functions.md)
-- [The `date_time_input_format` setting](../../operations/settings/settings.md#settings-date_time_input_format)
-- [The `date_time_output_format` setting](../../operations/settings/settings.md#settings-date_time_output_format)
+- [The `date_time_input_format` setting](../../operations/settings/settings-formats.md#date_time_input_format)
+- [The `date_time_output_format` setting](../../operations/settings/settings-formats.md#date_time_output_format)
 - [The `timezone` server configuration parameter](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-timezone)
-- [Operators for working with dates and times](../../sql-reference/operators/index.md#operators-datetime)
+- [Operators for working with dates and times](../../sql-reference/operators/index.md#operators-for-working-with-dates-and-times)
 - [`Date` data type](../../sql-reference/data-types/date.md)
 - [`DateTime` data type](../../sql-reference/data-types/datetime.md)
diff --git a/docs/en/sql-reference/data-types/decimal.md b/docs/en/sql-reference/data-types/decimal.md
index 8df8b2519e3..bba5ea74ebe 100644
--- a/docs/en/sql-reference/data-types/decimal.md
+++ b/docs/en/sql-reference/data-types/decimal.md
@@ -32,7 +32,7 @@ For example, Decimal32(4) can contain numbers from -99999.9999 to 99999.9999 wit
 
 Internally data is represented as normal signed integers with respective bit width. Real value ranges that can be stored in memory are a bit larger than specified above, which are checked only on conversion from a string.
 
-Because modern CPUs do not support 128-bit integers natively, operations on Decimal128 are emulated. Because of this Decimal128 works significantly slower than Decimal32/Decimal64.
+Because modern CPUs do not support 128-bit and 256-bit integers natively, operations on Decimal128 and Decimal256 are emulated. Thus, Decimal128 and Decimal256 work significantly slower than Decimal32/Decimal64.
 
 ## Operations and Result Type
 
@@ -59,6 +59,10 @@ Some functions on Decimal return result as Float64 (for example, var or stddev).
 
 During calculations on Decimal, integer overflows might happen. Excessive digits in a fraction are discarded (not rounded). Excessive digits in integer part will lead to an exception.
 
+:::warning
+Overflow check is not implemented for Decimal128 and Decimal256. In case of overflow incorrect result is returned, no exception is thrown.
+:::
+
 ``` sql
 SELECT toDecimal32(2, 4) AS x, x / 3
 ```
diff --git a/docs/en/sql-reference/data-types/index.md b/docs/en/sql-reference/data-types/index.md
index 508307a0543..ffd063590fa 100644
--- a/docs/en/sql-reference/data-types/index.md
+++ b/docs/en/sql-reference/data-types/index.md
@@ -28,6 +28,6 @@ ClickHouse data types include:
 - **Nested data structures**: A [`Nested` data structure](./nested-data-structures/index.md) is like a table inside a cell
 - **Tuples**: A [`Tuple` of elements](./tuple.md), each having an individual type.
 - **Nullable**: [`Nullable`](./nullable.md) allows you to store a value as `NULL` when a value is "missing" (instead of the column settings its default value for the data type)
-- **IP addresses**: use [`IPv4`](./domains/ipv4.md) and [`IPv6`](./domains/ipv6.md) to efficiently store IP addresses
+- **IP addresses**: use [`IPv4`](./ipv4.md) and [`IPv6`](./ipv6.md) to efficiently store IP addresses
 - **Geo types**: for [geographical data](./geo.md), including `Point`, `Ring`, `Polygon` and `MultiPolygon`
 - **Special data types**: including [`Expression`](./special-data-types/expression.md), [`Set`](./special-data-types/set.md), [`Nothing`](./special-data-types/nothing.md) and [`Interval`](./special-data-types/interval.md)
diff --git a/docs/en/sql-reference/data-types/domains/ipv4.md b/docs/en/sql-reference/data-types/ipv4.md
similarity index 60%
rename from docs/en/sql-reference/data-types/domains/ipv4.md
rename to docs/en/sql-reference/data-types/ipv4.md
index b34814211fc..288806f47b3 100644
--- a/docs/en/sql-reference/data-types/domains/ipv4.md
+++ b/docs/en/sql-reference/data-types/ipv4.md
@@ -1,12 +1,12 @@
 ---
-slug: /en/sql-reference/data-types/domains/ipv4
+slug: /en/sql-reference/data-types/ipv4
 sidebar_position: 59
 sidebar_label: IPv4
 ---
 
 ## IPv4
 
-`IPv4` is a domain based on `UInt32` type and serves as a typed replacement for storing IPv4 values. It provides compact storage with the human-friendly input-output format and column type information on inspection.
+IPv4 addresses. Stored in 4 bytes as UInt32.
 
 ### Basic Usage
 
@@ -57,25 +57,6 @@ SELECT toTypeName(from), hex(from) FROM hits LIMIT 1;
 └──────────────────┴───────────┘
 ```
 
-Domain values are not implicitly convertible to types other than `UInt32`.
-If you want to convert `IPv4` value to a string, you have to do that explicitly with `IPv4NumToString()` function:
+**See Also**
 
-``` sql
-SELECT toTypeName(s), IPv4NumToString(from) as s FROM hits LIMIT 1;
-```
-
-    ┌─toTypeName(IPv4NumToString(from))─┬─s──────────────┐
-    │ String                            │ 183.247.232.58 │
-    └───────────────────────────────────┴────────────────┘
-
-Or cast to a `UInt32` value:
-
-``` sql
-SELECT toTypeName(i), CAST(from as UInt32) as i FROM hits LIMIT 1;
-```
-
-``` text
-┌─toTypeName(CAST(from, 'UInt32'))─┬──────────i─┐
-│ UInt32                           │ 3086477370 │
-└──────────────────────────────────┴────────────┘
-```
+- [Functions for Working with IPv4 and IPv6 Addresses](../functions/ip-address-functions.md)
diff --git a/docs/en/sql-reference/data-types/domains/ipv6.md b/docs/en/sql-reference/data-types/ipv6.md
similarity index 61%
rename from docs/en/sql-reference/data-types/domains/ipv6.md
rename to docs/en/sql-reference/data-types/ipv6.md
index dcb22e3cb6d..97959308b58 100644
--- a/docs/en/sql-reference/data-types/domains/ipv6.md
+++ b/docs/en/sql-reference/data-types/ipv6.md
@@ -1,12 +1,12 @@
 ---
-slug: /en/sql-reference/data-types/domains/ipv6
+slug: /en/sql-reference/data-types/ipv6
 sidebar_position: 60
 sidebar_label: IPv6
 ---
 
 ## IPv6
 
-`IPv6` is a domain based on `FixedString(16)` type and serves as a typed replacement for storing IPv6 values. It provides compact storage with the human-friendly input-output format and column type information on inspection.
+IPv6 addresses. Stored in 16 bytes as UInt128 big-endian.
 
 ### Basic Usage
 
@@ -57,27 +57,6 @@ SELECT toTypeName(from), hex(from) FROM hits LIMIT 1;
 └──────────────────┴──────────────────────────────────┘
 ```
 
-Domain values are not implicitly convertible to types other than `FixedString(16)`.
-If you want to convert `IPv6` value to a string, you have to do that explicitly with `IPv6NumToString()` function:
+**See Also**
 
-``` sql
-SELECT toTypeName(s), IPv6NumToString(from) as s FROM hits LIMIT 1;
-```
-
-``` text
-┌─toTypeName(IPv6NumToString(from))─┬─s─────────────────────────────┐
-│ String                            │ 2001:44c8:129:2632:33:0:252:2 │
-└───────────────────────────────────┴───────────────────────────────┘
-```
-
-Or cast to a `FixedString(16)` value:
-
-``` sql
-SELECT toTypeName(i), CAST(from as FixedString(16)) as i FROM hits LIMIT 1;
-```
-
-``` text
-┌─toTypeName(CAST(from, 'FixedString(16)'))─┬─i───────┐
-│ FixedString(16)                           │  ��� │
-└───────────────────────────────────────────┴─────────┘
-```
+- [Functions for Working with IPv4 and IPv6 Addresses](../functions/ip-address-functions.md)
diff --git a/docs/en/sql-reference/data-types/map.md b/docs/en/sql-reference/data-types/map.md
index 0ea183d73d8..e0c8b98f9f8 100644
--- a/docs/en/sql-reference/data-types/map.md
+++ b/docs/en/sql-reference/data-types/map.md
@@ -108,6 +108,7 @@ Result:
 
 - [map()](../../sql-reference/functions/tuple-map-functions.md#function-map) function
 - [CAST()](../../sql-reference/functions/type-conversion-functions.md#type_conversion_function-cast) function
+- [-Map combinator for Map datatype](../aggregate-functions/combinators.md#-map)
 
 
 ## Related content
diff --git a/docs/en/sql-reference/dictionaries/index.md b/docs/en/sql-reference/dictionaries/index.md
index 43e9300c1ae..6c3d80683db 100644
--- a/docs/en/sql-reference/dictionaries/index.md
+++ b/docs/en/sql-reference/dictionaries/index.md
@@ -2280,7 +2280,7 @@ This config consists of a list of regular expression tree nodes. Each node has t
   - The value of an attribute may contain **back references**, referring to capture groups of the matched regular expression. In the example, the value of attribute `version` in the first node consists of a back-reference `\1` to capture group `(\d+[\.\d]*)` in the regular expression. Back-reference numbers range from 1 to 9 and are written as `$1` or `\1` (for number 1). The back reference is replaced by the matched capture group during query execution.
 - **child nodes**: a list of children of a regexp tree node, each of which has its own attributes and (potentially) children nodes. String matching proceeds in a depth-first fashion. If a string matches a regexp node, the dictionary checks if it also matches the nodes' child nodes. If that is the case, the attributes of the deepest matching node are assigned. Attributes of a child node overwrite equally named attributes of parent nodes. The name of child nodes in YAML files can be arbitrary, e.g. `versions` in above example.
 
-Regexp tree dictionaries only allow access using the functions `dictGet` and `dictGetOrDefault`.
+Regexp tree dictionaries only allow access using the functions `dictGet`, `dictGetOrDefault`, and `dictGetAll`.
 
 Example:
 
@@ -2300,6 +2300,67 @@ In this case, we first match the regular expression `\d+/tclwebkit(?:\d+[\.\d]*)
 
 With a powerful YAML configure file, we can use a regexp tree dictionaries as a user agent string parser. We support [uap-core](https://github.com/ua-parser/uap-core) and demonstrate how to use it in the functional test [02504_regexp_dictionary_ua_parser](https://github.com/ClickHouse/ClickHouse/blob/master/tests/queries/0_stateless/02504_regexp_dictionary_ua_parser.sh)
 
+#### Collecting Attribute Values
+
+Sometimes it is useful to return values from multiple regular expressions that matched, rather than just the value of a leaf node. In these cases, the specialized [`dictGetAll`](../../sql-reference/functions/ext-dict-functions.md#dictgetall) function can be used. If a node has an attribute value of type `T`, `dictGetAll` will return an `Array(T)` containing zero or more values.
+
+By default, the number of matches returned per key is unbounded. A bound can be passed as an optional fourth argument to `dictGetAll`. The array is populated in _topological order_, meaning that child nodes come before parent nodes, and sibling nodes follow the ordering in the source.
+
+Example:
+
+```sql
+CREATE DICTIONARY regexp_dict
+(
+    regexp String,
+    tag String,
+    topological_index Int64,
+    captured Nullable(String),
+    parent String
+)
+PRIMARY KEY(regexp)
+SOURCE(YAMLRegExpTree(PATH '/var/lib/clickhouse/user_files/regexp_tree.yaml'))
+LAYOUT(regexp_tree)
+LIFETIME(0)
+```
+
+```yaml
+# /var/lib/clickhouse/user_files/regexp_tree.yaml
+- regexp: 'clickhouse\.com'
+  tag: 'ClickHouse'
+  topological_index: 1
+  paths:
+    - regexp: 'clickhouse\.com/docs(.*)'
+      tag: 'ClickHouse Documentation'
+      topological_index: 0
+      captured: '\1'
+      parent: 'ClickHouse'
+
+- regexp: '/docs(/|$)'
+  tag: 'Documentation'
+  topological_index: 2
+
+- regexp: 'github.com'
+  tag: 'GitHub'
+  topological_index: 3
+  captured: 'NULL'
+```
+
+```sql
+CREATE TABLE urls (url String) ENGINE=MergeTree ORDER BY url;
+INSERT INTO urls VALUES ('clickhouse.com'), ('clickhouse.com/docs/en'), ('github.com/clickhouse/tree/master/docs');
+SELECT url, dictGetAll('regexp_dict', ('tag', 'topological_index', 'captured', 'parent'), url, 2) FROM urls;
+```
+
+Result:
+
+```text
+┌─url────────────────────────────────────┬─dictGetAll('regexp_dict', ('tag', 'topological_index', 'captured', 'parent'), url, 2)─┐
+│ clickhouse.com                         │ (['ClickHouse'],[1],[],[])                                                            │
+│ clickhouse.com/docs/en                 │ (['ClickHouse Documentation','ClickHouse'],[0,1],['/en'],['ClickHouse'])              │
+│ github.com/clickhouse/tree/master/docs │ (['Documentation','GitHub'],[2,3],[NULL],[])                                          │
+└────────────────────────────────────────┴───────────────────────────────────────────────────────────────────────────────────────┘
+```
+
 ### Use Regular Expression Tree Dictionary in ClickHouse Cloud
 
 Above used `YAMLRegExpTree` source works in ClickHouse Open Source but not in ClickHouse Cloud. To use regexp tree dictionaries in ClickHouse could, first create a regexp tree dictionary from a YAML file locally in ClickHouse Open Source, then dump this dictionary into a CSV file using the `dictionary` table function and the [INTO OUTFILE](../statements/select/into-outfile.md) clause.
diff --git a/docs/en/sql-reference/functions/array-functions.md b/docs/en/sql-reference/functions/array-functions.md
index bdd1445c990..7f2b8f3c605 100644
--- a/docs/en/sql-reference/functions/array-functions.md
+++ b/docs/en/sql-reference/functions/array-functions.md
@@ -230,13 +230,15 @@ hasAll(set, subset)
 **Arguments**
 
 - `set` – Array of any type with a set of elements.
-- `subset` – Array of any type with elements that should be tested to be a subset of `set`.
+- `subset` – Array of any type that shares a common supertype with `set` containing elements that should be tested to be a subset of `set`.
 
 **Return values**
 
 - `1`, if `set` contains all of the elements from `subset`.
 - `0`, otherwise.
 
+Raises an exception `NO_COMMON_TYPE` if the set and subset elements do not share a common supertype.
+
 **Peculiar properties**
 
 - An empty array is a subset of any array.
@@ -253,7 +255,7 @@ hasAll(set, subset)
 
 `SELECT hasAll(['a', 'b'], ['a'])` returns 1.
 
-`SELECT hasAll([1], ['a'])` returns 0.
+`SELECT hasAll([1], ['a'])` raises a `NO_COMMON_TYPE` exception.
 
 `SELECT hasAll([[1, 2], [3, 4]], [[1, 2], [3, 5]])` returns 0.
 
@@ -268,13 +270,15 @@ hasAny(array1, array2)
 **Arguments**
 
 - `array1` – Array of any type with a set of elements.
-- `array2` – Array of any type with a set of elements.
+- `array2` – Array of any type that shares a common supertype with `array1`.
 
 **Return values**
 
 - `1`, if `array1` and `array2` have one similar element at least.
 - `0`, otherwise.
 
+Raises an exception `NO_COMMON_TYPE` if the array1 and array2 elements do not share a common supertype.
+
 **Peculiar properties**
 
 - `Null` processed as a value.
@@ -288,7 +292,7 @@ hasAny(array1, array2)
 
 `SELECT hasAny([-128, 1., 512], [1])` returns `1`.
 
-`SELECT hasAny([[1, 2], [3, 4]], ['a', 'c'])` returns `0`.
+`SELECT hasAny([[1, 2], [3, 4]], ['a', 'c'])` raises a `NO_COMMON_TYPE` exception.
 
 `SELECT hasAll([[1, 2], [3, 4]], [[1, 2], [1, 2]])` returns `1`.
 
@@ -318,6 +322,8 @@ For Example:
 - `1`, if `array1` contains `array2`.
 - `0`, otherwise.
 
+Raises an exception `NO_COMMON_TYPE` if the array1 and array2 elements do not share a common supertype.
+
 **Peculiar properties**
 
 - The function will return `1` if `array2` is empty.
@@ -339,6 +345,9 @@ For Example:
 `SELECT hasSubstr(['a', 'b' , 'c'], ['a', 'c'])` returns 0.
 
 `SELECT hasSubstr([[1, 2], [3, 4], [5, 6]], [[1, 2], [3, 4]])` returns 1.
+i
+`SELECT hasSubstr([1, 2, NULL, 3, 4], ['a'])` raises a `NO_COMMON_TYPE` exception.
+
 
 ## indexOf(arr, x)
 
diff --git a/docs/en/sql-reference/functions/date-time-functions.md b/docs/en/sql-reference/functions/date-time-functions.md
index 280b41e7a5f..3f61e7a214d 100644
--- a/docs/en/sql-reference/functions/date-time-functions.md
+++ b/docs/en/sql-reference/functions/date-time-functions.md
@@ -139,8 +139,8 @@ makeDateTime32(year, month, day, hour, minute, second[, fraction[, precision[, t
 
 ## timeZone
 
-Returns the timezone of the server.
-If the function is executed in the context of a distributed table, it generates a normal column with values relevant to each shard, otherwise it produces a constant value.
+Returns the timezone of the current session, i.e. the value of setting [session_timezone](../../operations/settings/settings.md#session_timezone).
+If the function is executed in the context of a distributed table, then it generates a normal column with values relevant to each shard, otherwise it produces a constant value.
 
 **Syntax**
 
@@ -156,6 +156,33 @@ Alias: `timezone`.
 
 Type: [String](../../sql-reference/data-types/string.md).
 
+**See also**
+
+- [serverTimeZone](#serverTimeZone)
+
+## serverTimeZone
+
+Returns the timezone of the server, i.e. the value of setting [timezone](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-timezone).
+If the function is executed in the context of a distributed table, then it generates a normal column with values relevant to each shard. Otherwise, it produces a constant value.
+
+**Syntax**
+
+``` sql
+serverTimeZone()
+```
+
+Alias: `serverTimezone`.
+
+**Returned value**
+
+-   Timezone.
+
+Type: [String](../../sql-reference/data-types/string.md).
+
+**See also**
+
+- [timeZone](#timeZone)
+
 ## toTimeZone
 
 Converts a date or date with time to the specified time zone. Does not change the internal value (number of unix seconds) of the data, only the value's time zone attribute and the value's string representation changes.
diff --git a/docs/en/sql-reference/functions/distance-functions.md b/docs/en/sql-reference/functions/distance-functions.md
index 67affb88a53..1774c22014d 100644
--- a/docs/en/sql-reference/functions/distance-functions.md
+++ b/docs/en/sql-reference/functions/distance-functions.md
@@ -237,6 +237,43 @@ Result:
 └────────────────────────────┘
 ```
 
+## L2SquaredDistance
+
+Calculates the sum of the squares of the difference between the corresponding elements of two vectors.
+
+**Syntax**
+
+```sql
+L2SquaredDistance(vector1, vector2)
+```
+
+Alias: `distanceL2Squared`.
+
+**Arguments**
+
+- `vector1` — First vector. [Tuple](../../sql-reference/data-types/tuple.md) or [Array](../../sql-reference/data-types/array.md).
+- `vector2` — Second vector. [Tuple](../../sql-reference/data-types/tuple.md) or [Array](../../sql-reference/data-types/array.md).
+
+**Returned value**
+
+Type: [Float](../../sql-reference/data-types/float.md).
+
+**Example**
+
+Query:
+
+```sql
+SELECT L2SquaredDistance([1, 2, 3], [0, 0, 0])
+```
+
+Result:
+
+```response
+┌─L2SquaredDistance([1, 2, 3], [0, 0, 0])─┐
+│                                      14 │
+└─────────────────────────────────────────┘
+```
+
 ## LinfDistance
 
 Calculates the distance between two points (the values of the vectors are the coordinates) in `L_{inf}` space ([maximum norm](https://en.wikipedia.org/wiki/Norm_(mathematics)#Maximum_norm_(special_case_of:_infinity_norm,_uniform_norm,_or_supremum_norm))).
diff --git a/docs/en/sql-reference/functions/ext-dict-functions.md b/docs/en/sql-reference/functions/ext-dict-functions.md
index 7d8aa2c0390..284d6d80405 100644
--- a/docs/en/sql-reference/functions/ext-dict-functions.md
+++ b/docs/en/sql-reference/functions/ext-dict-functions.md
@@ -403,6 +403,84 @@ SELECT dictGetDescendants('hierarchy_flat_dictionary', number, 1) FROM system.nu
 └────────────────────────────────────────────────────────────┘
 ```
 
+
+## dictGetAll
+
+Retrieves the attribute values of all nodes that matched each key in a [regular expression tree dictionary](../../sql-reference/dictionaries/index.md#regexp-tree-dictionary).
+
+Besides returning values of type `Array(T)` instead of `T`, this function behaves similarly to [`dictGet`](#dictget-dictgetordefault-dictgetornull).
+
+**Syntax**
+
+``` sql
+dictGetAll('dict_name', attr_names, id_expr[, limit])
+```
+
+**Arguments**
+
+- `dict_name` — Name of the dictionary. [String literal](../../sql-reference/syntax.md#syntax-string-literal).
+- `attr_names` — Name of the column of the dictionary, [String literal](../../sql-reference/syntax.md#syntax-string-literal), or tuple of column names, [Tuple](../../sql-reference/data-types/tuple.md)([String literal](../../sql-reference/syntax.md#syntax-string-literal)).
+- `id_expr` — Key value. [Expression](../../sql-reference/syntax.md#syntax-expressions) returning array of dictionary key-type value or [Tuple](../../sql-reference/data-types/tuple.md)-type value depending on the dictionary configuration.
+- `limit` - Maximum length for each value array returned. When truncating, child nodes are given precedence over parent nodes, and otherwise the defined list order for the regexp tree dictionary is respected. If unspecified, array length is unlimited.
+
+**Returned value**
+
+- If ClickHouse parses the attribute successfully in the attribute’s data type as defined in the dictionary, returns an array of dictionary attribute values that correspond to `id_expr` for each attribute specified by `attr_names`.
+
+- If there is no key corresponding to `id_expr` in the dictionary, then an empty array is returned.
+
+ClickHouse throws an exception if it cannot parse the value of the attribute or the value does not match the attribute data type.
+
+**Example**
+
+Consider the following regexp tree dictionary:
+
+```sql
+CREATE DICTIONARY regexp_dict
+(
+    regexp String,
+    tag String
+)
+PRIMARY KEY(regexp)
+SOURCE(YAMLRegExpTree(PATH '/var/lib/clickhouse/user_files/regexp_tree.yaml'))
+LAYOUT(regexp_tree)
+...
+```
+
+```yaml
+# /var/lib/clickhouse/user_files/regexp_tree.yaml
+- regexp: 'foo'
+  tag: 'foo_attr'
+- regexp: 'bar'
+  tag: 'bar_attr'
+- regexp: 'baz'
+  tag: 'baz_attr'
+```
+
+Get all matching values:
+
+```sql
+SELECT dictGetAll('regexp_dict', 'tag', 'foobarbaz');
+```
+
+```text
+┌─dictGetAll('regexp_dict', 'tag', 'foobarbaz')─┐
+│ ['foo_attr','bar_attr','baz_attr']            │
+└───────────────────────────────────────────────┘
+```
+
+Get up to 2 matching values:
+
+```sql
+SELECT dictGetAll('regexp_dict', 'tag', 'foobarbaz', 2);
+```
+
+```text
+┌─dictGetAll('regexp_dict', 'tag', 'foobarbaz', 2)─┐
+│ ['foo_attr','bar_attr']                          │
+└──────────────────────────────────────────────────┘
+```
+
 ## Other Functions
 
 ClickHouse supports specialized functions that convert dictionary attribute values to a specific data type regardless of the dictionary configuration.
diff --git a/docs/en/sql-reference/functions/functions-for-nulls.md b/docs/en/sql-reference/functions/functions-for-nulls.md
index 6f82fedaab7..d57b799e94c 100644
--- a/docs/en/sql-reference/functions/functions-for-nulls.md
+++ b/docs/en/sql-reference/functions/functions-for-nulls.md
@@ -8,7 +8,7 @@ sidebar_label: Nullable
 
 ## isNull
 
-Returns whether the argument is [NULL](../../sql-reference/syntax.md#null-literal).
+Returns whether the argument is [NULL](../../sql-reference/syntax.md#null).
 
 ``` sql
 isNull(x)
diff --git a/docs/en/sql-reference/functions/index.md b/docs/en/sql-reference/functions/index.md
index 42d402e9d44..d07a5292431 100644
--- a/docs/en/sql-reference/functions/index.md
+++ b/docs/en/sql-reference/functions/index.md
@@ -10,7 +10,9 @@ There are at least\* two types of functions - regular functions (they are just c
 
 In this section we discuss regular functions. For aggregate functions, see the section “Aggregate functions”.
 
-\* - There is a third type of function that the ‘arrayJoin’ function belongs to; table functions can also be mentioned separately.\*
+:::note 
+There is a third type of function that the [‘arrayJoin’ function](/docs/en/sql-reference/functions/array-join.md) belongs to. And [table functions](/docs/en/sql-reference/table-functions/index.md) can also be mentioned separately.
+:::
 
 ## Strong Typing
 
diff --git a/docs/en/sql-reference/functions/ip-address-functions.md b/docs/en/sql-reference/functions/ip-address-functions.md
index 0dc1db1161b..33c788a632e 100644
--- a/docs/en/sql-reference/functions/ip-address-functions.md
+++ b/docs/en/sql-reference/functions/ip-address-functions.md
@@ -248,7 +248,7 @@ SELECT IPv6CIDRToRange(toIPv6('2001:0db8:0000:85a3:0000:0000:ac1f:8001'), 32);
 
 ## toIPv4(string)
 
-An alias to `IPv4StringToNum()` that takes a string form of IPv4 address and returns value of [IPv4](../../sql-reference/data-types/domains/ipv4.md) type, which is binary equal to value returned by `IPv4StringToNum()`.
+An alias to `IPv4StringToNum()` that takes a string form of IPv4 address and returns value of [IPv4](../../sql-reference/data-types/ipv4.md) type, which is binary equal to value returned by `IPv4StringToNum()`.
 
 ``` sql
 WITH
@@ -296,7 +296,7 @@ Same as `toIPv6`, but if the IPv6 address has an invalid format, it returns null
 
 ## toIPv6
 
-Converts a string form of IPv6 address to [IPv6](../../sql-reference/data-types/domains/ipv6.md) type. If the IPv6 address has an invalid format, returns an empty value.
+Converts a string form of IPv6 address to [IPv6](../../sql-reference/data-types/ipv6.md) type. If the IPv6 address has an invalid format, returns an empty value.
 Similar to [IPv6StringToNum](#ipv6stringtonums) function, which converts IPv6 address to binary format.
 
 If the input string contains a valid IPv4 address, then the IPv6 equivalent of the IPv4 address is returned.
@@ -315,7 +315,7 @@ toIPv6(string)
 
 - IP address.
 
-Type: [IPv6](../../sql-reference/data-types/domains/ipv6.md).
+Type: [IPv6](../../sql-reference/data-types/ipv6.md).
 
 **Examples**
 
diff --git a/docs/en/sql-reference/functions/nlp-functions.md b/docs/en/sql-reference/functions/nlp-functions.md
index f10415783a5..bb127a939f3 100644
--- a/docs/en/sql-reference/functions/nlp-functions.md
+++ b/docs/en/sql-reference/functions/nlp-functions.md
@@ -4,6 +4,8 @@ sidebar_position: 130
 sidebar_label: NLP (experimental)
 ---
 
+# Natural Language Processing (NLP) Functions
+
 :::note
 This is an experimental feature that is currently in development and is not ready for general use. It will change in unpredictable backwards-incompatible ways in future releases. Set `allow_experimental_nlp_functions = 1` to enable it.
 :::
diff --git a/docs/en/sql-reference/functions/tuple-functions.md b/docs/en/sql-reference/functions/tuple-functions.md
index 1739920c9f0..7ed2deaeda6 100644
--- a/docs/en/sql-reference/functions/tuple-functions.md
+++ b/docs/en/sql-reference/functions/tuple-functions.md
@@ -22,14 +22,15 @@ tuple(x, y, …)
 
 A function that allows getting a column from a tuple.
 
-If the second argument is a number `n`, it is the column index, starting from 1. If the second argument is a string `s`, it represents the name of the element. Besides, we can provide the third optional argument, such that when index out of bounds or element for such name does not exist, the default value returned instead of throw exception. The second and third arguments if provided are always must be constant. There is no cost to execute the function.
+If the second argument is a number `index`, it is the column index, starting from 1. If the second argument is a string `name`, it represents the name of the element. Besides, we can provide the third optional argument, such that when index out of bounds or no element exist for the name, the default value returned instead of throwing an exception. The second and third arguments, if provided, must be constants. There is no cost to execute the function.
 
-The function implements the operator `x.n` and `x.s`.
+The function implements operators `x.index` and `x.name`.
 
 **Syntax**
 
 ``` sql
-tupleElement(tuple, n/s [, default_value])
+tupleElement(tuple, index, [, default_value])
+tupleElement(tuple, name, [, default_value])
 ```
 
 ## untuple
diff --git a/docs/en/sql-reference/functions/type-conversion-functions.md b/docs/en/sql-reference/functions/type-conversion-functions.md
index f6c99b168ac..214c885bc0e 100644
--- a/docs/en/sql-reference/functions/type-conversion-functions.md
+++ b/docs/en/sql-reference/functions/type-conversion-functions.md
@@ -33,7 +33,7 @@ SELECT
     toTypeName(toNullable('') AS val) AS source_type,
     toTypeName(toString(val)) AS to_type_result_type,
     toTypeName(CAST(val, 'String')) AS cast_result_type
-    
+
 ┌─source_type──────┬─to_type_result_type─┬─cast_result_type─┐
 │ Nullable(String) │ Nullable(String)    │ String           │
 └──────────────────┴─────────────────────┴──────────────────┘
@@ -203,7 +203,7 @@ Result:
 
 ## toDate
 
-Converts the argument to [Date](/docs/en/sql-reference/data-types/date.md) data type. 
+Converts the argument to [Date](/docs/en/sql-reference/data-types/date.md) data type.
 
 If the argument is [DateTime](/docs/en/sql-reference/data-types/datetime.md) or [DateTime64](/docs/en/sql-reference/data-types/datetime64.md), it truncates it and leaves the date component of the DateTime:
 
@@ -232,7 +232,7 @@ SELECT
 │ 2022-12-30 │ Date                             │
 └────────────┴──────────────────────────────────┘
 
-1 row in set. Elapsed: 0.001 sec. 
+1 row in set. Elapsed: 0.001 sec.
 ```
 
 ```sql
@@ -314,20 +314,183 @@ SELECT
 └─────────────────────┴───────────────┴─────────────┴─────────────────────┘
 ```
 
+
 ## toDateOrZero
 
+The same as [toDate](#todate) but returns lower boundary of [Date](/docs/en/sql-reference/data-types/date.md) if an invalid argument is received. Only [String](/docs/en/sql-reference/data-types/string.md) argument is supported.
+
+**Example**
+
+Query:
+
+``` sql
+SELECT toDateOrZero('2022-12-30'), toDateOrZero('');
+```
+
+Result:
+
+```response
+┌─toDateOrZero('2022-12-30')─┬─toDateOrZero('')─┐
+│                 2022-12-30 │       1970-01-01 │
+└────────────────────────────┴──────────────────┘
+```
+
+
 ## toDateOrNull
 
+The same as [toDate](#todate) but returns `NULL` if an invalid argument is received. Only [String](/docs/en/sql-reference/data-types/string.md) argument is supported.
+
+**Example**
+
+Query:
+
+``` sql
+SELECT toDateOrNull('2022-12-30'), toDateOrNull('');
+```
+
+Result:
+
+```response
+┌─toDateOrNull('2022-12-30')─┬─toDateOrNull('')─┐
+│                 2022-12-30 │             ᴺᵁᴸᴸ │
+└────────────────────────────┴──────────────────┘
+```
+
+
 ## toDateOrDefault
 
+Like [toDate](#todate) but if unsuccessful, returns a default value which is either the second argument (if specified), or otherwise the lower boundary of [Date](/docs/en/sql-reference/data-types/date.md).
+
+**Syntax**
+
+``` sql
+toDateOrDefault(expr [, default_value])
+```
+
+**Example**
+
+Query:
+
+``` sql
+SELECT toDateOrDefault('2022-12-30'), toDateOrDefault('', '2023-01-01'::Date);
+```
+
+Result:
+
+```response
+┌─toDateOrDefault('2022-12-30')─┬─toDateOrDefault('', CAST('2023-01-01', 'Date'))─┐
+│                    2022-12-30 │                                      2023-01-01 │
+└───────────────────────────────┴─────────────────────────────────────────────────┘
+```
+
+
 ## toDateTime
 
+Converts an input value to [DateTime](/docs/en/sql-reference/data-types/datetime.md).
+
+**Syntax**
+
+``` sql
+toDateTime(expr[, time_zone ])
+```
+
+**Arguments**
+
+- `expr` — The value. [String](/docs/en/sql-reference/data-types/string.md), [Int](/docs/en/sql-reference/data-types/int-uint.md), [Date](/docs/en/sql-reference/data-types/date.md) or [DateTime](/docs/en/sql-reference/data-types/datetime.md).
+- `time_zone` — Time zone. [String](/docs/en/sql-reference/data-types/string.md).
+
+If `expr` is a number, it is interpreted as the number of seconds since the beginning of the Unix Epoch (as Unix timestamp).
+
+**Returned value**
+
+- A date time. [DateTime](/docs/en/sql-reference/data-types/datetime.md)
+
+**Example**
+
+Query:
+
+``` sql
+SELECT toDateTime('2022-12-30 13:44:17'), toDateTime(1685457500, 'UTC');
+```
+
+Result:
+
+```response
+┌─toDateTime('2022-12-30 13:44:17')─┬─toDateTime(1685457500, 'UTC')─┐
+│               2022-12-30 13:44:17 │           2023-05-30 14:38:20 │
+└───────────────────────────────────┴───────────────────────────────┘
+```
+
+
 ## toDateTimeOrZero
 
+The same as [toDateTime](#todatetime) but returns lower boundary of [DateTime](/docs/en/sql-reference/data-types/datetime.md) if an invalid argument is received. Only [String](/docs/en/sql-reference/data-types/string.md) argument is supported.
+
+**Example**
+
+Query:
+
+``` sql
+SELECT toDateTimeOrZero('2022-12-30 13:44:17'), toDateTimeOrZero('');
+```
+
+Result:
+
+```response
+┌─toDateTimeOrZero('2022-12-30 13:44:17')─┬─toDateTimeOrZero('')─┐
+│                     2022-12-30 13:44:17 │  1970-01-01 00:00:00 │
+└─────────────────────────────────────────┴──────────────────────┘
+```
+
+
 ## toDateTimeOrNull
 
+The same as [toDateTime](#todatetime) but returns `NULL` if an invalid argument is received. Only [String](/docs/en/sql-reference/data-types/string.md) argument is supported.
+
+**Example**
+
+Query:
+
+``` sql
+SELECT toDateTimeOrNull('2022-12-30 13:44:17'), toDateTimeOrNull('');
+```
+
+Result:
+
+```response
+┌─toDateTimeOrNull('2022-12-30 13:44:17')─┬─toDateTimeOrNull('')─┐
+│                     2022-12-30 13:44:17 │                 ᴺᵁᴸᴸ │
+└─────────────────────────────────────────┴──────────────────────┘
+```
+
+
 ## toDateTimeOrDefault
 
+Like [toDateTime](#todatetime) but if unsuccessful, returns a default value which is either the third argument (if specified), or otherwise the lower boundary of [DateTime](/docs/en/sql-reference/data-types/datetime.md).
+
+**Syntax**
+
+``` sql
+toDateTimeOrDefault(expr [, time_zone [, default_value]])
+```
+
+**Example**
+
+Query:
+
+``` sql
+SELECT toDateTimeOrDefault('2022-12-30 13:44:17'), toDateTimeOrDefault('', 'UTC', '2023-01-01'::DateTime('UTC'));
+```
+
+Result:
+
+```response
+┌─toDateTimeOrDefault('2022-12-30 13:44:17')─┬─toDateTimeOrDefault('', 'UTC', CAST('2023-01-01', 'DateTime(\'UTC\')'))─┐
+│                        2022-12-30 13:44:17 │                                                     2023-01-01 00:00:00 │
+└────────────────────────────────────────────┴─────────────────────────────────────────────────────────────────────────┘
+```
+
+
 ## toDate32
 
 Converts the argument to the [Date32](/docs/en/sql-reference/data-types/date32.md) data type. If the value is outside the range, `toDate32` returns the border values supported by [Date32](/docs/en/sql-reference/data-types/date32.md). If the argument has [Date](/docs/en/sql-reference/data-types/date.md) type, it's borders are taken into account.
@@ -519,6 +682,11 @@ SELECT toDateTime64('2019-01-01 00:00:00', 3, 'Asia/Istanbul') AS value, toTypeN
 └─────────────────────────┴─────────────────────────────────────────────────────────────────────┘
 ```
 
+## toDateTime64OrZero
+
+## toDateTime64OrNull
+
+## toDateTime64OrDefault
 
 ## toDecimal(32\|64\|128\|256)
 
@@ -1247,7 +1415,7 @@ Returns DateTime values parsed from input string according to a MySQL style form
 **Supported format specifiers**
 
 All format specifiers listed in [formatDateTime](/docs/en/sql-reference/functions/date-time-functions.md#date_time_functions-formatDateTime) except:
-- %Q: Quarter (1-4) 
+- %Q: Quarter (1-4)
 
 **Example**
 
@@ -1341,10 +1509,12 @@ parseDateTimeBestEffort(time_string [, time_zone])
 - A string containing 9..10 digit [unix timestamp](https://en.wikipedia.org/wiki/Unix_time).
 - A string with a date and a time component: `YYYYMMDDhhmmss`, `DD/MM/YYYY hh:mm:ss`, `DD-MM-YY hh:mm`, `YYYY-MM-DD hh:mm:ss`, etc.
 - A string with a date, but no time component: `YYYY`, `YYYYMM`, `YYYY*MM`, `DD/MM/YYYY`, `DD-MM-YY` etc.
-- A string with a day and time: `DD`, `DD hh`, `DD hh:mm`. In this case `YYYY-MM` are substituted as `2000-01`.
+- A string with a day and time: `DD`, `DD hh`, `DD hh:mm`. In this case `MM` is substituted by `01`.
 - A string that includes the date and time along with time zone offset information: `YYYY-MM-DD hh:mm:ss ±h:mm`, etc. For example, `2020-12-12 17:36:00 -5:00`.
+- A [syslog timestamp](https://datatracker.ietf.org/doc/html/rfc3164#section-4.1.2): `Mmm dd hh:mm:ss`. For example, `Jun  9 14:20:32`.
 
 For all of the formats with separator the function parses months names expressed by their full name or by the first three letters of a month name. Examples: `24/DEC/18`, `24-Dec-18`, `01-September-2018`.
+If the year is not specified, it is considered to be equal to the current year. If the resulting DateTime happen to be in the future (even by a second after the current moment), then the current year is substituted by the previous year.
 
 **Returned value**
 
@@ -1415,23 +1585,46 @@ Result:
 Query:
 
 ``` sql
-SELECT parseDateTimeBestEffort('10 20:19');
+SELECT toYear(now()) as year, parseDateTimeBestEffort('10 20:19');
 ```
 
 Result:
 
 ```response
-┌─parseDateTimeBestEffort('10 20:19')─┐
-│                 2000-01-10 20:19:00 │
-└─────────────────────────────────────┘
+┌─year─┬─parseDateTimeBestEffort('10 20:19')─┐
+│ 2023 │                 2023-01-10 20:19:00 │
+└──────┴─────────────────────────────────────┘
+```
+
+Query:
+
+``` sql
+WITH
+    now() AS ts_now,
+    formatDateTime(ts_around, '%b %e %T') AS syslog_arg
+SELECT
+    ts_now,
+    syslog_arg,
+    parseDateTimeBestEffort(syslog_arg)
+FROM (SELECT arrayJoin([ts_now - 30, ts_now + 30]) AS ts_around);
+```
+
+Result:
+
+```response
+┌──────────────ts_now─┬─syslog_arg──────┬─parseDateTimeBestEffort(syslog_arg)─┐
+│ 2023-06-30 23:59:30 │ Jun 30 23:59:00 │                 2023-06-30 23:59:00 │
+│ 2023-06-30 23:59:30 │ Jul  1 00:00:00 │                 2022-07-01 00:00:00 │
+└─────────────────────┴─────────────────┴─────────────────────────────────────┘
 ```
 
 **See Also**
 
-- [RFC 1123](https://tools.ietf.org/html/rfc1123)
+- [RFC 1123](https://datatracker.ietf.org/doc/html/rfc1123)
 - [toDate](#todate)
 - [toDateTime](#todatetime)
 - [ISO 8601 announcement by @xkcd](https://xkcd.com/1179/)
+- [RFC 3164](https://datatracker.ietf.org/doc/html/rfc3164#section-4.1.2)
 
 ## parseDateTimeBestEffortUS
 
diff --git a/docs/en/sql-reference/statements/alter/column.md b/docs/en/sql-reference/statements/alter/column.md
index 378f41c1199..dae2c7dd1d3 100644
--- a/docs/en/sql-reference/statements/alter/column.md
+++ b/docs/en/sql-reference/statements/alter/column.md
@@ -232,6 +232,7 @@ ALTER TABLE table_with_ttl MODIFY COLUMN column_ttl REMOVE TTL;
 
 Materializes or updates a column with an expression for a default value (`DEFAULT` or `MATERIALIZED`).
 It is used if it is necessary to add or update a column with a complicated expression, because evaluating such an expression directly on `SELECT` executing turns out to be expensive. 
+Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations).
 
 Syntax:
 
diff --git a/docs/en/sql-reference/statements/alter/index.md b/docs/en/sql-reference/statements/alter/index.md
index 7a687a067aa..7dadc2be5b2 100644
--- a/docs/en/sql-reference/statements/alter/index.md
+++ b/docs/en/sql-reference/statements/alter/index.md
@@ -60,7 +60,7 @@ You can specify how long (in seconds) to wait for inactive replicas to execute a
 For all `ALTER` queries, if `alter_sync = 2` and some replicas are not active for more than the time, specified in the `replication_wait_for_inactive_replica_timeout` setting, then an exception `UNFINISHED` is thrown.
 :::
 
-For `ALTER TABLE ... UPDATE|DELETE` queries the synchronicity is defined by the [mutations_sync](/docs/en/operations/settings/settings.md/#mutations_sync) setting.
+For `ALTER TABLE ... UPDATE|DELETE|MATERIALIZE INDEX|MATERIALIZE PROJECTION|MATERIALIZE COLUMN` queries the synchronicity is defined by the [mutations_sync](/docs/en/operations/settings/settings.md/#mutations_sync) setting.
 
 ## Related content
 
diff --git a/docs/en/sql-reference/statements/alter/projection.md b/docs/en/sql-reference/statements/alter/projection.md
index 030e9352a00..fb438927089 100644
--- a/docs/en/sql-reference/statements/alter/projection.md
+++ b/docs/en/sql-reference/statements/alter/projection.md
@@ -142,19 +142,19 @@ The following operations with [projections](/docs/en/engines/table-engines/merge
 
 ## ADD PROJECTION
 
-`ALTER TABLE [db].name ADD PROJECTION name ( SELECT <COLUMN LIST EXPR> [GROUP BY] [ORDER BY] )` - Adds projection description to tables metadata.
+`ALTER TABLE [db.]name [ON CLUSTER cluster] ADD PROJECTION [IF NOT EXISTS] name ( SELECT <COLUMN LIST EXPR> [GROUP BY] [ORDER BY] )` - Adds projection description to tables metadata.
 
 ## DROP PROJECTION
 
-`ALTER TABLE [db].name DROP PROJECTION name` - Removes projection description from tables metadata and deletes projection files from disk. Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations).
+`ALTER TABLE [db.]name [ON CLUSTER cluster] DROP PROJECTION [IF EXISTS] name` - Removes projection description from tables metadata and deletes projection files from disk. Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations).
 
 ## MATERIALIZE PROJECTION
 
-`ALTER TABLE [db.]table MATERIALIZE PROJECTION name IN PARTITION partition_name` - The query rebuilds the projection `name` in the partition `partition_name`. Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations).
+`ALTER TABLE [db.]table [ON CLUSTER cluster] MATERIALIZE PROJECTION [IF EXISTS] name [IN PARTITION partition_name]` - The query rebuilds the projection `name` in the partition `partition_name`. Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations).
 
 ## CLEAR PROJECTION
 
-`ALTER TABLE [db.]table CLEAR PROJECTION name IN PARTITION partition_name` - Deletes projection files from disk without removing description. Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations).
+`ALTER TABLE [db.]table [ON CLUSTER cluster] CLEAR PROJECTION [IF EXISTS] name [IN PARTITION partition_name]` - Deletes projection files from disk without removing description. Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations).
 
 
 The commands `ADD`, `DROP` and `CLEAR` are lightweight in a sense that they only change metadata or remove files.
diff --git a/docs/en/sql-reference/statements/alter/skipping-index.md b/docs/en/sql-reference/statements/alter/skipping-index.md
index 67af76986da..42fd12d9487 100644
--- a/docs/en/sql-reference/statements/alter/skipping-index.md
+++ b/docs/en/sql-reference/statements/alter/skipping-index.md
@@ -10,15 +10,25 @@ sidebar_label: INDEX
 
 The following operations are available:
 
-- `ALTER TABLE [db].table_name [ON CLUSTER cluster] ADD INDEX name expression TYPE type GRANULARITY value [FIRST|AFTER name]` - Adds index description to tables metadata.
+## ADD INDEX
 
-- `ALTER TABLE [db].table_name [ON CLUSTER cluster] DROP INDEX name` - Removes index description from tables metadata and deletes index files from disk. Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations).
+`ALTER TABLE [db.]table_name [ON CLUSTER cluster] ADD INDEX [IF NOT EXISTS] name expression TYPE type [GRANULARITY value] [FIRST|AFTER name]` - Adds index description to tables metadata.
 
-- `ALTER TABLE [db.]table_name [ON CLUSTER cluster] MATERIALIZE INDEX name [IN PARTITION partition_name]` - Rebuilds the secondary index `name` for the specified `partition_name`. Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations). If `IN PARTITION` part is omitted then it rebuilds the index for the whole table data.
+## DROP INDEX
 
-The first two commands are lightweight in a sense that they only change metadata or remove files.
+`ALTER TABLE [db.]table_name [ON CLUSTER cluster] DROP INDEX [IF EXISTS] name` - Removes index description from tables metadata and deletes index files from disk. Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations).
 
-Also, they are replicated, syncing indices metadata via ZooKeeper.
+## MATERIALIZE INDEX
+
+`ALTER TABLE [db.]table_name [ON CLUSTER cluster] MATERIALIZE INDEX [IF EXISTS] name [IN PARTITION partition_name]` - Rebuilds the secondary index `name` for the specified `partition_name`. Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations). If `IN PARTITION` part is omitted then it rebuilds the index for the whole table data.
+
+## CLEAR INDEX
+
+`ALTER TABLE [db.]table_name [ON CLUSTER cluster] CLEAR INDEX [IF EXISTS] name [IN PARTITION partition_name]` - Deletes the secondary index files from disk without removing description. Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations).
+
+
+The commands `ADD`, `DROP`, and `CLEAR` are lightweight in the sense that they only change metadata or remove files.
+Also, they are replicated, syncing indices metadata via ClickHouse Keeper or ZooKeeper.
 
 :::note    
 Index manipulation is supported only for tables with [`*MergeTree`](/docs/en/engines/table-engines/mergetree-family/mergetree.md) engine (including [replicated](/docs/en/engines/table-engines/mergetree-family/replication.md) variants).
diff --git a/docs/en/sql-reference/statements/create/dictionary.md b/docs/en/sql-reference/statements/create/dictionary.md
index 29c72d62f24..c0a153c5660 100644
--- a/docs/en/sql-reference/statements/create/dictionary.md
+++ b/docs/en/sql-reference/statements/create/dictionary.md
@@ -82,6 +82,35 @@ LIFETIME(MIN 0 MAX 1000)
 LAYOUT(FLAT())
 ```
 
+:::note
+When using the SQL console in [ClickHouse Cloud](https://clickhouse.com), you must specify a user (`default` or any other user with the role `default_role`) and password when creating a dictionary.
+:::note
+
+```sql
+CREATE USER IF NOT EXISTS clickhouse_admin
+IDENTIFIED WITH sha256_password BY 'passworD43$x';
+
+GRANT default_role TO clickhouse_admin;
+
+CREATE DATABASE foo_db;
+
+CREATE TABLE foo_db.source_table (
+    id UInt64,
+    value String
+) ENGINE = MergeTree
+PRIMARY KEY id;
+
+CREATE DICTIONARY foo_db.id_value_dictionary
+(
+    id UInt64,
+    value String
+)
+PRIMARY KEY id
+SOURCE(CLICKHOUSE(TABLE 'source_table' USER 'clickhouse_admin' PASSWORD 'passworD43$x' DB 'foo_db' ))
+LAYOUT(FLAT())
+LIFETIME(MIN 0 MAX 1000);
+```
+
 ### Create a dictionary from a table in a remote ClickHouse service
 
 Input table (in the remote ClickHouse service) `source_table`:
diff --git a/docs/en/sql-reference/statements/create/table.md b/docs/en/sql-reference/statements/create/table.md
index de44a001472..1a72f89fb1f 100644
--- a/docs/en/sql-reference/statements/create/table.md
+++ b/docs/en/sql-reference/statements/create/table.md
@@ -380,11 +380,15 @@ High compression levels are useful for asymmetric scenarios, like compress once,
 
 `DEFLATE_QPL` — [Deflate compression algorithm](https://github.com/intel/qpl) implemented by Intel® Query Processing Library. Some limitations apply:
 
-- DEFLATE_QPL is experimental and can only be used after setting configuration parameter `allow_experimental_codecs=1`.
+- DEFLATE_QPL is disabled by default and can only be used after setting configuration parameter `enable_deflate_qpl_codec = 1`.
 - DEFLATE_QPL requires a ClickHouse build compiled with SSE 4.2 instructions (by default, this is the case). Refer to [Build Clickhouse with DEFLATE_QPL](/docs/en/development/building_and_benchmarking_deflate_qpl.md/#Build-Clickhouse-with-DEFLATE_QPL) for more details.
 - DEFLATE_QPL works best if the system has a Intel® IAA (In-Memory Analytics Accelerator) offloading device. Refer to [Accelerator Configuration](https://intel.github.io/qpl/documentation/get_started_docs/installation.html#accelerator-configuration) and [Benchmark with DEFLATE_QPL](/docs/en/development/building_and_benchmarking_deflate_qpl.md/#Run-Benchmark-with-DEFLATE_QPL) for more details.
 - DEFLATE_QPL-compressed data can only be transferred between ClickHouse nodes compiled with SSE 4.2 enabled.
 
+:::note
+DEFLATE_QPL is not available in ClickHouse Cloud.
+:::
+
 ### Specialized Codecs
 
 These codecs are designed to make compression more effective by using specific features of data. Some of these codecs do not compress data themself. Instead, they prepare the data for a common purpose codec, which compresses it better than without this preparation.
diff --git a/docs/en/sql-reference/statements/delete.md b/docs/en/sql-reference/statements/delete.md
index fa9f08e225f..87a6d4d92d8 100644
--- a/docs/en/sql-reference/statements/delete.md
+++ b/docs/en/sql-reference/statements/delete.md
@@ -55,6 +55,9 @@ With the described implementation now we can see what can negatively affect 'DEL
 - Table having a very large number of data parts
 - Having a lot of data in Compact parts—in a Compact part, all columns are stored in one file.
 
+:::note
+Currently, Lightweight delete does not work for tables with projection as rows in projection may be affected and require the projection to be rebuilt. Rebuilding projection makes the deletion not lightweight, so this is not supported. 
+:::
 
 ## Related content
 
diff --git a/docs/en/sql-reference/statements/select/join.md b/docs/en/sql-reference/statements/select/join.md
index 08ffae838f8..7971b3ba275 100644
--- a/docs/en/sql-reference/statements/select/join.md
+++ b/docs/en/sql-reference/statements/select/join.md
@@ -21,6 +21,9 @@ Expressions from `ON` clause and columns from `USING` clause are called “join
 ## Related Content
 
 - Blog: [ClickHouse: A Blazingly Fast DBMS with Full SQL Join Support - Part 1](https://clickhouse.com/blog/clickhouse-fully-supports-joins)
+- Blog: [ClickHouse: A Blazingly Fast DBMS with Full SQL Join Support - Under the Hood - Part 2](https://clickhouse.com/blog/clickhouse-fully-supports-joins-hash-joins-part2)
+- Blog: [ClickHouse: A Blazingly Fast DBMS with Full SQL Join Support - Under the Hood - Part 3](https://clickhouse.com/blog/clickhouse-fully-supports-joins-full-sort-partial-merge-part3)
+- Blog: [ClickHouse: A Blazingly Fast DBMS with Full SQL Join Support - Under the Hood - Part 4](https://clickhouse.com/blog/clickhouse-fully-supports-joins-direct-join-part4)
 
 ## Supported Types of JOIN
 
diff --git a/docs/en/sql-reference/statements/set.md b/docs/en/sql-reference/statements/set.md
index 14f523adc3b..3e5e86eccf7 100644
--- a/docs/en/sql-reference/statements/set.md
+++ b/docs/en/sql-reference/statements/set.md
@@ -10,7 +10,7 @@ sidebar_label: SET
 SET param = value
 ```
 
-Assigns `value` to the `param` [setting](../../operations/settings/index.md) for the current session. You cannot change [server settings](../../operations/server-configuration-parameters/index.md) this way.
+Assigns `value` to the `param` [setting](../../operations/settings/index.md) for the current session. You cannot change [server settings](../../operations/server-configuration-parameters/settings.md) this way.
 
 You can also set all the values from the specified settings profile in a single query.
 
diff --git a/docs/en/sql-reference/statements/show.md b/docs/en/sql-reference/statements/show.md
index 21c0010498a..336b93db9d5 100644
--- a/docs/en/sql-reference/statements/show.md
+++ b/docs/en/sql-reference/statements/show.md
@@ -273,7 +273,7 @@ SHOW DICTIONARIES FROM db LIKE '%reg%' LIMIT 2
 Displays a list of primary and data skipping indexes of a table.
 
 ```sql
-SHOW [EXTENDED] {INDEX | INDEXES | KEYS } {FROM | IN} <table> [{FROM | IN} <db>] [WHERE <expr>] [INTO OUTFILE <filename>] [FORMAT <format>]
+SHOW [EXTENDED] {INDEX | INDEXES | INDICES | KEYS } {FROM | IN} <table> [{FROM | IN} <db>] [WHERE <expr>] [INTO OUTFILE <filename>] [FORMAT <format>]
 ```
 
 The database and table name can be specified in abbreviated form as `<db>.<table>`, i.e. `FROM tab FROM db` and `FROM db.tab` are
@@ -283,7 +283,7 @@ The optional keyword `EXTENDED` currently has no effect, it only exists for MySQ
 
 `SHOW INDEX` produces a result table with the following structure:
 - table - The name of the table (String)
-- non_unique - 0 if the index can contain duplicates, 1 otherwise (UInt8)
+- non_unique - 0 if the index cannot contain duplicates, 1 otherwise (UInt8)
 - key_name - The name of the index, `PRIMARY` if the index is a primary key index (String)
 - seq_in_index - Currently unused
 - column_name - Currently unused
diff --git a/docs/en/sql-reference/table-functions/azureBlobStorage.md b/docs/en/sql-reference/table-functions/azureBlobStorage.md
new file mode 100644
index 00000000000..7bb5d892c47
--- /dev/null
+++ b/docs/en/sql-reference/table-functions/azureBlobStorage.md
@@ -0,0 +1,72 @@
+---
+slug: /en/sql-reference/table-functions/azureBlobStorage
+sidebar_position: 10
+sidebar_label: azureBlobStorage
+keywords: [azure blob storage]
+---
+
+# azureBlobStorage Table Function
+
+Provides a table-like interface to select/insert files in [Azure Blob Storage](https://azure.microsoft.com/en-us/products/storage/blobs). This table function is similar to the [s3 function](../../sql-reference/table-functions/s3.md).
+
+**Syntax**
+
+``` sql
+azureBlobStorage(- connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression, structure])
+```
+
+**Arguments**
+
+- `connection_string|storage_account_url` — connection_string includes account name & key ([Create connection string](https://learn.microsoft.com/en-us/azure/storage/common/storage-configure-connection-string?toc=%2Fazure%2Fstorage%2Fblobs%2Ftoc.json&bc=%2Fazure%2Fstorage%2Fblobs%2Fbreadcrumb%2Ftoc.json#configure-a-connection-string-for-an-azure-storage-account)) or you could also provide the storage account url here and account name & account key as separate parameters (see parameters account_name & account_key)
+- `container_name` - Container name
+- `blobpath` - file path. Supports following wildcards in readonly mode: `*`, `?`, `{abc,def}` and `{N..M}` where `N`, `M` — numbers, `'abc'`, `'def'` — strings.
+- `account_name` - if storage_account_url is used, then account name can be specified here
+- `account_key` - if storage_account_url is used, then account key can be specified here
+- `format` — The [format](../../interfaces/formats.md#formats) of the file.
+- `compression` — Supported values: `none`, `gzip/gz`, `brotli/br`, `xz/LZMA`, `zstd/zst`. By default, it will autodetect compression by file extension. (same as setting to `auto`).
+- `structure` — Structure of the table. Format `'column1_name column1_type, column2_name column2_type, ...'`.
+
+**Returned value**
+
+A table with the specified structure for reading or writing data in the specified file.
+
+**Examples**
+
+Write data into azure blob storage using the following :
+
+```sql
+INSERT INTO TABLE FUNCTION azureBlobStorage('http://azurite1:10000/devstoreaccount1',
+    'test_container', 'test_{_partition_id}.csv', 'devstoreaccount1', 'Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==',
+    'CSV', 'auto', 'column1 UInt32, column2 UInt32, column3 UInt32') PARTITION BY column3 VALUES (1, 2, 3), (3, 2, 1), (78, 43, 3);
+```
+
+And then it can be read using
+
+```sql
+SELECT * FROM azureBlobStorage('http://azurite1:10000/devstoreaccount1',
+    'test_container', 'test_1.csv', 'devstoreaccount1', 'Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==',
+    'CSV', 'auto', 'column1 UInt32, column2 UInt32, column3 UInt32');
+```
+
+```response
+┌───column1─┬────column2─┬───column3─┐
+│     3     │       2    │      1    │
+└───────────┴────────────┴───────────┘
+```
+
+or using connection_string
+
+```sql
+SELECT count(*) FROM azureBlobStorage('DefaultEndpointsProtocol=https;AccountName=devstoreaccount1;AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;EndPointSuffix=core.windows.net',
+    'test_container', 'test_3.csv', 'CSV', 'auto' , 'column1 UInt32, column2 UInt32, column3 UInt32');
+```
+
+``` text
+┌─count()─┐
+│      2  │
+└─────────┘
+```
+
+**See Also**
+
+- [AzureBlobStorage Table Engine](/docs/en/engines/table-engines/integrations/azureBlobStorage.md)
diff --git a/docs/en/sql-reference/table-functions/cluster.md b/docs/en/sql-reference/table-functions/cluster.md
index 904c678750c..7362c433e0e 100644
--- a/docs/en/sql-reference/table-functions/cluster.md
+++ b/docs/en/sql-reference/table-functions/cluster.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/cluster
-sidebar_position: 50
+sidebar_position: 30
 sidebar_label: cluster
 title: "cluster, clusterAllReplicas"
 ---
@@ -9,7 +9,7 @@ Allows to access all shards in an existing cluster which configured in `remote_s
 
 `clusterAllReplicas` function — same as `cluster`, but all replicas are queried. Each replica in a cluster is used as a separate shard/connection.
 
-:::note    
+:::note
 All available clusters are listed in the [system.clusters](../../operations/system-tables/clusters.md) table.
 :::
 
@@ -23,9 +23,9 @@ clusterAllReplicas('cluster_name', db, table[, sharding_key])
 ```
 **Arguments**
 
-- `cluster_name` – Name of a cluster that is used to build a set of addresses and connection parameters to remote and local servers. 
-- `db.table` or `db`, `table` - Name of a database and a table.  
-- `sharding_key` - A sharding key. Optional. Needs to be specified if the cluster has more than one shard. 
+- `cluster_name` – Name of a cluster that is used to build a set of addresses and connection parameters to remote and local servers.
+- `db.table` or `db`, `table` - Name of a database and a table.
+- `sharding_key` - A sharding key. Optional. Needs to be specified if the cluster has more than one shard.
 
 **Returned value**
 
diff --git a/docs/en/sql-reference/table-functions/deltalake.md b/docs/en/sql-reference/table-functions/deltalake.md
index f1cc4659a2a..885d8df6a1e 100644
--- a/docs/en/sql-reference/table-functions/deltalake.md
+++ b/docs/en/sql-reference/table-functions/deltalake.md
@@ -1,6 +1,7 @@
 ---
 slug: /en/sql-reference/table-functions/deltalake
-sidebar_label: DeltaLake
+sidebar_position: 45
+sidebar_label: deltaLake
 ---
 
 # deltaLake Table Function
diff --git a/docs/en/sql-reference/table-functions/dictionary.md b/docs/en/sql-reference/table-functions/dictionary.md
index 73d5039a64b..d34bc86e0cd 100644
--- a/docs/en/sql-reference/table-functions/dictionary.md
+++ b/docs/en/sql-reference/table-functions/dictionary.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/dictionary
-sidebar_position: 54
+sidebar_position: 47
 sidebar_label: dictionary
 title: dictionary
 ---
diff --git a/docs/en/sql-reference/table-functions/executable.md b/docs/en/sql-reference/table-functions/executable.md
index c6aba61aedb..d377c5d4d0c 100644
--- a/docs/en/sql-reference/table-functions/executable.md
+++ b/docs/en/sql-reference/table-functions/executable.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/engines/table-functions/executable
-sidebar_position: 55
+sidebar_position: 50
 sidebar_label:  executable
 keywords: [udf, user defined function, clickhouse, executable, table, function]
 ---
diff --git a/docs/en/sql-reference/table-functions/file.md b/docs/en/sql-reference/table-functions/file.md
index 28c2dc9f1f3..c78ffc1d61c 100644
--- a/docs/en/sql-reference/table-functions/file.md
+++ b/docs/en/sql-reference/table-functions/file.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/file
-sidebar_position: 37
+sidebar_position: 60
 sidebar_label: file
 ---
 
@@ -40,7 +40,7 @@ VALUES (1, 2, 3), (3, 2, 1), (1, 3, 2)
 As a result, the data is written into the file `test.tsv`:
 
 ```bash
-# cat /var/lib/clickhouse/user_files/test.tsv 
+# cat /var/lib/clickhouse/user_files/test.tsv
 1	2	3
 3	2	1
 1	3	2
@@ -163,7 +163,7 @@ Query the number of rows in all files of these two directories:
 SELECT count(*) FROM file('{some,another}_dir/*', 'TSV', 'name String, value UInt32');
 ```
 
-:::note    
+:::note
 If your listing of files contains number ranges with leading zeros, use the construction with braces for each digit separately or use `?`.
 :::
 
@@ -196,6 +196,17 @@ SELECT count(*) FROM file('big_dir/**/file002', 'CSV', 'name String, value UInt3
 - `_path` — Path to the file.
 - `_file` — Name of the file.
 
+## Settings
+
+- [engine_file_empty_if_not_exists](/docs/en/operations/settings/settings.md#engine-file-emptyif-not-exists) - allows to select empty data from a file that doesn't exist. Disabled by default.
+- [engine_file_truncate_on_insert](/docs/en/operations/settings/settings.md#engine-file-truncate-on-insert) - allows to truncate file before insert into it. Disabled by default.
+- [engine_file_allow_create_multiple_files](/docs/en/operations/settings/settings.md#engine_file_allow_create_multiple_files) - allows to create a new file on each insert if format has suffix. Disabled by default.
+- [engine_file_skip_empty_files](/docs/en/operations/settings/settings.md#engine_file_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
+- [storage_file_read_method](/docs/en/operations/settings/settings.md#engine-file-emptyif-not-exists) - method of reading data from storage file, one of: read, pread, mmap (only for clickhouse-local). Default value: `pread` for clickhouse-server, `mmap` for clickhouse-local.
+
+
+
 **See Also**
 
 - [Virtual columns](/docs/en/engines/table-engines/index.md#table_engines-virtual_columns)
+- [Rename files after processing](/docs/en/operations/settings/settings.md#rename_files_after_processing)
diff --git a/docs/en/sql-reference/table-functions/format.md b/docs/en/sql-reference/table-functions/format.md
index 2813eef5bcf..dcebdf16387 100644
--- a/docs/en/sql-reference/table-functions/format.md
+++ b/docs/en/sql-reference/table-functions/format.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/format
-sidebar_position: 56
+sidebar_position: 65
 sidebar_label: format
 ---
 
diff --git a/docs/en/sql-reference/table-functions/gcs.md b/docs/en/sql-reference/table-functions/gcs.md
index bfa7f36fa48..01b4e4f6a69 100644
--- a/docs/en/sql-reference/table-functions/gcs.md
+++ b/docs/en/sql-reference/table-functions/gcs.md
@@ -1,7 +1,7 @@
 ---
 slug: /en/sql-reference/table-functions/gcs
-sidebar_position: 45
-sidebar_label: s3
+sidebar_position: 70
+sidebar_label: gcs
 keywords: [gcs, bucket]
 ---
 
@@ -16,7 +16,7 @@ gcs(path [,hmac_key, hmac_secret] [,format] [,structure] [,compression])
 ```
 
 :::tip GCS
-The GCS Table Function integrates with Google Cloud Storage by using the GCS XML API and HMAC keys. See the [Google interoperability docs]( https://cloud.google.com/storage/docs/interoperability) for more details about the endpoint and HMAC. 
+The GCS Table Function integrates with Google Cloud Storage by using the GCS XML API and HMAC keys. See the [Google interoperability docs]( https://cloud.google.com/storage/docs/interoperability) for more details about the endpoint and HMAC.
 
 :::
 
diff --git a/docs/en/sql-reference/table-functions/generate.md b/docs/en/sql-reference/table-functions/generate.md
index 724f6d4a1f2..3b9b077af49 100644
--- a/docs/en/sql-reference/table-functions/generate.md
+++ b/docs/en/sql-reference/table-functions/generate.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/generate
-sidebar_position: 47
+sidebar_position: 75
 sidebar_label: generateRandom
 ---
 
diff --git a/docs/en/sql-reference/table-functions/hdfs.md b/docs/en/sql-reference/table-functions/hdfs.md
index 6ba24211131..680ac54ee78 100644
--- a/docs/en/sql-reference/table-functions/hdfs.md
+++ b/docs/en/sql-reference/table-functions/hdfs.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/hdfs
-sidebar_position: 45
+sidebar_position: 80
 sidebar_label: hdfs
 ---
 
@@ -79,7 +79,7 @@ SELECT count(*)
 FROM hdfs('hdfs://hdfs1:9000/{some,another}_dir/*', 'TSV', 'name String, value UInt32')
 ```
 
-:::note    
+:::note
 If your listing of files contains number ranges with leading zeros, use the construction with braces for each digit separately or use `?`.
 :::
 
@@ -97,6 +97,12 @@ FROM hdfs('hdfs://hdfs1:9000/big_dir/file{0..9}{0..9}{0..9}', 'CSV', 'name Strin
 - `_path` — Path to the file.
 - `_file` — Name of the file.
 
+## Storage Settings {#storage-settings}
+
+- [hdfs_truncate_on_insert](/docs/en/operations/settings/settings.md#hdfs-truncate-on-insert) - allows to truncate file before insert into it. Disabled by default.
+- [hdfs_create_multiple_files](/docs/en/operations/settings/settings.md#hdfs_allow_create_multiple_files) - allows to create a new file on each insert if format has suffix. Disabled by default.
+- [hdfs_skip_empty_files](/docs/en/operations/settings/settings.md#hdfs_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
+
 **See Also**
 
 - [Virtual columns](../../engines/table-engines/index.md#table_engines-virtual_columns)
diff --git a/docs/en/sql-reference/table-functions/hdfsCluster.md b/docs/en/sql-reference/table-functions/hdfsCluster.md
index afd1fd28a5a..832be46d05f 100644
--- a/docs/en/sql-reference/table-functions/hdfsCluster.md
+++ b/docs/en/sql-reference/table-functions/hdfsCluster.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/hdfsCluster
-sidebar_position: 55
+sidebar_position: 81
 sidebar_label: hdfsCluster
 ---
 
@@ -50,7 +50,7 @@ SELECT count(*)
 FROM hdfsCluster('cluster_simple', 'hdfs://hdfs1:9000/{some,another}_dir/*', 'TSV', 'name String, value UInt32')
 ```
 
-:::note    
+:::note
 If your listing of files contains number ranges with leading zeros, use the construction with braces for each digit separately or use `?`.
 :::
 
diff --git a/docs/en/sql-reference/table-functions/hudi.md b/docs/en/sql-reference/table-functions/hudi.md
index 5a97b2401b4..959a32fe26d 100644
--- a/docs/en/sql-reference/table-functions/hudi.md
+++ b/docs/en/sql-reference/table-functions/hudi.md
@@ -1,6 +1,7 @@
 ---
 slug: /en/sql-reference/table-functions/hudi
-sidebar_label: Hudi
+sidebar_position: 85
+sidebar_label: hudi
 ---
 
 # hudi Table Function
diff --git a/docs/en/sql-reference/table-functions/iceberg.md b/docs/en/sql-reference/table-functions/iceberg.md
index 713b0f9bbf5..30db0ef00aa 100644
--- a/docs/en/sql-reference/table-functions/iceberg.md
+++ b/docs/en/sql-reference/table-functions/iceberg.md
@@ -1,6 +1,7 @@
 ---
 slug: /en/sql-reference/table-functions/iceberg
-sidebar_label: Iceberg
+sidebar_position: 90
+sidebar_label: iceberg
 ---
 
 # iceberg Table Function
diff --git a/docs/en/sql-reference/table-functions/index.md b/docs/en/sql-reference/table-functions/index.md
index b16295db36a..e8eb983b774 100644
--- a/docs/en/sql-reference/table-functions/index.md
+++ b/docs/en/sql-reference/table-functions/index.md
@@ -1,10 +1,10 @@
 ---
 slug: /en/sql-reference/table-functions/
 sidebar_label: Table Functions
-sidebar_position: 34
+sidebar_position: 1
 ---
 
-# Table Functions 
+# Table Functions
 
 Table functions are methods for constructing tables.
 
diff --git a/docs/en/sql-reference/table-functions/input.md b/docs/en/sql-reference/table-functions/input.md
index 6aa1cab00c1..1541177b990 100644
--- a/docs/en/sql-reference/table-functions/input.md
+++ b/docs/en/sql-reference/table-functions/input.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/input
-sidebar_position: 46
+sidebar_position: 95
 sidebar_label: input
 ---
 
diff --git a/docs/en/sql-reference/table-functions/jdbc.md b/docs/en/sql-reference/table-functions/jdbc.md
index 1c12dba9c2b..fbc917c1e1a 100644
--- a/docs/en/sql-reference/table-functions/jdbc.md
+++ b/docs/en/sql-reference/table-functions/jdbc.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/jdbc
-sidebar_position: 43
+sidebar_position: 100
 sidebar_label: jdbc
 ---
 
diff --git a/docs/en/sql-reference/table-functions/merge.md b/docs/en/sql-reference/table-functions/merge.md
index ba0d19b804e..a1f376ba0eb 100644
--- a/docs/en/sql-reference/table-functions/merge.md
+++ b/docs/en/sql-reference/table-functions/merge.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/merge
-sidebar_position: 38
+sidebar_position: 130
 sidebar_label: merge
 ---
 
@@ -16,7 +16,7 @@ merge('db_name', 'tables_regexp')
 **Arguments**
 
 - `db_name` — Possible values:
-    - database name, 
+    - database name,
     - constant expression that returns a string with a database name, for example, `currentDatabase()`,
     - `REGEXP(expression)`, where `expression` is a regular expression to match the DB names.
 
diff --git a/docs/en/sql-reference/table-functions/mongodb.md b/docs/en/sql-reference/table-functions/mongodb.md
index 042225dd1f0..aad60a7003c 100644
--- a/docs/en/sql-reference/table-functions/mongodb.md
+++ b/docs/en/sql-reference/table-functions/mongodb.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/mongodb
-sidebar_position: 42
+sidebar_position: 135
 sidebar_label: mongodb
 ---
 
diff --git a/docs/en/sql-reference/table-functions/mysql.md b/docs/en/sql-reference/table-functions/mysql.md
index 8d7656365f5..0e5b0f54d1c 100644
--- a/docs/en/sql-reference/table-functions/mysql.md
+++ b/docs/en/sql-reference/table-functions/mysql.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/mysql
-sidebar_position: 42
+sidebar_position: 137
 sidebar_label: mysql
 ---
 
@@ -107,6 +107,30 @@ SELECT * FROM mysql('localhost:3306', 'test', 'test', 'bayonet', '123');
 └────────┴───────┘
 ```
 
+Copying data from MySQL table into ClickHouse table:
+
+```sql
+CREATE TABLE mysql_copy
+(
+   `id` UInt64,
+   `datetime` DateTime('UTC'),
+   `description` String,
+)
+ENGINE = MergeTree
+ORDER BY (id,datetime);
+
+INSERT INTO mysql_copy
+SELECT * FROM mysql('host:port', 'database', 'table', 'user', 'password');
+```
+
+Or if copying only an incremental batch from MySQL based on the max current id:
+
+```sql
+INSERT INTO mysql_copy
+SELECT * FROM mysql('host:port', 'database', 'table', 'user', 'password')
+WHERE id > (SELECT max(id) from mysql_copy);
+```
+
 **See Also**
 
 - [The ‘MySQL’ table engine](../../engines/table-engines/integrations/mysql.md)
diff --git a/docs/en/sql-reference/table-functions/null.md b/docs/en/sql-reference/table-functions/null.md
index d27295f1916..76e9c32cdbb 100644
--- a/docs/en/sql-reference/table-functions/null.md
+++ b/docs/en/sql-reference/table-functions/null.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/null
-sidebar_position: 53
+sidebar_position: 140
 sidebar_label: null function
 title: 'null'
 ---
diff --git a/docs/en/sql-reference/table-functions/numbers.md b/docs/en/sql-reference/table-functions/numbers.md
index a7e49be44a1..32f51363a0a 100644
--- a/docs/en/sql-reference/table-functions/numbers.md
+++ b/docs/en/sql-reference/table-functions/numbers.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/numbers
-sidebar_position: 39
+sidebar_position: 145
 sidebar_label: numbers
 ---
 
diff --git a/docs/en/sql-reference/table-functions/odbc.md b/docs/en/sql-reference/table-functions/odbc.md
index 781ebacc680..fe6e5390887 100644
--- a/docs/en/sql-reference/table-functions/odbc.md
+++ b/docs/en/sql-reference/table-functions/odbc.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/odbc
-sidebar_position: 44
+sidebar_position: 150
 sidebar_label: odbc
 ---
 
diff --git a/docs/en/sql-reference/table-functions/postgresql.md b/docs/en/sql-reference/table-functions/postgresql.md
index 3e147fb8417..b9211d70cdb 100644
--- a/docs/en/sql-reference/table-functions/postgresql.md
+++ b/docs/en/sql-reference/table-functions/postgresql.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/postgresql
-sidebar_position: 42
+sidebar_position: 160
 sidebar_label: postgresql
 ---
 
diff --git a/docs/en/sql-reference/table-functions/redis.md b/docs/en/sql-reference/table-functions/redis.md
new file mode 100644
index 00000000000..98d9a647cee
--- /dev/null
+++ b/docs/en/sql-reference/table-functions/redis.md
@@ -0,0 +1,67 @@
+---
+slug: /en/sql-reference/table-functions/redis
+sidebar_position: 170
+sidebar_label: redis
+---
+
+# redis
+
+This table function allows integrating ClickHouse with [Redis](https://redis.io/).
+
+**Syntax**
+
+```sql
+redis(host:port, key, structure[, db_index[, password[, pool_size]]])
+```
+
+**Arguments**
+
+- `host:port` — Redis server address, you can ignore port and default Redis port 6379 will be used.
+
+- `key` — any column name in the column list.
+
+- `structure` — The schema for the ClickHouse table returned from this function.
+
+- `db_index` — Redis db index range from 0 to 15, default is 0.
+
+- `password` — User password, default is blank string.
+
+- `pool_size` — Redis max connection pool size, default is 16.
+
+- `primary` must be specified, it supports only one column in the primary key. The primary key will be serialized in binary as a Redis key.
+
+- columns other than the primary key will be serialized in binary as Redis value in corresponding order.
+
+- queries with key equals or in filtering will be optimized to multi keys lookup from Redis. If queries without filtering key full table scan will happen which is a heavy operation.
+
+
+**Returned Value**
+
+A table object with key as Redis key, other columns packaged together as Redis value.
+
+## Usage Example {#usage-example}
+
+Create a table in ClickHouse which allows to read data from Redis:
+
+``` sql
+CREATE TABLE redis_table
+(
+    `k` String,
+    `m` String,
+    `n` UInt32
+)
+ENGINE = Redis('redis1:6379') PRIMARY KEY(k);
+```
+
+```sql
+SELECT * FROM redis(
+    'redis1:6379',
+    'key',
+    'key String, v1 String, v2 UInt32'
+)
+```
+
+**See Also**
+
+- [The `Redis` table engine](/docs/en/engines/table-engines/integrations/redis.md)
+- [Using redis as a dictionary source](/docs/en/sql-reference/dictionaries/index.md#redis)
diff --git a/docs/en/sql-reference/table-functions/remote.md b/docs/en/sql-reference/table-functions/remote.md
index bf0abd49fc6..fba3ea55653 100644
--- a/docs/en/sql-reference/table-functions/remote.md
+++ b/docs/en/sql-reference/table-functions/remote.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/remote
-sidebar_position: 40
+sidebar_position: 175
 sidebar_label: remote
 ---
 
@@ -89,10 +89,10 @@ SELECT * FROM remote_table;
 ```
 
 ### Migration of tables from one system to another:
-This example uses one table from a sample dataset.  The database is `imdb`, and the table is `actors`. 
+This example uses one table from a sample dataset.  The database is `imdb`, and the table is `actors`.
 
 #### On the source ClickHouse system (the system that currently hosts the data)
-- Verify the source database and table name (`imdb.actors`)  
+- Verify the source database and table name (`imdb.actors`)
   ```sql
   show databases
   ```
@@ -114,9 +114,8 @@ This example uses one table from a sample dataset.  The database is `imdb`, and
                             `first_name` String,
                             `last_name` String,
                             `gender` FixedString(1))
-                  ENGINE = ReplicatedMergeTree('/clickhouse/tables/{uuid}/{shard}', '{replica}')
-                  ORDER BY (id, first_name, last_name, gender)
-                  SETTINGS index_granularity = 8192
+                  ENGINE = MergeTree
+                  ORDER BY (id, first_name, last_name, gender);
   ```
 
 #### On the destination ClickHouse system:
@@ -132,9 +131,8 @@ This example uses one table from a sample dataset.  The database is `imdb`, and
                             `first_name` String,
                             `last_name` String,
                             `gender` FixedString(1))
-                  ENGINE = ReplicatedMergeTree('/clickhouse/tables/{uuid}/{shard}', '{replica}')
-                  ORDER BY (id, first_name, last_name, gender)
-                  SETTINGS index_granularity = 8192
+                  ENGINE = MergeTree
+                  ORDER BY (id, first_name, last_name, gender);
   ```
 
 #### Back on the source deployment:
@@ -142,7 +140,7 @@ This example uses one table from a sample dataset.  The database is `imdb`, and
 Insert into the new database and table created on the remote system.  You will need the host, port, username, password, destination database, and destination table.
 ```sql
 INSERT INTO FUNCTION
-remoteSecure('remote.clickhouse.cloud:9440', 'imdb.actors', 'USER', 'PASSWORD', rand())
+remoteSecure('remote.clickhouse.cloud:9440', 'imdb.actors', 'USER', 'PASSWORD')
 SELECT * from imdb.actors
 ```
 
diff --git a/docs/en/sql-reference/table-functions/s3.md b/docs/en/sql-reference/table-functions/s3.md
index a9ddc286ec5..55c825b8b9b 100644
--- a/docs/en/sql-reference/table-functions/s3.md
+++ b/docs/en/sql-reference/table-functions/s3.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/s3
-sidebar_position: 45
+sidebar_position: 180
 sidebar_label: s3
 keywords: [s3, gcs, bucket]
 ---
@@ -33,7 +33,7 @@ For GCS, substitute your HMAC key and HMAC secret where you see `aws_access_key_
   and not ~~https://storage.cloud.google.com~~.
   :::
 
-- `NOSIGN` - If this keyword is provided in place of credentials, all the requests will not be signed. 
+- `NOSIGN` - If this keyword is provided in place of credentials, all the requests will not be signed.
 - `format` — The [format](../../interfaces/formats.md#formats) of the file.
 - `structure` — Structure of the table. Format `'column1_name column1_type, column2_name column2_type, ...'`.
 - `compression` — Parameter is optional. Supported values: `none`, `gzip/gz`, `brotli/br`, `xz/LZMA`, `zstd/zst`. By default, it will autodetect compression by file extension.
@@ -202,6 +202,12 @@ FROM s3(
 LIMIT 5;
 ```
 
+## Storage Settings {#storage-settings}
+
+- [s3_truncate_on_insert](/docs/en/operations/settings/settings.md#s3-truncate-on-insert) - allows to truncate file before insert into it. Disabled by default.
+- [s3_create_multiple_files](/docs/en/operations/settings/settings.md#s3_allow_create_multiple_files) - allows to create a new file on each insert if format has suffix. Disabled by default.
+- [s3_skip_empty_files](/docs/en/operations/settings/settings.md#s3_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
+
 **See Also**
 
 - [S3 engine](../../engines/table-engines/integrations/s3.md)
diff --git a/docs/en/sql-reference/table-functions/s3Cluster.md b/docs/en/sql-reference/table-functions/s3Cluster.md
index a1d9b9cdad4..d5bdc85f9f8 100644
--- a/docs/en/sql-reference/table-functions/s3Cluster.md
+++ b/docs/en/sql-reference/table-functions/s3Cluster.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/s3Cluster
-sidebar_position: 55
+sidebar_position: 181
 sidebar_label: s3Cluster
 title: "s3Cluster Table Function"
 ---
@@ -31,18 +31,18 @@ Select the data from all the files in the `/root/data/clickhouse` and `/root/dat
 
 ``` sql
 SELECT * FROM s3Cluster(
-    'cluster_simple', 
-    'http://minio1:9001/root/data/{clickhouse,database}/*', 
-    'minio', 
-    'minio123', 
-    'CSV', 
+    'cluster_simple',
+    'http://minio1:9001/root/data/{clickhouse,database}/*',
+    'minio',
+    'minio123',
+    'CSV',
     'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))'
 ) ORDER BY (name, value, polygon);
 ```
 
 Count the total amount of rows in all files in the cluster `cluster_simple`:
 
-:::tip    
+:::tip
 If your listing of files contains number ranges with leading zeros, use the construction with braces for each digit separately or use `?`.
 :::
 
diff --git a/docs/en/sql-reference/table-functions/sqlite.md b/docs/en/sql-reference/table-functions/sqlite.md
index 344fab4fad2..4188b598cb2 100644
--- a/docs/en/sql-reference/table-functions/sqlite.md
+++ b/docs/en/sql-reference/table-functions/sqlite.md
@@ -1,19 +1,19 @@
 ---
 slug: /en/sql-reference/table-functions/sqlite
-sidebar_position: 55
+sidebar_position: 185
 sidebar_label: sqlite
 title: sqlite
 ---
 
 Allows to perform queries on a data stored in an [SQLite](../../engines/database-engines/sqlite.md) database.
 
-**Syntax** 
+**Syntax**
 
 ``` sql
     sqlite('db_path', 'table_name')
 ```
 
-**Arguments** 
+**Arguments**
 
 - `db_path` — Path to a file with an SQLite database. [String](../../sql-reference/data-types/string.md).
 - `table_name` — Name of a table in the SQLite database. [String](../../sql-reference/data-types/string.md).
@@ -40,6 +40,6 @@ Result:
 └───────┴──────┘
 ```
 
-**See Also** 
+**See Also**
 
 - [SQLite](../../engines/table-engines/integrations/sqlite.md) table engine
diff --git a/docs/en/sql-reference/table-functions/url.md b/docs/en/sql-reference/table-functions/url.md
index f157a850a12..2ab43f1b895 100644
--- a/docs/en/sql-reference/table-functions/url.md
+++ b/docs/en/sql-reference/table-functions/url.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/url
-sidebar_position: 41
+sidebar_position: 200
 sidebar_label: url
 ---
 
@@ -53,6 +53,10 @@ Character `|` inside patterns is used to specify failover addresses. They are it
 - `_path` — Path to the `URL`.
 - `_file` — Resource name of the `URL`.
 
+## Storage Settings {#storage-settings}
+
+- [engine_url_skip_empty_files](/docs/en/operations/settings/settings.md#engine_url_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
+
 **See Also**
 
 - [Virtual columns](/docs/en/engines/table-engines/index.md#table_engines-virtual_columns)
diff --git a/docs/en/sql-reference/table-functions/urlCluster.md b/docs/en/sql-reference/table-functions/urlCluster.md
index 07d3f4a7362..cf05189112e 100644
--- a/docs/en/sql-reference/table-functions/urlCluster.md
+++ b/docs/en/sql-reference/table-functions/urlCluster.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/urlCluster
-sidebar_position: 55
+sidebar_position: 201
 sidebar_label: urlCluster
 ---
 
diff --git a/docs/en/sql-reference/table-functions/view.md b/docs/en/sql-reference/table-functions/view.md
index 2c21fe9ff4b..fafb204f31a 100644
--- a/docs/en/sql-reference/table-functions/view.md
+++ b/docs/en/sql-reference/table-functions/view.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/view
-sidebar_position: 51
+sidebar_position: 210
 sidebar_label: view
 title: view
 ---
diff --git a/docs/redirects.txt b/docs/redirects.txt
index cea138f7237..ebeda125e01 100644
--- a/docs/redirects.txt
+++ b/docs/redirects.txt
@@ -1,453 +1,6 @@
-agg_functions/combinators.md query-language/agg-functions/combinators.md
-agg_functions/index.md query-language/agg-functions/index.md
-agg_functions/parametric_functions.md query-language/agg-functions/parametric-functions.md
-agg_functions/reference.md query-language/agg-functions/reference.md
-changelog/2017.md whats-new/changelog/2017.md
-changelog/2018.md whats-new/changelog/2018.md
-changelog/2019.md whats-new/changelog/2019.md
-changelog/index.md whats-new/changelog/index.md
-commercial/cloud.md https://clickhouse.com/cloud/
-data_types/array.md sql-reference/data-types/array.md
-data_types/boolean.md sql-reference/data-types/boolean.md
-data_types/date.md sql-reference/data-types/date.md
-data_types/datetime.md sql-reference/data-types/datetime.md
-data_types/datetime64.md sql-reference/data-types/datetime64.md
-data_types/decimal.md sql-reference/data-types/decimal.md
-data_types/domains/ipv4.md sql-reference/data-types/domains/ipv4.md
-data_types/domains/ipv6.md sql-reference/data-types/domains/ipv6.md
-data_types/domains/overview.md sql-reference/data-types/domains/overview.md
-data_types/enum.md sql-reference/data-types/enum.md
-data_types/fixedstring.md sql-reference/data-types/fixedstring.md
-data_types/float.md sql-reference/data-types/float.md
-data_types/index.md sql-reference/data-types/index.md
-data_types/int_uint.md sql-reference/data-types/int-uint.md
-data_types/nested_data_structures/aggregatefunction.md sql-reference/data-types/aggregatefunction.md
-data_types/nested_data_structures/index.md sql-reference/data-types/nested-data-structures/index.md
-data_types/nested_data_structures/nested.md sql-reference/data-types/nested-data-structures/nested.md
-data_types/nullable.md sql-reference/data-types/nullable.md
-data_types/special_data_types/expression.md sql-reference/data-types/special-data-types/expression.md
-data_types/special_data_types/index.md sql-reference/data-types/special-data-types/index.md
-data_types/special_data_types/interval.md sql-reference/data-types/special-data-types/interval.md
-data_types/special_data_types/nothing.md sql-reference/data-types/special-data-types/nothing.md
-data_types/special_data_types/set.md sql-reference/data-types/special-data-types/set.md
-data_types/string.md sql-reference/data-types/string.md
-data_types/tuple.md sql-reference/data-types/tuple.md
-data_types/uuid.md sql-reference/data-types/uuid.md
-database_engines/index.md engines/database-engines/index.md
-database_engines/lazy.md engines/database-engines/lazy.md
-database_engines/mysql.md engines/database-engines/mysql.md
-development/browse_code.md development/browse-code.md
-development/build_cross_arm.md development/build-cross-arm.md
-development/build_cross_osx.md development/build-cross-osx.md
-development/build_osx.md development/build-osx.md
-development/developer_instruction.md development/developer-instruction.md
-dicts/external_dicts.md query-language/dicts/external-dicts.md
-dicts/external_dicts_dict.md query-language/dicts/external-dicts-dict.md
-dicts/external_dicts_dict_layout.md query-language/dicts/external-dicts-dict-layout.md
-dicts/external_dicts_dict_lifetime.md query-language/dicts/external-dicts-dict-lifetime.md
-dicts/external_dicts_dict_sources.md query-language/dicts/external-dicts-dict-sources.md
-dicts/external_dicts_dict_structure.md query-language/dicts/external-dicts-dict-structure.md
-dicts/index.md query-language/dicts/index.md
-dicts/internal_dicts.md query-language/dicts/internal-dicts.md
-engines/database_engines/index.md engines/database-engines/index.md
-engines/database_engines/lazy.md engines/database-engines/lazy.md
-engines/database_engines/mysql.md engines/database-engines/mysql.md
-engines/table-engines/log-family/log-family.md engines/table-engines/log-family/index.md
-engines/table_engines/index.md engines/table-engines/index.md
-engines/table_engines/integrations/hdfs.md engines/table-engines/integrations/hdfs.md
-engines/table_engines/integrations/index.md engines/table-engines/integrations/index.md
-engines/table_engines/integrations/jdbc.md engines/table-engines/integrations/jdbc.md
-engines/table_engines/integrations/kafka.md engines/table-engines/integrations/kafka.md
-engines/table_engines/integrations/mysql.md engines/table-engines/integrations/mysql.md
-engines/table_engines/integrations/odbc.md engines/table-engines/integrations/odbc.md
-engines/table_engines/log_family/index.md engines/table-engines/log-family/index.md
-engines/table_engines/log_family/log.md engines/table-engines/log-family/log.md
-engines/table_engines/log_family/log_family.md engines/table-engines/log-family/log-family.md
-engines/table_engines/log_family/stripelog.md engines/table-engines/log-family/stripelog.md
-engines/table_engines/log_family/tinylog.md engines/table-engines/log-family/tinylog.md
-engines/table_engines/mergetree_family/aggregatingmergetree.md engines/table-engines/mergetree-family/aggregatingmergetree.md
-engines/table_engines/mergetree_family/collapsingmergetree.md engines/table-engines/mergetree-family/collapsingmergetree.md
-engines/table_engines/mergetree_family/custom_partitioning_key.md engines/table-engines/mergetree-family/custom-partitioning-key.md
-engines/table_engines/mergetree_family/graphitemergetree.md engines/table-engines/mergetree-family/graphitemergetree.md
-engines/table_engines/mergetree_family/index.md engines/table-engines/mergetree-family/index.md
-engines/table_engines/mergetree_family/mergetree.md engines/table-engines/mergetree-family/mergetree.md
-engines/table_engines/mergetree_family/replacingmergetree.md engines/table-engines/mergetree-family/replacingmergetree.md
-engines/table_engines/mergetree_family/replication.md engines/table-engines/mergetree-family/replication.md
-engines/table_engines/mergetree_family/summingmergetree.md engines/table-engines/mergetree-family/summingmergetree.md
-engines/table_engines/mergetree_family/versionedcollapsingmergetree.md engines/table-engines/mergetree-family/versionedcollapsingmergetree.md
-engines/table_engines/special/buffer.md engines/table-engines/special/buffer.md
-engines/table_engines/special/dictionary.md engines/table-engines/special/dictionary.md
-engines/table_engines/special/distributed.md engines/table-engines/special/distributed.md
-engines/table_engines/special/external_data.md engines/table-engines/special/external-data.md
-engines/table_engines/special/file.md engines/table-engines/special/file.md
-engines/table_engines/special/generate.md engines/table-engines/special/generate.md
-engines/table_engines/special/index.md engines/table-engines/special/index.md
-engines/table_engines/special/join.md engines/table-engines/special/join.md
-engines/table_engines/special/materializedview.md engines/table-engines/special/materializedview.md
-engines/table_engines/special/memory.md engines/table-engines/special/memory.md
-engines/table_engines/special/merge.md engines/table-engines/special/merge.md
-engines/table_engines/special/null.md engines/table-engines/special/null.md
-engines/table_engines/special/set.md engines/table-engines/special/set.md
-engines/table_engines/special/url.md engines/table-engines/special/url.md
-engines/table_engines/special/view.md engines/table-engines/special/view.md
-extended_roadmap.md whats-new/extended-roadmap.md
-formats.md interfaces/formats.md
-formats/capnproto.md interfaces/formats.md
-formats/csv.md interfaces/formats.md
-formats/csvwithnames.md interfaces/formats.md
-formats/json.md interfaces/formats.md
-formats/jsoncompact.md interfaces/formats.md
-formats/jsoneachrow.md interfaces/formats.md
-formats/native.md interfaces/formats.md
-formats/null.md interfaces/formats.md
-formats/pretty.md interfaces/formats.md
-formats/prettycompact.md interfaces/formats.md
-formats/prettycompactmonoblock.md interfaces/formats.md
-formats/prettynoescapes.md interfaces/formats.md
-formats/prettyspace.md interfaces/formats.md
-formats/rowbinary.md interfaces/formats.md
-formats/tabseparated.md interfaces/formats.md
-formats/tabseparatedraw.md interfaces/formats.md
-formats/tabseparatedwithnames.md interfaces/formats.md
-formats/tabseparatedwithnamesandtypes.md interfaces/formats.md
-formats/tskv.md interfaces/formats.md
-formats/values.md interfaces/formats.md
-formats/vertical.md interfaces/formats.md
-formats/verticalraw.md interfaces/formats.md
-formats/xml.md interfaces/formats.md
-functions/arithmetic_functions.md query-language/functions/arithmetic-functions.md
-functions/array_functions.md query-language/functions/array-functions.md
-functions/array_join.md query-language/functions/array-join.md
-functions/bit_functions.md query-language/functions/bit-functions.md
-functions/bitmap_functions.md query-language/functions/bitmap-functions.md
-functions/comparison_functions.md query-language/functions/comparison-functions.md
-functions/conditional_functions.md query-language/functions/conditional-functions.md
-functions/date_time_functions.md query-language/functions/date-time-functions.md
-functions/encoding_functions.md query-language/functions/encoding-functions.md
-functions/ext_dict_functions.md query-language/functions/ext-dict-functions.md
-functions/hash_functions.md query-language/functions/hash-functions.md
-functions/higher_order_functions.md query-language/functions/higher-order-functions.md
-functions/in_functions.md query-language/functions/in-functions.md
-functions/index.md query-language/functions/index.md
-functions/ip_address_functions.md query-language/functions/ip-address-functions.md
-functions/json_functions.md query-language/functions/json-functions.md
-functions/logical_functions.md query-language/functions/logical-functions.md
-functions/math_functions.md query-language/functions/math-functions.md
-functions/other_functions.md query-language/functions/other-functions.md
-functions/random_functions.md query-language/functions/random-functions.md
-functions/rounding_functions.md query-language/functions/rounding-functions.md
-functions/splitting_merging_functions.md query-language/functions/splitting-merging-functions.md
-functions/string_functions.md query-language/functions/string-functions.md
-functions/string_replace_functions.md query-language/functions/string-replace-functions.md
-functions/string_search_functions.md query-language/functions/string-search-functions.md
-functions/type_conversion_functions.md query-language/functions/type-conversion-functions.md
-functions/url_functions.md query-language/functions/url-functions.md
-functions/ym_dict_functions.md query-language/functions/ym-dict-functions.md
-getting_started/example_datasets/amplab_benchmark.md getting-started/example-datasets/amplab-benchmark.md
-getting_started/example_datasets/criteo.md getting-started/example-datasets/criteo.md
-getting_started/example_datasets/index.md getting-started/example-datasets/index.md
-getting_started/example_datasets/metrica.md getting-started/example-datasets/metrica.md
-getting_started/example_datasets/nyc_taxi.md getting-started/example-datasets/nyc-taxi.md
-getting_started/example_datasets/ontime.md getting-started/example-datasets/ontime.md
-getting_started/example_datasets/star_schema.md getting-started/example-datasets/star-schema.md
-getting_started/example_datasets/wikistat.md getting-started/example-datasets/wikistat.md
-getting_started/index.md getting-started/index.md
-getting_started/install.md getting-started/install.md
-getting_started/playground.md getting-started/playground.md
-getting_started/tutorial.md getting-started/tutorial.md
-images/column_oriented.gif images/column-oriented.gif
-images/row_oriented.gif images/row-oriented.gif
-interfaces/http_interface.md interfaces/http.md
-interfaces/third-party/client_libraries.md interfaces/third-party/client-libraries.md
-interfaces/third-party_client_libraries.md interfaces/third-party/client-libraries.md
-interfaces/third-party_gui.md interfaces/third-party/gui.md
-interfaces/third_party/index.md interfaces/third-party/index.md
-introduction/index.md 
-introduction/distinctive_features.md introduction/distinctive-features.md
-introduction/features_considered_disadvantages.md introduction/distinctive-features.md
-introduction/possible_silly_questions.md faq/general.md
-introduction/ya_metrika_task.md introduction/history.md
-operations/access_rights.md operations/access-rights.md
-operations/configuration_files.md operations/configuration-files.md
-operations/optimizing_performance/index.md operations/optimizing-performance/index.md
-operations/optimizing_performance/sampling_query_profiler.md operations/optimizing-performance/sampling-query-profiler.md
-operations/performance/sampling_query_profiler.md operations/optimizing-performance/sampling-query-profiler.md
-operations/performance_test.md operations/performance-test.md
-operations/server_configuration_parameters/index.md operations/server-configuration-parameters/index.md
-operations/server_configuration_parameters/settings.md operations/server-configuration-parameters/settings.md
-operations/server_settings/index.md operations/server-configuration-parameters/index.md
-operations/server_settings/settings.md operations/server-configuration-parameters/settings.md
-operations/settings/constraints_on_settings.md operations/settings/constraints-on-settings.md
-operations/settings/permissions_for_queries.md operations/settings/permissions-for-queries.md
-operations/settings/query_complexity.md operations/settings/query-complexity.md
-operations/settings/settings_profiles.md operations/settings/settings-profiles.md
-operations/settings/settings_users.md operations/settings/settings-users.md
-operations/system_tables.md operations/system-tables.md
-operations/table_engines/aggregatingmergetree.md engines/table-engines/mergetree-family/aggregatingmergetree.md
-operations/table_engines/buffer.md engines/table-engines/special/buffer.md
-operations/table_engines/collapsingmergetree.md engines/table-engines/mergetree-family/collapsingmergetree.md
-operations/table_engines/custom_partitioning_key.md engines/table-engines/mergetree-family/custom-partitioning-key.md
-operations/table_engines/dictionary.md engines/table-engines/special/dictionary.md
-operations/table_engines/distributed.md engines/table-engines/special/distributed.md
-operations/table_engines/external_data.md engines/table-engines/special/external-data.md
-operations/table_engines/file.md engines/table-engines/special/file.md
-operations/table_engines/generate.md engines/table-engines/special/generate.md
-operations/table_engines/graphitemergetree.md engines/table-engines/mergetree-family/graphitemergetree.md
-operations/table_engines/hdfs.md engines/table-engines/integrations/hdfs.md
-operations/table_engines/index.md engines/table-engines/index.md
-operations/table_engines/jdbc.md engines/table-engines/integrations/jdbc.md
-operations/table_engines/join.md engines/table-engines/special/join.md
-operations/table_engines/kafka.md engines/table-engines/integrations/kafka.md
-operations/table_engines/log.md engines/table-engines/log-family/log.md
-operations/table_engines/log_family.md engines/table-engines/log-family/log-family.md
-operations/table_engines/materializedview.md engines/table-engines/special/materializedview.md
-operations/table_engines/memory.md engines/table-engines/special/memory.md
-operations/table_engines/merge.md engines/table-engines/special/merge.md
-operations/table_engines/mergetree.md engines/table-engines/mergetree-family/mergetree.md
-operations/table_engines/mysql.md engines/table-engines/integrations/mysql.md
-operations/table_engines/null.md engines/table-engines/special/null.md
-operations/table_engines/odbc.md engines/table-engines/integrations/odbc.md
-operations/table_engines/replacingmergetree.md engines/table-engines/mergetree-family/replacingmergetree.md
-operations/table_engines/replication.md engines/table-engines/mergetree-family/replication.md
-operations/table_engines/set.md engines/table-engines/special/set.md
-operations/table_engines/stripelog.md engines/table-engines/log-family/stripelog.md
-operations/table_engines/summingmergetree.md engines/table-engines/mergetree-family/summingmergetree.md
-operations/table_engines/tinylog.md engines/table-engines/log-family/tinylog.md
-operations/table_engines/url.md engines/table-engines/special/url.md
-operations/table_engines/versionedcollapsingmergetree.md engines/table-engines/mergetree-family/versionedcollapsingmergetree.md
-operations/table_engines/view.md engines/table-engines/special/view.md
-operations/utils/clickhouse-benchmark.md operations/utilities/clickhouse-benchmark.md
-operations/utils/clickhouse-copier.md operations/utilities/clickhouse-copier.md
-operations/utils/clickhouse-local.md operations/utilities/clickhouse-local.md
-operations/utils/index.md operations/utilities/index.md
-query_language/agg_functions/combinators.md sql-reference/aggregate-functions/combinators.md
-query_language/agg_functions/index.md sql-reference/aggregate-functions/index.md
-query_language/agg_functions/parametric_functions.md sql-reference/aggregate-functions/parametric-functions.md
-query_language/agg_functions/reference.md sql-reference/aggregate-functions/reference.md
-query_language/alter.md sql-reference/statements/alter.md
-query_language/create.md sql-reference/statements/create.md
-query_language/dicts/external_dicts.md sql-reference/dictionaries/external-dictionaries/external-dicts.md
-query_language/dicts/external_dicts_dict.md sql-reference/dictionaries/external-dictionaries/external-dicts-dict.md
-query_language/dicts/external_dicts_dict_hierarchical.md sql-reference/dictionaries/external-dictionaries/external-dicts-dict-hierarchical.md
-query_language/dicts/external_dicts_dict_layout.md sql-reference/dictionaries/external-dictionaries/external-dicts-dict-layout.md
-query_language/dicts/external_dicts_dict_lifetime.md sql-reference/dictionaries/external-dictionaries/external-dicts-dict-lifetime.md
-query_language/dicts/external_dicts_dict_sources.md sql-reference/dictionaries/external-dictionaries/external-dicts-dict-sources.md
-query_language/dicts/external_dicts_dict_structure.md sql-reference/dictionaries/external-dictionaries/external-dicts-dict-structure.md
-query_language/dicts/index.md sql-reference/dictionaries/index.md
-query_language/dicts/internal_dicts.md sql-reference/dictionaries/internal-dicts.md
-query_language/functions/arithmetic_functions.md sql-reference/functions/arithmetic-functions.md
-query_language/functions/array_functions.md sql-reference/functions/array-functions.md
-query_language/functions/array_join.md sql-reference/functions/array-join.md
-query_language/functions/bit_functions.md sql-reference/functions/bit-functions.md
-query_language/functions/bitmap_functions.md sql-reference/functions/bitmap-functions.md
-query_language/functions/comparison_functions.md sql-reference/functions/comparison-functions.md
-query_language/functions/conditional_functions.md sql-reference/functions/conditional-functions.md
-query_language/functions/date_time_functions.md sql-reference/functions/date-time-functions.md
-query_language/functions/encoding_functions.md sql-reference/functions/encoding-functions.md
-query_language/functions/ext_dict_functions.md sql-reference/functions/ext-dict-functions.md
-query_language/functions/functions_for_nulls.md sql-reference/functions/functions-for-nulls.md
-query_language/functions/geo.md sql-reference/functions/geo.md
-query_language/functions/hash_functions.md sql-reference/functions/hash-functions.md
-query_language/functions/higher_order_functions.md sql-reference/functions/higher-order-functions.md
-query_language/functions/in_functions.md sql-reference/functions/in-functions.md
-query_language/functions/index.md sql-reference/functions/index.md
-query_language/functions/introspection.md sql-reference/functions/introspection.md
-query_language/functions/ip_address_functions.md sql-reference/functions/ip-address-functions.md
-query_language/functions/json_functions.md sql-reference/functions/json-functions.md
-query_language/functions/logical_functions.md sql-reference/functions/logical-functions.md
-query_language/functions/machine_learning_functions.md sql-reference/functions/machine-learning-functions.md
-query_language/functions/math_functions.md sql-reference/functions/math-functions.md
-query_language/functions/other_functions.md sql-reference/functions/other-functions.md
-query_language/functions/random_functions.md sql-reference/functions/random-functions.md
-query_language/functions/rounding_functions.md sql-reference/functions/rounding-functions.md
-query_language/functions/splitting_merging_functions.md sql-reference/functions/splitting-merging-functions.md
-query_language/functions/string_functions.md sql-reference/functions/string-functions.md
-query_language/functions/string_replace_functions.md sql-reference/functions/string-replace-functions.md
-query_language/functions/string_search_functions.md sql-reference/functions/string-search-functions.md
-query_language/functions/type_conversion_functions.md sql-reference/functions/type-conversion-functions.md
-query_language/functions/url_functions.md sql-reference/functions/url-functions.md
-query_language/functions/uuid_functions.md sql-reference/functions/uuid-functions.md
-query_language/functions/ym_dict_functions.md sql-reference/functions/ym-dict-functions.md
-query_language/index.md sql-reference/index.md
-query_language/insert_into.md sql-reference/statements/insert-into.md
-query_language/misc.md sql-reference/statements/misc.md
-query_language/operators.md sql-reference/operators.md
-query_language/queries.md query-language.md
-query_language/select.md sql-reference/statements/select.md
-query_language/show.md sql-reference/statements/show.md
-query_language/syntax.md sql-reference/syntax.md
-query_language/system.md sql-reference/statements/system.md
-query_language/table_functions/file.md sql-reference/table-functions/file.md
-query_language/table_functions/generate.md sql-reference/table-functions/generate.md
-query_language/table_functions/hdfs.md sql-reference/table-functions/hdfs.md
-query_language/table_functions/index.md sql-reference/table-functions/index.md
-query_language/table_functions/input.md sql-reference/table-functions/input.md
-query_language/table_functions/jdbc.md sql-reference/table-functions/jdbc.md
-query_language/table_functions/merge.md sql-reference/table-functions/merge.md
-query_language/table_functions/mysql.md sql-reference/table-functions/mysql.md
-query_language/table_functions/numbers.md sql-reference/table-functions/numbers.md
-query_language/table_functions/odbc.md sql-reference/table-functions/odbc.md
-query_language/table_functions/remote.md sql-reference/table-functions/remote.md
-query_language/table_functions/url.md sql-reference/table-functions/url.md
-roadmap.md whats-new/roadmap.md
-security_changelog.md whats-new/security-changelog.md
-sql-reference/data-types/domains/overview.md sql-reference/data-types/domains/index.md
-sql_reference/aggregate_functions/combinators.md sql-reference/aggregate-functions/combinators.md
-sql_reference/aggregate_functions/index.md sql-reference/aggregate-functions/index.md
-sql_reference/aggregate_functions/parametric_functions.md sql-reference/aggregate-functions/parametric-functions.md
-sql_reference/aggregate_functions/reference.md sql-reference/aggregate-functions/reference.md
-sql_reference/ansi.md sql-reference/ansi.md
-sql_reference/data_types/aggregatefunction.md sql-reference/data-types/aggregatefunction.md
-sql_reference/data_types/array.md sql-reference/data-types/array.md
-sql_reference/data_types/boolean.md sql-reference/data-types/boolean.md
-sql_reference/data_types/date.md sql-reference/data-types/date.md
-sql_reference/data_types/datetime.md sql-reference/data-types/datetime.md
-sql_reference/data_types/datetime64.md sql-reference/data-types/datetime64.md
-sql_reference/data_types/decimal.md sql-reference/data-types/decimal.md
-sql_reference/data_types/domains/index.md sql-reference/data-types/domains/index.md
-sql_reference/data_types/domains/ipv4.md sql-reference/data-types/domains/ipv4.md
-sql_reference/data_types/domains/ipv6.md sql-reference/data-types/domains/ipv6.md
-sql_reference/data_types/domains/overview.md sql-reference/data-types/domains/overview.md
-sql_reference/data_types/enum.md sql-reference/data-types/enum.md
-sql_reference/data_types/fixedstring.md sql-reference/data-types/fixedstring.md
-sql_reference/data_types/float.md sql-reference/data-types/float.md
-sql_reference/data_types/index.md sql-reference/data-types/index.md
-sql_reference/data_types/int_uint.md sql-reference/data-types/int-uint.md
-sql_reference/data_types/nested_data_structures/index.md sql-reference/data-types/nested-data-structures/index.md
-sql_reference/data_types/nested_data_structures/nested.md sql-reference/data-types/nested-data-structures/nested.md
-sql_reference/data_types/nullable.md sql-reference/data-types/nullable.md
-sql_reference/data_types/simpleaggregatefunction.md sql-reference/data-types/simpleaggregatefunction.md
-sql_reference/data_types/special_data_types/expression.md sql-reference/data-types/special-data-types/expression.md
-sql_reference/data_types/special_data_types/index.md sql-reference/data-types/special-data-types/index.md
-sql_reference/data_types/special_data_types/interval.md sql-reference/data-types/special-data-types/interval.md
-sql_reference/data_types/special_data_types/nothing.md sql-reference/data-types/special-data-types/nothing.md
-sql_reference/data_types/special_data_types/set.md sql-reference/data-types/special-data-types/set.md
-sql_reference/data_types/string.md sql-reference/data-types/string.md
-sql_reference/data_types/tuple.md sql-reference/data-types/tuple.md
-sql_reference/data_types/uuid.md sql-reference/data-types/uuid.md
-sql_reference/dictionaries/external_dictionaries/external_dicts.md sql-reference/dictionaries/external-dictionaries/external-dicts.md
-sql_reference/dictionaries/external_dictionaries/external_dicts_dict.md sql-reference/dictionaries/external-dictionaries/external-dicts-dict.md
-sql_reference/dictionaries/external_dictionaries/external_dicts_dict_hierarchical.md sql-reference/dictionaries/external-dictionaries/external-dicts-dict-hierarchical.md
-sql_reference/dictionaries/external_dictionaries/external_dicts_dict_layout.md sql-reference/dictionaries/external-dictionaries/external-dicts-dict-layout.md
-sql_reference/dictionaries/external_dictionaries/external_dicts_dict_lifetime.md sql-reference/dictionaries/external-dictionaries/external-dicts-dict-lifetime.md
-sql_reference/dictionaries/external_dictionaries/external_dicts_dict_sources.md sql-reference/dictionaries/external-dictionaries/external-dicts-dict-sources.md
-sql_reference/dictionaries/external_dictionaries/external_dicts_dict_structure.md sql-reference/dictionaries/external-dictionaries/external-dicts-dict-structure.md
-sql_reference/dictionaries/external_dictionaries/index.md sql-reference/dictionaries/external-dictionaries/index.md
-sql_reference/dictionaries/index.md sql-reference/dictionaries/index.md
-sql_reference/dictionaries/internal_dicts.md sql-reference/dictionaries/internal-dicts.md
-sql_reference/functions/arithmetic_functions.md sql-reference/functions/arithmetic-functions.md
-sql_reference/functions/array_functions.md sql-reference/functions/array-functions.md
-sql_reference/functions/array_join.md sql-reference/functions/array-join.md
-sql_reference/functions/bit_functions.md sql-reference/functions/bit-functions.md
-sql_reference/functions/bitmap_functions.md sql-reference/functions/bitmap-functions.md
-sql_reference/functions/comparison_functions.md sql-reference/functions/comparison-functions.md
-sql_reference/functions/conditional_functions.md sql-reference/functions/conditional-functions.md
-sql_reference/functions/date_time_functions.md sql-reference/functions/date-time-functions.md
-sql_reference/functions/encoding_functions.md sql-reference/functions/encoding-functions.md
-sql_reference/functions/ext_dict_functions.md sql-reference/functions/ext-dict-functions.md
-sql_reference/functions/functions_for_nulls.md sql-reference/functions/functions-for-nulls.md
-sql_reference/functions/geo.md sql-reference/functions/geo.md
-sql_reference/functions/hash_functions.md sql-reference/functions/hash-functions.md
-sql_reference/functions/higher_order_functions.md sql-reference/functions/higher-order-functions.md
-sql_reference/functions/in_functions.md sql-reference/functions/in-functions.md
-sql_reference/functions/index.md sql-reference/functions/index.md
-sql_reference/functions/introspection.md sql-reference/functions/introspection.md
-sql_reference/functions/ip_address_functions.md sql-reference/functions/ip-address-functions.md
-sql_reference/functions/json_functions.md sql-reference/functions/json-functions.md
-sql_reference/functions/logical_functions.md sql-reference/functions/logical-functions.md
-sql_reference/functions/machine_learning_functions.md sql-reference/functions/machine-learning-functions.md
-sql_reference/functions/math_functions.md sql-reference/functions/math-functions.md
-sql_reference/functions/other_functions.md sql-reference/functions/other-functions.md
-sql_reference/functions/random_functions.md sql-reference/functions/random-functions.md
-sql_reference/functions/rounding_functions.md sql-reference/functions/rounding-functions.md
-sql_reference/functions/splitting_merging_functions.md sql-reference/functions/splitting-merging-functions.md
-sql_reference/functions/string_functions.md sql-reference/functions/string-functions.md
-sql_reference/functions/string_replace_functions.md sql-reference/functions/string-replace-functions.md
-sql_reference/functions/string_search_functions.md sql-reference/functions/string-search-functions.md
-sql_reference/functions/type_conversion_functions.md sql-reference/functions/type-conversion-functions.md
-sql_reference/functions/url_functions.md sql-reference/functions/url-functions.md
-sql_reference/functions/uuid_functions.md sql-reference/functions/uuid-functions.md
-sql_reference/functions/ym_dict_functions.md sql-reference/functions/ym-dict-functions.md
-sql_reference/index.md sql-reference/index.md
-sql_reference/operators.md sql-reference/operators.md
-sql_reference/statements/alter.md sql-reference/statements/alter.md
-sql_reference/statements/create.md sql-reference/statements/create.md
-sql_reference/statements/index.md sql-reference/statements/index.md
-sql_reference/statements/insert_into.md sql-reference/statements/insert-into.md
-sql_reference/statements/misc.md sql-reference/statements/misc.md
-sql_reference/statements/select.md sql-reference/statements/select.md
-sql_reference/statements/show.md sql-reference/statements/show.md
-sql_reference/statements/system.md sql-reference/statements/system.md
-sql_reference/syntax.md sql-reference/syntax.md
-sql_reference/table_functions/file.md sql-reference/table-functions/file.md
-sql_reference/table_functions/generate.md sql-reference/table-functions/generate.md
-sql_reference/table_functions/hdfs.md sql-reference/table-functions/hdfs.md
-sql_reference/table_functions/index.md sql-reference/table-functions/index.md
-sql_reference/table_functions/input.md sql-reference/table-functions/input.md
-sql_reference/table_functions/jdbc.md sql-reference/table-functions/jdbc.md
-sql_reference/table_functions/merge.md sql-reference/table-functions/merge.md
-sql_reference/table_functions/mysql.md sql-reference/table-functions/mysql.md
-sql_reference/table_functions/numbers.md sql-reference/table-functions/numbers.md
-sql_reference/table_functions/odbc.md sql-reference/table-functions/odbc.md
-sql_reference/table_functions/remote.md sql-reference/table-functions/remote.md
-sql_reference/table_functions/url.md sql-reference/table-functions/url.md
-system_tables.md operations/system-tables.md
-system_tables/system.asynchronous_metrics.md operations/system-tables.md
-system_tables/system.clusters.md operations/system-tables.md
-system_tables/system.columns.md operations/system-tables.md
-system_tables/system.databases.md operations/system-tables.md
-system_tables/system.dictionaries.md operations/system-tables.md
-system_tables/system.events.md operations/system-tables.md
-system_tables/system.functions.md operations/system-tables.md
-system_tables/system.merges.md operations/system-tables.md
-system_tables/system.metrics.md operations/system-tables.md
-system_tables/system.numbers.md operations/system-tables.md
-system_tables/system.numbers_mt.md operations/system-tables.md
-system_tables/system.one.md operations/system-tables.md
-system_tables/system.parts.md operations/system-tables.md
-system_tables/system.processes.md operations/system-tables.md
-system_tables/system.replicas.md operations/system-tables.md
-system_tables/system.settings.md operations/system-tables.md
-system_tables/system.tables.md operations/system-tables.md
-system_tables/system.zookeeper.md operations/system-tables.md
-table_engines.md operations/table-engines.md
-table_engines/aggregatingmergetree.md operations/table-engines/aggregatingmergetree.md
-table_engines/buffer.md operations/table-engines/buffer.md
-table_engines/collapsingmergetree.md operations/table-engines/collapsingmergetree.md
-table_engines/custom_partitioning_key.md operations/table-engines/custom-partitioning-key.md
-table_engines/dictionary.md operations/table-engines/dictionary.md
-table_engines/distributed.md operations/table-engines/distributed.md
-table_engines/external_data.md operations/table-engines/external-data.md
-table_engines/file.md operations/table-engines/file.md
-table_engines/graphitemergetree.md operations/table-engines/graphitemergetree.md
-table_engines/index.md operations/table-engines/index.md
-table_engines/join.md operations/table-engines/join.md
-table_engines/kafka.md operations/table-engines/kafka.md
-table_engines/log.md operations/table-engines/log.md
-table_engines/materializedview.md operations/table-engines/materializedview.md
-table_engines/memory.md operations/table-engines/memory.md
-table_engines/merge.md operations/table-engines/merge.md
-table_engines/mergetree.md operations/table-engines/mergetree.md
-table_engines/mysql.md operations/table-engines/mysql.md
-table_engines/null.md operations/table-engines/null.md
-table_engines/replacingmergetree.md operations/table-engines/replacingmergetree.md
-table_engines/replication.md operations/table-engines/replication.md
-table_engines/set.md operations/table-engines/set.md
-table_engines/summingmergetree.md operations/table-engines/summingmergetree.md
-table_engines/tinylog.md operations/table-engines/tinylog.md
-table_engines/view.md operations/table-engines/view.md
-table_functions/file.md query-language/table-functions/file.md
-table_functions/index.md query-language/table-functions/index.md
-table_functions/merge.md query-language/table-functions/merge.md
-table_functions/numbers.md query-language/table-functions/numbers.md
-table_functions/remote.md query-language/table-functions/remote.md
-utils.md operations/utils.md
-utils/clickhouse-copier.md operations/utils/clickhouse-copier.md
-utils/clickhouse-local.md operations/utils/clickhouse-local.md
-whats_new/changelog/2017.md whats-new/changelog/2017.md
-whats_new/changelog/2018.md whats-new/changelog/2018.md
-whats_new/changelog/2019.md whats-new/changelog/2019.md
-whats_new/changelog/index.md whats-new/changelog/index.md
-whats_new/index.md whats-new/index.md
-whats_new/roadmap.md whats-new/roadmap.md
-whats_new/security_changelog.md whats-new/security-changelog.md
+The redirects from this file were moved to the Docusaurus configuration file.
+If you need to add a redirect please either open a PR in 
+https://github.com/clickhouse/clickhouse-docs adding the redirect to
+https://github.com/ClickHouse/clickhouse-docs/blob/main/docusaurus.config.js
+or open an issue in the same repo and provide the old URL and new URL to have
+the redirect added.
diff --git a/docs/ru/interfaces/cli.md b/docs/ru/interfaces/cli.md
index 4c22eae0207..aa6ae3629e8 100644
--- a/docs/ru/interfaces/cli.md
+++ b/docs/ru/interfaces/cli.md
@@ -142,7 +142,129 @@ $ clickhouse-client --param_tbl="numbers" --param_db="system" --param_col="numbe
 -   `--history_file` - путь к файлу с историей команд.
 -   `--param_<name>` — значение параметра для [запроса с параметрами](#cli-queries-with-parameters).
 
-Начиная с версии 20.5, в `clickhouse-client` есть автоматическая подсветка синтаксиса (включена всегда).
+Вместо параметров `--host`, `--port`, `--user` и `--password` клиент ClickHouse также поддерживает строки подключения (смотри следующий раздел).
+
+## Строка подключения {#connection_string}
+
+clickhouse-client также поддерживает подключение к серверу clickhouse с помощью строки подключения, аналогичной [MongoDB](https://www.mongodb.com/docs/manual/reference/connection-string/), [PostgreSQL](https://www.postgresql.org/docs/current/libpq-connect.html#LIBPQ-CONNSTRING), [MySQL](https://dev.mysql.com/doc/refman/8.0/en/connecting-using-uri-or-key-value-pairs.html#connecting-using-uri). Она имеет следующий синтаксис:
+
+```text
+clickhouse:[//[user[:password]@][hosts_and_ports]][/database][?query_parameters]
+```
+
+Где
+
+- `user` - (необязательно) - это имя пользователя,
+- `password` - (необязательно) - Пароль пользователя. Если символ `:` укаказан, и пароль пуст, то клиент запросит ввести пользователя пароль.
+- `hosts_and_ports` - (необязательно) - список хостов и необязательных портов. `host[:port] [, host:[port]], ...`,
+- `database` - (необязательно) - это имя базы данных,
+- `query_parameters` - (опционально) список пар ключ-значение `param1=value1[,&param2=value2], ...`. Для некоторых параметров значение не требуется. Имена и значения параметров чувствительны к регистру.
+
+Если user не указан, будут использоваться имя пользователя `default`.
+Если host не указан, будет использован хост `localhost`.
+Если port не указан, будет использоваться порт `9000`.
+Если база данных не указана, будет использоваться база данных `default`.
+
+Если имя пользователя, пароль или база данных были указаны в строке подключения, их нельзя указать с помощью `--user`, `--password` или `--database` (и наоборот).
+
+Параметр host может быть либо именем хоста, либо IP-адресом. Для указания IPv6-адреса поместите его в квадратные скобки:
+
+```text
+clickhouse://[2001:db8::1234]
+```
+
+URI позволяет подключаться к нескольким хостам. Строки подключения могут содержать несколько хостов. ClickHouse-client будет пытаться подключиться к этим хостам по порядку (т.е. слева направо). После установления соединения попытки подключения к оставшимся хостам не предпринимаются.
+
+
+
+Строка подключения должна быть указана в первом аргументе clickhouse-client. Строка подключения может комбинироваться с другими [параметрами командной строки] (#command-line-options) кроме `--host/-h` и `--port`.
+
+Для компонента `query_parameter` разрешены следующие ключи:
+
+- `secure` или сокращенно `s` - без значение. Если параметр указан, то соединение с сервером будет осуществляться по защищенному каналу (TLS). См. `secure` в [command-line-options](#command-line-options).
+
+### Кодирование URI {#connection_string_uri_percent_encoding}
+
+Не US ASCII и специальные символы в имени пользователя, пароле, хостах, базе данных и параметрах запроса должны быть [закодированы](https://ru.wikipedia.org/wiki/URL#%D0%9A%D0%BE%D0%B4%D0%B8%D1%80%D0%BE%D0%B2%D0%B0%D0%BD%D0%B8%D0%B5_URL).
+
+### Примеры {#connection_string_examples}
+
+Подключиться к localhost через порт 9000 и выполнить запрос `SELECT 1`
+
+``` bash
+clickhouse-client clickhouse://localhost:9000 --query "SELECT 1"
+```
+Подключиться к localhost, используя пользователя `john` с паролем `secret`, хост `127.0.0.1` и порт `9000`
+
+``bash
+clickhouse-client clickhouse://john:secret@127.0.0.1:9000
+```
+
+Подключиться к localhost, используя пользователя по умолчанию, хост с IPV6 адресом `[::1]` и порт `9000`.
+
+``` bash
+clickhouse-client clickhouse://[::1]:9000
+```
+
+Подключиться к localhost через порт 9000  многострочном режиме.
+
+``` bash
+clickhouse-client clickhouse://localhost:9000 '-m'
+```
+
+Подключиться к localhost через порт 9000 с пользователем default.
+
+``` bash
+clickhouse-client clickhouse://default@localhost:9000
+
+# Эквивалетно:
+clickhouse-client clickhouse://localhost:9000 --user default
+```
+
+Подключиться к localhost через порт 9000 с базой данных `my_database`
+
+``` bash
+clickhouse-client clickhouse://localhost:9000/my_database
+
+# Эквивалетно:
+clickhouse-client clickhouse://localhost:9000 --database my_database
+```
+
+Подключиться к localhost через порт 9000 с базой данных `my_database`, указанной в строке подключения, используя безопасным соединением  при помощи короткого варианта параметра URI 's'.
+
+``` bash
+clickhouse-client clickhouse://localhost/my_database?s
+
+# Эквивалетно:
+clickhouse-client clickhouse://localhost/my_database -s
+```
+
+Подключиться к хосту по умолчанию с использованием порта по умолчанию, пользователя по умолчанию, и базы данных по умолчанию.
+
+``` bash
+clickhouse-client clickhouse:
+```
+
+Подключиться к хосту по умолчанию через порт по умолчанию, используя имя пользователя `my_user` без пароля.
+
+``` bash
+clickhouse-client clickhouse://my_user@
+
+# Использование пустого пароля между : и @ означает, что пользователь должен ввести пароль перед началом соединения.
+clickhouse-client clickhouse://my_user:@
+```
+
+Подключиться к localhost, используя электронную почту, как имя пользователя. Символ `@` закодирован как `%40`.
+
+``` bash
+clickhouse-client clickhouse://some_user%40some_mail.com@localhost:9000
+```
+
+Подключится к одному из хостов: `192.168.1.15`, `192.168.1.25`.
+
+``` bash
+clickhouse-client clickhouse://192.168.1.15,192.168.1.25 
+```
 
 ### Конфигурационные файлы {#configuration_files}
 
diff --git a/docs/ru/interfaces/formats.md b/docs/ru/interfaces/formats.md
index bef5c223281..48a6132170a 100644
--- a/docs/ru/interfaces/formats.md
+++ b/docs/ru/interfaces/formats.md
@@ -387,6 +387,23 @@ $ clickhouse-client --format_csv_delimiter="|" --query="INSERT INTO test.csv FOR
 
 Формат CSV поддерживает вывод totals и extremes аналогично `TabSeparated`.
 
+
+### CSV опции форматирования {#csv-format-settings}
+
+- [format_csv_delimiter](../operations/settings/settings.md#format_csv_delimiter) - символ, который будет считаться разделителем в CSV данных. Значение по умолчанию - `,`.
+- [format_csv_allow_single_quotes](../operations/settings/settings.md#format_csv_allow_single_quotes) - разрешить строки в одинарных кавычках. Значение по умолчанию - `true`.
+- [format_csv_allow_double_quotes](../operations/settings/settings.md#format_csv_allow_double_quotes) - разрешить строки в двойных кавычках. Значение по умолчанию - `true`.
+- [format_csv_null_representation](../operations/settings/settings.md#format_tsv_null_representation) - пользовательское представление NULL в формате CSV. Значение по умолчанию - `\N`.
+- [input_format_csv_empty_as_default](../operations/settings/settings.md#input_format_csv_empty_as_default) - рассматривать пустые поля в CSV в качестве значений по умолчанию. Значение по умолчанию - `true`. Для сложных выражений по умолчанию необходимо также включить [input_format_defaults_for_omitted_fields](../operations/settings/settings.md#input_format_defaults_for_omitted_fields).
+- [input_format_csv_enum_as_number](../operations/settings/settings.md#input_format_csv_enum_as_number) - рассматривать вставленные значения enum в форматах CSV как индексы enum. Значение по умолчанию - `false`.
+- [input_format_csv_use_best_effort_in_schema_inference](../operations/settings/settings.md#input_format_csv_use_best_effort_in_schema_inference) - использовать некоторые твики и эвристики для вывода схемы в формате CSV. Если параметр отключен, все поля будут определяться как строки. Значение по умолчанию - `true`.
+- [input_format_csv_arrays_as_nested_csv](../operations/settings/settings.md#input_format_csv_arrays_as_nested_csv) - при чтении массива из CSV ожидать, что его элементы были сериализованы во вложенный CSV и затем помещены в строку. Значение по умолчанию - `false`.
+- [output_format_csv_crlf_end_of_line](../operations/settings/settings.md#output_format_csv_crlf_end_of_line) - если установлено значение true, конец строки в формате вывода CSV будет `\r\n` вместо `\n`. Значение по умолчанию - `false`.
+- [input_format_csv_skip_first_lines](../operations/settings/settings.md#input_format_csv_skip_first_lines) - пропустить указанное количество строк в начале данных. Значение по умолчанию - `0`.
+- [input_format_csv_detect_header](../operations/settings/settings.md#input_format_csv_detect_header) - обнаружить заголовок с именами и типами в формате CSV. Значение по умолчанию - `true`.
+- [input_format_csv_trim_whitespaces](../operations/settings/settings.md#input_format_csv_trim_whitespaces) - удалить пробелы и символы табуляции из строк без кавычек.
+Значение по умолчанию - `true`.
+
 ## CSVWithNames {#csvwithnames}
 
 Выводит также заголовок, аналогично [TabSeparatedWithNames](#tabseparatedwithnames).
diff --git a/docs/ru/operations/server-configuration-parameters/settings.md b/docs/ru/operations/server-configuration-parameters/settings.md
index 787153d4d19..5430469ea18 100644
--- a/docs/ru/operations/server-configuration-parameters/settings.md
+++ b/docs/ru/operations/server-configuration-parameters/settings.md
@@ -1067,7 +1067,7 @@ ClickHouse использует потоки из глобального пул
 -   requireTLSv1_2 - Требование соединения TLSv1.2. Допустимые значения: `true`, `false`.
 -   fips - Активация режима OpenSSL FIPS. Поддерживается, если версия OpenSSL, с которой собрана библиотека поддерживает fips.
 -   privateKeyPassphraseHandler - Класс (подкласс PrivateKeyPassphraseHandler)запрашивающий кодовую фразу доступа к секретному ключу. Например, `<privateKeyPassphraseHandler>`, `<name>KeyFileHandler</name>`, `<options><password>test</password></options>`, `</privateKeyPassphraseHandler>`.
--   invalidCertificateHandler - Класс (подкласс CertificateHandler) для подтверждения не валидных сертификатов. Например, `<invalidCertificateHandler> <name>ConsoleCertificateHandler</name> </invalidCertificateHandler>`.
+-   invalidCertificateHandler - Класс (подкласс CertificateHandler) для подтверждения не валидных сертификатов. Например, `<invalidCertificateHandler> <name>RejectCertificateHandler</name> </invalidCertificateHandler>`.
 -   disableProtocols - Запрещенные к использованию протоколы.
 -   preferServerCiphers - Предпочтение серверных шифров на клиенте.
 
@@ -1355,6 +1355,10 @@ Parameters:
 <timezone>Europe/Moscow</timezone>
 ```
 
+**См. также**
+
+- [session_timezone](../settings/settings.md#session_timezone)
+
 ## tcp_port {#server_configuration_parameters-tcp_port}
 
 Порт для взаимодействия с клиентами по протоколу TCP.
diff --git a/docs/ru/operations/settings/settings.md b/docs/ru/operations/settings/settings.md
index cda338cef75..f83d05ff710 100644
--- a/docs/ru/operations/settings/settings.md
+++ b/docs/ru/operations/settings/settings.md
@@ -1589,6 +1589,24 @@ SELECT area/period FROM account_orders FORMAT JSON;
 
 Символ, интерпретируемый как разделитель в данных формата CSV. По умолчанию — `,`.
 
+## format_csv_allow_double_quotes {#format_csv_allow_double_quotes}
+
+Если установлено значение true, разрешить строки в двойных кавычках.
+
+Включено по умолчанию.
+
+## input_format_csv_empty_as_default {#input_format_csv_empty_as_default}
+
+Если включено, заменяет пустые поля ввода в CSV значениями по умолчанию. Для сложных выражений по умолчанию `input_format_defaults_for_omitted_fields` также должен быть включен.
+
+Включено по умолчанию.
+
+## input_format_csv_arrays_as_nested_csv {#input_format_csv_arrays_as_nested_csv}
+
+При чтении массива из CSV ожидайте, что его элементы были сериализованы во вложенный CSV, а затем помещены в строку. Пример: "[""Hello"", ""world"", ""42"""" TV""]". Скобки вокруг массива могут быть опущены.
+
+По умолчанию отключены.
+
 ## input_format_csv_unquoted_null_literal_as_null {#settings-input_format_csv_unquoted_null_literal_as_null}
 
 Для формата CSV включает или выключает парсинг неэкранированной строки `NULL` как литерала (синоним для `\N`)
@@ -1665,6 +1683,50 @@ SELECT * FROM table_with_enum_column_for_csv_insert;
 
 Использовать в качестве разделителя строк для CSV формата CRLF (DOS/Windows стиль) вместо LF (Unix стиль).
 
+## input_format_csv_detect_header {#input_format_csv_detect_header}
+
+Обнаружить заголовок с именами и типами в формате CSV.
+ 
+Значение по умолчанию - `true`.
+
+## input_format_csv_skip_first_lines {#input_format_csv_skip_first_lines}
+
+Количество строк, пропускаемых в начале данных в формате ввода CSV.
+
+Значение по умолчанию: `0`.
+
+## input_format_csv_trim_whitespaces {#input_format_csv_trim_whitespaces}
+
+Удалить пробелы и символы табуляции из строк без кавычек.
+
+Значение по умолчанию: `true`.
+
+**Примеры**
+
+Запрос
+
+```bash
+echo '  string  ' | ./clickhouse local -q  "select * from table FORMAT CSV" --input-format="CSV" --input_format_csv_trim_whitespaces=true
+```
+
+Результат
+
+```text
+"string"
+```
+
+Запрос
+
+```bash
+echo '  string  ' | ./clickhouse local -q  "select * from table FORMAT CSV" --input-format="CSV" --input_format_csv_trim_whitespaces=false
+```
+
+Результат
+
+```text
+"  string  "
+```
+
 ## output_format_tsv_crlf_end_of_line {#settings-output-format-tsv-crlf-end-of-line}
 
 Использовать в качестве разделителя строк для TSV формата CRLF (DOC/Windows стиль) вместо LF (Unix стиль).
@@ -4064,3 +4126,83 @@ SELECT sum(number) FROM numbers(10000000000) SETTINGS partial_result_on_first_ca
 Возможные значения:: `true`, `false`
 
 Значение по умолчанию: `false`
+
+## session_timezone {#session_timezone}
+
+Задаёт значение часового пояса (session_timezone) по умолчанию для текущей сессии вместо [часового пояса сервера](../server-configuration-parameters/settings.md#server_configuration_parameters-timezone). То есть, все значения DateTime/DateTime64, для которых явно не задан часовой пояс, будут интерпретированы как относящиеся к указанной зоне.
+При значении настройки `''` (пустая строка), будет совпадать с часовым поясом сервера. 
+
+Функции `timeZone()` and `serverTimezone()` возвращают часовой пояс текущей сессии и сервера соответственно.
+
+Примеры:
+```sql
+SELECT timeZone(), serverTimezone() FORMAT TSV
+
+Europe/Berlin	Europe/Berlin
+```
+
+```sql
+SELECT timeZone(), serverTimezone() SETTINGS session_timezone = 'Asia/Novosibirsk' FORMAT TSV
+
+Asia/Novosibirsk	Europe/Berlin
+```
+
+```sql
+SELECT toDateTime64(toDateTime64('1999-12-12 23:23:23.123', 3), 3, 'Europe/Zurich') SETTINGS session_timezone = 'America/Denver' FORMAT TSV
+
+1999-12-13 07:23:23.123
+```
+
+Возможные значения:
+
+-    Любая зона из `system.time_zones`, например `Europe/Berlin`, `UTC` или `Zulu`
+
+Значение по умолчанию: `''`.
+
+:::warning
+Иногда при формировании значений типа `DateTime` и `DateTime64` параметр  `session_timezone` может быть проигнорирован.
+Это может привести к путанице. Пример и пояснение см. ниже.
+:::
+
+```sql
+CREATE TABLE test_tz (`d` DateTime('UTC')) ENGINE = Memory AS SELECT toDateTime('2000-01-01 00:00:00', 'UTC');
+
+SELECT *, timezone() FROM test_tz WHERE d = toDateTime('2000-01-01 00:00:00') SETTINGS session_timezone = 'Asia/Novosibirsk'
+0 rows in set.
+
+SELECT *, timezone() FROM test_tz WHERE d = '2000-01-01 00:00:00' SETTINGS session_timezone = 'Asia/Novosibirsk'
+┌───────────────────d─┬─timezone()───────┐
+│ 2000-01-01 00:00:00 │ Asia/Novosibirsk │
+└─────────────────────┴──────────────────┘
+```
+
+Это происходит из-за различного происхождения значения, используемого для сравнения:
+- В первом запросе функция `toDateTime()`, создавая значение типа `DateTime`, принимает во внимание параметр `session_timezone` из контекста запроса;
+- Во втором запросе `DateTime` формируется из строки неявно, наследуя тип колонки `d` (в том числе и числовой пояс), и параметр `session_timezone` игнорируется.
+
+**Смотрите также**
+
+- [timezone](../server-configuration-parameters/settings.md#server_configuration_parameters-timezone)
+
+## rename_files_after_processing
+
+- **Тип:** Строка
+
+- **Значение по умолчанию:** Пустая строка
+
+Этот параметр позволяет задать паттерн для переименования файлов, обрабатываемых табличной функцией `file`. Когда опция установлена, все файлы, прочитанные табличной функцией `file`, будут переименованы в соответствии с указанным шаблоном, если обработка и чтение файла завершились успешно.
+
+### Шаблон
+Шаблон поддерживает следующие виды плейсхолдеров:
+
+- `%f` — Исходное имя файла без расширения (например "sample").
+- `%e` — Оригинальное расширение файла с точкой (например ".csv").
+- `%t` — Текущее время (в микросекундах).
+- `%%` — Знак процента ("%").
+
+### Пример
+- Значение аргумента: `--rename_files_after_processing="processed_%f_%t%e"`
+
+- Запрос: `SELECT * FROM file('sample.csv')`
+
+Если чтение и обработка `sample.csv` прошли успешно, файл будет переименован в `processed_sample_1683473210851438.csv`.
diff --git a/docs/ru/operations/system-tables/query_log.md b/docs/ru/operations/system-tables/query_log.md
index a55528bd829..8f858c14fb1 100644
--- a/docs/ru/operations/system-tables/query_log.md
+++ b/docs/ru/operations/system-tables/query_log.md
@@ -69,11 +69,11 @@ ClickHouse не удаляет данные из таблица автомати
     -   0 — запрос был инициирован другим запросом при выполнении распределенного запроса.
 -   `user` ([String](../../sql-reference/data-types/string.md)) — пользователь, запустивший текущий запрос.
 -   `query_id` ([String](../../sql-reference/data-types/string.md)) — ID запроса.
--   `address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — IP адрес, с которого пришел запрос.
+-   `address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — IP адрес, с которого пришел запрос.
 -   `port` ([UInt16](../../sql-reference/data-types/int-uint.md)) — порт, с которого клиент сделал запрос
 -   `initial_user` ([String](../../sql-reference/data-types/string.md)) — пользователь, запустивший первоначальный запрос (для распределенных запросов).
 -   `initial_query_id` ([String](../../sql-reference/data-types/string.md)) — ID родительского запроса.
--   `initial_address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — IP адрес, с которого пришел родительский запрос.
+-   `initial_address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — IP адрес, с которого пришел родительский запрос.
 -   `initial_port` ([UInt16](../../sql-reference/data-types/int-uint.md)) — порт, с которого клиент сделал родительский запрос.
 -   `initial_query_start_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — время начала обработки запроса (для распределенных запросов).
 -   `initial_query_start_time_microseconds` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — время начала обработки запроса с точностью до микросекунд (для распределенных запросов).
diff --git a/docs/ru/operations/system-tables/query_thread_log.md b/docs/ru/operations/system-tables/query_thread_log.md
index c9aabb02cad..1a256e1657a 100644
--- a/docs/ru/operations/system-tables/query_thread_log.md
+++ b/docs/ru/operations/system-tables/query_thread_log.md
@@ -39,11 +39,11 @@ ClickHouse не удаляет данные из таблицы автомати
     -   0 — запрос был инициирован другим запросом при распределенном запросе.
 -   `user` ([String](../../sql-reference/data-types/string.md)) — пользователь, запустивший текущий запрос.
 -   `query_id` ([String](../../sql-reference/data-types/string.md)) — ID запроса.
--   `address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — IP адрес, с которого пришел запрос.
+-   `address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — IP адрес, с которого пришел запрос.
 -   `port` ([UInt16](../../sql-reference/data-types/int-uint.md#uint-ranges)) — порт, с которого пришел запрос.
 -   `initial_user` ([String](../../sql-reference/data-types/string.md)) — пользователь, запустивший первоначальный запрос (для распределенных запросов).
 -   `initial_query_id` ([String](../../sql-reference/data-types/string.md)) — ID родительского запроса.
--   `initial_address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — IP адрес, с которого пришел родительский запрос.
+-   `initial_address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — IP адрес, с которого пришел родительский запрос.
 -   `initial_port` ([UInt16](../../sql-reference/data-types/int-uint.md#uint-ranges)) — порт, пришел родительский запрос.
 -   `interface` ([UInt8](../../sql-reference/data-types/int-uint.md#uint-ranges)) — интерфейс, с которого ушёл запрос. Возможные значения:
     -   1 — TCP.
diff --git a/docs/ru/operations/system-tables/session_log.md b/docs/ru/operations/system-tables/session_log.md
index 1f313e7815a..5849cb51ab4 100644
--- a/docs/ru/operations/system-tables/session_log.md
+++ b/docs/ru/operations/system-tables/session_log.md
@@ -27,7 +27,7 @@ slug: /ru/operations/system-tables/session_log
 -   `profiles` ([Array](../../sql-reference/data-types/array.md)([LowCardinality(String)](../../sql-reference/data-types/lowcardinality.md))) — список профилей, установленных для всех ролей и (или) пользователей.
 -   `roles` ([Array](../../sql-reference/data-types/array.md)([LowCardinality(String)](../../sql-reference/data-types/lowcardinality.md))) — список ролей, к которым применяется данный профиль.
 -   `settings` ([Array](../../sql-reference/data-types/array.md)([Tuple](../../sql-reference/data-types/tuple.md)([LowCardinality(String)](../../sql-reference/data-types/lowcardinality.md), [String](../../sql-reference/data-types/string.md)))) — настройки, которые были изменены при входе или выходе клиента из системы.
--   `client_address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — IP-адрес, который использовался для входа или выхода из системы.
+-   `client_address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — IP-адрес, который использовался для входа или выхода из системы.
 -   `client_port` ([UInt16](../../sql-reference/data-types/int-uint.md)) — порт клиента, который использовался для входа или выхода из системы.
 -   `interface` ([Enum8](../../sql-reference/data-types/enum.md)) — интерфейс, с которого был инициирован вход в систему. Возможные значения:
     -   `TCP`
diff --git a/docs/ru/operations/system-tables/zookeeper_log.md b/docs/ru/operations/system-tables/zookeeper_log.md
index ccbdd5110ad..9874cb3a269 100644
--- a/docs/ru/operations/system-tables/zookeeper_log.md
+++ b/docs/ru/operations/system-tables/zookeeper_log.md
@@ -15,7 +15,7 @@ slug: /ru/operations/system-tables/zookeeper_log
     -   `Finalize` — соединение разорвано, ответ не получен.
 -   `event_date` ([Date](../../sql-reference/data-types/date.md)) — дата, когда произошло событие.
 -   `event_time` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — дата и время, когда произошло событие.
--   `address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — IP адрес сервера ZooKeeper, с которого был сделан запрос.
+-   `address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — IP адрес сервера ZooKeeper, с которого был сделан запрос.
 -   `port` ([UInt16](../../sql-reference/data-types/int-uint.md)) — порт сервера ZooKeeper, с которого был сделан запрос.
 -   `session_id` ([Int64](../../sql-reference/data-types/int-uint.md)) — идентификатор сессии, который сервер ZooKeeper создает для каждого соединения.
 -   `xid` ([Int32](../../sql-reference/data-types/int-uint.md)) — идентификатор запроса внутри сессии. Обычно это последовательный номер запроса, одинаковый у строки запроса и у парной строки `response`/`finalize`.
diff --git a/docs/ru/sql-reference/aggregate-functions/combinators.md b/docs/ru/sql-reference/aggregate-functions/combinators.md
index 3a7ff571f99..99d5f11442c 100644
--- a/docs/ru/sql-reference/aggregate-functions/combinators.md
+++ b/docs/ru/sql-reference/aggregate-functions/combinators.md
@@ -66,6 +66,10 @@ WITH anySimpleState(number) AS c SELECT toTypeName(c), c FROM numbers(1);
 
 В случае применения этого комбинатора, агрегатная функция возвращает не готовое значение (например, в случае функции [uniq](reference/uniq.md#agg_function-uniq) — количество уникальных значений), а промежуточное состояние агрегации (например, в случае функции `uniq` — хэш-таблицу для расчёта количества уникальных значений), которое имеет тип `AggregateFunction(...)` и может использоваться для дальнейшей обработки или может быть сохранено в таблицу для последующей доагрегации.
 
+:::note
+Промежуточное состояние для -MapState не является инвариантом для одних и тех же исходных данные т.к. порядок данных может меняться. Это не влияет, тем не менее, на загрузку таких данных.
+:::
+
 Для работы с промежуточными состояниями предназначены:
 
 -   Движок таблиц [AggregatingMergeTree](../../engines/table-engines/mergetree-family/aggregatingmergetree.md).
diff --git a/docs/ru/sql-reference/data-types/decimal.md b/docs/ru/sql-reference/data-types/decimal.md
index 81cb5079945..dbbf18253b2 100644
--- a/docs/ru/sql-reference/data-types/decimal.md
+++ b/docs/ru/sql-reference/data-types/decimal.md
@@ -31,7 +31,7 @@ sidebar_label: Decimal
 ## Внутреннее представление {#vnutrennee-predstavlenie}
 
 Внутри данные представляются как знаковые целые числа, соответсвующей разрядности. Реальные диапазоны, хранящиеся в ячейках памяти несколько больше заявленных. Заявленные диапазоны Decimal проверяются только при вводе числа из строкового представления.
-Поскольку современные CPU не поддерживают 128-битные числа, операции над Decimal128 эмулируются программно. Decimal128 работает в разы медленней чем Decimal32/Decimal64.
+Поскольку современные CPU не поддерживают 128-битные и 256-битные числа, для операций над Decimal128 и Decimal256 эмулируются программно. Данные типы работают в разы медленнее, чем Decimal32/Decimal64.
 
 ## Операции и типы результата {#operatsii-i-tipy-rezultata}
 
@@ -59,6 +59,10 @@ sidebar_label: Decimal
 
 При выполнении операций над типом Decimal могут происходить целочисленные переполнения. Лишняя дробная часть отбрасывается (не округляется). Лишняя целочисленная часть приводит к исключению.
 
+:::warning
+Проверка переполнения не реализована для Decimal128 и Decimal256. В случае переполнения неверный результат будёт возвращён без выбрасывания исключения.
+:::
+
 ``` sql
 SELECT toDecimal32(2, 4) AS x, x / 3
 ```
diff --git a/docs/ru/sql-reference/data-types/domains/ipv4.md b/docs/ru/sql-reference/data-types/ipv4.md
similarity index 56%
rename from docs/ru/sql-reference/data-types/domains/ipv4.md
rename to docs/ru/sql-reference/data-types/ipv4.md
index 57a19e282ae..5cb977c64c9 100644
--- a/docs/ru/sql-reference/data-types/domains/ipv4.md
+++ b/docs/ru/sql-reference/data-types/ipv4.md
@@ -1,12 +1,12 @@
 ---
-slug: /ru/sql-reference/data-types/domains/ipv4
+slug: /ru/sql-reference/data-types/ipv4
 sidebar_position: 59
 sidebar_label: IPv4
 ---
 
 ## IPv4 {#ipv4}
 
-`IPv4` — это домен, базирующийся на типе данных `UInt32` предназначенный для хранения адресов IPv4. Он обеспечивает компактное хранение данных с удобным для человека форматом ввода-вывода, и явно отображаемым типом данных в структуре таблицы.
+IPv4-адреса. Хранится в 4 байтах как UInt32.
 
 ### Применение {#primenenie}
 
@@ -57,27 +57,6 @@ SELECT toTypeName(from), hex(from) FROM hits LIMIT 1;
 └──────────────────┴───────────┘
 ```
 
-Значения с доменным типом данных не преобразуются неявно в другие типы данных, кроме `UInt32`.
-Если необходимо преобразовать значение типа `IPv4` в строку, то это необходимо делать явно с помощью функции `IPv4NumToString()`:
+**См. также**
 
-``` sql
-SELECT toTypeName(s), IPv4NumToString(from) AS s FROM hits LIMIT 1;
-```
-
-``` text
-┌─toTypeName(IPv4NumToString(from))─┬─s──────────────┐
-│ String                            │ 183.247.232.58 │
-└───────────────────────────────────┴────────────────┘
-```
-
-Или приводить к типу данных `UInt32`:
-
-``` sql
-SELECT toTypeName(i), CAST(from AS UInt32) AS i FROM hits LIMIT 1;
-```
-
-``` text
-┌─toTypeName(CAST(from, 'UInt32'))─┬──────────i─┐
-│ UInt32                           │ 3086477370 │
-└──────────────────────────────────┴────────────┘
-```
+- [Functions for Working with IPv4 and IPv6 Addresses](../functions/ip-address-functions.md)
diff --git a/docs/ru/sql-reference/data-types/domains/ipv6.md b/docs/ru/sql-reference/data-types/ipv6.md
similarity index 98%
rename from docs/ru/sql-reference/data-types/domains/ipv6.md
rename to docs/ru/sql-reference/data-types/ipv6.md
index fdfb26f68c1..808068ce90a 100644
--- a/docs/ru/sql-reference/data-types/domains/ipv6.md
+++ b/docs/ru/sql-reference/data-types/ipv6.md
@@ -1,5 +1,5 @@
 ---
-slug: /ru/sql-reference/data-types/domains/ipv6
+slug: /ru/sql-reference/data-types/ipv6
 sidebar_position: 60
 sidebar_label: IPv6
 ---
diff --git a/docs/ru/sql-reference/functions/date-time-functions.md b/docs/ru/sql-reference/functions/date-time-functions.md
index 867d71d334c..17ab04b7799 100644
--- a/docs/ru/sql-reference/functions/date-time-functions.md
+++ b/docs/ru/sql-reference/functions/date-time-functions.md
@@ -26,7 +26,8 @@ SELECT
 
 ## timeZone {#timezone}
 
-Возвращает часовой пояс сервера.
+Возвращает часовой пояс сервера, считающийся умолчанием для текущей сессии: значение параметра [session_timezone](../../operations/settings/settings.md#session_timezone), если установлено.
+
 Если функция вызывается в контексте распределенной таблицы, то она генерирует обычный столбец со значениями, актуальными для каждого шарда. Иначе возвращается константа.
 
 **Синтаксис**
@@ -43,6 +44,33 @@ timeZone()
 
 Тип: [String](../../sql-reference/data-types/string.md).
 
+**Смотрите также**
+
+- [serverTimeZone](#servertimezone)
+
+## serverTimeZone {#servertimezone}
+
+Возвращает часовой пояс сервера по умолчанию, в т.ч. установленный [timezone](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-timezone)
+Если функция вызывается в контексте распределенной таблицы, то она генерирует обычный столбец со значениями, актуальными для каждого шарда. Иначе возвращается константа.
+
+**Синтаксис**
+
+``` sql
+serverTimeZone()
+```
+
+Синонимы: `serverTimezone`.
+
+**Возвращаемое значение**
+
+-   Часовой пояс.
+
+Тип: [String](../../sql-reference/data-types/string.md).
+
+**Смотрите также**
+
+- [timeZone](#timezone)
+
 ## toTimeZone {#totimezone}
 
 Переводит дату или дату с временем в указанный часовой пояс. Часовой пояс - это атрибут типов `Date` и `DateTime`. Внутреннее значение (количество секунд) поля таблицы или результирующего столбца не изменяется, изменяется тип поля и, соответственно, его текстовое отображение.
diff --git a/docs/ru/sql-reference/functions/ext-dict-functions.md b/docs/ru/sql-reference/functions/ext-dict-functions.md
index e6cb878d1c7..d14f0ddf027 100644
--- a/docs/ru/sql-reference/functions/ext-dict-functions.md
+++ b/docs/ru/sql-reference/functions/ext-dict-functions.md
@@ -5,7 +5,7 @@ sidebar_label: "Функции для работы с внешними слов
 ---
 
 :::note "Внимание"
-    Для словарей, созданных с помощью [DDL-запросов](../../sql-reference/statements/create/dictionary.md), в параметре `dict_name` указывается полное имя словаря вместе с базой данных, например: `<database>.<dict_name>`. Если база данных не указана, используется текущая.
+Для словарей, созданных с помощью [DDL-запросов](../../sql-reference/statements/create/dictionary.md), в параметре `dict_name` указывается полное имя словаря вместе с базой данных, например: `<database>.<dict_name>`. Если база данных не указана, используется текущая.
 :::
 
 # Функции для работы с внешними словарями {#ext_dict_functions}
diff --git a/docs/ru/sql-reference/functions/ip-address-functions.md b/docs/ru/sql-reference/functions/ip-address-functions.md
index 96d4b737c88..d1a72b82b67 100644
--- a/docs/ru/sql-reference/functions/ip-address-functions.md
+++ b/docs/ru/sql-reference/functions/ip-address-functions.md
@@ -265,7 +265,7 @@ SELECT
 
 ## toIPv6 {#toipv6string}
 
-Приводит строку с адресом в формате IPv6 к типу [IPv6](../../sql-reference/data-types/domains/ipv6.md). Возвращает пустое значение, если входящая строка не является корректным IP адресом.
+Приводит строку с адресом в формате IPv6 к типу [IPv6](../../sql-reference/data-types/ipv6.md). Возвращает пустое значение, если входящая строка не является корректным IP адресом.
 Похоже на функцию [IPv6StringToNum](#ipv6stringtonums), которая представляет адрес IPv6 в двоичном виде.
 
 Если входящая строка содержит корректный IPv4 адрес, функция возвращает его IPv6 эквивалент.
@@ -284,7 +284,7 @@ toIPv6(string)
 
 -   IP адрес.
 
-Тип: [IPv6](../../sql-reference/data-types/domains/ipv6.md).
+Тип: [IPv6](../../sql-reference/data-types/ipv6.md).
 
 **Примеры**
 
diff --git a/docs/ru/sql-reference/functions/type-conversion-functions.md b/docs/ru/sql-reference/functions/type-conversion-functions.md
index 298b7bbc93e..d5e6246fe9e 100644
--- a/docs/ru/sql-reference/functions/type-conversion-functions.md
+++ b/docs/ru/sql-reference/functions/type-conversion-functions.md
@@ -165,22 +165,217 @@ SELECT toUInt64(nan), toUInt32(-32), toUInt16('16'), toUInt8(8.8);
 
 ## toDate {#todate}
 
-Cиноним: `DATE`.
+Конвертирует аргумент в значение [Date](/docs/ru/sql-reference/data-types/date.md).
+
+**Синтаксис**
+
+``` sql
+toDate(expr)
+```
+
+**Аргументы**
+
+- `expr` — Значение для преобразования. [String](/docs/ru/sql-reference/data-types/string.md), [Int](/docs/ru/sql-reference/data-types/int-uint.md), [Date](/docs/ru/sql-reference/data-types/date.md) или [DateTime](/docs/ru/sql-reference/data-types/datetime.md).
+
+Если `expr` является числом выглядит как UNIX timestamp (больше чем 65535), оно интерпретируется как DateTime, затем обрезается до Date учитывавая текущую часовой пояс. Если `expr` является числом и меньше чем 65536, оно интерпретируется как количество дней с 1970-01-01.
+
+**Возвращаемое значение**
+
+- Календарная дата. [Date](/docs/ru/sql-reference/data-types/date.md).
+
+**Пример**
+
+Запрос:
+
+``` sql
+SELECT toDate('2022-12-30'), toDate(1685457500);
+```
+
+Результат:
+
+```response
+┌─toDate('2022-12-30')─┬─toDate(1685457500)─┐
+│           2022-12-30 │         2023-05-30 │
+└──────────────────────┴────────────────────┘
+```
+
 
 ## toDateOrZero {#todateorzero}
 
+Как [toDate](#todate), но в случае неудачи возвращает нижнюю границу [Date](/docs/ru/sql-reference/data-types/date.md)). Поддерживается только аргумент типа [String](/docs/ru/sql-reference/data-types/string.md).
+
+**Пример**
+
+Запрос:
+
+``` sql
+SELECT toDateOrZero('2022-12-30'), toDateOrZero('');
+```
+
+Результат:
+
+```response
+┌─toDateOrZero('2022-12-30')─┬─toDateOrZero('')─┐
+│                 2022-12-30 │       1970-01-01 │
+└────────────────────────────┴──────────────────┘
+```
+
+
 ## toDateOrNull {#todateornull}
 
+Как [toDate](#todate), но в случае неудачи возвращает `NULL`. Поддерживается только аргумент типа [String](/docs/ru/sql-reference/data-types/string.md).
+
+**Пример**
+
+Запрос:
+
+``` sql
+SELECT toDateOrNull('2022-12-30'), toDateOrNull('');
+```
+
+Результат:
+
+```response
+┌─toDateOrNull('2022-12-30')─┬─toDateOrNull('')─┐
+│                 2022-12-30 │             ᴺᵁᴸᴸ │
+└────────────────────────────┴──────────────────┘
+```
+
+
 ## toDateOrDefault {#todateordefault}
 
+Как [toDate](#todate), но в случае неудачи возвращает значение по умолчанию (или второй аргумент (если указан), или нижняя граница [Date](/docs/ru/sql-reference/data-types/date.md)).
+
+**Синтаксис**
+
+``` sql
+toDateOrDefault(expr [, default_value])
+```
+
+**Пример**
+
+Запрос:
+
+``` sql
+SELECT toDateOrDefault('2022-12-30'), toDateOrDefault('', '2023-01-01'::Date);
+```
+
+Результат:
+
+```response
+┌─toDateOrDefault('2022-12-30')─┬─toDateOrDefault('', CAST('2023-01-01', 'Date'))─┐
+│                    2022-12-30 │                                      2023-01-01 │
+└───────────────────────────────┴─────────────────────────────────────────────────┘
+```
+
+
 ## toDateTime {#todatetime}
 
+Конвертирует аргумент в значение [DateTime](/docs/ru/sql-reference/data-types/datetime.md).
+
+**Синтаксис**
+
+``` sql
+toDateTime(expr[, time_zone ])
+```
+
+**Аргументы**
+
+- `expr` — Значение для преобразования. [String](/docs/ru/sql-reference/data-types/string.md), [Int](/docs/ru/sql-reference/data-types/int-uint.md), [Date](/docs/ru/sql-reference/data-types/date.md) или [DateTime](/docs/ru/sql-reference/data-types/datetime.md).
+- `time_zone` — Часовой пояс. [String](/docs/ru/sql-reference/data-types/string.md).
+
+Если `expr` является числом, оно интерпретируется как количество секунд от начала unix эпохи.
+
+**Возвращаемое значение**
+
+- Время. [DateTime](/docs/ru/sql-reference/data-types/datetime.md)
+
+**Пример**
+
+Запрос:
+
+``` sql
+SELECT toDateTime('2022-12-30 13:44:17'), toDateTime(1685457500, 'UTC');
+```
+
+Результат:
+
+```response
+┌─toDateTime('2022-12-30 13:44:17')─┬─toDateTime(1685457500, 'UTC')─┐
+│               2022-12-30 13:44:17 │           2023-05-30 14:38:20 │
+└───────────────────────────────────┴───────────────────────────────┘
+```
+
+
 ## toDateTimeOrZero {#todatetimeorzero}
 
+Как [toDateTime](#todatetime), но в случае неудачи возвращает нижнюю границу [DateTime](/docs/ru/sql-reference/data-types/datetime.md)). Поддерживается только аргумент типа [String](/docs/ru/sql-reference/data-types/string.md).
+
+**Пример**
+
+Запрос:
+
+``` sql
+SELECT toDateTimeOrZero('2022-12-30 13:44:17'), toDateTimeOrZero('');
+```
+
+Результат:
+
+```response
+┌─toDateTimeOrZero('2022-12-30 13:44:17')─┬─toDateTimeOrZero('')─┐
+│                     2022-12-30 13:44:17 │  1970-01-01 00:00:00 │
+└─────────────────────────────────────────┴──────────────────────┘
+```
+
+
 ## toDateTimeOrNull {#todatetimeornull}
 
+Как [toDateTime](#todatetime), но в случае неудачи возвращает `NULL`. Поддерживается только аргумент типа [String](/docs/ru/sql-reference/data-types/string.md).
+
+**Example**
+
+Query:
+
+``` sql
+SELECT toDateTimeOrNull('2022-12-30 13:44:17'), toDateTimeOrNull('');
+```
+
+Result:
+
+```response
+┌─toDateTimeOrNull('2022-12-30 13:44:17')─┬─toDateTimeOrNull('')─┐
+│                     2022-12-30 13:44:17 │                 ᴺᵁᴸᴸ │
+└─────────────────────────────────────────┴──────────────────────┘
+```
+
+
 ## toDateTimeOrDefault {#todatetimeordefault}
 
+Как [toDateTime](#todatetime), но в случае неудачи возвращает значение по умолчанию (или третий аргумент (если указан), или нижняя граница [DateTime](/docs/ru/sql-reference/data-types/datetime.md)).
+
+**Синтаксис**
+
+``` sql
+toDateTimeOrDefault(expr, [, time_zone [, default_value]])
+```
+
+**Пример**
+
+Запрос:
+
+``` sql
+SELECT toDateTimeOrDefault('2022-12-30 13:44:17'), toDateTimeOrDefault('', 'UTC', '2023-01-01'::DateTime('UTC'));
+```
+
+Результат:
+
+```response
+┌─toDateTimeOrDefault('2022-12-30 13:44:17')─┬─toDateTimeOrDefault('', 'UTC', CAST('2023-01-01', 'DateTime(\'UTC\')'))─┐
+│                        2022-12-30 13:44:17 │                                                     2023-01-01 00:00:00 │
+└────────────────────────────────────────────┴─────────────────────────────────────────────────────────────────────────┘
+```
+
+
 ## toDate32 {#todate32}
 
 Конвертирует аргумент в значение типа [Date32](../../sql-reference/data-types/date32.md). Если значение выходит за границы диапазона, возвращается пограничное значение `Date32`. Если аргумент имеет тип [Date](../../sql-reference/data-types/date.md), учитываются границы типа `Date`.
@@ -301,6 +496,14 @@ SELECT
 └─────────────────────────────────────────────────────────┴───────────────────────────────────────────────────────────┘
 ```
 
+## toDateTime64
+
+## toDateTime64OrZero
+
+## toDateTime64OrNull
+
+## toDateTime64OrDefault
+
 ## toDecimal(32\|64\|128\|256) {#todecimal3264128}
 
 Преобразует `value` к типу данных [Decimal](../../sql-reference/functions/type-conversion-functions.md) с точностью `S`. `value` может быть числом или строкой. Параметр `S` (scale) задаёт число десятичных знаков.
@@ -1020,10 +1223,12 @@ parseDateTimeBestEffort(time_string[, time_zone])
 -   [Unix timestamp](https://ru.wikipedia.org/wiki/Unix-время) в строковом представлении. 9 или 10 символов.
 -   Строка с датой и временем: `YYYYMMDDhhmmss`, `DD/MM/YYYY hh:mm:ss`, `DD-MM-YY hh:mm`, `YYYY-MM-DD hh:mm:ss`, etc.
 -   Строка с датой, но без времени: `YYYY`, `YYYYMM`, `YYYY*MM`, `DD/MM/YYYY`, `DD-MM-YY` и т.д.
--   Строка с временем, и с днём: `DD`, `DD hh`, `DD hh:mm`. В этом случае `YYYY-MM` принимается равным `2000-01`.
+-   Строка с временем, и с днём: `DD`, `DD hh`, `DD hh:mm`. В этом случае `MM` принимается равным `01`.
 -   Строка, содержащая дату и время вместе с информацией о часовом поясе: `YYYY-MM-DD hh:mm:ss ±h:mm`, и т.д. Например, `2020-12-12 17:36:00 -5:00`.
+-   Строка, содержащая дату и время в формате [syslog timestamp](https://datatracker.ietf.org/doc/html/rfc3164#section-4.1.2): `Mmm dd hh:mm:ss`. Например, `Jun  9 14:20:32`.
 
 Для всех форматов с разделителями функция распознаёт названия месяцев, выраженных в виде полного англоязычного имени месяца или в виде первых трёх символов имени месяца. Примеры: `24/DEC/18`, `24-Dec-18`, `01-September-2018`.
+Если год не указан, вместо него подставляется текущий год. Если в результате получается будущее время (даже на одну секунду впереди текущего момента времени), то текущий год заменяется на прошлый.
 
 **Возвращаемое значение**
 
@@ -1094,23 +1299,46 @@ AS parseDateTimeBestEffort;
 Запрос:
 
 ``` sql
-SELECT parseDateTimeBestEffort('10 20:19');
+SELECT toYear(now()) as year, parseDateTimeBestEffort('10 20:19');
 ```
 
 Результат:
 
 ``` text
-┌─parseDateTimeBestEffort('10 20:19')─┐
-│                 2000-01-10 20:19:00 │
-└─────────────────────────────────────┘
+┌─year─┬─parseDateTimeBestEffort('10 20:19')─┐
+│ 2023 │                 2023-01-10 20:19:00 │
+└──────┴─────────────────────────────────────┘
+```
+
+Запрос:
+
+``` sql
+WITH
+    now() AS ts_now,
+    formatDateTime(ts_around, '%b %e %T') AS syslog_arg
+SELECT
+    ts_now,
+    syslog_arg,
+    parseDateTimeBestEffort(syslog_arg)
+FROM (SELECT arrayJoin([ts_now - 30, ts_now + 30]) AS ts_around);
+```
+
+Результат:
+
+``` text
+┌──────────────ts_now─┬─syslog_arg──────┬─parseDateTimeBestEffort(syslog_arg)─┐
+│ 2023-06-30 23:59:30 │ Jun 30 23:59:00 │                 2023-06-30 23:59:00 │
+│ 2023-06-30 23:59:30 │ Jul  1 00:00:00 │                 2022-07-01 00:00:00 │
+└─────────────────────┴─────────────────┴─────────────────────────────────────┘
 ```
 
 **Смотрите также**
 
 -   [Информация о формате ISO 8601 от @xkcd](https://xkcd.com/1179/)
--   [RFC 1123](https://tools.ietf.org/html/rfc1123)
+-   [RFC 1123](https://datatracker.ietf.org/doc/html/rfc1123)
 -   [toDate](#todate)
 -   [toDateTime](#todatetime)
+-   [RFC 3164](https://datatracker.ietf.org/doc/html/rfc3164#section-4.1.2)
 
 ## parseDateTimeBestEffortUS {#parsedatetimebesteffortUS}
 
diff --git a/docs/ru/sql-reference/statements/alter/projection.md b/docs/ru/sql-reference/statements/alter/projection.md
index 63b068611ec..33e52b93add 100644
--- a/docs/ru/sql-reference/statements/alter/projection.md
+++ b/docs/ru/sql-reference/statements/alter/projection.md
@@ -8,13 +8,13 @@ sidebar_label: PROJECTION
 
 Доступны следующие операции с [проекциями](../../../engines/table-engines/mergetree-family/mergetree.md#projections):
 
--   `ALTER TABLE [db].name ADD PROJECTION name ( SELECT <COLUMN LIST EXPR> [GROUP BY] [ORDER BY] )` — добавляет описание проекции в метаданные.
+-   `ALTER TABLE [db].name ADD PROJECTION [IF NOT EXISTS] name ( SELECT <COLUMN LIST EXPR> [GROUP BY] [ORDER BY] )` — добавляет описание проекции в метаданные.
 
--   `ALTER TABLE [db].name DROP PROJECTION name` — удаляет описание проекции из метаданных и удаляет файлы проекции с диска.
+-   `ALTER TABLE [db].name DROP PROJECTION [IF EXISTS] name` — удаляет описание проекции из метаданных и удаляет файлы проекции с диска.
 
 -   `ALTER TABLE [db.]table MATERIALIZE PROJECTION name IN PARTITION partition_name` — перестраивает проекцию в указанной партиции. Реализовано как [мутация](../../../sql-reference/statements/alter/index.md#mutations).
 
--   `ALTER TABLE [db.]table CLEAR PROJECTION name IN PARTITION partition_name` — удаляет файлы проекции с диска без удаления описания.
+-   `ALTER TABLE [db.]table CLEAR PROJECTION [IF EXISTS] name IN PARTITION partition_name` — удаляет файлы проекции с диска без удаления описания.
 
 Команды `ADD`, `DROP` и `CLEAR` — легковесны, поскольку они только меняют метаданные или удаляют файлы.
 
@@ -22,4 +22,4 @@ sidebar_label: PROJECTION
 
     :::note
     Манипуляции с проекциями поддерживаются только для таблиц с движком [`*MergeTree`](../../../engines/table-engines/mergetree-family/mergetree.md) (включая [replicated](../../../engines/table-engines/mergetree-family/replication.md) варианты).
-    :::
\ No newline at end of file
+    :::
diff --git a/docs/ru/sql-reference/table-functions/file.md b/docs/ru/sql-reference/table-functions/file.md
index 94bc734a8fb..0983c51d954 100644
--- a/docs/ru/sql-reference/table-functions/file.md
+++ b/docs/ru/sql-reference/table-functions/file.md
@@ -126,3 +126,4 @@ SELECT count(*) FROM file('big_dir/file{0..9}{0..9}{0..9}', 'CSV', 'name String,
 **Смотрите также**
 
 -   [Виртуальные столбцы](index.md#table_engines-virtual_columns)
+-   [Переименование файлов после обработки](/docs/ru/operations/settings/settings.md#rename_files_after_processing)
diff --git a/docs/ru/whats-new/changelog/2017.mdx b/docs/ru/whats-new/changelog/2017.mdx
index 9d1c7220f3d..93df717ea8f 100644
--- a/docs/ru/whats-new/changelog/2017.mdx
+++ b/docs/ru/whats-new/changelog/2017.mdx
@@ -1,6 +1,6 @@
 ---
 slug: /ru/whats-new/changelog/2017
-sidebar_position: 6
+sidebar_position: 60
 sidebar_label: 2017
 title: 2017 Changelog
 ---
diff --git a/docs/ru/whats-new/changelog/2018.mdx b/docs/ru/whats-new/changelog/2018.mdx
index fb804afa293..fdb26416c27 100644
--- a/docs/ru/whats-new/changelog/2018.mdx
+++ b/docs/ru/whats-new/changelog/2018.mdx
@@ -1,6 +1,6 @@
 ---
 slug: /ru/whats-new/changelog/2018
-sidebar_position: 5
+sidebar_position: 50
 sidebar_label: 2018
 title: 2018 Changelog
 ---
diff --git a/docs/ru/whats-new/changelog/2019.mdx b/docs/ru/whats-new/changelog/2019.mdx
index caea40f6077..ff025ab7aa7 100644
--- a/docs/ru/whats-new/changelog/2019.mdx
+++ b/docs/ru/whats-new/changelog/2019.mdx
@@ -1,6 +1,6 @@
 ---
 slug: /ru/whats-new/changelog/2019
-sidebar_position: 4
+sidebar_position: 40
 sidebar_label: 2019
 title: 2019 Changelog
 ---
diff --git a/docs/ru/whats-new/changelog/2020.mdx b/docs/ru/whats-new/changelog/2020.mdx
index 51943785a4a..aa53b0a09d9 100644
--- a/docs/ru/whats-new/changelog/2020.mdx
+++ b/docs/ru/whats-new/changelog/2020.mdx
@@ -1,6 +1,6 @@
 ---
 slug: /ru/whats-new/changelog/2020
-sidebar_position: 3
+sidebar_position: 30
 sidebar_label: 2020
 title: 2020 Changelog
 ---
diff --git a/docs/ru/whats-new/changelog/2021.mdx b/docs/ru/whats-new/changelog/2021.mdx
index d517bad19e6..97b44b4321e 100644
--- a/docs/ru/whats-new/changelog/2021.mdx
+++ b/docs/ru/whats-new/changelog/2021.mdx
@@ -1,6 +1,6 @@
 ---
 slug: /ru/whats-new/changelog/2021
-sidebar_position: 2
+sidebar_position: 20
 sidebar_label: 2021
 title: 2021 Changelog
 ---
diff --git a/docs/ru/whats-new/changelog/2022.mdx b/docs/ru/whats-new/changelog/2022.mdx
new file mode 100644
index 00000000000..c70fbfda355
--- /dev/null
+++ b/docs/ru/whats-new/changelog/2022.mdx
@@ -0,0 +1,10 @@
+---
+slug: /ru/whats-new/changelog/2022
+sidebar_position: 10
+sidebar_label: 2022
+title: 2022 Changelog
+---
+
+import Changelog from '@site/docs/en/whats-new/changelog/2022.md';
+
+<Changelog />
diff --git a/docs/ru/whats-new/changelog/_category_.yml b/docs/ru/whats-new/changelog/_category_.yml
index 7a496eace66..5be70a51ac0 100644
--- a/docs/ru/whats-new/changelog/_category_.yml
+++ b/docs/ru/whats-new/changelog/_category_.yml
@@ -2,5 +2,5 @@ label: 'Changelog'
 collapsible: true
 collapsed: true
 link:
-  type: doc
-  id: ru/whats-new/changelog/index
+  type: generated-index
+  title: Changelog
diff --git a/docs/ru/whats-new/changelog/index.mdx b/docs/ru/whats-new/changelog/index.mdx
index 311be3be313..b69bf91b300 100644
--- a/docs/ru/whats-new/changelog/index.mdx
+++ b/docs/ru/whats-new/changelog/index.mdx
@@ -1,7 +1,7 @@
 ---
 sidebar_position: 1
-sidebar_label: 2022
-title: 2022 Changelog
+sidebar_label: 2023
+title: 2023 Changelog
 slug: /ru/whats-new/changelog/index
 ---
 
diff --git a/docs/zh/operations/server-configuration-parameters/settings.md b/docs/zh/operations/server-configuration-parameters/settings.md
index 52142eda2e8..f6106d8734e 100644
--- a/docs/zh/operations/server-configuration-parameters/settings.md
+++ b/docs/zh/operations/server-configuration-parameters/settings.md
@@ -466,7 +466,7 @@ SSL客户端/服务器配置。
 -   requireTLSv1_2 – Require a TLSv1.2 connection. Acceptable values: `true`, `false`.
 -   fips – Activates OpenSSL FIPS mode. Supported if the library’s OpenSSL version supports FIPS.
 -   privateKeyPassphraseHandler – Class (PrivateKeyPassphraseHandler subclass) that requests the passphrase for accessing the private key. For example: `<privateKeyPassphraseHandler>`, `<name>KeyFileHandler</name>`, `<options><password>test</password></options>`, `</privateKeyPassphraseHandler>`.
--   invalidCertificateHandler – Class (a subclass of CertificateHandler) for verifying invalid certificates. For example: `<invalidCertificateHandler> <name>ConsoleCertificateHandler</name> </invalidCertificateHandler>` .
+-   invalidCertificateHandler – Class (a subclass of CertificateHandler) for verifying invalid certificates. For example: `<invalidCertificateHandler> <name>RejectCertificateHandler</name> </invalidCertificateHandler>` .
 -   disableProtocols – Protocols that are not allowed to use.
 -   preferServerCiphers – Preferred server ciphers on the client.
 
diff --git a/docs/zh/operations/system-tables/query_log.md b/docs/zh/operations/system-tables/query_log.md
index 7149282dfcc..0ba669906cb 100644
--- a/docs/zh/operations/system-tables/query_log.md
+++ b/docs/zh/operations/system-tables/query_log.md
@@ -60,11 +60,11 @@ ClickHouse不会自动从表中删除数据。更多详情请看 [introduction](
     -   0 — 由另一个查询发起的，作为分布式查询的一部分.
 -   `user` ([String](../../sql-reference/data-types/string.md)) — 发起查询的用户.
 -   `query_id` ([String](../../sql-reference/data-types/string.md)) — 查询ID.
--   `address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — 发起查询的客户端IP地址.
+-   `address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — 发起查询的客户端IP地址.
 -   `port` ([UInt16](../../sql-reference/data-types/int-uint.md)) — 发起查询的客户端端口.
 -   `initial_user` ([String](../../sql-reference/data-types/string.md)) — 初始查询的用户名（用于分布式查询执行）.
 -   `initial_query_id` ([String](../../sql-reference/data-types/string.md)) — 运行初始查询的ID（用于分布式查询执行）.
--   `initial_address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — 运行父查询的IP地址.
+-   `initial_address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — 运行父查询的IP地址.
 -   `initial_port` ([UInt16](../../sql-reference/data-types/int-uint.md)) — 发起父查询的客户端端口.
 -   `interface` ([UInt8](../../sql-reference/data-types/int-uint.md)) — 发起查询的接口. 可能的值:
     -   1 — TCP.
diff --git a/docs/zh/operations/system-tables/query_thread_log.md b/docs/zh/operations/system-tables/query_thread_log.md
index 8a41c1501a6..c4b7e2f1043 100644
--- a/docs/zh/operations/system-tables/query_thread_log.md
+++ b/docs/zh/operations/system-tables/query_thread_log.md
@@ -36,11 +36,11 @@ ClickHouse不会自动从表中删除数据。 欲了解更多详情，请参照
     -   0 — 由其他查询发起的分布式查询。
 -   `user` ([字符串](../../sql-reference/data-types/string.md)) — 发起查询的用户名。
 -   `query_id` ([字符串](../../sql-reference/data-types/string.md)) — 查询的ID。
--   `address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — 发起查询的IP地址。
+-   `address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — 发起查询的IP地址。
 -   `port` ([UInt16](../../sql-reference/data-types/int-uint.md#uint-ranges)) — 发起查询的端口。
 -   `initial_user` ([字符串](../../sql-reference/data-types/string.md)) — 首次发起查询的用户名（对于分布式查询）。
 -   `initial_query_id` ([字符串](../../sql-reference/data-types/string.md)) — 首次发起查询的ID（对于分布式查询）。
--   `initial_address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — 发起该查询的父查询IP地址。
+-   `initial_address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — 发起该查询的父查询IP地址。
 -   `initial_port` ([UInt16](../../sql-reference/data-types/int-uint.md#uint-ranges)) — 发起该查询的父查询端口。
 -   `interface` ([UInt8](../../sql-reference/data-types/int-uint.md#uint-ranges)) — 发起查询的界面，可能的值:
     -   1 — TCP.
diff --git a/docs/zh/operations/system-tables/zookeeper_log.md b/docs/zh/operations/system-tables/zookeeper_log.md
index 59dcdaecdc1..ebc51a2e79d 100644
--- a/docs/zh/operations/system-tables/zookeeper_log.md
+++ b/docs/zh/operations/system-tables/zookeeper_log.md
@@ -15,7 +15,7 @@ slug: /zh/operations/system-tables/zookeeper_log
     -   `Finalize` — 连接丢失, 未收到响应.
 -   `event_date` ([Date](../../sql-reference/data-types/date.md)) — 事件发生的日期.
 -   `event_time` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — 事件发生的日期和时间.
--   `address` ([IPv6](../../sql-reference/data-types/domains/ipv6.md)) — 用于发出请求的 ZooKeeper 服务器的 IP 地址.
+-   `address` ([IPv6](../../sql-reference/data-types/ipv6.md)) — 用于发出请求的 ZooKeeper 服务器的 IP 地址.
 -   `port` ([UInt16](../../sql-reference/data-types/int-uint.md)) — 用于发出请求的 ZooKeeper 服务器的端口.
 -   `session_id` ([Int64](../../sql-reference/data-types/int-uint.md)) — ZooKeeper 服务器为每个连接设置的会话 ID.
 -   `xid` ([Int32](../../sql-reference/data-types/int-uint.md)) — 会话中请求的 ID. 这通常是一个连续的请求编号. 请求行和配对的 `response`/`finalize` 行相同.
diff --git a/docs/zh/sql-reference/data-types/domains/ipv4.md b/docs/zh/sql-reference/data-types/ipv4.md
similarity index 98%
rename from docs/zh/sql-reference/data-types/domains/ipv4.md
rename to docs/zh/sql-reference/data-types/ipv4.md
index 69e17b2f617..b89af974b87 100644
--- a/docs/zh/sql-reference/data-types/domains/ipv4.md
+++ b/docs/zh/sql-reference/data-types/ipv4.md
@@ -1,5 +1,5 @@
 ---
-slug: /zh/sql-reference/data-types/domains/ipv4
+slug: /zh/sql-reference/data-types/ipv4
 ---
 ## IPv4 {#ipv4}
 
diff --git a/docs/zh/sql-reference/data-types/domains/ipv6.md b/docs/zh/sql-reference/data-types/ipv6.md
similarity index 98%
rename from docs/zh/sql-reference/data-types/domains/ipv6.md
rename to docs/zh/sql-reference/data-types/ipv6.md
index 9dd88692c37..3896bb873d8 100644
--- a/docs/zh/sql-reference/data-types/domains/ipv6.md
+++ b/docs/zh/sql-reference/data-types/ipv6.md
@@ -1,5 +1,5 @@
 ---
-slug: /zh/sql-reference/data-types/domains/ipv6
+slug: /zh/sql-reference/data-types/ipv6
 ---
 ## IPv6 {#ipv6}
 
diff --git a/docs/zh/whats-new/changelog/index.md b/docs/zh/whats-new/changelog/index.md
index 8fd19a0f1d8..3df4e40b204 100644
--- a/docs/zh/whats-new/changelog/index.md
+++ b/docs/zh/whats-new/changelog/index.md
@@ -6,4 +6,4 @@ sidebar_label:  Changelog
 
 # Changelog
 
-You can view the latest Changelog at [https://clickhouse.com/docs/en/whats-new/changelog/](https://clickhouse.com/docs/en/whats-new/changelog/)
\ No newline at end of file
+You can view the latest Changelog at [https://clickhouse.com/docs/en/whats-new/changelog/](/docs/en/whats-new/changelog/index.md)
diff --git a/programs/CMakeLists.txt b/programs/CMakeLists.txt
index c00d1f5349f..eb4a898d472 100644
--- a/programs/CMakeLists.txt
+++ b/programs/CMakeLists.txt
@@ -409,8 +409,15 @@ if (ENABLE_CLICKHOUSE_KEEPER_CONVERTER)
     list(APPEND CLICKHOUSE_BUNDLE clickhouse-keeper-converter)
 endif ()
 if (ENABLE_CLICKHOUSE_KEEPER_CLIENT)
-    add_custom_target (clickhouse-keeper-client ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-keeper-client DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-keeper-client" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
+    if (NOT BUILD_STANDALONE_KEEPER)
+        add_custom_target (clickhouse-keeper-client ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-keeper-client DEPENDS clickhouse)
+        install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-keeper-client" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
+    # symlink to standalone keeper binary
+    else ()
+        add_custom_target (clickhouse-keeper-client ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse-keeper clickhouse-keeper-client DEPENDS clickhouse-keeper)
+        install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-keeper-client" DESTINATION "${CMAKE_INSTALL_BINDIR}" COMPONENT clickhouse-keeper)
+    endif ()
+
     list(APPEND CLICKHOUSE_BUNDLE clickhouse-keeper-client)
 endif ()
 if (ENABLE_CLICKHOUSE_DISKS)
diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index 32a07284d26..19b601b9a7b 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -4,14 +4,16 @@
 #include <map>
 #include <iostream>
 #include <iomanip>
+#include <memory>
 #include <optional>
-#include <string_view>
+#include <Common/ThreadStatus.h>
 #include <Common/scope_guard_safe.h>
 #include <boost/program_options.hpp>
 #include <boost/algorithm/string/replace.hpp>
 #include <filesystem>
 #include <string>
 #include "Client.h"
+#include "Client/ConnectionString.h"
 #include "Core/Protocol.h"
 #include "Parsers/formatAST.h"
 
@@ -307,7 +309,7 @@ int Client::main(const std::vector<std::string> & /*args*/)
 try
 {
     UseSSL use_ssl;
-    MainThreadStatus::getInstance();
+    auto & thread_status = MainThreadStatus::getInstance();
     setupSignalHandler();
 
     std::cout << std::fixed << std::setprecision(3);
@@ -320,6 +322,14 @@ try
     processConfig();
     initTtyBuffer(toProgressOption(config().getString("progress", "default")));
 
+    {
+        // All that just to set DB::CurrentThread::get().getGlobalContext()
+        // which is required for client timezone (pushed from server) to work.
+        auto thread_group = std::make_shared<ThreadGroup>();
+        const_cast<ContextWeakPtr&>(thread_group->global_context) = global_context;
+        thread_status.attachToGroup(thread_group, false);
+    }
+
     /// Includes delayed_interactive.
     if (is_interactive)
     {
@@ -780,7 +790,7 @@ bool Client::processWithFuzzing(const String & full_query)
 
                 WriteBufferFromOStream cerr_buf(std::cerr, 4096);
                 fuzz_base->dumpTree(cerr_buf);
-                cerr_buf.next();
+                cerr_buf.finalize();
 
                 fmt::print(
                     stderr,
@@ -918,7 +928,7 @@ bool Client::processWithFuzzing(const String & full_query)
         std::cout << std::endl;
         WriteBufferFromOStream ast_buf(std::cout, 4096);
         formatAST(*query, ast_buf, false /*highlight*/);
-        ast_buf.next();
+        ast_buf.finalize();
         if (const auto * insert = query->as<ASTInsertQuery>())
         {
             /// For inserts with data it's really useful to have the data itself available in the logs, as formatAST doesn't print it
@@ -977,13 +987,7 @@ void Client::addOptions(OptionsDescription & options_description)
         ("connection", po::value<std::string>(), "connection to use (from the client config), by default connection name is hostname")
         ("secure,s", "Use TLS connection")
         ("user,u", po::value<std::string>()->default_value("default"), "user")
-        /** If "--password [value]" is used but the value is omitted, the bad argument exception will be thrown.
-            * implicit_value is used to avoid this exception (to allow user to type just "--password")
-            * Since currently boost provides no way to check if a value has been set implicitly for an option,
-            * the "\n" is used to distinguish this case because there is hardly a chance a user would use "\n"
-            * as the password.
-            */
-        ("password", po::value<std::string>()->implicit_value("\n", ""), "password")
+        ("password", po::value<std::string>(), "password")
         ("ask-password", "ask-password")
         ("quota_key", po::value<std::string>(), "A string to differentiate quotas when the user have keyed quotas configured on server")
 
@@ -1248,6 +1252,9 @@ void Client::readArguments(
     std::vector<Arguments> & external_tables_arguments,
     std::vector<Arguments> & hosts_and_ports_arguments)
 {
+    bool has_connection_string = argc >= 2 && tryParseConnectionString(std::string_view(argv[1]), common_arguments, hosts_and_ports_arguments);
+    int start_argument_index = has_connection_string ? 2 : 1;
+
     /** We allow different groups of arguments:
         * - common arguments;
         * - arguments for any number of external tables each in form "--external args...",
@@ -1260,10 +1267,13 @@ void Client::readArguments(
     std::string prev_host_arg;
     std::string prev_port_arg;
 
-    for (int arg_num = 1; arg_num < argc; ++arg_num)
+    for (int arg_num = start_argument_index; arg_num < argc; ++arg_num)
     {
         std::string_view arg = argv[arg_num];
 
+        if (has_connection_string)
+            checkIfCmdLineOptionCanBeUsedWithConnectionString(arg);
+
         if (arg == "--external")
         {
             in_external_group = true;
@@ -1391,6 +1401,14 @@ void Client::readArguments(
                 arg = argv[arg_num];
                 addMultiquery(arg, common_arguments);
             }
+            else if (arg == "--password" && ((arg_num + 1) >= argc || std::string_view(argv[arg_num + 1]).starts_with('-')))
+            {
+                common_arguments.emplace_back(arg);
+                /// No password was provided by user. Add '\n' as implicit password,
+                /// which encodes that client should ask user for the password.
+                /// '\n' is used because there is hardly a chance that a user would use '\n' as a password.
+                common_arguments.emplace_back("\n");
+            }
             else
                 common_arguments.emplace_back(arg);
         }
diff --git a/programs/copier/ClusterCopierApp.cpp b/programs/copier/ClusterCopierApp.cpp
index 822289dd89c..64071423b8e 100644
--- a/programs/copier/ClusterCopierApp.cpp
+++ b/programs/copier/ClusterCopierApp.cpp
@@ -44,7 +44,7 @@ void ClusterCopierApp::initialize(Poco::Util::Application & self)
     time_t timestamp = Poco::Timestamp().epochTime();
     auto curr_pid = Poco::Process::id();
 
-    process_id = std::to_string(DateLUT::instance().toNumYYYYMMDDhhmmss(timestamp)) + "_" + std::to_string(curr_pid);
+    process_id = std::to_string(DateLUT::serverTimezoneInstance().toNumYYYYMMDDhhmmss(timestamp)) + "_" + std::to_string(curr_pid);
     host_id = escapeForFileName(getFQDNOrHostName()) + '#' + process_id;
     process_path = fs::weakly_canonical(fs::path(base_dir) / ("clickhouse-copier_" + process_id));
     fs::create_directories(process_path);
diff --git a/programs/copier/ShardPartitionPiece.h b/programs/copier/ShardPartitionPiece.h
index aba378d466d..453364c0fc8 100644
--- a/programs/copier/ShardPartitionPiece.h
+++ b/programs/copier/ShardPartitionPiece.h
@@ -2,6 +2,8 @@
 
 #include <base/types.h>
 
+#include <vector>
+
 namespace DB
 {
 
diff --git a/programs/format/Format.cpp b/programs/format/Format.cpp
index 392ecefac0f..43c66a32302 100644
--- a/programs/format/Format.cpp
+++ b/programs/format/Format.cpp
@@ -151,6 +151,7 @@ int mainEntryClickHouseFormat(int argc, char ** argv)
 
             WriteBufferFromFileDescriptor out(STDOUT_FILENO);
             obfuscateQueries(query, out, obfuscated_words_map, used_nouns, hash_func, is_known_identifier);
+            out.finalize();
         }
         else
         {
@@ -175,7 +176,7 @@ int mainEntryClickHouseFormat(int argc, char ** argv)
                     {
                         WriteBufferFromOStream res_buf(std::cout, 4096);
                         formatAST(*res, res_buf, hilite, oneline);
-                        res_buf.next();
+                        res_buf.finalize();
                         if (multiple)
                             std::cout << "\n;\n";
                         std::cout << std::endl;
@@ -199,7 +200,7 @@ int mainEntryClickHouseFormat(int argc, char ** argv)
                             res_cout.write(*s_pos++);
                         }
 
-                        res_cout.next();
+                        res_cout.finalize();
                         if (multiple)
                             std::cout << " \\\n;\n";
                         std::cout << std::endl;
diff --git a/programs/keeper-client/KeeperClient.cpp b/programs/keeper-client/KeeperClient.cpp
index f38da1b72aa..f41dca1e27a 100644
--- a/programs/keeper-client/KeeperClient.cpp
+++ b/programs/keeper-client/KeeperClient.cpp
@@ -127,42 +127,42 @@ void KeeperClient::defineOptions(Poco::Util::OptionSet & options)
 
     options.addOption(
         Poco::Util::Option("host", "h", "server hostname. default `localhost`")
-            .argument("host")
+            .argument("<host>")
             .binding("host"));
 
     options.addOption(
         Poco::Util::Option("port", "p", "server port. default `2181`")
-            .argument("port")
+            .argument("<port>")
             .binding("port"));
 
     options.addOption(
         Poco::Util::Option("query", "q", "will execute given query, then exit.")
-            .argument("query")
+            .argument("<query>")
             .binding("query"));
 
     options.addOption(
         Poco::Util::Option("connection-timeout", "", "set connection timeout in seconds. default 10s.")
-            .argument("connection-timeout")
+            .argument("<seconds>")
             .binding("connection-timeout"));
 
     options.addOption(
         Poco::Util::Option("session-timeout", "", "set session timeout in seconds. default 10s.")
-            .argument("session-timeout")
+            .argument("<seconds>")
             .binding("session-timeout"));
 
     options.addOption(
         Poco::Util::Option("operation-timeout", "", "set operation timeout in seconds. default 10s.")
-            .argument("operation-timeout")
+            .argument("<seconds>")
             .binding("operation-timeout"));
 
     options.addOption(
         Poco::Util::Option("history-file", "", "set path of history file. default `~/.keeper-client-history`")
-            .argument("history-file")
+            .argument("<file>")
             .binding("history-file"));
 
     options.addOption(
         Poco::Util::Option("log-level", "", "set log level")
-            .argument("log-level")
+            .argument("<level>")
             .binding("log-level"));
 }
 
diff --git a/programs/keeper-converter/KeeperConverter.cpp b/programs/keeper-converter/KeeperConverter.cpp
index 7d25c1d5017..a049e6bc2b3 100644
--- a/programs/keeper-converter/KeeperConverter.cpp
+++ b/programs/keeper-converter/KeeperConverter.cpp
@@ -9,6 +9,7 @@
 #include <Poco/AutoPtr.h>
 #include <Poco/Logger.h>
 #include <Common/logger_useful.h>
+#include <Disks/DiskLocal.h>
 
 
 int mainEntryClickHouseKeeperConverter(int argc, char ** argv)
@@ -39,8 +40,9 @@ int mainEntryClickHouseKeeperConverter(int argc, char ** argv)
 
     try
     {
-        auto keeper_context = std::make_shared<KeeperContext>();
-        keeper_context->digest_enabled = true;
+        auto keeper_context = std::make_shared<KeeperContext>(true);
+        keeper_context->setDigestEnabled(true);
+        keeper_context->setSnapshotDisk(std::make_shared<DiskLocal>("Keeper-snapshots", options["output-dir"].as<std::string>(), 0));
 
         DB::KeeperStorage storage(/* tick_time_ms */ 500, /* superdigest */ "", keeper_context, /* initialize_system_nodes */ false);
 
@@ -51,10 +53,10 @@ int mainEntryClickHouseKeeperConverter(int argc, char ** argv)
         DB::SnapshotMetadataPtr snapshot_meta = std::make_shared<DB::SnapshotMetadata>(storage.getZXID(), 1, std::make_shared<nuraft::cluster_config>());
         DB::KeeperStorageSnapshot snapshot(&storage, snapshot_meta);
 
-        DB::KeeperSnapshotManager manager(options["output-dir"].as<std::string>(), 1, keeper_context);
+        DB::KeeperSnapshotManager manager(1, keeper_context);
         auto snp = manager.serializeSnapshotToBuffer(snapshot);
-        auto path = manager.serializeSnapshotBufferToDisk(*snp, storage.getZXID());
-        std::cout << "Snapshot serialized to path:" << path << std::endl;
+        auto file_info = manager.serializeSnapshotBufferToDisk(*snp, storage.getZXID());
+        std::cout << "Snapshot serialized to path:" << fs::path(file_info.disk->getPath()) / file_info.path << std::endl;
     }
     catch (...)
     {
diff --git a/programs/keeper/CMakeLists.txt b/programs/keeper/CMakeLists.txt
index 1f1138f49eb..18bdc8f317c 100644
--- a/programs/keeper/CMakeLists.txt
+++ b/programs/keeper/CMakeLists.txt
@@ -43,13 +43,15 @@ if (BUILD_STANDALONE_KEEPER)
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperDispatcher.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperLogStore.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperServer.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperContext.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperFeatureFlags.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperSnapshotManager.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperSnapshotManagerS3.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperStateMachine.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperContext.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperStateManager.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperStorage.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperAsynchronousMetrics.cpp
-        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/TinyContext.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/pathUtils.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/SessionExpiryQueue.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/SummingStateMachine.cpp
@@ -58,10 +60,14 @@ if (BUILD_STANDALONE_KEEPER)
 
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Core/SettingsFields.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Core/BaseSettings.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Core/ServerSettings.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Core/Field.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Core/SettingsEnums.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Core/ServerUUID.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Core/UUID.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Core/BackgroundSchedulePool.cpp
+
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/IO/ReadBuffer.cpp
 
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/KeeperTCPHandler.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/TCPServer.cpp
@@ -93,6 +99,10 @@ if (BUILD_STANDALONE_KEEPER)
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Compression/ICompressionCodec.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Compression/LZ4_decompress_faster.cpp
 
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Common/CurrentThread.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Common/NamedCollections/NamedCollections.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Common/NamedCollections/NamedCollectionConfiguration.cpp
+
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Common/ZooKeeper/IKeeper.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Common/ZooKeeper/TestKeeper.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Common/ZooKeeper/ZooKeeperCommon.cpp
@@ -103,24 +113,83 @@ if (BUILD_STANDALONE_KEEPER)
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Common/ZooKeeper/ZooKeeperLock.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Common/ZooKeeper/ZooKeeperNodeCache.cpp
 
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/registerDisks.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IDisk.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/DiskFactory.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/DiskSelector.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/DiskLocal.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/DiskLocalCheckThread.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/LocalDirectorySyncGuard.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/TemporaryFileOnDisk.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/loadLocalDiskConfig.cpp
+
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/IObjectStorage.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/MetadataStorageFromDisk.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/MetadataFromDiskTransactionState.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/DiskObjectStorageMetadata.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/MetadataStorageFromDiskTransactionOperations.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/DiskObjectStorage.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/DiskObjectStorageTransaction.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/DiskObjectStorageRemoteMetadataRestoreHelper.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/DiskObjectStorageCommon.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/ObjectStorageIteratorAsync.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/ObjectStorageIterator.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/StoredObject.cpp
+
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/S3/registerDiskS3.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/S3/S3Capabilities.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/S3/diskSettings.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/S3/ProxyListConfiguration.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/S3/ProxyResolverConfiguration.cpp
+
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/createReadBufferFromFileBase.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/IOUringReader.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/WriteBufferFromTemporaryFile.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/WriteBufferWithFinalizeCallback.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/getThreadPoolReader.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/ThreadPoolRemoteFSReader.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/ThreadPoolReader.cpp
+
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Storages/StorageS3Settings.cpp
+
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Daemon/BaseDaemon.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Daemon/SentryWriter.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Daemon/GraphiteWriter.cpp
         ${CMAKE_CURRENT_BINARY_DIR}/../../src/Daemon/GitHash.generated.cpp
 
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/Standalone/Context.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/Standalone/Settings.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/Standalone/ThreadStatusExt.cpp
+
         Keeper.cpp
         clickhouse-keeper.cpp
     )
 
+    # List of resources for clickhouse-keeper client
+    if (ENABLE_CLICKHOUSE_KEEPER_CLIENT)
+        list(APPEND CLICKHOUSE_KEEPER_STANDALONE_SOURCES
+            ${CMAKE_CURRENT_SOURCE_DIR}/../../programs/keeper-client/KeeperClient.cpp
+            ${CMAKE_CURRENT_SOURCE_DIR}/../../programs/keeper-client/Commands.cpp
+            ${CMAKE_CURRENT_SOURCE_DIR}/../../programs/keeper-client/Parser.cpp
+
+            ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Client/LineReader.cpp
+            ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Client/ReplxxLineReader.cpp
+        )
+    endif()
+
     clickhouse_add_executable(clickhouse-keeper ${CLICKHOUSE_KEEPER_STANDALONE_SOURCES})
 
     # Remove some redundant dependencies
     target_compile_definitions (clickhouse-keeper PRIVATE -DCLICKHOUSE_PROGRAM_STANDALONE_BUILD)
     target_compile_definitions (clickhouse-keeper PUBLIC -DWITHOUT_TEXT_LOG)
 
-    target_include_directories(clickhouse-keeper PUBLIC "${CMAKE_CURRENT_SOURCE_DIR}/../../src") # uses includes from src directory
-    target_include_directories(clickhouse-keeper PUBLIC "${CMAKE_CURRENT_BINARY_DIR}/../../src/Core/include") # uses some includes from core
-    target_include_directories(clickhouse-keeper PUBLIC "${CMAKE_CURRENT_BINARY_DIR}/../../src") # uses some includes from common
+    if (ENABLE_CLICKHOUSE_KEEPER_CLIENT AND TARGET ch_rust::skim)
+        target_link_libraries(clickhouse-keeper PRIVATE ch_rust::skim)
+    endif()
 
     target_link_libraries(clickhouse-keeper
         PRIVATE
diff --git a/programs/keeper/Keeper.cpp b/programs/keeper/Keeper.cpp
index 7633465c5e5..c0574853251 100644
--- a/programs/keeper/Keeper.cpp
+++ b/programs/keeper/Keeper.cpp
@@ -24,6 +24,8 @@
 #include <sys/stat.h>
 #include <pwd.h>
 
+#include <Interpreters/Context.h>
+
 #include <Coordination/FourLetterCommand.h>
 #include <Coordination/KeeperAsynchronousMetrics.h>
 
@@ -34,6 +36,8 @@
 #include "Core/Defines.h"
 #include "config.h"
 #include "config_version.h"
+#include "config_tools.h"
+
 
 #if USE_SSL
 #    include <Poco/Net/Context.h>
@@ -43,6 +47,8 @@
 #include <Server/ProtocolServerAdapter.h>
 #include <Server/KeeperTCPHandlerFactory.h>
 
+#include <Disks/registerDisks.h>
+
 
 int mainEntryClickHouseKeeper(int argc, char ** argv)
 {
@@ -131,7 +137,10 @@ int Keeper::run()
     if (config().hasOption("help"))
     {
         Poco::Util::HelpFormatter help_formatter(Keeper::options());
-        auto header_str = fmt::format("{} [OPTION] [-- [ARG]...]\n"
+        auto header_str = fmt::format("{0} [OPTION] [-- [ARG]...]\n"
+#if ENABLE_CLICKHOUSE_KEEPER_CLIENT
+                                      "{0} client [OPTION]\n"
+#endif
                                       "positional arguments can be used to rewrite config.xml properties, for example, --http_port=8010",
                                       commandName());
         help_formatter.setHeader(header_str);
@@ -196,9 +205,12 @@ void Keeper::defineOptions(Poco::Util::OptionSet & options)
     BaseDaemon::defineOptions(options);
 }
 
-struct Keeper::KeeperHTTPContext : public IHTTPContext
+namespace
 {
-    explicit KeeperHTTPContext(TinyContextPtr context_)
+
+struct KeeperHTTPContext : public IHTTPContext
+{
+    explicit KeeperHTTPContext(ContextPtr context_)
         : context(std::move(context_))
     {}
 
@@ -219,12 +231,12 @@ struct Keeper::KeeperHTTPContext : public IHTTPContext
 
     uint64_t getMaxFieldNameSize() const override
     {
-        return context->getConfigRef().getUInt64("keeper_server.http_max_field_name_size", 1048576);
+        return context->getConfigRef().getUInt64("keeper_server.http_max_field_name_size", 128 * 1024);
     }
 
     uint64_t getMaxFieldValueSize() const override
     {
-        return context->getConfigRef().getUInt64("keeper_server.http_max_field_value_size", 1048576);
+        return context->getConfigRef().getUInt64("keeper_server.http_max_field_value_size", 128 * 1024);
     }
 
     uint64_t getMaxChunkSize() const override
@@ -242,12 +254,14 @@ struct Keeper::KeeperHTTPContext : public IHTTPContext
         return {context->getConfigRef().getInt64("keeper_server.http_send_timeout", DBMS_DEFAULT_SEND_TIMEOUT_SEC), 0};
     }
 
-    TinyContextPtr context;
+    ContextPtr context;
 };
 
-HTTPContextPtr Keeper::httpContext()
+HTTPContextPtr httpContext()
 {
-    return std::make_shared<KeeperHTTPContext>(tiny_context);
+    return std::make_shared<KeeperHTTPContext>(Context::getGlobalContextInstance());
+}
+
 }
 
 int Keeper::main(const std::vector<std::string> & /*args*/)
@@ -301,8 +315,8 @@ try
 
     /// Initialize DateLUT early, to not interfere with running time of first query.
     LOG_DEBUG(log, "Initializing DateLUT.");
-    DateLUT::instance();
-    LOG_TRACE(log, "Initialized DateLUT with time zone '{}'.", DateLUT::instance().getTimeZone());
+    DateLUT::serverTimezoneInstance();
+    LOG_TRACE(log, "Initialized DateLUT with time zone '{}'.", DateLUT::serverTimezoneInstance().getTimeZone());
 
     /// Don't want to use DNS cache
     DNSResolver::instance().setDisableCacheFlag();
@@ -311,10 +325,21 @@ try
     std::mutex servers_lock;
     auto servers = std::make_shared<std::vector<ProtocolServerAdapter>>();
 
-    tiny_context = std::make_shared<TinyContext>();
+    auto shared_context = Context::createShared();
+    auto global_context = Context::createGlobal(shared_context.get());
+
+    global_context->makeGlobalContext();
+    global_context->setPath(path);
+    global_context->setRemoteHostFilter(config());
+
+    if (config().has("macros"))
+        global_context->setMacros(std::make_unique<Macros>(config(), "macros", log));
+
+    registerDisks(/*global_skip_access_check=*/false);
+
     /// This object will periodically calculate some metrics.
     KeeperAsynchronousMetrics async_metrics(
-        tiny_context,
+        global_context,
         config().getUInt("asynchronous_metrics_update_period_s", 1),
         [&]() -> std::vector<ProtocolServerMetrics>
         {
@@ -339,12 +364,12 @@ try
     }
 
     /// Initialize keeper RAFT. Do nothing if no keeper_server in config.
-    tiny_context->initializeKeeperDispatcher(/* start_async = */ true);
-    FourLetterCommandFactory::registerCommands(*tiny_context->getKeeperDispatcher());
+    global_context->initializeKeeperDispatcher(/* start_async = */ true);
+    FourLetterCommandFactory::registerCommands(*global_context->getKeeperDispatcher());
 
-    auto config_getter = [this] () -> const Poco::Util::AbstractConfiguration &
+    auto config_getter = [&] () -> const Poco::Util::AbstractConfiguration &
     {
-        return tiny_context->getConfigRef();
+        return global_context->getConfigRef();
     };
 
     auto tcp_receive_timeout = config().getInt64("keeper_server.socket_receive_timeout_sec", DBMS_DEFAULT_RECEIVE_TIMEOUT_SEC);
@@ -366,7 +391,7 @@ try
                 "Keeper (tcp): " + address.toString(),
                 std::make_unique<TCPServer>(
                     new KeeperTCPHandlerFactory(
-                        config_getter, tiny_context->getKeeperDispatcher(),
+                        config_getter, global_context->getKeeperDispatcher(),
                         tcp_receive_timeout, tcp_send_timeout, false), server_pool, socket));
         });
 
@@ -384,7 +409,7 @@ try
                 "Keeper with secure protocol (tcp_secure): " + address.toString(),
                 std::make_unique<TCPServer>(
                     new KeeperTCPHandlerFactory(
-                        config_getter, tiny_context->getKeeperDispatcher(),
+                        config_getter, global_context->getKeeperDispatcher(),
                         tcp_receive_timeout, tcp_send_timeout, true), server_pool, socket));
 #else
             UNUSED(port);
@@ -436,7 +461,7 @@ try
         [&](ConfigurationPtr config, bool /* initial_loading */)
         {
             if (config->has("keeper_server"))
-                tiny_context->updateKeeperConfiguration(*config);
+                global_context->updateKeeperConfiguration(*config);
         },
         /* already_loaded = */ false);  /// Reload it right now (initial loading)
 
@@ -467,7 +492,7 @@ try
         else
             LOG_INFO(log, "Closed connections to Keeper.");
 
-        tiny_context->shutdownKeeperDispatcher();
+        global_context->shutdownKeeperDispatcher();
 
         /// Wait server pool to avoid use-after-free of destroyed context in the handlers
         server_pool.joinAll();
diff --git a/programs/keeper/Keeper.h b/programs/keeper/Keeper.h
index 8a7724acb85..f889ffa595b 100644
--- a/programs/keeper/Keeper.h
+++ b/programs/keeper/Keeper.h
@@ -1,9 +1,7 @@
 #pragma once
 
 #include <Server/IServer.h>
-#include <Server/HTTP/HTTPContext.h>
 #include <Daemon/BaseDaemon.h>
-#include <Coordination/TinyContext.h>
 
 namespace Poco
 {
@@ -68,11 +66,6 @@ protected:
     std::string getDefaultConfigFileName() const override;
 
 private:
-    TinyContextPtr tiny_context;
-
-    struct KeeperHTTPContext;
-    HTTPContextPtr httpContext();
-
     Poco::Net::SocketAddress socketBindListen(Poco::Net::ServerSocket & socket, const std::string & host, UInt16 port, [[maybe_unused]] bool secure = false) const;
 
     using CreateServerFunc = std::function<void(UInt16)>;
diff --git a/programs/keeper/clickhouse-keeper.cpp b/programs/keeper/clickhouse-keeper.cpp
index baa673f79ee..be2686d936b 100644
--- a/programs/keeper/clickhouse-keeper.cpp
+++ b/programs/keeper/clickhouse-keeper.cpp
@@ -1,6 +1,30 @@
+#include <Common/StringUtils/StringUtils.h>
+#include "config_tools.h"
+
+
 int mainEntryClickHouseKeeper(int argc, char ** argv);
 
+#if ENABLE_CLICKHOUSE_KEEPER_CLIENT
+int mainEntryClickHouseKeeperClient(int argc, char ** argv);
+#endif
+
 int main(int argc_, char ** argv_)
 {
+#if ENABLE_CLICKHOUSE_KEEPER_CLIENT
+
+    if (argc_ >= 2)
+    {
+        /// 'clickhouse-keeper --client ...' and 'clickhouse-keeper client ...' are OK
+        if (strcmp(argv_[1], "--client") == 0 || strcmp(argv_[1], "client") == 0)
+        {
+            argv_[1] = argv_[0];
+            return mainEntryClickHouseKeeperClient(--argc_, argv_ + 1);
+        }
+    }
+
+    if (argc_ > 0 && (strcmp(argv_[0], "clickhouse-keeper-client") == 0 || endsWith(argv_[0], "/clickhouse-keeper-client")))
+        return mainEntryClickHouseKeeperClient(argc_, argv_);
+#endif
+
     return mainEntryClickHouseKeeper(argc_, argv_);
 }
diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 96c1ca261b5..caca7cfb50d 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -130,15 +130,31 @@ void LocalServer::initialize(Poco::Util::Application & self)
     });
 #endif
 
-    IOThreadPool::initialize(
+    getIOThreadPool().initialize(
         config().getUInt("max_io_thread_pool_size", 100),
         config().getUInt("max_io_thread_pool_free_size", 0),
         config().getUInt("io_thread_pool_queue_size", 10000));
 
-    OutdatedPartsLoadingThreadPool::initialize(
-        config().getUInt("max_outdated_parts_loading_thread_pool_size", 16),
+
+    const size_t active_parts_loading_threads = config().getUInt("max_active_parts_loading_thread_pool_size", 64);
+    getActivePartsLoadingThreadPool().initialize(
+        active_parts_loading_threads,
         0, // We don't need any threads one all the parts will be loaded
-        config().getUInt("max_outdated_parts_loading_thread_pool_size", 16));
+        active_parts_loading_threads);
+
+    const size_t outdated_parts_loading_threads = config().getUInt("max_outdated_parts_loading_thread_pool_size", 32);
+    getOutdatedPartsLoadingThreadPool().initialize(
+        outdated_parts_loading_threads,
+        0, // We don't need any threads one all the parts will be loaded
+        outdated_parts_loading_threads);
+
+    getOutdatedPartsLoadingThreadPool().setMaxTurboThreads(active_parts_loading_threads);
+
+    const size_t cleanup_threads = config().getUInt("max_parts_cleaning_thread_pool_size", 128);
+    getPartsCleaningThreadPool().initialize(
+        cleanup_threads,
+        0, // We don't need any threads one all the parts will be deleted
+        cleanup_threads);
 }
 
 
diff --git a/programs/obfuscator/Obfuscator.cpp b/programs/obfuscator/Obfuscator.cpp
index add16ec5205..3042ae2bb57 100644
--- a/programs/obfuscator/Obfuscator.cpp
+++ b/programs/obfuscator/Obfuscator.cpp
@@ -491,7 +491,7 @@ private:
     const DateLUTImpl & date_lut;
 
 public:
-    explicit DateTimeModel(UInt64 seed_) : seed(seed_), date_lut(DateLUT::instance()) {}
+    explicit DateTimeModel(UInt64 seed_) : seed(seed_), date_lut(DateLUT::serverTimezoneInstance()) {}
 
     void train(const IColumn &) override {}
     void finalize() override {}
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 9eb3e6c9ebc..d2d8a0d07fb 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -683,21 +683,36 @@ try
     });
 #endif
 
-    IOThreadPool::initialize(
+    getIOThreadPool().initialize(
         server_settings.max_io_thread_pool_size,
         server_settings.max_io_thread_pool_free_size,
         server_settings.io_thread_pool_queue_size);
 
-    BackupsIOThreadPool::initialize(
+    getBackupsIOThreadPool().initialize(
         server_settings.max_backups_io_thread_pool_size,
         server_settings.max_backups_io_thread_pool_free_size,
         server_settings.backups_io_thread_pool_queue_size);
 
-    OutdatedPartsLoadingThreadPool::initialize(
+    getActivePartsLoadingThreadPool().initialize(
+        server_settings.max_active_parts_loading_thread_pool_size,
+        0, // We don't need any threads once all the parts will be loaded
+        server_settings.max_active_parts_loading_thread_pool_size);
+
+    getOutdatedPartsLoadingThreadPool().initialize(
         server_settings.max_outdated_parts_loading_thread_pool_size,
-        0, // We don't need any threads one all the parts will be loaded
+        0, // We don't need any threads once all the parts will be loaded
         server_settings.max_outdated_parts_loading_thread_pool_size);
 
+    /// It could grow if we need to synchronously wait until all the data parts will be loaded.
+    getOutdatedPartsLoadingThreadPool().setMaxTurboThreads(
+        server_settings.max_active_parts_loading_thread_pool_size
+    );
+
+    getPartsCleaningThreadPool().initialize(
+        server_settings.max_parts_cleaning_thread_pool_size,
+        0, // We don't need any threads one all the parts will be deleted
+        server_settings.max_parts_cleaning_thread_pool_size);
+
     /// Initialize global local cache for remote filesystem.
     if (config().has("local_cache_for_remote_fs"))
     {
@@ -945,8 +960,8 @@ try
 
     /// Initialize DateLUT early, to not interfere with running time of first query.
     LOG_DEBUG(log, "Initializing DateLUT.");
-    DateLUT::instance();
-    LOG_TRACE(log, "Initialized DateLUT with time zone '{}'.", DateLUT::instance().getTimeZone());
+    DateLUT::serverTimezoneInstance();
+    LOG_TRACE(log, "Initialized DateLUT with time zone '{}'.", DateLUT::serverTimezoneInstance().getTimeZone());
 
     /// Storage with temporary data for processing of heavy queries.
     if (!server_settings.tmp_policy.value.empty())
@@ -1226,6 +1241,36 @@ try
             global_context->getMessageBrokerSchedulePool().increaseThreadsCount(server_settings_.background_message_broker_schedule_pool_size);
             global_context->getDistributedSchedulePool().increaseThreadsCount(server_settings_.background_distributed_schedule_pool_size);
 
+            getIOThreadPool().reloadConfiguration(
+                server_settings.max_io_thread_pool_size,
+                server_settings.max_io_thread_pool_free_size,
+                server_settings.io_thread_pool_queue_size);
+
+            getBackupsIOThreadPool().reloadConfiguration(
+                server_settings.max_backups_io_thread_pool_size,
+                server_settings.max_backups_io_thread_pool_free_size,
+                server_settings.backups_io_thread_pool_queue_size);
+
+            getActivePartsLoadingThreadPool().reloadConfiguration(
+                server_settings.max_active_parts_loading_thread_pool_size,
+                0, // We don't need any threads once all the parts will be loaded
+                server_settings.max_active_parts_loading_thread_pool_size);
+
+            getOutdatedPartsLoadingThreadPool().reloadConfiguration(
+                server_settings.max_outdated_parts_loading_thread_pool_size,
+                0, // We don't need any threads once all the parts will be loaded
+                server_settings.max_outdated_parts_loading_thread_pool_size);
+
+            /// It could grow if we need to synchronously wait until all the data parts will be loaded.
+            getOutdatedPartsLoadingThreadPool().setMaxTurboThreads(
+                server_settings.max_active_parts_loading_thread_pool_size
+            );
+
+            getPartsCleaningThreadPool().reloadConfiguration(
+                server_settings.max_parts_cleaning_thread_pool_size,
+                0, // We don't need any threads one all the parts will be deleted
+                server_settings.max_parts_cleaning_thread_pool_size);
+
             if (config->has("resources"))
             {
                 global_context->getResourceManager()->updateConfiguration(*config);
@@ -1660,7 +1705,6 @@ try
 #endif
 
         /// Must be done after initialization of `servers`, because async_metrics will access `servers` variable from its thread.
-
         async_metrics.start();
 
         {
diff --git a/programs/server/config.xml b/programs/server/config.xml
index d18b4cb2ac9..acd6d92a896 100644
--- a/programs/server/config.xml
+++ b/programs/server/config.xml
@@ -282,6 +282,13 @@
             <cacheSessions>true</cacheSessions>
             <disableProtocols>sslv2,sslv3</disableProtocols>
             <preferServerCiphers>true</preferServerCiphers>
+
+            <invalidCertificateHandler>
+                <!-- The server, in contrast to the client, cannot ask about the certificate interactively.
+                     The only reasonable option is to reject.
+                -->
+                <name>RejectCertificateHandler</name>
+            </invalidCertificateHandler>
         </server>
 
         <client> <!-- Used for connecting to https dictionary source and secured Zookeeper communication -->
@@ -1543,12 +1550,12 @@
     -->
 
     <!-- Configuration for the query cache -->
-    <!-- <query_cache> -->
-    <!--     <max_size_in_bytes>1073741824</max_size_in_bytes> -->
-    <!--     <max_entries>1024</max_entries> -->
-    <!--     <max_entry_size_in_bytes>1048576</max_entry_size_in_bytes> -->
-    <!--     <max_entry_size_in_rows>30000000</max_entry_size_in_rows> -->
-    <!-- </query_cache> -->
+    <query_cache>
+        <max_size_in_bytes>1073741824</max_size_in_bytes>
+        <max_entries>1024</max_entries>
+        <max_entry_size_in_bytes>1048576</max_entry_size_in_bytes>
+        <max_entry_size_in_rows>30000000</max_entry_size_in_rows>
+    </query_cache>
 
     <!-- Uncomment if enable merge tree metadata cache -->
     <!--merge_tree_metadata_cache>
diff --git a/programs/server/dashboard.html b/programs/server/dashboard.html
index 97b35ec97c4..951b7db3aa3 100644
--- a/programs/server/dashboard.html
+++ b/programs/server/dashboard.html
@@ -449,7 +449,7 @@ let queries = [
 FROM system.metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "CPU Usage (cores)",
@@ -457,7 +457,7 @@ ORDER BY t`
 FROM system.metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "Queries Running",
@@ -465,7 +465,7 @@ ORDER BY t`
 FROM system.metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "Merges Running",
@@ -473,7 +473,7 @@ ORDER BY t`
 FROM system.metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "Selected Bytes/second",
@@ -481,7 +481,7 @@ ORDER BY t`
 FROM system.metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "IO Wait",
@@ -489,7 +489,7 @@ ORDER BY t`
 FROM system.metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "CPU Wait",
@@ -497,7 +497,7 @@ ORDER BY t`
 FROM system.metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "OS CPU Usage (Userspace)",
@@ -506,7 +506,7 @@ FROM system.asynchronous_metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 AND metric = 'OSUserTimeNormalized'
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "OS CPU Usage (Kernel)",
@@ -515,7 +515,7 @@ FROM system.asynchronous_metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 AND metric = 'OSSystemTimeNormalized'
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "Read From Disk",
@@ -523,7 +523,7 @@ ORDER BY t`
 FROM system.metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "Read From Filesystem",
@@ -531,7 +531,7 @@ ORDER BY t`
 FROM system.metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "Memory (tracked)",
@@ -539,7 +539,7 @@ ORDER BY t`
 FROM system.metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "Load Average (15 minutes)",
@@ -548,7 +548,7 @@ FROM system.asynchronous_metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 AND metric = 'LoadAverage15'
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "Selected Rows/second",
@@ -556,7 +556,7 @@ ORDER BY t`
 FROM system.metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "Inserted Rows/second",
@@ -564,7 +564,7 @@ ORDER BY t`
 FROM system.metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "Total MergeTree Parts",
@@ -573,7 +573,7 @@ FROM system.asynchronous_metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 AND metric = 'TotalPartsOfMergeTreeTables'
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     },
     {
       "title": "Max Parts For Partition",
@@ -582,7 +582,7 @@ FROM system.asynchronous_metric_log
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 AND metric = 'MaxPartCountForPartition'
 GROUP BY t
-ORDER BY t`
+ORDER BY t WITH FILL STEP {rounding:UInt32}`
     }
 ];
 
diff --git a/rust/.cargo/config.toml.in b/rust/.cargo/config.toml.in
index a1dd966117b..db83145d449 100644
--- a/rust/.cargo/config.toml.in
+++ b/rust/.cargo/config.toml.in
@@ -1,3 +1,10 @@
 [env]
 CFLAGS = "@RUST_CFLAGS@"
 CXXFLAGS = "@RUST_CXXFLAGS@"
+
+[build]
+rustflags = @RUSTFLAGS@
+rustdocflags = @RUSTFLAGS@
+
+[unstable]
+@RUST_CARGO_BUILD_STD@
diff --git a/rust/BLAKE3/include/blake3.h b/rust/BLAKE3/include/blake3.h
index 85572506d43..5dc7d5bd902 100644
--- a/rust/BLAKE3/include/blake3.h
+++ b/rust/BLAKE3/include/blake3.h
@@ -8,8 +8,6 @@ extern "C" {
 
 char *blake3_apply_shim(const char *begin, uint32_t _size, uint8_t *out_char_data);
 
-char *blake3_apply_shim_msan_compat(const char *begin, uint32_t size, uint8_t *out_char_data);
-
 void blake3_free_char_pointer(char *ptr_to_free);
 
 } // extern "C"
diff --git a/rust/BLAKE3/src/lib.rs b/rust/BLAKE3/src/lib.rs
index 2b54787589f..011145d2f71 100644
--- a/rust/BLAKE3/src/lib.rs
+++ b/rust/BLAKE3/src/lib.rs
@@ -3,7 +3,6 @@ extern crate libc;
 
 use std::ffi::{CStr, CString};
 use std::os::raw::c_char;
-use std::mem;
 
 #[no_mangle]
 pub unsafe extern "C" fn blake3_apply_shim(
@@ -24,30 +23,6 @@ pub unsafe extern "C" fn blake3_apply_shim(
     std::ptr::null_mut()
 }
 
-#[no_mangle]
-pub unsafe extern "C" fn blake3_apply_shim_msan_compat(
-    mut begin: *const c_char,
-    size: u32,
-    out_char_data: *mut u8,
-) -> *mut c_char {
-    if begin.is_null() {
-        let err_str = CString::new("input was a null pointer").unwrap();
-        return err_str.into_raw();
-    }
-    libc::memset(out_char_data as *mut libc::c_void, 0, mem::size_of::<u8>());
-    let mut hasher = blake3::Hasher::new();
-    let mut vec = Vec::<u8>::new();
-    for _ in 0..size {
-        vec.push(*begin as u8);
-        begin = begin.add(1);
-    }
-    let input_res = vec.as_mut_slice();
-    hasher.update(input_res);
-    let mut reader = hasher.finalize_xof();
-    reader.fill(std::slice::from_raw_parts_mut(out_char_data, blake3::OUT_LEN));
-    std::ptr::null_mut()
-}
-
 // Freeing memory according to docs: https://doc.rust-lang.org/std/ffi/struct.CString.html#method.into_raw
 #[no_mangle]
 pub unsafe extern "C" fn blake3_free_char_pointer(ptr_to_free: *mut c_char) {
diff --git a/rust/CMakeLists.txt b/rust/CMakeLists.txt
index d229894791a..6700ead9786 100644
--- a/rust/CMakeLists.txt
+++ b/rust/CMakeLists.txt
@@ -14,8 +14,18 @@ macro(configure_rustc)
         set(RUST_CFLAGS "${RUST_CFLAGS} --sysroot ${CMAKE_SYSROOT}")
     endif()
 
+    set(RUSTFLAGS "[]")
+    set(RUST_CARGO_BUILD_STD "")
+    # For more info: https://doc.rust-lang.org/beta/unstable-book/compiler-flags/sanitizer.html#memorysanitizer
+    if (SANITIZE STREQUAL "memory")
+        set(RUST_CARGO_BUILD_STD "build-std = [\"std\", \"panic_abort\", \"core\", \"alloc\"]")
+        set(RUSTFLAGS "[\"-Zsanitizer=memory\", \"-Zsanitizer-memory-track-origins\"]")
+    endif()
+
     message(STATUS "RUST_CFLAGS: ${RUST_CFLAGS}")
     message(STATUS "RUST_CXXFLAGS: ${RUST_CXXFLAGS}")
+    message(STATUS "RUSTFLAGS: ${RUSTFLAGS}")
+    message(STATUS "RUST_CARGO_BUILD_STD: ${RUST_CARGO_BUILD_STD}")
 
     # NOTE: requires RW access for the source dir
     configure_file("${CMAKE_CURRENT_SOURCE_DIR}/.cargo/config.toml.in" "${CMAKE_CURRENT_SOURCE_DIR}/.cargo/config.toml" @ONLY)
diff --git a/rust/skim/CMakeLists.txt b/rust/skim/CMakeLists.txt
index c2e406ec12f..1e7a43aba7c 100644
--- a/rust/skim/CMakeLists.txt
+++ b/rust/skim/CMakeLists.txt
@@ -14,11 +14,6 @@ if (OS_FREEBSD)
     return()
 endif()
 
-if (SANITIZE STREQUAL "memory")
-    message(STATUS "skim is disabled under memory sanitizer, because the interop is not instrumented properly")
-    return()
-endif()
-
 clickhouse_import_crate(MANIFEST_PATH Cargo.toml)
 
 # -Wno-dollar-in-identifier-extension: cxx bridge complies names with '$'
diff --git a/rust/skim/Cargo.lock b/rust/skim/Cargo.lock
index badd22dad07..9f948ee1c38 100644
--- a/rust/skim/Cargo.lock
+++ b/rust/skim/Cargo.lock
@@ -14,13 +14,19 @@ dependencies = [
 
 [[package]]
 name = "aho-corasick"
-version = "0.7.20"
+version = "1.0.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "cc936419f96fa211c1b9166887b38e5e40b19958e5b895be7c1f93adec7071ac"
+checksum = "43f6cb1bf222025340178f382c426f13757b2960e89779dfcb319c32542a5a41"
 dependencies = [
  "memchr",
 ]
 
+[[package]]
+name = "android-tzdata"
+version = "0.1.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e999941b234f3131b00bc13c22d06e8c5ff726d1b6318ac7eb276997bbb4fef0"
+
 [[package]]
 name = "android_system_properties"
 version = "0.1.5"
@@ -32,9 +38,9 @@ dependencies = [
 
 [[package]]
 name = "arrayvec"
-version = "0.7.2"
+version = "0.7.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8da52d66c7071e2e3fa2a1e5c6d088fec47b593032b254f5e980de8ea54454d6"
+checksum = "96d30a06541fbafbc7f82ed10c06164cfbd2c401138f6addd8404629c4b16711"
 
 [[package]]
 name = "atty"
@@ -42,7 +48,7 @@ version = "0.2.14"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "d9b39be18770d11421cdb1b9947a45dd3f37e93092cbf377614828a319d5fee8"
 dependencies = [
- "hermit-abi",
+ "hermit-abi 0.1.19",
  "libc",
  "winapi",
 ]
@@ -67,15 +73,15 @@ checksum = "bef38d45163c2f1dde094a7dfd33ccf595c92905c8f8f4fdc18d06fb1037718a"
 
 [[package]]
 name = "bumpalo"
-version = "3.11.1"
+version = "3.13.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "572f695136211188308f16ad2ca5c851a712c464060ae6974944458eb83880ba"
+checksum = "a3e2c3daef883ecc1b5d58c15adae93470a91d425f3532ba1695849656af3fc1"
 
 [[package]]
 name = "cc"
-version = "1.0.77"
+version = "1.0.79"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e9f73505338f7d905b19d18738976aae232eb46b8efc15554ffc56deb5d9ebe4"
+checksum = "50d30906286121d95be3d479533b458f87493b30a4b5f79a607db8f5d11aa91f"
 
 [[package]]
 name = "cfg-if"
@@ -85,13 +91,13 @@ checksum = "baf1de4339761588bc0619e3cbc0120ee582ebb74b53b4efbf79117bd2da40fd"
 
 [[package]]
 name = "chrono"
-version = "0.4.23"
+version = "0.4.26"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "16b0a3d9ed01224b22057780a37bb8c5dbfe1be8ba48678e7bf57ec4b385411f"
+checksum = "ec837a71355b28f6556dbd569b37b3f363091c0bd4b2e735674521b4c5fd9bc5"
 dependencies = [
+ "android-tzdata",
  "iana-time-zone",
  "js-sys",
- "num-integer",
  "num-traits",
  "time 0.1.45",
  "wasm-bindgen",
@@ -100,9 +106,9 @@ dependencies = [
 
 [[package]]
 name = "clap"
-version = "3.2.23"
+version = "3.2.25"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "71655c45cb9845d3270c9d6df84ebe72b4dad3c2ba3f7023ad47c144e4e473a5"
+checksum = "4ea181bf566f71cb9a5d17a59e1871af638180a18fb0035c92ae62b705207123"
 dependencies = [
  "atty",
  "bitflags",
@@ -135,9 +141,9 @@ dependencies = [
 
 [[package]]
 name = "core-foundation-sys"
-version = "0.8.3"
+version = "0.8.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5827cebf4670468b8772dd191856768aedcb1b0278a04f989f7766351917b9dc"
+checksum = "e496a50fda8aacccc86d7529e2c1e0892dbd0f898a6b5645b5561b89c3210efa"
 
 [[package]]
 name = "crossbeam"
@@ -155,9 +161,9 @@ dependencies = [
 
 [[package]]
 name = "crossbeam-channel"
-version = "0.5.6"
+version = "0.5.8"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c2dd04ddaf88237dc3b8d8f9a3c1004b506b54b3313403944054d23c0870c521"
+checksum = "a33c2bf77f2df06183c3aa30d1e96c0695a313d4f9c453cc3762a6db39f99200"
 dependencies = [
  "cfg-if",
  "crossbeam-utils",
@@ -165,9 +171,9 @@ dependencies = [
 
 [[package]]
 name = "crossbeam-deque"
-version = "0.8.2"
+version = "0.8.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "715e8152b692bba2d374b53d4875445368fdf21a94751410af607a5ac677d1fc"
+checksum = "ce6fd6f855243022dcecf8702fef0c297d4338e226845fe067f6341ad9fa0cef"
 dependencies = [
  "cfg-if",
  "crossbeam-epoch",
@@ -176,14 +182,14 @@ dependencies = [
 
 [[package]]
 name = "crossbeam-epoch"
-version = "0.9.13"
+version = "0.9.15"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "01a9af1f4c2ef74bb8aa1f7e19706bc72d03598c8a570bb5de72243c7a9d9d5a"
+checksum = "ae211234986c545741a7dc064309f67ee1e5ad243d0e48335adc0484d960bcc7"
 dependencies = [
  "autocfg",
  "cfg-if",
  "crossbeam-utils",
- "memoffset 0.7.1",
+ "memoffset 0.9.0",
  "scopeguard",
 ]
 
@@ -199,18 +205,18 @@ dependencies = [
 
 [[package]]
 name = "crossbeam-utils"
-version = "0.8.14"
+version = "0.8.16"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4fb766fa798726286dbbb842f174001dab8abc7b627a1dd86e0b7222a95d929f"
+checksum = "5a22b2d63d4d1dc0b7f1b6b2747dd0088008a9be28b6ddf0b1e7d335e3037294"
 dependencies = [
  "cfg-if",
 ]
 
 [[package]]
 name = "cxx"
-version = "1.0.83"
+version = "1.0.97"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bdf07d07d6531bfcdbe9b8b739b104610c6508dcc4d63b410585faf338241daf"
+checksum = "e88abab2f5abbe4c56e8f1fb431b784d710b709888f35755a160e62e33fe38e8"
 dependencies = [
  "cc",
  "cxxbridge-flags",
@@ -220,9 +226,9 @@ dependencies = [
 
 [[package]]
 name = "cxx-build"
-version = "1.0.83"
+version = "1.0.97"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d2eb5b96ecdc99f72657332953d4d9c50135af1bac34277801cc3937906ebd39"
+checksum = "5c0c11acd0e63bae27dcd2afced407063312771212b7a823b4fd72d633be30fb"
 dependencies = [
  "cc",
  "codespan-reporting",
@@ -230,31 +236,31 @@ dependencies = [
  "proc-macro2",
  "quote",
  "scratch",
- "syn",
+ "syn 2.0.23",
 ]
 
 [[package]]
 name = "cxxbridge-flags"
-version = "1.0.83"
+version = "1.0.97"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ac040a39517fd1674e0f32177648334b0f4074625b5588a64519804ba0553b12"
+checksum = "8d3816ed957c008ccd4728485511e3d9aaf7db419aa321e3d2c5a2f3411e36c8"
 
 [[package]]
 name = "cxxbridge-macro"
-version = "1.0.83"
+version = "1.0.97"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1362b0ddcfc4eb0a1f57b68bd77dd99f0e826958a96abd0ae9bd092e114ffed6"
+checksum = "a26acccf6f445af85ea056362561a24ef56cdc15fcc685f03aec50b9c702cb6d"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn",
+ "syn 2.0.23",
 ]
 
 [[package]]
 name = "darling"
-version = "0.14.2"
+version = "0.14.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b0dd3cd20dc6b5a876612a6e5accfe7f3dd883db6d07acfbf14c128f61550dfa"
+checksum = "7b750cb3417fd1b327431a470f388520309479ab0bf5e323505daf0290cd3850"
 dependencies = [
  "darling_core",
  "darling_macro",
@@ -262,27 +268,27 @@ dependencies = [
 
 [[package]]
 name = "darling_core"
-version = "0.14.2"
+version = "0.14.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a784d2ccaf7c98501746bf0be29b2022ba41fd62a2e622af997a03e9f972859f"
+checksum = "109c1ca6e6b7f82cc233a97004ea8ed7ca123a9af07a8230878fcfda9b158bf0"
 dependencies = [
  "fnv",
  "ident_case",
  "proc-macro2",
  "quote",
  "strsim",
- "syn",
+ "syn 1.0.109",
 ]
 
 [[package]]
 name = "darling_macro"
-version = "0.14.2"
+version = "0.14.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7618812407e9402654622dd402b0a89dff9ba93badd6540781526117b92aab7e"
+checksum = "a4aab4dbc9f7611d8b55048a3a16d2d010c2c8334e46304b40ac1cc14bf3b48e"
 dependencies = [
  "darling_core",
  "quote",
- "syn",
+ "syn 1.0.109",
 ]
 
 [[package]]
@@ -313,7 +319,7 @@ dependencies = [
  "darling",
  "proc-macro2",
  "quote",
- "syn",
+ "syn 1.0.109",
 ]
 
 [[package]]
@@ -323,7 +329,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "8f0314b72bed045f3a68671b3c86328386762c93f82d98c65c3cb5e5f573dd68"
 dependencies = [
  "derive_builder_core",
- "syn",
+ "syn 1.0.109",
 ]
 
 [[package]]
@@ -349,9 +355,9 @@ dependencies = [
 
 [[package]]
 name = "either"
-version = "1.8.0"
+version = "1.8.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "90e5c1c8368803113bf0c9584fc495a58b86dc8a29edbf8fe877d21d9507e797"
+checksum = "7fcaabb2fef8c910e7f4c7ce9f67a1283a1715879a7c230ca9d6d1ae31f16d91"
 
 [[package]]
 name = "env_logger"
@@ -383,9 +389,9 @@ dependencies = [
 
 [[package]]
 name = "getrandom"
-version = "0.2.8"
+version = "0.2.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c05aeb6a22b8f62540c194aac980f2115af067bfe15a0734d7277a768d396b31"
+checksum = "be4136b2a15dd319360be1c07d9933517ccf0be8f16bf62a3bee4f0d618df427"
 dependencies = [
  "cfg-if",
  "libc",
@@ -407,6 +413,12 @@ dependencies = [
  "libc",
 ]
 
+[[package]]
+name = "hermit-abi"
+version = "0.3.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "fed44880c466736ef9a5c5b5facefb5ed0785676d0c02d612db14e54f0d84286"
+
 [[package]]
 name = "humantime"
 version = "2.1.0"
@@ -415,26 +427,25 @@ checksum = "9a3a5bfb195931eeb336b2a7b4d761daec841b97f947d34394601737a7bba5e4"
 
 [[package]]
 name = "iana-time-zone"
-version = "0.1.53"
+version = "0.1.57"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "64c122667b287044802d6ce17ee2ddf13207ed924c712de9a66a5814d5b64765"
+checksum = "2fad5b825842d2b38bd206f3e81d6957625fd7f0a361e345c30e01a0ae2dd613"
 dependencies = [
  "android_system_properties",
  "core-foundation-sys",
  "iana-time-zone-haiku",
  "js-sys",
  "wasm-bindgen",
- "winapi",
+ "windows",
 ]
 
 [[package]]
 name = "iana-time-zone-haiku"
-version = "0.1.1"
+version = "0.1.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0703ae284fc167426161c2e3f1da3ea71d94b21bedbcc9494e92b28e334e3dca"
+checksum = "f31827a206f56af32e590ba56d5d2d085f558508192593743f16b2306495269f"
 dependencies = [
- "cxx",
- "cxx-build",
+ "cc",
 ]
 
 [[package]]
@@ -445,9 +456,9 @@ checksum = "b9e0384b61958566e926dc50660321d12159025e767c18e043daf26b70104c39"
 
 [[package]]
 name = "indexmap"
-version = "1.9.2"
+version = "1.9.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1885e79c1fc4b10f0e172c475f458b7f7b93061064d98c3293e98c5ba0c8b399"
+checksum = "bd070e393353796e801d209ad339e89596eb4c8d430d18ede6a1cced8fafbd99"
 dependencies = [
  "autocfg",
  "hashbrown",
@@ -455,9 +466,9 @@ dependencies = [
 
 [[package]]
 name = "js-sys"
-version = "0.3.60"
+version = "0.3.64"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "49409df3e3bf0856b916e2ceaca09ee28e6871cf7d9ce97a692cacfdb2a25a47"
+checksum = "c5f195fe497f702db0f318b07fdd68edb16955aed830df8363d837542f8f935a"
 dependencies = [
  "wasm-bindgen",
 ]
@@ -470,27 +481,24 @@ checksum = "e2abad23fbc42b3700f2f279844dc832adb2b2eb069b2df918f455c4e18cc646"
 
 [[package]]
 name = "libc"
-version = "0.2.138"
+version = "0.2.147"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "db6d7e329c562c5dfab7a46a2afabc8b987ab9a4834c9d1ca04dc54c1546cef8"
+checksum = "b4668fb0ea861c1df094127ac5f1da3409a82116a4ba74fca2e58ef927159bb3"
 
 [[package]]
 name = "link-cplusplus"
-version = "1.0.7"
+version = "1.0.8"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9272ab7b96c9046fbc5bc56c06c117cb639fe2d509df0c421cad82d2915cf369"
+checksum = "ecd207c9c713c34f95a097a5b029ac2ce6010530c7b49d7fea24d977dede04f5"
 dependencies = [
  "cc",
 ]
 
 [[package]]
 name = "log"
-version = "0.4.17"
+version = "0.4.19"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "abb12e687cfb44aa40f41fc3978ef76448f9b6038cad6aef4259d3c095a2382e"
-dependencies = [
- "cfg-if",
-]
+checksum = "b06a4cde4c0f271a446782e3eff8de789548ce57dbc8eca9292c27f4a42004b4"
 
 [[package]]
 name = "memchr"
@@ -509,9 +517,9 @@ dependencies = [
 
 [[package]]
 name = "memoffset"
-version = "0.7.1"
+version = "0.9.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5de893c32cde5f383baa4c04c5d6dbdd735cfd4a794b0debdb2bb1b421da5ff4"
+checksum = "5a634b1c61a95585bd15607c6ab0c4e5b226e695ff2800ba0cdccddf208c406c"
 dependencies = [
  "autocfg",
 ]
@@ -541,16 +549,6 @@ dependencies = [
  "pin-utils",
 ]
 
-[[package]]
-name = "num-integer"
-version = "0.1.45"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "225d3389fb3509a24c93f5c29eb6bde2586b98d9f016636dff58d7c6f7569cd9"
-dependencies = [
- "autocfg",
- "num-traits",
-]
-
 [[package]]
 name = "num-traits"
 version = "0.2.15"
@@ -562,25 +560,25 @@ dependencies = [
 
 [[package]]
 name = "num_cpus"
-version = "1.14.0"
+version = "1.16.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f6058e64324c71e02bc2b150e4f3bc8286db6c83092132ffa3f6b1eab0f9def5"
+checksum = "4161fcb6d602d4d2081af7c3a45852d875a03dd337a6bfdd6e06407b61342a43"
 dependencies = [
- "hermit-abi",
+ "hermit-abi 0.3.1",
  "libc",
 ]
 
 [[package]]
 name = "once_cell"
-version = "1.16.0"
+version = "1.18.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "86f0b0d4bf799edbc74508c1e8bf170ff5f41238e5f8225603ca7caaae2b7860"
+checksum = "dd8b5dd2ae5ed71462c540258bedcb51965123ad7e7ccf4b9a8cafaa4a63576d"
 
 [[package]]
 name = "os_str_bytes"
-version = "6.4.1"
+version = "6.5.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9b7820b9daea5457c9f21c69448905d723fbd21136ccf521748f23fd49e723ee"
+checksum = "4d5d9eb14b174ee9aa2ef96dc2b94637a2d4b6e7cb873c7e171f0c20c6cf3eac"
 
 [[package]]
 name = "pin-utils"
@@ -590,27 +588,27 @@ checksum = "8b870d8c151b6f2fb93e84a13146138f05d02ed11c7e7c54f8826aaaf7c9f184"
 
 [[package]]
 name = "proc-macro2"
-version = "1.0.47"
+version = "1.0.63"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5ea3d908b0e36316caf9e9e2c4625cdde190a7e6f440d794667ed17a1855e725"
+checksum = "7b368fba921b0dce7e60f5e04ec15e565b3303972b42bcfde1d0713b881959eb"
 dependencies = [
  "unicode-ident",
 ]
 
 [[package]]
 name = "quote"
-version = "1.0.21"
+version = "1.0.29"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bbe448f377a7d6961e30f5955f9b8d106c3f5e449d493ee1b125c1d43c2b5179"
+checksum = "573015e8ab27661678357f27dc26460738fd2b6c86e46f386fde94cb5d913105"
 dependencies = [
  "proc-macro2",
 ]
 
 [[package]]
 name = "rayon"
-version = "1.6.1"
+version = "1.7.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6db3a213adf02b3bcfd2d3846bb41cb22857d131789e01df434fb7e7bc0759b7"
+checksum = "1d2df5196e37bcc87abebc0053e20787d73847bb33134a69841207dd0a47f03b"
 dependencies = [
  "either",
  "rayon-core",
@@ -618,9 +616,9 @@ dependencies = [
 
 [[package]]
 name = "rayon-core"
-version = "1.10.1"
+version = "1.11.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "cac410af5d00ab6884528b4ab69d1e8e146e8d471201800fa1b4524126de6ad3"
+checksum = "4b8f95bd6966f5c87776639160a66bd8ab9895d9d4ab01ddba9fc60661aebe8d"
 dependencies = [
  "crossbeam-channel",
  "crossbeam-deque",
@@ -650,9 +648,9 @@ dependencies = [
 
 [[package]]
 name = "regex"
-version = "1.7.0"
+version = "1.8.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e076559ef8e241f2ae3479e36f97bd5741c0330689e217ad51ce2c76808b868a"
+checksum = "d0ab3ca65655bb1e41f2a8c8cd662eb4fb035e67c3f78da1d61dffe89d07300f"
 dependencies = [
  "aho-corasick",
  "memchr",
@@ -661,15 +659,15 @@ dependencies = [
 
 [[package]]
 name = "regex-syntax"
-version = "0.6.28"
+version = "0.7.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "456c603be3e8d448b072f410900c09faf164fbce2d480456f50eea6e25f9c848"
+checksum = "436b050e76ed2903236f032a59761c1eb99e1b0aead2c257922771dab1fc8c78"
 
 [[package]]
 name = "rustversion"
-version = "1.0.9"
+version = "1.0.12"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "97477e48b4cf8603ad5f7aaf897467cf42ab4218a38ef76fb14c2d6773a6d6a8"
+checksum = "4f3208ce4d8448b3f3e7d168a73f5e0c43a61e32930de3bceeccedb388b6bf06"
 
 [[package]]
 name = "scopeguard"
@@ -679,15 +677,15 @@ checksum = "d29ab0c6d3fc0ee92fe66e2d99f700eab17a8d57d1c1d3b748380fb20baa78cd"
 
 [[package]]
 name = "scratch"
-version = "1.0.2"
+version = "1.0.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9c8132065adcfd6e02db789d9285a0deb2f3fcb04002865ab67d5fb103533898"
+checksum = "1792db035ce95be60c3f8853017b3999209281c24e2ba5bc8e59bf97a0c590c1"
 
 [[package]]
 name = "serde"
-version = "1.0.149"
+version = "1.0.164"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "256b9932320c590e707b94576e3cc1f7c9024d0ee6612dfbcf1cb106cbe8e055"
+checksum = "9e8c8cf938e98f769bc164923b06dce91cea1751522f46f8466461af04c9027d"
 
 [[package]]
 name = "shlex"
@@ -697,9 +695,9 @@ checksum = "43b2853a4d09f215c24cc5489c992ce46052d359b5109343cbafbf26bc62f8a3"
 
 [[package]]
 name = "skim"
-version = "0.10.2"
+version = "0.10.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "cebed5f897cd6c0d80fbe30adb36c0abf7400e93043a63ae56458495642b3485"
+checksum = "e5d28de0a6cb2cdd83a076f1de9d965b973ae08b244df1aa70b432946dda0f32"
 dependencies = [
  "atty",
  "beef",
@@ -717,7 +715,7 @@ dependencies = [
  "rayon",
  "regex",
  "shlex",
- "time 0.3.17",
+ "time 0.3.22",
  "timer",
  "tuikit",
  "unicode-width",
@@ -732,9 +730,20 @@ checksum = "73473c0e59e6d5812c5dfe2a064a6444949f089e20eec9a2e5506596494e4623"
 
 [[package]]
 name = "syn"
-version = "1.0.105"
+version = "1.0.109"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "60b9b43d45702de4c839cb9b51d9f529c5dd26a4aff255b42b1ebc03e88ee908"
+checksum = "72b64191b275b66ffe2469e8af2c1cfe3bafa67b529ead792a6d0160888b4237"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "unicode-ident",
+]
+
+[[package]]
+name = "syn"
+version = "2.0.23"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "59fb7d6d8281a51045d62b8eb3a7d1ce347b76f312af50cd3dc0af39c87c1737"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -754,9 +763,9 @@ dependencies = [
 
 [[package]]
 name = "termcolor"
-version = "1.1.3"
+version = "1.2.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bab24d30b911b2376f3a13cc2cd443142f0c81dda04c118693e35b3835757755"
+checksum = "be55cf8942feac5c765c2c993422806843c9a9a45d4d5c407ad6dd2ea95eb9b6"
 dependencies = [
  "winapi-util",
 ]
@@ -769,30 +778,31 @@ checksum = "222a222a5bfe1bba4a77b45ec488a741b3cb8872e5e499451fd7d0129c9c7c3d"
 
 [[package]]
 name = "thiserror"
-version = "1.0.37"
+version = "1.0.40"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "10deb33631e3c9018b9baf9dcbbc4f737320d2b576bac10f6aefa048fa407e3e"
+checksum = "978c9a314bd8dc99be594bc3c175faaa9794be04a5a5e153caba6915336cebac"
 dependencies = [
  "thiserror-impl",
 ]
 
 [[package]]
 name = "thiserror-impl"
-version = "1.0.37"
+version = "1.0.40"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "982d17546b47146b28f7c22e3d08465f6b8903d0ea13c1660d9d84a6e7adcdbb"
+checksum = "f9456a42c5b0d803c8cd86e73dd7cc9edd429499f37a3550d286d5e86720569f"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn",
+ "syn 2.0.23",
 ]
 
 [[package]]
 name = "thread_local"
-version = "1.1.4"
+version = "1.1.7"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5516c27b78311c50bf42c071425c560ac799b11c30b31f87e3081965fe5e0180"
+checksum = "3fdd6f064ccff2d6567adcb3873ca630700f00b5ad3f060c25b5dcfd9a4ce152"
 dependencies = [
+ "cfg-if",
  "once_cell",
 ]
 
@@ -809,9 +819,9 @@ dependencies = [
 
 [[package]]
 name = "time"
-version = "0.3.17"
+version = "0.3.22"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a561bf4617eebd33bca6434b988f39ed798e527f51a1e797d0ee4f61c0a38376"
+checksum = "ea9e1b3cf1243ae005d9e74085d4d542f3125458f3a81af210d901dcd7411efd"
 dependencies = [
  "serde",
  "time-core",
@@ -819,9 +829,9 @@ dependencies = [
 
 [[package]]
 name = "time-core"
-version = "0.1.0"
+version = "0.1.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2e153e1f1acaef8acc537e68b44906d2db6436e2b35ac2c6b42640fff91f00fd"
+checksum = "7300fbefb4dadc1af235a9cef3737cea692a9d97e1b9cbcd4ebdae6f8868e6fb"
 
 [[package]]
 name = "timer"
@@ -848,9 +858,9 @@ dependencies = [
 
 [[package]]
 name = "unicode-ident"
-version = "1.0.5"
+version = "1.0.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6ceab39d59e4c9499d4e5a8ee0e2735b891bb7308ac83dfb4e80cad195c9f6f3"
+checksum = "b15811caf2415fb889178633e7724bad2509101cde276048e013b9def5e51fa0"
 
 [[package]]
 name = "unicode-width"
@@ -860,15 +870,15 @@ checksum = "c0edd1e5b14653f783770bce4a4dabb4a5108a5370a5f5d8cfe8710c361f6c8b"
 
 [[package]]
 name = "utf8parse"
-version = "0.2.0"
+version = "0.2.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "936e4b492acfd135421d8dca4b1aa80a7bfc26e702ef3af710e0752684df5372"
+checksum = "711b9620af191e0cdc7468a8d14e709c3dcdb115b36f838e601583af800a370a"
 
 [[package]]
 name = "vte"
-version = "0.11.0"
+version = "0.11.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1aae21c12ad2ec2d168c236f369c38ff332bc1134f7246350dca641437365045"
+checksum = "f5022b5fbf9407086c180e9557be968742d839e68346af7792b8592489732197"
 dependencies = [
  "arrayvec",
  "utf8parse",
@@ -899,9 +909,9 @@ checksum = "9c8d87e72b64a3b4db28d11ce29237c246188f4f51057d65a7eab63b7987e423"
 
 [[package]]
 name = "wasm-bindgen"
-version = "0.2.83"
+version = "0.2.87"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "eaf9f5aceeec8be17c128b2e93e031fb8a4d469bb9c4ae2d7dc1888b26887268"
+checksum = "7706a72ab36d8cb1f80ffbf0e071533974a60d0a308d01a5d0375bf60499a342"
 dependencies = [
  "cfg-if",
  "wasm-bindgen-macro",
@@ -909,24 +919,24 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-backend"
-version = "0.2.83"
+version = "0.2.87"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4c8ffb332579b0557b52d268b91feab8df3615f265d5270fec2a8c95b17c1142"
+checksum = "5ef2b6d3c510e9625e5fe6f509ab07d66a760f0885d858736483c32ed7809abd"
 dependencies = [
  "bumpalo",
  "log",
  "once_cell",
  "proc-macro2",
  "quote",
- "syn",
+ "syn 2.0.23",
  "wasm-bindgen-shared",
 ]
 
 [[package]]
 name = "wasm-bindgen-macro"
-version = "0.2.83"
+version = "0.2.87"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "052be0f94026e6cbc75cdefc9bae13fd6052cdcaf532fa6c45e7ae33a1e6c810"
+checksum = "dee495e55982a3bd48105a7b947fd2a9b4a8ae3010041b9e0faab3f9cd028f1d"
 dependencies = [
  "quote",
  "wasm-bindgen-macro-support",
@@ -934,22 +944,22 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-macro-support"
-version = "0.2.83"
+version = "0.2.87"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "07bc0c051dc5f23e307b13285f9d75df86bfdf816c5721e573dec1f9b8aa193c"
+checksum = "54681b18a46765f095758388f2d0cf16eb8d4169b639ab575a8f5693af210c7b"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn",
+ "syn 2.0.23",
  "wasm-bindgen-backend",
  "wasm-bindgen-shared",
 ]
 
 [[package]]
 name = "wasm-bindgen-shared"
-version = "0.2.83"
+version = "0.2.87"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1c38c045535d93ec4f0b4defec448e4291638ee608530863b1e2ba115d4fff7f"
+checksum = "ca6ad05a4870b2bf5fe995117d3728437bd27d7cd5f06f13c17443ef369775a1"
 
 [[package]]
 name = "winapi"
@@ -981,3 +991,69 @@ name = "winapi-x86_64-pc-windows-gnu"
 version = "0.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "712e227841d057c1ee1cd2fb22fa7e5a5461ae8e48fa2ca79ec42cfc1931183f"
+
+[[package]]
+name = "windows"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e686886bc078bc1b0b600cac0147aadb815089b6e4da64016cbd754b6342700f"
+dependencies = [
+ "windows-targets",
+]
+
+[[package]]
+name = "windows-targets"
+version = "0.48.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "05d4b17490f70499f20b9e791dcf6a299785ce8af4d709018206dc5b4953e95f"
+dependencies = [
+ "windows_aarch64_gnullvm",
+ "windows_aarch64_msvc",
+ "windows_i686_gnu",
+ "windows_i686_msvc",
+ "windows_x86_64_gnu",
+ "windows_x86_64_gnullvm",
+ "windows_x86_64_msvc",
+]
+
+[[package]]
+name = "windows_aarch64_gnullvm"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "91ae572e1b79dba883e0d315474df7305d12f569b400fcf90581b06062f7e1bc"
+
+[[package]]
+name = "windows_aarch64_msvc"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b2ef27e0d7bdfcfc7b868b317c1d32c641a6fe4629c171b8928c7b08d98d7cf3"
+
+[[package]]
+name = "windows_i686_gnu"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "622a1962a7db830d6fd0a69683c80a18fda201879f0f447f065a3b7467daa241"
+
+[[package]]
+name = "windows_i686_msvc"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4542c6e364ce21bf45d69fdd2a8e455fa38d316158cfd43b3ac1c5b1b19f8e00"
+
+[[package]]
+name = "windows_x86_64_gnu"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ca2b8a661f7628cbd23440e50b05d705db3686f894fc9580820623656af974b1"
+
+[[package]]
+name = "windows_x86_64_gnullvm"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7896dbc1f41e08872e9d5e8f8baa8fdd2677f29468c4e156210174edc7f7b953"
+
+[[package]]
+name = "windows_x86_64_msvc"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1a515f5799fe4961cb532f983ce2b23082366b898e52ffbce459c86f67c8378a"
diff --git a/src/Access/Common/AccessFlags.h b/src/Access/Common/AccessFlags.h
index 270ee1c0045..c9672da7d92 100644
--- a/src/Access/Common/AccessFlags.h
+++ b/src/Access/Common/AccessFlags.h
@@ -4,6 +4,7 @@
 #include <bitset>
 #include <cstring>
 #include <vector>
+#include <unordered_map>
 
 
 namespace DB
diff --git a/src/Access/Common/AccessType.h b/src/Access/Common/AccessType.h
index 6394c0279a7..f65a77c1d6a 100644
--- a/src/Access/Common/AccessType.h
+++ b/src/Access/Common/AccessType.h
@@ -201,6 +201,7 @@ enum class AccessType
     M(URL, "", GLOBAL, SOURCES) \
     M(REMOTE, "", GLOBAL, SOURCES) \
     M(MONGO, "", GLOBAL, SOURCES) \
+    M(REDIS, "", GLOBAL, SOURCES) \
     M(MEILISEARCH, "", GLOBAL, SOURCES) \
     M(MYSQL, "", GLOBAL, SOURCES) \
     M(POSTGRES, "", GLOBAL, SOURCES) \
@@ -210,6 +211,7 @@ enum class AccessType
     M(HDFS, "", GLOBAL, SOURCES) \
     M(S3, "", GLOBAL, SOURCES) \
     M(HIVE, "", GLOBAL, SOURCES) \
+    M(AZURE, "", GLOBAL, SOURCES) \
     M(SOURCES, "", GROUP, ALL) \
     \
     M(CLUSTER, "", GLOBAL, ALL) /* ON CLUSTER queries */ \
diff --git a/src/Access/ContextAccess.cpp b/src/Access/ContextAccess.cpp
index 04756162b46..9c57853679f 100644
--- a/src/Access/ContextAccess.cpp
+++ b/src/Access/ContextAccess.cpp
@@ -228,6 +228,12 @@ ContextAccess::ContextAccess(const AccessControl & access_control_, const Params
 }
 
 
+ContextAccess::ContextAccess(FullAccess)
+    : is_full_access(true), access(std::make_shared<AccessRights>(AccessRights::getFullAccess())), access_with_implicit(access)
+{
+}
+
+
 ContextAccess::~ContextAccess()
 {
     enabled_settings.reset();
@@ -333,7 +339,7 @@ void ContextAccess::calculateAccessRights() const
                 boost::algorithm::join(roles_info->getCurrentRolesNames(), ", "),
                 boost::algorithm::join(roles_info->getEnabledRolesNames(), ", "));
         }
-        LOG_TRACE(trace_log, "Settings: readonly={}, allow_ddl={}, allow_introspection_functions={}", params.readonly, params.allow_ddl, params.allow_introspection);
+        LOG_TRACE(trace_log, "Settings: readonly = {}, allow_ddl = {}, allow_introspection_functions = {}", params.readonly, params.allow_ddl, params.allow_introspection);
         LOG_TRACE(trace_log, "List of all grants: {}", access->toString());
         LOG_TRACE(trace_log, "List of all grants including implicit: {}", access_with_implicit->toString());
     }
@@ -413,14 +419,8 @@ std::optional<QuotaUsage> ContextAccess::getQuotaUsage() const
 
 std::shared_ptr<const ContextAccess> ContextAccess::getFullAccess()
 {
-    static const std::shared_ptr<const ContextAccess> res = []
-    {
-        auto full_access = std::make_shared<ContextAccess>();
-        full_access->is_full_access = true;
-        full_access->access = std::make_shared<AccessRights>(AccessRights::getFullAccess());
-        full_access->access_with_implicit = full_access->access;
-        return full_access;
-    }();
+    static const std::shared_ptr<const ContextAccess> res =
+        [] { return std::shared_ptr<ContextAccess>(new ContextAccess{kFullAccess}); }();
     return res;
 }
 
diff --git a/src/Access/ContextAccess.h b/src/Access/ContextAccess.h
index 63604a03b4e..60bad0118fc 100644
--- a/src/Access/ContextAccess.h
+++ b/src/Access/ContextAccess.h
@@ -69,7 +69,6 @@ public:
     using Params = ContextAccessParams;
     const Params & getParams() const { return params; }
 
-    ContextAccess() { } /// NOLINT
     ContextAccess(const AccessControl & access_control_, const Params & params_);
 
     /// Returns the current user. Throws if user is nullptr.
@@ -171,10 +170,17 @@ public:
 private:
     friend class AccessControl;
 
+    struct FullAccess {};
+    static const FullAccess kFullAccess;
+
+    /// Makes an instance of ContextAccess which provides full access to everything
+    /// without any limitations. This is used for the global context.
+    explicit ContextAccess(FullAccess);
+
     void initialize();
-    void setUser(const UserPtr & user_) const;
-    void setRolesInfo(const std::shared_ptr<const EnabledRolesInfo> & roles_info_) const;
-    void calculateAccessRights() const;
+    void setUser(const UserPtr & user_) const TSA_REQUIRES(mutex);
+    void setRolesInfo(const std::shared_ptr<const EnabledRolesInfo> & roles_info_) const TSA_REQUIRES(mutex);
+    void calculateAccessRights() const TSA_REQUIRES(mutex);
 
     template <bool throw_if_denied, bool grant_option>
     bool checkAccessImpl(const AccessFlags & flags) const;
@@ -217,20 +223,23 @@ private:
 
     const AccessControl * access_control = nullptr;
     const Params params;
-    bool is_full_access = false;
-    mutable Poco::Logger * trace_log = nullptr;
-    mutable UserPtr user;
-    mutable String user_name;
-    mutable bool user_was_dropped = false;
-    mutable scope_guard subscription_for_user_change;
-    mutable std::shared_ptr<const EnabledRoles> enabled_roles;
-    mutable scope_guard subscription_for_roles_changes;
-    mutable std::shared_ptr<const EnabledRolesInfo> roles_info;
-    mutable std::shared_ptr<const AccessRights> access;
-    mutable std::shared_ptr<const AccessRights> access_with_implicit;
-    mutable std::shared_ptr<const EnabledRowPolicies> enabled_row_policies;
-    mutable std::shared_ptr<const EnabledQuota> enabled_quota;
-    mutable std::shared_ptr<const EnabledSettings> enabled_settings;
+    const bool is_full_access = false;
+
+    mutable std::atomic<bool> user_was_dropped = false;
+    mutable std::atomic<Poco::Logger *> trace_log = nullptr;
+
+    mutable UserPtr user TSA_GUARDED_BY(mutex);
+    mutable String user_name TSA_GUARDED_BY(mutex);
+    mutable scope_guard subscription_for_user_change TSA_GUARDED_BY(mutex);
+    mutable std::shared_ptr<const EnabledRoles> enabled_roles TSA_GUARDED_BY(mutex);
+    mutable scope_guard subscription_for_roles_changes TSA_GUARDED_BY(mutex);
+    mutable std::shared_ptr<const EnabledRolesInfo> roles_info TSA_GUARDED_BY(mutex);
+    mutable std::shared_ptr<const AccessRights> access TSA_GUARDED_BY(mutex);
+    mutable std::shared_ptr<const AccessRights> access_with_implicit TSA_GUARDED_BY(mutex);
+    mutable std::shared_ptr<const EnabledRowPolicies> enabled_row_policies TSA_GUARDED_BY(mutex);
+    mutable std::shared_ptr<const EnabledQuota> enabled_quota TSA_GUARDED_BY(mutex);
+    mutable std::shared_ptr<const EnabledSettings> enabled_settings TSA_GUARDED_BY(mutex);
+
     mutable std::mutex mutex;
 };
 
diff --git a/src/Access/ExternalAuthenticators.h b/src/Access/ExternalAuthenticators.h
index bf928c18d5b..7b47c9351fd 100644
--- a/src/Access/ExternalAuthenticators.h
+++ b/src/Access/ExternalAuthenticators.h
@@ -5,6 +5,7 @@
 #include <Access/GSSAcceptor.h>
 #include <base/defines.h>
 #include <base/types.h>
+#include <base/extended_types.h>
 
 #include <chrono>
 #include <map>
@@ -42,7 +43,7 @@ public:
 private:
     struct LDAPCacheEntry
     {
-        std::size_t last_successful_params_hash = 0;
+        UInt128 last_successful_params_hash = 0;
         std::chrono::steady_clock::time_point last_successful_authentication_timestamp;
         LDAPClient::SearchResultsList last_successful_role_search_results;
     };
diff --git a/src/AggregateFunctions/AggregateFunctionArray.h b/src/AggregateFunctions/AggregateFunctionArray.h
index 21394e3ce05..7f38453f86b 100644
--- a/src/AggregateFunctions/AggregateFunctionArray.h
+++ b/src/AggregateFunctions/AggregateFunctionArray.h
@@ -141,6 +141,13 @@ public:
         nested_func->merge(place, rhs, arena);
     }
 
+    bool isAbleToParallelizeMerge() const override { return nested_func->isAbleToParallelizeMerge(); }
+
+    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, ThreadPool & thread_pool, Arena * arena) const override
+    {
+        nested_func->merge(place, rhs, thread_pool, arena);
+    }
+
     void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> version) const override
     {
         nested_func->serialize(place, buf, version);
diff --git a/src/AggregateFunctions/AggregateFunctionAvg.h b/src/AggregateFunctions/AggregateFunctionAvg.h
index a86c7d042fc..37f20fca01c 100644
--- a/src/AggregateFunctions/AggregateFunctionAvg.h
+++ b/src/AggregateFunctions/AggregateFunctionAvg.h
@@ -146,8 +146,8 @@ public:
         for (const auto & argument : this->argument_types)
             can_be_compiled &= canBeNativeType(*argument);
 
-        auto return_type = this->getResultType();
-        can_be_compiled &= canBeNativeType(*return_type);
+        const auto & result_type = this->getResultType();
+        can_be_compiled &= canBeNativeType(*result_type);
 
         return can_be_compiled;
     }
@@ -198,8 +198,8 @@ public:
         auto * denominator_ptr = b.CreateConstGEP1_32(b.getInt8Ty(), aggregate_data_ptr, denominator_offset);
         auto * denominator_value = b.CreateLoad(denominator_type, denominator_ptr);
 
-        auto * double_numerator = nativeCast<Numerator>(b, numerator_value, b.getDoubleTy());
-        auto * double_denominator = nativeCast<Denominator>(b, denominator_value, b.getDoubleTy());
+        auto * double_numerator = nativeCast<Numerator>(b, numerator_value, this->getResultType());
+        auto * double_denominator = nativeCast<Denominator>(b, denominator_value, this->getResultType());
 
         return b.CreateFDiv(double_numerator, double_denominator);
     }
@@ -308,7 +308,7 @@ public:
 
 #if USE_EMBEDDED_COMPILER
 
-    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const DataTypes & arguments_types, const std::vector<llvm::Value *> & argument_values) const override
+    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const ValuesWithType & arguments) const override
     {
         llvm::IRBuilder<> & b = static_cast<llvm::IRBuilder<> &>(builder);
 
@@ -316,7 +316,7 @@ public:
 
         auto * numerator_ptr = aggregate_data_ptr;
         auto * numerator_value = b.CreateLoad(numerator_type, numerator_ptr);
-        auto * value_cast_to_numerator = nativeCast(b, arguments_types[0], argument_values[0], numerator_type);
+        auto * value_cast_to_numerator = nativeCast(b, arguments[0], toNativeDataType<Numerator>());
         auto * numerator_result_value = numerator_type->isIntegerTy() ? b.CreateAdd(numerator_value, value_cast_to_numerator) : b.CreateFAdd(numerator_value, value_cast_to_numerator);
         b.CreateStore(numerator_result_value, numerator_ptr);
 
diff --git a/src/AggregateFunctions/AggregateFunctionAvgWeighted.h b/src/AggregateFunctions/AggregateFunctionAvgWeighted.h
index bc3e3a32a71..5a3869032ca 100644
--- a/src/AggregateFunctions/AggregateFunctionAvgWeighted.h
+++ b/src/AggregateFunctions/AggregateFunctionAvgWeighted.h
@@ -30,7 +30,7 @@ public:
 
     using Numerator = typename Base::Numerator;
     using Denominator = typename Base::Denominator;
-     using Fraction = typename Base::Fraction;
+    using Fraction = typename Base::Fraction;
 
     void NO_SANITIZE_UNDEFINED add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena *) const override
     {
@@ -55,7 +55,7 @@ public:
         return can_be_compiled;
     }
 
-    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const DataTypes & arguments_types, const std::vector<llvm::Value *> & argument_values) const override
+    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const ValuesWithType & arguments) const override
     {
         llvm::IRBuilder<> & b = static_cast<llvm::IRBuilder<> &>(builder);
 
@@ -63,8 +63,9 @@ public:
         auto * numerator_ptr = aggregate_data_ptr;
         auto * numerator_value = b.CreateLoad(numerator_type, numerator_ptr);
 
-        auto * argument = nativeCast(b, arguments_types[0], argument_values[0], numerator_type);
-        auto * weight = nativeCast(b, arguments_types[1], argument_values[1], numerator_type);
+        auto numerator_data_type = toNativeDataType<Numerator>();
+        auto * argument = nativeCast(b, arguments[0], numerator_data_type);
+        auto * weight = nativeCast(b, arguments[1], numerator_data_type);
 
         llvm::Value * value_weight_multiplication = argument->getType()->isIntegerTy() ? b.CreateMul(argument, weight) : b.CreateFMul(argument, weight);
         auto * numerator_result_value = numerator_type->isIntegerTy() ? b.CreateAdd(numerator_value, value_weight_multiplication) : b.CreateFAdd(numerator_value, value_weight_multiplication);
@@ -75,7 +76,7 @@ public:
         static constexpr size_t denominator_offset = offsetof(Fraction, denominator);
         auto * denominator_ptr = b.CreateConstInBoundsGEP1_64(b.getInt8Ty(), aggregate_data_ptr, denominator_offset);
 
-        auto * weight_cast_to_denominator = nativeCast(b, arguments_types[1], argument_values[1], denominator_type);
+        auto * weight_cast_to_denominator = nativeCast(b, arguments[1], toNativeDataType<Denominator>());
 
         auto * denominator_value = b.CreateLoad(denominator_type, denominator_ptr);
         auto * denominator_value_updated = denominator_type->isIntegerTy() ? b.CreateAdd(denominator_value, weight_cast_to_denominator) : b.CreateFAdd(denominator_value, weight_cast_to_denominator);
diff --git a/src/AggregateFunctions/AggregateFunctionBitwise.h b/src/AggregateFunctions/AggregateFunctionBitwise.h
index 6c94a72bf32..71479b309c7 100644
--- a/src/AggregateFunctions/AggregateFunctionBitwise.h
+++ b/src/AggregateFunctions/AggregateFunctionBitwise.h
@@ -148,7 +148,7 @@ public:
         Data::compileCreate(builder, value_ptr);
     }
 
-    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const DataTypes &, const std::vector<llvm::Value *> & argument_values) const override
+    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const ValuesWithType & arguments) const override
     {
         llvm::IRBuilder<> & b = static_cast<llvm::IRBuilder<> &>(builder);
 
@@ -157,8 +157,7 @@ public:
         auto * value_ptr = aggregate_data_ptr;
         auto * value = b.CreateLoad(return_type, value_ptr);
 
-        const auto & argument_value = argument_values[0];
-        auto * result_value = Data::compileUpdate(builder, value, argument_value);
+        auto * result_value = Data::compileUpdate(builder, value, arguments[0].value);
 
         b.CreateStore(result_value, value_ptr);
     }
diff --git a/src/AggregateFunctions/AggregateFunctionCount.h b/src/AggregateFunctions/AggregateFunctionCount.h
index 848a8a4b603..77d3bfeb448 100644
--- a/src/AggregateFunctions/AggregateFunctionCount.h
+++ b/src/AggregateFunctions/AggregateFunctionCount.h
@@ -165,7 +165,7 @@ public:
         b.CreateMemSet(aggregate_data_ptr, llvm::ConstantInt::get(b.getInt8Ty(), 0), sizeof(AggregateFunctionCountData), llvm::assumeAligned(this->alignOfData()));
     }
 
-    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const DataTypes &, const std::vector<llvm::Value *> &) const override
+    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const ValuesWithType &) const override
     {
         llvm::IRBuilder<> & b = static_cast<llvm::IRBuilder<> &>(builder);
 
@@ -309,13 +309,13 @@ public:
         b.CreateMemSet(aggregate_data_ptr, llvm::ConstantInt::get(b.getInt8Ty(), 0), sizeof(AggregateFunctionCountData), llvm::assumeAligned(this->alignOfData()));
     }
 
-    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const DataTypes &, const std::vector<llvm::Value *> & values) const override
+    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const ValuesWithType & arguments) const override
     {
         llvm::IRBuilder<> & b = static_cast<llvm::IRBuilder<> &>(builder);
 
         auto * return_type = toNativeType(b, this->getResultType());
 
-        auto * is_null_value = b.CreateExtractValue(values[0], {1});
+        auto * is_null_value = b.CreateExtractValue(arguments[0].value, {1});
         auto * increment_value = b.CreateSelect(is_null_value, llvm::ConstantInt::get(return_type, 0), llvm::ConstantInt::get(return_type, 1));
 
         auto * count_value_ptr = aggregate_data_ptr;
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
index 15f500b8bb6..bb1368b9ff8 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
@@ -25,6 +25,7 @@ IAggregateFunction * createWithNumericOrTimeType(const IDataType & argument_type
     WhichDataType which(argument_type);
     if (which.idx == TypeIndex::Date) return new AggregateFunctionTemplate<UInt16, Data>(std::forward<TArgs>(args)...);
     if (which.idx == TypeIndex::DateTime) return new AggregateFunctionTemplate<UInt32, Data>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::IPv4) return new AggregateFunctionTemplate<IPv4, Data>(std::forward<TArgs>(args)...);
     return createWithNumericType<AggregateFunctionTemplate, Data, TArgs...>(argument_type, std::forward<TArgs>(args)...);
 }
 
diff --git a/src/AggregateFunctions/AggregateFunctionGroupBitmapData.h b/src/AggregateFunctions/AggregateFunctionGroupBitmapData.h
index d99f0bf16ee..7ea1ebe7749 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupBitmapData.h
+++ b/src/AggregateFunctions/AggregateFunctionGroupBitmapData.h
@@ -122,7 +122,7 @@ public:
             size_t size;
             readVarUInt(size, in);
 
-            static constexpr size_t max_size = 1_GiB;
+            static constexpr size_t max_size = 100_GiB;
 
             if (size == 0)
                 throw Exception(ErrorCodes::INCORRECT_DATA, "Incorrect size (0) in groupBitmap.");
diff --git a/src/AggregateFunctions/AggregateFunctionGroupUniqArray.cpp b/src/AggregateFunctions/AggregateFunctionGroupUniqArray.cpp
index 16f2feb71bf..9e8060d44cc 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupUniqArray.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupUniqArray.cpp
@@ -4,6 +4,7 @@
 #include <AggregateFunctions/FactoryHelpers.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
+#include <DataTypes/DataTypeIPv4andIPv6.h>
 
 
 namespace DB
@@ -39,12 +40,22 @@ public:
     static DataTypePtr createResultType() { return std::make_shared<DataTypeArray>(std::make_shared<DataTypeDateTime>()); }
 };
 
+template <typename HasLimit>
+class AggregateFunctionGroupUniqArrayIPv4 : public AggregateFunctionGroupUniqArray<DataTypeIPv4::FieldType, HasLimit>
+{
+public:
+    explicit AggregateFunctionGroupUniqArrayIPv4(const DataTypePtr & argument_type, const Array & parameters_, UInt64 max_elems_ = std::numeric_limits<UInt64>::max())
+        : AggregateFunctionGroupUniqArray<DataTypeIPv4::FieldType, HasLimit>(argument_type, parameters_, createResultType(), max_elems_) {}
+    static DataTypePtr createResultType() { return std::make_shared<DataTypeArray>(std::make_shared<DataTypeIPv4>()); }
+};
+
 template <typename HasLimit, typename ... TArgs>
 IAggregateFunction * createWithExtraTypes(const DataTypePtr & argument_type, TArgs && ... args)
 {
     WhichDataType which(argument_type);
     if (which.idx == TypeIndex::Date) return new AggregateFunctionGroupUniqArrayDate<HasLimit>(argument_type, std::forward<TArgs>(args)...);
     else if (which.idx == TypeIndex::DateTime) return new AggregateFunctionGroupUniqArrayDateTime<HasLimit>(argument_type, std::forward<TArgs>(args)...);
+    else if (which.idx == TypeIndex::IPv4) return new AggregateFunctionGroupUniqArrayIPv4<HasLimit>(argument_type, std::forward<TArgs>(args)...);
     else
     {
         /// Check that we can use plain version of AggregateFunctionGroupUniqArrayGeneric
diff --git a/src/AggregateFunctions/AggregateFunctionIf.cpp b/src/AggregateFunctions/AggregateFunctionIf.cpp
index 20bdb32796a..87fa8239507 100644
--- a/src/AggregateFunctions/AggregateFunctionIf.cpp
+++ b/src/AggregateFunctions/AggregateFunctionIf.cpp
@@ -188,18 +188,18 @@ public:
         return canBeNativeType(*this->argument_types.back()) && this->nested_function->isCompilable();
     }
 
-    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const DataTypes & arguments_types, const std::vector<llvm::Value *> & argument_values) const override
+    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const ValuesWithType & arguments) const override
     {
         llvm::IRBuilder<> & b = static_cast<llvm::IRBuilder<> &>(builder);
 
-        const auto & nullable_type = arguments_types[0];
-        const auto & nullable_value = argument_values[0];
+        const auto & nullable_type = arguments[0].type;
+        const auto & nullable_value = arguments[0].value;
 
         auto * wrapped_value = b.CreateExtractValue(nullable_value, {0});
         auto * is_null_value = b.CreateExtractValue(nullable_value, {1});
 
-        const auto & predicate_type = arguments_types[argument_values.size() - 1];
-        auto * predicate_value = argument_values[argument_values.size() - 1];
+        const auto & predicate_type = arguments.back().type;
+        auto * predicate_value = arguments.back().value;
         auto * is_predicate_true = nativeBoolCast(b, predicate_type, predicate_value);
 
         auto * head = b.GetInsertBlock();
@@ -219,7 +219,7 @@ public:
             b.CreateStore(llvm::ConstantInt::get(b.getInt8Ty(), 1), aggregate_data_ptr);
 
         auto * aggregate_data_ptr_with_prefix_size_offset = b.CreateConstInBoundsGEP1_64(b.getInt8Ty(), aggregate_data_ptr, this->prefix_size);
-        this->nested_function->compileAdd(b, aggregate_data_ptr_with_prefix_size_offset, { removeNullable(nullable_type) }, { wrapped_value });
+        this->nested_function->compileAdd(b, aggregate_data_ptr_with_prefix_size_offset, { ValueWithType(wrapped_value, removeNullable(nullable_type)) });
         b.CreateBr(join_block);
 
         b.SetInsertPoint(join_block);
@@ -370,38 +370,31 @@ public:
         return canBeNativeType(*this->argument_types.back()) && this->nested_function->isCompilable();
     }
 
-    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const DataTypes & arguments_types, const std::vector<llvm::Value *> & argument_values) const override
+    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const ValuesWithType & arguments) const override
     {
-        /// TODO: Check
-
         llvm::IRBuilder<> & b = static_cast<llvm::IRBuilder<> &>(builder);
 
-        size_t arguments_size = arguments_types.size();
+        size_t arguments_size = arguments.size();
+
+        ValuesWithType wrapped_arguments;
+        wrapped_arguments.reserve(arguments_size);
 
-        DataTypes non_nullable_types;
-        std::vector<llvm::Value * > wrapped_values;
         std::vector<llvm::Value * > is_null_values;
 
-        non_nullable_types.resize(arguments_size);
-        wrapped_values.resize(arguments_size);
-        is_null_values.resize(arguments_size);
-
         for (size_t i = 0; i < arguments_size; ++i)
         {
-            const auto & argument_value = argument_values[i];
+            const auto & argument_value = arguments[i].value;
+            const auto & argument_type = arguments[i].type;
 
             if (is_nullable[i])
             {
                 auto * wrapped_value = b.CreateExtractValue(argument_value, {0});
-                is_null_values[i] = b.CreateExtractValue(argument_value, {1});
-
-                wrapped_values[i] = wrapped_value;
-                non_nullable_types[i] = removeNullable(arguments_types[i]);
+                is_null_values.emplace_back(b.CreateExtractValue(argument_value, {1}));
+                wrapped_arguments.emplace_back(wrapped_value, removeNullable(argument_type));
             }
             else
             {
-                wrapped_values[i] = argument_value;
-                non_nullable_types[i] = arguments_types[i];
+                wrapped_arguments.emplace_back(argument_value, argument_type);
             }
         }
 
@@ -415,9 +408,6 @@ public:
 
         for (auto * is_null_value : is_null_values)
         {
-            if (!is_null_value)
-                continue;
-
             auto * values_have_null = b.CreateLoad(b.getInt1Ty(), values_have_null_ptr);
             b.CreateStore(b.CreateOr(values_have_null, is_null_value), values_have_null_ptr);
         }
@@ -426,8 +416,8 @@ public:
 
         b.SetInsertPoint(join_block_after_null_checks);
 
-        const auto & predicate_type = arguments_types[argument_values.size() - 1];
-        auto * predicate_value = argument_values[argument_values.size() - 1];
+        const auto & predicate_type = arguments.back().type;
+        auto * predicate_value = arguments.back().value;
         auto * is_predicate_true = nativeBoolCast(b, predicate_type, predicate_value);
 
         auto * if_true = llvm::BasicBlock::Create(head->getContext(), "if_true", head->getParent());
@@ -444,7 +434,7 @@ public:
             b.CreateStore(llvm::ConstantInt::get(b.getInt8Ty(), 1), aggregate_data_ptr);
 
         auto * aggregate_data_ptr_with_prefix_size_offset = b.CreateConstInBoundsGEP1_64(b.getInt8Ty(), aggregate_data_ptr, this->prefix_size);
-        this->nested_function->compileAdd(b, aggregate_data_ptr_with_prefix_size_offset, non_nullable_types, wrapped_values);
+        this->nested_function->compileAdd(b, aggregate_data_ptr_with_prefix_size_offset, wrapped_arguments);
         b.CreateBr(join_block);
 
         b.SetInsertPoint(join_block);
diff --git a/src/AggregateFunctions/AggregateFunctionIf.h b/src/AggregateFunctions/AggregateFunctionIf.h
index cd7d7e27a25..afab861e202 100644
--- a/src/AggregateFunctions/AggregateFunctionIf.h
+++ b/src/AggregateFunctions/AggregateFunctionIf.h
@@ -223,12 +223,12 @@ public:
         nested_func->compileCreate(builder, aggregate_data_ptr);
     }
 
-    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const DataTypes & arguments_types, const std::vector<llvm::Value *> & argument_values) const override
+    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const ValuesWithType & arguments) const override
     {
         llvm::IRBuilder<> & b = static_cast<llvm::IRBuilder<> &>(builder);
 
-        const auto & predicate_type = arguments_types[argument_values.size() - 1];
-        auto * predicate_value = argument_values[argument_values.size() - 1];
+        const auto & predicate_type = arguments.back().type;
+        auto * predicate_value = arguments.back().value;
 
         auto * head = b.GetInsertBlock();
 
@@ -242,21 +242,9 @@ public:
 
         b.SetInsertPoint(if_true);
 
-        size_t arguments_size_without_predicate = arguments_types.size() - 1;
-
-        DataTypes argument_types_without_predicate;
-        std::vector<llvm::Value *> argument_values_without_predicate;
-
-        argument_types_without_predicate.resize(arguments_size_without_predicate);
-        argument_values_without_predicate.resize(arguments_size_without_predicate);
-
-        for (size_t i = 0; i < arguments_size_without_predicate; ++i)
-        {
-            argument_types_without_predicate[i] = arguments_types[i];
-            argument_values_without_predicate[i] = argument_values[i];
-        }
-
-        nested_func->compileAdd(builder, aggregate_data_ptr, argument_types_without_predicate, argument_values_without_predicate);
+        ValuesWithType arguments_without_predicate = arguments;
+        arguments_without_predicate.pop_back();
+        nested_func->compileAdd(builder, aggregate_data_ptr, arguments_without_predicate);
 
         b.CreateBr(join_block);
 
diff --git a/src/AggregateFunctions/AggregateFunctionMap.cpp b/src/AggregateFunctions/AggregateFunctionMap.cpp
index f6100602f3f..b957b541fe1 100644
--- a/src/AggregateFunctions/AggregateFunctionMap.cpp
+++ b/src/AggregateFunctions/AggregateFunctionMap.cpp
@@ -100,6 +100,10 @@ public:
                     return std::make_shared<AggregateFunctionMap<UInt256>>(nested_function, arguments);
                 case TypeIndex::UUID:
                     return std::make_shared<AggregateFunctionMap<UUID>>(nested_function, arguments);
+                case TypeIndex::IPv4:
+                    return std::make_shared<AggregateFunctionMap<IPv4>>(nested_function, arguments);
+                case TypeIndex::IPv6:
+                    return std::make_shared<AggregateFunctionMap<IPv6>>(nested_function, arguments);
                 case TypeIndex::FixedString:
                 case TypeIndex::String:
                     return std::make_shared<AggregateFunctionMap<String>>(nested_function, arguments);
diff --git a/src/AggregateFunctions/AggregateFunctionMap.h b/src/AggregateFunctions/AggregateFunctionMap.h
index 55f6611974e..7b9bb088d8f 100644
--- a/src/AggregateFunctions/AggregateFunctionMap.h
+++ b/src/AggregateFunctions/AggregateFunctionMap.h
@@ -19,7 +19,9 @@
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
 #include "DataTypes/Serializations/ISerialization.h"
+#include <base/IPv4andIPv6.h>
 #include "base/types.h"
+#include <Common/formatIPv6.h>
 #include <Common/Arena.h>
 #include "AggregateFunctions/AggregateFunctionFactory.h"
 
@@ -69,6 +71,31 @@ struct AggregateFunctionMapCombinatorData<String>
     }
 };
 
+/// Specialization for IPv6 - for historical reasons it should be stored as FixedString(16)
+template <>
+struct AggregateFunctionMapCombinatorData<IPv6>
+{
+    struct IPv6Hash
+    {
+        using hash_type = std::hash<IPv6>;
+        using is_transparent = void;
+
+        size_t operator()(const IPv6 & ip) const { return hash_type{}(ip); }
+    };
+
+    using SearchType = IPv6;
+    std::unordered_map<IPv6, AggregateDataPtr, IPv6Hash, std::equal_to<>> merged_maps;
+
+    static void writeKey(const IPv6 & key, WriteBuffer & buf)
+    {
+        writeIPv6Binary(key, buf);
+    }
+    static void readKey(IPv6 & key, ReadBuffer & buf)
+    {
+        readIPv6Binary(key, buf);
+    }
+};
+
 template <typename KeyType>
 class AggregateFunctionMap final
     : public IAggregateFunctionDataHelper<AggregateFunctionMapCombinatorData<KeyType>, AggregateFunctionMap<KeyType>>
@@ -147,6 +174,8 @@ public:
                 StringRef key_ref;
                 if (key_type->getTypeId() == TypeIndex::FixedString)
                     key_ref = assert_cast<const ColumnFixedString &>(key_column).getDataAt(offset + i);
+                else if (key_type->getTypeId() == TypeIndex::IPv6)
+                    key_ref = assert_cast<const ColumnIPv6 &>(key_column).getDataAt(offset + i);
                 else
                     key_ref = assert_cast<const ColumnString &>(key_column).getDataAt(offset + i);
 
diff --git a/src/AggregateFunctions/AggregateFunctionMerge.h b/src/AggregateFunctions/AggregateFunctionMerge.h
index 0cb44259816..5b9e8e606af 100644
--- a/src/AggregateFunctions/AggregateFunctionMerge.h
+++ b/src/AggregateFunctions/AggregateFunctionMerge.h
@@ -110,6 +110,13 @@ public:
         nested_func->merge(place, rhs, arena);
     }
 
+    bool isAbleToParallelizeMerge() const override { return nested_func->isAbleToParallelizeMerge(); }
+
+    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, ThreadPool & thread_pool, Arena * arena) const override
+    {
+        nested_func->merge(place, rhs, thread_pool, arena);
+    }
+
     void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> version) const override
     {
         nested_func->serialize(place, buf, version);
diff --git a/src/AggregateFunctions/AggregateFunctionMinMaxAny.h b/src/AggregateFunctions/AggregateFunctionMinMaxAny.h
index 94c0d60be81..5312df32459 100644
--- a/src/AggregateFunctions/AggregateFunctionMinMaxAny.h
+++ b/src/AggregateFunctions/AggregateFunctionMinMaxAny.h
@@ -1459,11 +1459,11 @@ public:
         b.CreateMemSet(aggregate_data_ptr, llvm::ConstantInt::get(b.getInt8Ty(), 0), this->sizeOfData(), llvm::assumeAligned(this->alignOfData()));
     }
 
-    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const DataTypes &, const std::vector<llvm::Value *> & argument_values) const override
+    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const ValuesWithType & arguments) const override
     {
         if constexpr (Data::is_compilable)
         {
-            Data::compileChangeIfBetter(builder, aggregate_data_ptr, argument_values[0]);
+            Data::compileChangeIfBetter(builder, aggregate_data_ptr, arguments[0].value);
         }
         else
         {
diff --git a/src/AggregateFunctions/AggregateFunctionNull.h b/src/AggregateFunctions/AggregateFunctionNull.h
index b817bad82fa..6b6580bf4c4 100644
--- a/src/AggregateFunctions/AggregateFunctionNull.h
+++ b/src/AggregateFunctions/AggregateFunctionNull.h
@@ -148,6 +148,13 @@ public:
         nested_function->merge(nestedPlace(place), nestedPlace(rhs), arena);
     }
 
+    bool isAbleToParallelizeMerge() const override { return nested_function->isAbleToParallelizeMerge(); }
+
+    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, ThreadPool & thread_pool, Arena * arena) const override
+    {
+        nested_function->merge(nestedPlace(place), nestedPlace(rhs), thread_pool, arena);
+    }
+
     void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> version) const override
     {
         bool flag = getFlag(place);
@@ -371,12 +378,12 @@ public:
 
 #if USE_EMBEDDED_COMPILER
 
-    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const DataTypes & arguments_types, const std::vector<llvm::Value *> & argument_values) const override
+    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const ValuesWithType & arguments) const override
     {
         llvm::IRBuilder<> & b = static_cast<llvm::IRBuilder<> &>(builder);
 
-        const auto & nullable_type = arguments_types[0];
-        const auto & nullable_value = argument_values[0];
+        const auto & nullable_type = arguments[0].type;
+        const auto & nullable_value = arguments[0].value;
 
         auto * wrapped_value = b.CreateExtractValue(nullable_value, {0});
         auto * is_null_value = b.CreateExtractValue(nullable_value, {1});
@@ -398,7 +405,7 @@ public:
             b.CreateStore(llvm::ConstantInt::get(b.getInt8Ty(), 1), aggregate_data_ptr);
 
         auto * aggregate_data_ptr_with_prefix_size_offset = b.CreateConstInBoundsGEP1_64(b.getInt8Ty(), aggregate_data_ptr, this->prefix_size);
-        this->nested_function->compileAdd(b, aggregate_data_ptr_with_prefix_size_offset, { removeNullable(nullable_type) }, { wrapped_value });
+        this->nested_function->compileAdd(b, aggregate_data_ptr_with_prefix_size_offset, { ValueWithType(wrapped_value, removeNullable(nullable_type)) });
         b.CreateBr(join_block);
 
         b.SetInsertPoint(join_block);
@@ -561,36 +568,32 @@ public:
 
 #if USE_EMBEDDED_COMPILER
 
-    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const DataTypes & arguments_types, const std::vector<llvm::Value *> & argument_values) const override
+    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const ValuesWithType & arguments) const override
     {
         llvm::IRBuilder<> & b = static_cast<llvm::IRBuilder<> &>(builder);
 
-        size_t arguments_size = arguments_types.size();
+        size_t arguments_size = arguments.size();
 
-        DataTypes non_nullable_types;
-        std::vector<llvm::Value * > wrapped_values;
-        std::vector<llvm::Value * > is_null_values;
+        ValuesWithType wrapped_arguments;
+        wrapped_arguments.reserve(arguments_size);
 
-        non_nullable_types.resize(arguments_size);
-        wrapped_values.resize(arguments_size);
-        is_null_values.resize(arguments_size);
+        std::vector<llvm::Value *> is_null_values;
+        is_null_values.reserve(arguments_size);
 
         for (size_t i = 0; i < arguments_size; ++i)
         {
-            const auto & argument_value = argument_values[i];
+            const auto & argument_value = arguments[i].value;
+            const auto & argument_type = arguments[i].type;
 
             if (is_nullable[i])
             {
                 auto * wrapped_value = b.CreateExtractValue(argument_value, {0});
-                is_null_values[i] = b.CreateExtractValue(argument_value, {1});
-
-                wrapped_values[i] = wrapped_value;
-                non_nullable_types[i] = removeNullable(arguments_types[i]);
+                is_null_values.emplace_back(b.CreateExtractValue(argument_value, {1}));
+                wrapped_arguments.emplace_back(wrapped_value, removeNullable(argument_type));
             }
             else
             {
-                wrapped_values[i] = argument_value;
-                non_nullable_types[i] = arguments_types[i];
+                wrapped_arguments.emplace_back(argument_value, argument_type);
             }
         }
 
@@ -605,9 +608,6 @@ public:
 
         for (auto * is_null_value : is_null_values)
         {
-            if (!is_null_value)
-                continue;
-
             auto * values_have_null = b.CreateLoad(b.getInt1Ty(), values_have_null_ptr);
             b.CreateStore(b.CreateOr(values_have_null, is_null_value), values_have_null_ptr);
         }
@@ -623,7 +623,7 @@ public:
             b.CreateStore(llvm::ConstantInt::get(b.getInt8Ty(), 1), aggregate_data_ptr);
 
         auto * aggregate_data_ptr_with_prefix_size_offset = b.CreateConstInBoundsGEP1_64(b.getInt8Ty(), aggregate_data_ptr, this->prefix_size);
-        this->nested_function->compileAdd(b, aggregate_data_ptr_with_prefix_size_offset, arguments_types, wrapped_values);
+        this->nested_function->compileAdd(b, aggregate_data_ptr_with_prefix_size_offset, wrapped_arguments);
         b.CreateBr(join_block);
 
         b.SetInsertPoint(join_block);
diff --git a/src/AggregateFunctions/AggregateFunctionState.h b/src/AggregateFunctions/AggregateFunctionState.h
index 625fe1f36bc..8335d21cb1e 100644
--- a/src/AggregateFunctions/AggregateFunctionState.h
+++ b/src/AggregateFunctions/AggregateFunctionState.h
@@ -91,6 +91,13 @@ public:
         nested_func->merge(place, rhs, arena);
     }
 
+    bool isAbleToParallelizeMerge() const override { return nested_func->isAbleToParallelizeMerge(); }
+
+    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, ThreadPool & thread_pool, Arena * arena) const override
+    {
+        nested_func->merge(place, rhs, thread_pool, arena);
+    }
+
     void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> version) const override
     {
         nested_func->serialize(place, buf, version);
diff --git a/src/AggregateFunctions/AggregateFunctionSum.h b/src/AggregateFunctions/AggregateFunctionSum.h
index f77d1dae36f..bb0804c14b3 100644
--- a/src/AggregateFunctions/AggregateFunctionSum.h
+++ b/src/AggregateFunctions/AggregateFunctionSum.h
@@ -588,7 +588,7 @@ public:
         b.CreateStore(llvm::Constant::getNullValue(return_type), aggregate_sum_ptr);
     }
 
-    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const DataTypes & arguments_types, const std::vector<llvm::Value *> & argument_values) const override
+    void compileAdd(llvm::IRBuilderBase & builder, llvm::Value * aggregate_data_ptr, const ValuesWithType & arguments) const override
     {
         llvm::IRBuilder<> & b = static_cast<llvm::IRBuilder<> &>(builder);
 
@@ -597,10 +597,7 @@ public:
         auto * sum_value_ptr = aggregate_data_ptr;
         auto * sum_value = b.CreateLoad(return_type, sum_value_ptr);
 
-        const auto & argument_type = arguments_types[0];
-        const auto & argument_value = argument_values[0];
-
-        auto * value_cast_to_result = nativeCast(b, argument_type, argument_value, return_type);
+        auto * value_cast_to_result = nativeCast(b, arguments[0], this->getResultType());
         auto * sum_result_value = sum_value->getType()->isIntegerTy() ? b.CreateAdd(sum_value, value_cast_to_result) : b.CreateFAdd(sum_value, value_cast_to_result);
 
         b.CreateStore(sum_result_value, sum_value_ptr);
diff --git a/src/AggregateFunctions/AggregateFunctionTopK.cpp b/src/AggregateFunctions/AggregateFunctionTopK.cpp
index e568694df02..8f6652223cc 100644
--- a/src/AggregateFunctions/AggregateFunctionTopK.cpp
+++ b/src/AggregateFunctions/AggregateFunctionTopK.cpp
@@ -5,6 +5,7 @@
 #include <Common/FieldVisitorConvertToNumber.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
+#include <DataTypes/DataTypeIPv4andIPv6.h>
 
 
 static inline constexpr UInt64 TOP_K_MAX_SIZE = 0xFFFFFF;
@@ -60,6 +61,22 @@ public:
     {}
 };
 
+template <bool is_weighted>
+class AggregateFunctionTopKIPv4 : public AggregateFunctionTopK<DataTypeIPv4::FieldType, is_weighted>
+{
+public:
+    using AggregateFunctionTopK<DataTypeIPv4::FieldType, is_weighted>::AggregateFunctionTopK;
+
+    AggregateFunctionTopKIPv4(UInt64 threshold_, UInt64 load_factor, const DataTypes & argument_types_, const Array & params)
+        : AggregateFunctionTopK<DataTypeIPv4::FieldType, is_weighted>(
+            threshold_,
+            load_factor,
+            argument_types_,
+            params,
+            std::make_shared<DataTypeArray>(std::make_shared<DataTypeIPv4>()))
+    {}
+};
+
 
 template <bool is_weighted>
 IAggregateFunction * createWithExtraTypes(const DataTypes & argument_types, UInt64 threshold, UInt64 load_factor, const Array & params)
@@ -72,6 +89,8 @@ IAggregateFunction * createWithExtraTypes(const DataTypes & argument_types, UInt
         return new AggregateFunctionTopKDate<is_weighted>(threshold, load_factor, argument_types, params);
     if (which.idx == TypeIndex::DateTime)
         return new AggregateFunctionTopKDateTime<is_weighted>(threshold, load_factor, argument_types, params);
+    if (which.idx == TypeIndex::IPv4)
+        return new AggregateFunctionTopKIPv4<is_weighted>(threshold, load_factor, argument_types, params);
 
     /// Check that we can use plain version of AggregateFunctionTopKGeneric
     if (argument_types[0]->isValueUnambiguouslyRepresentedInContiguousMemoryRegion())
diff --git a/src/AggregateFunctions/AggregateFunctionUniq.cpp b/src/AggregateFunctions/AggregateFunctionUniq.cpp
index bf998c5ee9e..748a232641e 100644
--- a/src/AggregateFunctions/AggregateFunctionUniq.cpp
+++ b/src/AggregateFunctions/AggregateFunctionUniq.cpp
@@ -8,6 +8,7 @@
 #include <DataTypes/DataTypeDateTime.h>
 #include <DataTypes/DataTypeTuple.h>
 #include <DataTypes/DataTypeUUID.h>
+#include <DataTypes/DataTypeIPv4andIPv6.h>
 
 #include <Core/Settings.h>
 
@@ -60,6 +61,10 @@ createAggregateFunctionUniq(const std::string & name, const DataTypes & argument
             return std::make_shared<AggregateFunctionUniq<String, Data>>(argument_types);
         else if (which.isUUID())
             return std::make_shared<AggregateFunctionUniq<DataTypeUUID::FieldType, Data>>(argument_types);
+        else if (which.isIPv4())
+            return std::make_shared<AggregateFunctionUniq<DataTypeIPv4::FieldType, Data>>(argument_types);
+        else if (which.isIPv6())
+            return std::make_shared<AggregateFunctionUniq<DataTypeIPv6::FieldType, Data>>(argument_types);
         else if (which.isTuple())
         {
             if (use_exact_hash_function)
@@ -109,6 +114,10 @@ createAggregateFunctionUniq(const std::string & name, const DataTypes & argument
             return std::make_shared<AggregateFunctionUniq<String, Data<String, is_able_to_parallelize_merge>>>(argument_types);
         else if (which.isUUID())
             return std::make_shared<AggregateFunctionUniq<DataTypeUUID::FieldType, Data<DataTypeUUID::FieldType, is_able_to_parallelize_merge>>>(argument_types);
+        else if (which.isIPv4())
+            return std::make_shared<AggregateFunctionUniq<DataTypeIPv4::FieldType, Data<DataTypeIPv4::FieldType, is_able_to_parallelize_merge>>>(argument_types);
+        else if (which.isIPv6())
+            return std::make_shared<AggregateFunctionUniq<DataTypeIPv6::FieldType, Data<DataTypeIPv6::FieldType, is_able_to_parallelize_merge>>>(argument_types);
         else if (which.isTuple())
         {
             if (use_exact_hash_function)
diff --git a/src/AggregateFunctions/AggregateFunctionUniq.h b/src/AggregateFunctions/AggregateFunctionUniq.h
index c782b9314fd..de68e9076a0 100644
--- a/src/AggregateFunctions/AggregateFunctionUniq.h
+++ b/src/AggregateFunctions/AggregateFunctionUniq.h
@@ -101,6 +101,18 @@ struct AggregateFunctionUniqHLL12Data<UUID, false>
     static String getName() { return "uniqHLL12"; }
 };
 
+template <>
+struct AggregateFunctionUniqHLL12Data<IPv6, false>
+{
+    using Set = HyperLogLogWithSmallSetOptimization<UInt64, 16, 12>;
+    Set set;
+
+    constexpr static bool is_able_to_parallelize_merge = false;
+    constexpr static bool is_variadic = false;
+
+    static String getName() { return "uniqHLL12"; }
+};
+
 template <bool is_exact_, bool argument_is_tuple_, bool is_able_to_parallelize_merge_>
 struct AggregateFunctionUniqHLL12DataForVariadic
 {
@@ -155,6 +167,25 @@ struct AggregateFunctionUniqExactData<String, is_able_to_parallelize_merge_>
     static String getName() { return "uniqExact"; }
 };
 
+/// For historical reasons IPv6 is treated as FixedString(16)
+template <bool is_able_to_parallelize_merge_>
+struct AggregateFunctionUniqExactData<IPv6, is_able_to_parallelize_merge_>
+{
+    using Key = UInt128;
+
+    /// When creating, the hash table must be small.
+    using SingleLevelSet = HashSet<Key, UInt128TrivialHash, HashTableGrower<3>, HashTableAllocatorWithStackMemory<sizeof(Key) * (1 << 3)>>;
+    using TwoLevelSet = TwoLevelHashSet<Key, UInt128TrivialHash>;
+    using Set = UniqExactSet<SingleLevelSet, TwoLevelSet>;
+
+    Set set;
+
+    constexpr static bool is_able_to_parallelize_merge = is_able_to_parallelize_merge_;
+    constexpr static bool is_variadic = false;
+
+    static String getName() { return "uniqExact"; }
+};
+
 template <bool is_exact_, bool argument_is_tuple_, bool is_able_to_parallelize_merge_>
 struct AggregateFunctionUniqExactDataForVariadic : AggregateFunctionUniqExactData<String, is_able_to_parallelize_merge_>
 {
@@ -248,27 +279,22 @@ struct Adder
                 AggregateFunctionUniqUniquesHashSetData> || std::is_same_v<Data, AggregateFunctionUniqHLL12Data<T, Data::is_able_to_parallelize_merge>>)
         {
             const auto & column = *columns[0];
-            if constexpr (!std::is_same_v<T, String>)
+            if constexpr (std::is_same_v<T, String> || std::is_same_v<T, IPv6>)
+            {
+                StringRef value = column.getDataAt(row_num);
+                data.set.insert(CityHash_v1_0_2::CityHash64(value.data, value.size));
+            }
+            else
             {
                 using ValueType = typename decltype(data.set)::value_type;
                 const auto & value = assert_cast<const ColumnVector<T> &>(column).getElement(row_num);
                 data.set.insert(static_cast<ValueType>(AggregateFunctionUniqTraits<T>::hash(value)));
             }
-            else
-            {
-                StringRef value = column.getDataAt(row_num);
-                data.set.insert(CityHash_v1_0_2::CityHash64(value.data, value.size));
-            }
         }
         else if constexpr (std::is_same_v<Data, AggregateFunctionUniqExactData<T, Data::is_able_to_parallelize_merge>>)
         {
             const auto & column = *columns[0];
-            if constexpr (!std::is_same_v<T, String>)
-            {
-                data.set.template insert<const T &, use_single_level_hash_table>(
-                    assert_cast<const ColumnVector<T> &>(column).getData()[row_num]);
-            }
-            else
+            if constexpr (std::is_same_v<T, String> || std::is_same_v<T, IPv6>)
             {
                 StringRef value = column.getDataAt(row_num);
 
@@ -279,6 +305,11 @@ struct Adder
 
                 data.set.template insert<const UInt128 &, use_single_level_hash_table>(key);
             }
+            else
+            {
+                data.set.template insert<const T &, use_single_level_hash_table>(
+                    assert_cast<const ColumnVector<T> &>(column).getData()[row_num]);
+            }
         }
 #if USE_DATASKETCHES
         else if constexpr (std::is_same_v<Data, AggregateFunctionUniqThetaData>)
diff --git a/src/AggregateFunctions/AggregateFunctionUniqCombined.cpp b/src/AggregateFunctions/AggregateFunctionUniqCombined.cpp
index 1c59da59e83..8c2cb6ea0de 100644
--- a/src/AggregateFunctions/AggregateFunctionUniqCombined.cpp
+++ b/src/AggregateFunctions/AggregateFunctionUniqCombined.cpp
@@ -8,6 +8,7 @@
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDate32.h>
 #include <DataTypes/DataTypeDateTime.h>
+#include <DataTypes/DataTypeIPv4andIPv6.h>
 
 #include <functional>
 
@@ -60,6 +61,10 @@ namespace
                 return std::make_shared<typename WithK<K, HashValueType>::template AggregateFunction<String>>(argument_types, params);
             else if (which.isUUID())
                 return std::make_shared<typename WithK<K, HashValueType>::template AggregateFunction<DataTypeUUID::FieldType>>(argument_types, params);
+            else if (which.isIPv4())
+                return std::make_shared<typename WithK<K, HashValueType>::template AggregateFunction<DataTypeIPv4::FieldType>>(argument_types, params);
+            else if (which.isIPv6())
+                return std::make_shared<typename WithK<K, HashValueType>::template AggregateFunction<DataTypeIPv6::FieldType>>(argument_types, params);
             else if (which.isTuple())
             {
                 if (use_exact_hash_function)
diff --git a/src/AggregateFunctions/AggregateFunctionUniqCombined.h b/src/AggregateFunctions/AggregateFunctionUniqCombined.h
index d879e3b3dde..5e8fa69f9de 100644
--- a/src/AggregateFunctions/AggregateFunctionUniqCombined.h
+++ b/src/AggregateFunctions/AggregateFunctionUniqCombined.h
@@ -119,6 +119,10 @@ struct AggregateFunctionUniqCombinedData<String, K, HashValueType> : public Aggr
 {
 };
 
+template <UInt8 K, typename HashValueType>
+struct AggregateFunctionUniqCombinedData<IPv6, K, HashValueType> : public AggregateFunctionUniqCombinedDataWithKey<UInt64 /*always*/, K>
+{
+};
 
 template <typename T, UInt8 K, typename HashValueType>
 class AggregateFunctionUniqCombined final
@@ -141,16 +145,16 @@ public:
 
     void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena *) const override
     {
-        if constexpr (!std::is_same_v<T, String>)
-        {
-            const auto & value = assert_cast<const ColumnVector<T> &>(*columns[0]).getElement(row_num);
-            this->data(place).set.insert(detail::AggregateFunctionUniqCombinedTraits<T, HashValueType>::hash(value));
-        }
-        else
+        if constexpr (std::is_same_v<T, String> || std::is_same_v<T, IPv6>)
         {
             StringRef value = columns[0]->getDataAt(row_num);
             this->data(place).set.insert(CityHash_v1_0_2::CityHash64(value.data, value.size));
         }
+        else
+        {
+            const auto & value = assert_cast<const ColumnVector<T> &>(*columns[0]).getElement(row_num);
+            this->data(place).set.insert(detail::AggregateFunctionUniqCombinedTraits<T, HashValueType>::hash(value));
+        }
     }
 
     void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena *) const override
diff --git a/src/AggregateFunctions/IAggregateFunction.h b/src/AggregateFunctions/IAggregateFunction.h
index ddc0535d0e4..df08b6f2109 100644
--- a/src/AggregateFunctions/IAggregateFunction.h
+++ b/src/AggregateFunctions/IAggregateFunction.h
@@ -6,6 +6,7 @@
 #include <Core/Block.h>
 #include <Core/ColumnNumbers.h>
 #include <Core/Field.h>
+#include <Core/ValuesWithType.h>
 #include <Interpreters/Context_fwd.h>
 #include <base/types.h>
 #include <Common/Exception.h>
@@ -389,7 +390,7 @@ public:
     }
 
     /// compileAdd should generate code for updating aggregate function state stored in aggregate_data_ptr
-    virtual void compileAdd(llvm::IRBuilderBase & /*builder*/, llvm::Value * /*aggregate_data_ptr*/, const DataTypes & /*arguments_types*/, const std::vector<llvm::Value *> & /*arguments_values*/) const
+    virtual void compileAdd(llvm::IRBuilderBase & /*builder*/, llvm::Value * /*aggregate_data_ptr*/, const ValuesWithType & /*arguments*/) const
     {
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "{} is not JIT-compilable", getName());
     }
diff --git a/src/AggregateFunctions/QuantileTiming.h b/src/AggregateFunctions/QuantileTiming.h
index de6607b2527..1d73453bc67 100644
--- a/src/AggregateFunctions/QuantileTiming.h
+++ b/src/AggregateFunctions/QuantileTiming.h
@@ -78,14 +78,14 @@ namespace detail
 
         void serialize(WriteBuffer & buf) const
         {
-            writeBinary(count, buf);
+            writeBinaryLittleEndian(count, buf);
             buf.write(reinterpret_cast<const char *>(elems), count * sizeof(elems[0]));
         }
 
         void deserialize(ReadBuffer & buf)
         {
             UInt16 new_count = 0;
-            readBinary(new_count, buf);
+            readBinaryLittleEndian(new_count, buf);
             if (new_count > TINY_MAX_ELEMS)
                 throw Exception(ErrorCodes::INCORRECT_DATA, "The number of elements {} for the 'tiny' kind of quantileTiming is exceeding the maximum of {}", new_count, TINY_MAX_ELEMS);
             buf.readStrict(reinterpret_cast<char *>(elems), new_count * sizeof(elems[0]));
@@ -164,14 +164,14 @@ namespace detail
 
         void serialize(WriteBuffer & buf) const
         {
-            writeBinary(elems.size(), buf);
+            writeBinaryLittleEndian(elems.size(), buf);
             buf.write(reinterpret_cast<const char *>(elems.data()), elems.size() * sizeof(elems[0]));
         }
 
         void deserialize(ReadBuffer & buf)
         {
             size_t size = 0;
-            readBinary(size, buf);
+            readBinaryLittleEndian(size, buf);
             if (size > 10'000)
                 throw Exception(ErrorCodes::INCORRECT_DATA, "The number of elements {} for the 'medium' kind of quantileTiming is too large", size);
 
@@ -341,7 +341,7 @@ namespace detail
 
         void serialize(WriteBuffer & buf) const
         {
-            writeBinary(count, buf);
+            writeBinaryLittleEndian(count, buf);
 
             if (count * 2 > SMALL_THRESHOLD + BIG_SIZE)
             {
@@ -356,8 +356,8 @@ namespace detail
                 {
                     if (count_small[i])
                     {
-                        writeBinary(UInt16(i), buf);
-                        writeBinary(count_small[i], buf);
+                        writeBinaryLittleEndian(UInt16(i), buf);
+                        writeBinaryLittleEndian(count_small[i], buf);
                     }
                 }
 
@@ -365,19 +365,19 @@ namespace detail
                 {
                     if (count_big[i])
                     {
-                        writeBinary(UInt16(i + SMALL_THRESHOLD), buf);
-                        writeBinary(count_big[i], buf);
+                        writeBinaryLittleEndian(UInt16(i + SMALL_THRESHOLD), buf);
+                        writeBinaryLittleEndian(count_big[i], buf);
                     }
                 }
 
                 /// Symbolizes end of data.
-                writeBinary(UInt16(BIG_THRESHOLD), buf);
+                writeBinaryLittleEndian(UInt16(BIG_THRESHOLD), buf);
             }
         }
 
         void deserialize(ReadBuffer & buf)
         {
-            readBinary(count, buf);
+            readBinaryLittleEndian(count, buf);
 
             if (count * 2 > SMALL_THRESHOLD + BIG_SIZE)
             {
@@ -388,12 +388,12 @@ namespace detail
                 while (true)
                 {
                     UInt16 index = 0;
-                    readBinary(index, buf);
+                    readBinaryLittleEndian(index, buf);
                     if (index == BIG_THRESHOLD)
                         break;
 
                     UInt64 elem_count = 0;
-                    readBinary(elem_count, buf);
+                    readBinaryLittleEndian(elem_count, buf);
 
                     if (index < SMALL_THRESHOLD)
                         count_small[index] = elem_count;
@@ -692,7 +692,7 @@ public:
     void serialize(WriteBuffer & buf) const
     {
         auto kind = which();
-        DB::writePODBinary(kind, buf);
+        writeBinaryLittleEndian(kind, buf);
 
         if (kind == Kind::Tiny)
             tiny.serialize(buf);
@@ -706,7 +706,7 @@ public:
     void deserialize(ReadBuffer & buf)
     {
         Kind kind;
-        DB::readPODBinary(kind, buf);
+        readBinaryLittleEndian(kind, buf);
 
         if (kind == Kind::Tiny)
         {
diff --git a/src/AggregateFunctions/ReservoirSamplerDeterministic.h b/src/AggregateFunctions/ReservoirSamplerDeterministic.h
index bde33260f5a..25d3b182654 100644
--- a/src/AggregateFunctions/ReservoirSamplerDeterministic.h
+++ b/src/AggregateFunctions/ReservoirSamplerDeterministic.h
@@ -157,8 +157,8 @@ public:
     void read(DB::ReadBuffer & buf)
     {
         size_t size = 0;
-        DB::readIntBinary<size_t>(size, buf);
-        DB::readIntBinary<size_t>(total_values, buf);
+        readBinaryLittleEndian(size, buf);
+        readBinaryLittleEndian(total_values, buf);
 
         /// Compatibility with old versions.
         if (size > total_values)
@@ -171,16 +171,16 @@ public:
 
         samples.resize(size);
         for (size_t i = 0; i < size; ++i)
-            DB::readPODBinary(samples[i], buf);
+            readBinaryLittleEndian(samples[i], buf);
 
         sorted = false;
     }
 
     void write(DB::WriteBuffer & buf) const
     {
-        size_t size = samples.size();
-        DB::writeIntBinary<size_t>(size, buf);
-        DB::writeIntBinary<size_t>(total_values, buf);
+        const size_t size = samples.size();
+        writeBinaryLittleEndian(size, buf);
+        writeBinaryLittleEndian(total_values, buf);
 
         for (size_t i = 0; i < size; ++i)
         {
@@ -190,12 +190,12 @@ public:
             /// Here we ensure that padding is zero without changing the protocol.
             /// TODO: After implementation of "versioning aggregate function state",
             /// change the serialization format.
-
             Element elem;
             memset(&elem, 0, sizeof(elem));
             elem = samples[i];
 
-            DB::writePODBinary(elem, buf);
+            DB::transformEndianness<std::endian::little>(elem);
+            DB::writeString(reinterpret_cast<const char*>(&elem), sizeof(elem), buf);
         }
     }
 
diff --git a/src/AggregateFunctions/UniqExactSet.h b/src/AggregateFunctions/UniqExactSet.h
index 916dfe4a424..90cfe700179 100644
--- a/src/AggregateFunctions/UniqExactSet.h
+++ b/src/AggregateFunctions/UniqExactSet.h
@@ -1,10 +1,11 @@
 #pragma once
 
+#include <exception>
 #include <Common/CurrentThread.h>
 #include <Common/HashTable/HashSet.h>
 #include <Common/ThreadPool.h>
-#include <Common/setThreadName.h>
 #include <Common/scope_guard_safe.h>
+#include <Common/setThreadName.h>
 
 
 namespace DB
@@ -48,30 +49,38 @@ public:
             }
             else
             {
-                auto next_bucket_to_merge = std::make_shared<std::atomic_uint32_t>(0);
-
-                auto thread_func = [&lhs, &rhs, next_bucket_to_merge, thread_group = CurrentThread::getGroup()]()
+                try
                 {
-                    SCOPE_EXIT_SAFE(
-                        if (thread_group)
-                            CurrentThread::detachFromGroupIfNotDetached();
-                    );
-                    if (thread_group)
-                        CurrentThread::attachToGroupIfDetached(thread_group);
-                    setThreadName("UniqExactMerger");
+                    auto next_bucket_to_merge = std::make_shared<std::atomic_uint32_t>(0);
 
-                    while (true)
+                    auto thread_func = [&lhs, &rhs, next_bucket_to_merge, thread_group = CurrentThread::getGroup()]()
                     {
-                        const auto bucket = next_bucket_to_merge->fetch_add(1);
-                        if (bucket >= rhs.NUM_BUCKETS)
-                            return;
-                        lhs.impls[bucket].merge(rhs.impls[bucket]);
-                    }
-                };
+                        SCOPE_EXIT_SAFE(
+                            if (thread_group)
+                                CurrentThread::detachFromGroupIfNotDetached();
+                        );
+                        if (thread_group)
+                            CurrentThread::attachToGroupIfDetached(thread_group);
+                        setThreadName("UniqExactMerger");
 
-                for (size_t i = 0; i < std::min<size_t>(thread_pool->getMaxThreads(), rhs.NUM_BUCKETS); ++i)
-                    thread_pool->scheduleOrThrowOnError(thread_func);
-                thread_pool->wait();
+                        while (true)
+                        {
+                            const auto bucket = next_bucket_to_merge->fetch_add(1);
+                            if (bucket >= rhs.NUM_BUCKETS)
+                                return;
+                            lhs.impls[bucket].merge(rhs.impls[bucket]);
+                        }
+                    };
+
+                    for (size_t i = 0; i < std::min<size_t>(thread_pool->getMaxThreads(), rhs.NUM_BUCKETS); ++i)
+                        thread_pool->scheduleOrThrowOnError(thread_func);
+                    thread_pool->wait();
+                }
+                catch (...)
+                {
+                    thread_pool->wait();
+                    throw;
+                }
             }
         }
     }
diff --git a/src/Analyzer/ColumnNode.cpp b/src/Analyzer/ColumnNode.cpp
index a9d47f8287d..3d9f5d1640e 100644
--- a/src/Analyzer/ColumnNode.cpp
+++ b/src/Analyzer/ColumnNode.cpp
@@ -117,7 +117,10 @@ ASTPtr ColumnNode::toASTImpl(const ConvertToASTOptions & options) const
                 else
                 {
                     const auto & table_storage_id = table_node->getStorageID();
-                    column_identifier_parts = { table_storage_id.getDatabaseName(), table_storage_id.getTableName() };
+                    if (table_storage_id.hasDatabase() && options.qualify_indentifiers_with_database)
+                        column_identifier_parts = { table_storage_id.getDatabaseName(), table_storage_id.getTableName() };
+                    else
+                        column_identifier_parts = { table_storage_id.getTableName() };
                 }
             }
         }
diff --git a/src/Analyzer/IQueryTreeNode.h b/src/Analyzer/IQueryTreeNode.h
index 351d03bc8cb..763963b734a 100644
--- a/src/Analyzer/IQueryTreeNode.h
+++ b/src/Analyzer/IQueryTreeNode.h
@@ -187,10 +187,13 @@ public:
 
         /// Identifiers are fully qualified (`database.table.column`), otherwise names are just column names (`column`)
         bool fully_qualified_identifiers = true;
+
+        /// Identifiers are qualified but database name is not added (`table.column`) if set to false.
+        bool qualify_indentifiers_with_database = true;
     };
 
     /// Convert query tree to AST
-    ASTPtr toAST(const ConvertToASTOptions & options = { .add_cast_for_constants = true, .fully_qualified_identifiers = true }) const;
+    ASTPtr toAST(const ConvertToASTOptions & options = { .add_cast_for_constants = true, .fully_qualified_identifiers = true, .qualify_indentifiers_with_database = true }) const;
 
     /// Convert query tree to AST and then format it for error message.
     String formatConvertedASTForErrorMessage() const;
diff --git a/src/Analyzer/LambdaNode.cpp b/src/Analyzer/LambdaNode.cpp
index 0d15c4d42e6..4be4d69c190 100644
--- a/src/Analyzer/LambdaNode.cpp
+++ b/src/Analyzer/LambdaNode.cpp
@@ -10,9 +10,10 @@
 namespace DB
 {
 
-LambdaNode::LambdaNode(Names argument_names_, QueryTreeNodePtr expression_)
+LambdaNode::LambdaNode(Names argument_names_, QueryTreeNodePtr expression_, DataTypePtr result_type_)
     : IQueryTreeNode(children_size)
     , argument_names(std::move(argument_names_))
+    , result_type(std::move(result_type_))
 {
     auto arguments_list_node = std::make_shared<ListNode>();
     auto & nodes = arguments_list_node->getNodes();
@@ -63,7 +64,7 @@ void LambdaNode::updateTreeHashImpl(HashState & state) const
 
 QueryTreeNodePtr LambdaNode::cloneImpl() const
 {
-    return std::make_shared<LambdaNode>(argument_names, getExpression());
+    return std::make_shared<LambdaNode>(argument_names, getExpression(), result_type);
 }
 
 ASTPtr LambdaNode::toASTImpl(const ConvertToASTOptions & options) const
diff --git a/src/Analyzer/LambdaNode.h b/src/Analyzer/LambdaNode.h
index 355ed77cc6a..ea44a7e8187 100644
--- a/src/Analyzer/LambdaNode.h
+++ b/src/Analyzer/LambdaNode.h
@@ -35,7 +35,7 @@ class LambdaNode final : public IQueryTreeNode
 {
 public:
     /// Initialize lambda with argument names and lambda body expression
-    explicit LambdaNode(Names argument_names_, QueryTreeNodePtr expression_);
+    explicit LambdaNode(Names argument_names_, QueryTreeNodePtr expression_, DataTypePtr result_type_ = {});
 
     /// Get argument names
     const Names & getArgumentNames() const
diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index b2bfa648435..163092f1b7f 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -2383,7 +2383,6 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveTableIdentifierFromDatabaseCatalog(con
 
     auto storage_lock = storage->lockForShare(context->getInitialQueryId(), context->getSettingsRef().lock_acquire_timeout);
     auto storage_snapshot = storage->getStorageSnapshot(storage->getInMemoryMetadataPtr(), context);
-
     auto result = std::make_shared<TableNode>(std::move(storage), std::move(storage_lock), std::move(storage_snapshot));
     if (is_temporary_table)
         result->setTemporaryTableName(table_name);
@@ -4767,13 +4766,14 @@ ProjectionNames QueryAnalyzer::resolveFunction(QueryTreeNodePtr & node, Identifi
         auto * table_node = in_second_argument->as<TableNode>();
         auto * table_function_node = in_second_argument->as<TableFunctionNode>();
 
-        if (table_node && dynamic_cast<StorageSet *>(table_node->getStorage().get()) != nullptr)
+        if (table_node)
         {
-            /// If table is already prepared set, we do not replace it with subquery
+            /// If table is already prepared set, we do not replace it with subquery.
+            /// If table is not a StorageSet, we'll create plan to build set in the Planner.
         }
-        else if (table_node || table_function_node)
+        else if (table_function_node)
         {
-            const auto & storage_snapshot = table_node ? table_node->getStorageSnapshot() : table_function_node->getStorageSnapshot();
+            const auto & storage_snapshot = table_function_node->getStorageSnapshot();
             auto columns_to_select = storage_snapshot->getColumns(GetColumnsOptions(GetColumnsOptions::Ordinary));
 
             size_t columns_to_select_size = columns_to_select.size();
@@ -5209,14 +5209,26 @@ ProjectionNames QueryAnalyzer::resolveFunction(QueryTreeNodePtr & node, Identifi
             const auto & second_argument_constant_literal = second_argument_constant_node->getValue();
             const auto & second_argument_constant_type = second_argument_constant_node->getResultType();
 
-            auto set = makeSetForConstantValue(first_argument_constant_type,
+            const auto & settings = scope.context->getSettingsRef();
+
+            auto result_block = getSetElementsForConstantValue(first_argument_constant_type,
                 second_argument_constant_literal,
                 second_argument_constant_type,
-                scope.context->getSettingsRef());
+                settings.transform_null_in);
+
+            SizeLimits size_limits_for_set = {settings.max_rows_in_set, settings.max_bytes_in_set, settings.set_overflow_mode};
+
+            auto set = std::make_shared<Set>(size_limits_for_set, 0, settings.transform_null_in);
+
+            set->setHeader(result_block.cloneEmpty().getColumnsWithTypeAndName());
+            set->insertFromBlock(result_block.getColumnsWithTypeAndName());
+            set->finishInsert();
+
+            auto future_set = std::make_shared<FutureSetFromStorage>(std::move(set));
 
             /// Create constant set column for constant folding
 
-            auto column_set = ColumnSet::create(1, FutureSet(std::move(set)));
+            auto column_set = ColumnSet::create(1, std::move(future_set));
             argument_columns[1].column = ColumnConst::create(std::move(column_set), 1);
         }
 
diff --git a/src/Analyzer/SetUtils.cpp b/src/Analyzer/SetUtils.cpp
index 0fb075e925b..15eec16e899 100644
--- a/src/Analyzer/SetUtils.cpp
+++ b/src/Analyzer/SetUtils.cpp
@@ -118,7 +118,7 @@ Block createBlockFromCollection(const Collection & collection, const DataTypes &
 
 }
 
-SetPtr makeSetForConstantValue(const DataTypePtr & expression_type, const Field & value, const DataTypePtr & value_type, const Settings & settings)
+Block getSetElementsForConstantValue(const DataTypePtr & expression_type, const Field & value, const DataTypePtr & value_type, bool transform_null_in)
 {
     DataTypes set_element_types = {expression_type};
     const auto * lhs_tuple_type = typeid_cast<const DataTypeTuple *>(expression_type.get());
@@ -135,9 +135,6 @@ SetPtr makeSetForConstantValue(const DataTypePtr & expression_type, const Field
     size_t lhs_type_depth = getCompoundTypeDepth(*expression_type);
     size_t rhs_type_depth = getCompoundTypeDepth(*value_type);
 
-    SizeLimits size_limits_for_set = {settings.max_rows_in_set, settings.max_bytes_in_set, settings.set_overflow_mode};
-    bool tranform_null_in = settings.transform_null_in;
-
     Block result_block;
 
     if (lhs_type_depth == rhs_type_depth)
@@ -145,7 +142,7 @@ SetPtr makeSetForConstantValue(const DataTypePtr & expression_type, const Field
         /// 1 in 1; (1, 2) in (1, 2); identity(tuple(tuple(tuple(1)))) in tuple(tuple(tuple(1))); etc.
 
         Array array{value};
-        result_block = createBlockFromCollection(array, set_element_types, tranform_null_in);
+        result_block = createBlockFromCollection(array, set_element_types, transform_null_in);
     }
     else if (lhs_type_depth + 1 == rhs_type_depth)
     {
@@ -154,9 +151,9 @@ SetPtr makeSetForConstantValue(const DataTypePtr & expression_type, const Field
         WhichDataType rhs_which_type(value_type);
 
         if (rhs_which_type.isArray())
-            result_block = createBlockFromCollection(value.get<const Array &>(), set_element_types, tranform_null_in);
+            result_block = createBlockFromCollection(value.get<const Array &>(), set_element_types, transform_null_in);
         else if (rhs_which_type.isTuple())
-            result_block = createBlockFromCollection(value.get<const Tuple &>(), set_element_types, tranform_null_in);
+            result_block = createBlockFromCollection(value.get<const Tuple &>(), set_element_types, transform_null_in);
         else
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
                 "Unsupported type at the right-side of IN. Expected Array or Tuple. Actual {}",
@@ -170,13 +167,7 @@ SetPtr makeSetForConstantValue(const DataTypePtr & expression_type, const Field
             value_type->getName());
     }
 
-    auto set = std::make_shared<Set>(size_limits_for_set, true /*fill_set_elements*/, tranform_null_in);
-
-    set->setHeader(result_block.cloneEmpty().getColumnsWithTypeAndName());
-    set->insertFromBlock(result_block.getColumnsWithTypeAndName());
-    set->finishInsert();
-
-    return set;
+    return result_block;
 }
 
 }
diff --git a/src/Analyzer/SetUtils.h b/src/Analyzer/SetUtils.h
index 7afc8e5259c..c35b45dce59 100644
--- a/src/Analyzer/SetUtils.h
+++ b/src/Analyzer/SetUtils.h
@@ -12,19 +12,12 @@ namespace DB
 class Set;
 using SetPtr = std::shared_ptr<Set>;
 
-/** Make set for constant part of IN subquery.
+/** Get set elements for constant part of IN subquery.
   * Throws exception if parameters are not valid for IN function.
   *
   * Example: SELECT id FROM test_table WHERE id IN (1, 2, 3, 4);
   * Example: SELECT id FROM test_table WHERE id IN ((1, 2), (3, 4));
-  *
-  * @param expression_type - type of first argument of function IN.
-  * @param value - constant value of second argument of function IN.
-  * @param value_type - type of second argument of function IN.
-  * @param settings - query settings.
-  *
-  * @return SetPtr for constant value.
   */
-SetPtr makeSetForConstantValue(const DataTypePtr & expression_type, const Field & value, const DataTypePtr & value_type, const Settings & settings);
+Block getSetElementsForConstantValue(const DataTypePtr & expression_type, const Field & value, const DataTypePtr & value_type, bool transform_null_in);
 
 }
diff --git a/src/Analyzer/TableNode.cpp b/src/Analyzer/TableNode.cpp
index c86cbcd5a80..f899c1ae6fe 100644
--- a/src/Analyzer/TableNode.cpp
+++ b/src/Analyzer/TableNode.cpp
@@ -91,6 +91,11 @@ ASTPtr TableNode::toASTImpl(const ConvertToASTOptions & /* options */) const
     if (!temporary_table_name.empty())
         return std::make_shared<ASTTableIdentifier>(temporary_table_name);
 
+    // In case of cross-replication we don't know what database is used for the table.
+    // `storage_id.hasDatabase()` can return false only on the initiator node.
+    // Each shard will use the default database (in the case of cross-replication shards may have different defaults).
+    if (!storage_id.hasDatabase())
+        return std::make_shared<ASTTableIdentifier>(storage_id.getTableName());
     return std::make_shared<ASTTableIdentifier>(storage_id.getDatabaseName(), storage_id.getTableName());
 }
 
diff --git a/src/Backups/BackupCoordinationRemote.cpp b/src/Backups/BackupCoordinationRemote.cpp
index 4cd06061e1b..214873fb765 100644
--- a/src/Backups/BackupCoordinationRemote.cpp
+++ b/src/Backups/BackupCoordinationRemote.cpp
@@ -721,7 +721,15 @@ void BackupCoordinationRemote::prepareFileInfos() const
 
 bool BackupCoordinationRemote::startWritingFile(size_t data_file_index)
 {
-    bool acquired_writing = false;
+    {
+        /// Check if this host is already writing this file.
+        std::lock_guard lock{writing_files_mutex};
+        if (writing_files.contains(data_file_index))
+            return false;
+    }
+
+    /// Store in Zookeeper that this host is the only host which is allowed to write this file.
+    bool host_is_assigned = false;
     String full_path = zookeeper_path + "/writing_files/" + std::to_string(data_file_index);
     String host_index_str = std::to_string(current_host_index);
 
@@ -733,14 +741,23 @@ bool BackupCoordinationRemote::startWritingFile(size_t data_file_index)
         auto code = zk->tryCreate(full_path, host_index_str, zkutil::CreateMode::Persistent);
 
         if (code == Coordination::Error::ZOK)
-            acquired_writing = true; /// If we've just created this ZooKeeper's node, the writing is acquired, i.e. we should write this data file.
+            host_is_assigned = true; /// If we've just created this ZooKeeper's node, this host is assigned.
         else if (code == Coordination::Error::ZNODEEXISTS)
-            acquired_writing = (zk->get(full_path) == host_index_str); /// The previous retry could write this ZooKeeper's node and then fail.
+            host_is_assigned = (zk->get(full_path) == host_index_str); /// The previous retry could write this ZooKeeper's node and then fail.
         else
             throw zkutil::KeeperException(code, full_path);
     });
 
-    return acquired_writing;
+    if (!host_is_assigned)
+        return false; /// Other host is writing this file.
+
+    {
+        /// Check if this host is already writing this file,
+        /// and if it's not, mark that this host is writing this file.
+        /// We have to check that again because we were accessing ZooKeeper with the mutex unlocked.
+        std::lock_guard lock{writing_files_mutex};
+        return writing_files.emplace(data_file_index).second; /// Return false if this host is already writing this file.
+    }
 }
 
 bool BackupCoordinationRemote::hasConcurrentBackups(const std::atomic<size_t> &) const
diff --git a/src/Backups/BackupCoordinationRemote.h b/src/Backups/BackupCoordinationRemote.h
index 949dd9c9bf0..c1c7a40fc44 100644
--- a/src/Backups/BackupCoordinationRemote.h
+++ b/src/Backups/BackupCoordinationRemote.h
@@ -106,12 +106,14 @@ private:
     mutable std::optional<BackupCoordinationReplicatedAccess> TSA_GUARDED_BY(replicated_access_mutex) replicated_access;
     mutable std::optional<BackupCoordinationReplicatedSQLObjects> TSA_GUARDED_BY(replicated_sql_objects_mutex) replicated_sql_objects;
     mutable std::optional<BackupCoordinationFileInfos> TSA_GUARDED_BY(file_infos_mutex) file_infos;
+    std::unordered_set<size_t> TSA_GUARDED_BY(writing_files_mutex) writing_files;
 
     mutable std::mutex zookeeper_mutex;
     mutable std::mutex replicated_tables_mutex;
     mutable std::mutex replicated_access_mutex;
     mutable std::mutex replicated_sql_objects_mutex;
     mutable std::mutex file_infos_mutex;
+    mutable std::mutex writing_files_mutex;
 };
 
 }
diff --git a/src/Backups/BackupCoordinationReplicatedTables.cpp b/src/Backups/BackupCoordinationReplicatedTables.cpp
index 87de1c7ec75..1cbb88acb82 100644
--- a/src/Backups/BackupCoordinationReplicatedTables.cpp
+++ b/src/Backups/BackupCoordinationReplicatedTables.cpp
@@ -185,11 +185,10 @@ void BackupCoordinationReplicatedTables::addPartNames(PartNamesForTableReplica &
                 const String & other_replica_name = **other.replica_names.begin();
                 throw Exception(
                     ErrorCodes::CANNOT_BACKUP_TABLE,
-                    "Table {} on replica {} has part {} which is different from the part on replica {}. Must be the same",
-                    table_name_for_logs,
-                    replica_name,
-                    part_name,
-                    other_replica_name);
+                    "Table {} on replica {} has part {} different from the part on replica {} "
+                    "(checksum '{}' on replica {} != checksum '{}' on replica {})",
+                    table_name_for_logs, replica_name, part_name, other_replica_name,
+                    getHexUIntLowercase(checksum), replica_name, getHexUIntLowercase(other.checksum), other_replica_name);
             }
         }
 
diff --git a/src/Backups/BackupCoordinationStageSync.cpp b/src/Backups/BackupCoordinationStageSync.cpp
index 3d8c283f084..ebddbb8b82f 100644
--- a/src/Backups/BackupCoordinationStageSync.cpp
+++ b/src/Backups/BackupCoordinationStageSync.cpp
@@ -85,6 +85,9 @@ void BackupCoordinationStageSync::setError(const String & current_host, const Ex
         writeException(exception, buf, true);
         zookeeper->createIfNotExists(zookeeper_path + "/error", buf.str());
 
+        /// When backup/restore fails, it removes the nodes from Zookeeper.
+        /// Sometimes it fails to remove all nodes. It's possible that it removes /error node, but fails to remove /stage node,
+        /// so the following line tries to preserve the error status.
         auto code = zookeeper->trySet(zookeeper_path, Stage::ERROR);
         if (code != Coordination::Error::ZOK)
             throw zkutil::KeeperException(code, zookeeper_path);
diff --git a/src/Backups/BackupIO_S3.cpp b/src/Backups/BackupIO_S3.cpp
index f1fd276e34b..967beba4bf5 100644
--- a/src/Backups/BackupIO_S3.cpp
+++ b/src/Backups/BackupIO_S3.cpp
@@ -161,7 +161,7 @@ void BackupReaderS3::copyFileToDisk(const String & path_in_backup, size_t file_s
                 /* dest_key= */ blob_path[0],
                 request_settings,
                 object_attributes,
-                threadPoolCallbackRunner<void>(BackupsIOThreadPool::get(), "BackupReaderS3"),
+                threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupReaderS3"),
                 /* for_disk_s3= */ true);
 
             return file_size;
@@ -212,7 +212,7 @@ void BackupWriterS3::copyFileFromDisk(const String & path_in_backup, DiskPtr src
                 fs::path(s3_uri.key) / path_in_backup,
                 request_settings,
                 {},
-                threadPoolCallbackRunner<void>(BackupsIOThreadPool::get(), "BackupWriterS3"));
+                threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterS3"));
             return; /// copied!
         }
     }
@@ -224,7 +224,7 @@ void BackupWriterS3::copyFileFromDisk(const String & path_in_backup, DiskPtr src
 void BackupWriterS3::copyDataToFile(const String & path_in_backup, const CreateReadBufferFunction & create_read_buffer, UInt64 start_pos, UInt64 length)
 {
     copyDataToS3File(create_read_buffer, start_pos, length, client, s3_uri.bucket, fs::path(s3_uri.key) / path_in_backup, request_settings, {},
-                     threadPoolCallbackRunner<void>(BackupsIOThreadPool::get(), "BackupWriterS3"));
+                     threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterS3"));
 }
 
 BackupWriterS3::~BackupWriterS3() = default;
@@ -258,7 +258,7 @@ std::unique_ptr<WriteBuffer> BackupWriterS3::writeFile(const String & file_name)
         DBMS_DEFAULT_BUFFER_SIZE,
         request_settings,
         std::nullopt,
-        threadPoolCallbackRunner<void>(BackupsIOThreadPool::get(), "BackupWriterS3"),
+        threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterS3"),
         write_settings);
 }
 
diff --git a/src/Backups/BackupImpl.cpp b/src/Backups/BackupImpl.cpp
index 306236534b6..82793f44739 100644
--- a/src/Backups/BackupImpl.cpp
+++ b/src/Backups/BackupImpl.cpp
@@ -144,6 +144,7 @@ void BackupImpl::open(const ContextPtr & context)
         if (!uuid)
             uuid = UUIDHelpers::generateV4();
         lock_file_name = use_archive ? (archive_params.archive_name + ".lock") : ".lock";
+        lock_file_before_first_file_checked = false;
         writing_finalized = false;
 
         /// Check that we can write a backup there and create the lock file to own this destination.
@@ -833,13 +834,10 @@ void BackupImpl::writeFile(const BackupFileInfo & info, BackupEntryPtr entry)
     if (writing_finalized)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Backup is already finalized");
 
-    bool should_check_lock_file = false;
     {
         std::lock_guard lock{mutex};
         ++num_files;
         total_size += info.size;
-        if (!num_entries)
-            should_check_lock_file = true;
     }
 
     auto src_disk = entry->getDisk();
@@ -859,7 +857,7 @@ void BackupImpl::writeFile(const BackupFileInfo & info, BackupEntryPtr entry)
         return;
     }
 
-    if (!should_check_lock_file)
+    if (!lock_file_before_first_file_checked.exchange(true))
         checkLockFile(true);
 
     /// NOTE: `mutex` must be unlocked during copying otherwise writing will be in one thread maximum and hence slow.
diff --git a/src/Backups/BackupImpl.h b/src/Backups/BackupImpl.h
index 7e95d156162..3ab11228892 100644
--- a/src/Backups/BackupImpl.h
+++ b/src/Backups/BackupImpl.h
@@ -141,6 +141,7 @@ private:
     std::shared_ptr<IArchiveReader> archive_reader;
     std::shared_ptr<IArchiveWriter> archive_writer;
     String lock_file_name;
+    std::atomic<bool> lock_file_before_first_file_checked = false;
 
     bool writing_finalized = false;
     bool deduplicate_files = true;
diff --git a/src/Backups/BackupsWorker.cpp b/src/Backups/BackupsWorker.cpp
index 0a6482fb7de..53a076705c4 100644
--- a/src/Backups/BackupsWorker.cpp
+++ b/src/Backups/BackupsWorker.cpp
@@ -152,8 +152,7 @@ namespace
         }
         catch (...)
         {
-            if (coordination)
-                coordination->setError(Exception(getCurrentExceptionMessageAndPattern(true, true), getCurrentExceptionCode()));
+            sendExceptionToCoordination(coordination, Exception(getCurrentExceptionMessageAndPattern(true, true), getCurrentExceptionCode()));
         }
     }
 
diff --git a/src/Bridge/IBridge.cpp b/src/Bridge/IBridge.cpp
index 3c84e22478a..dd3c25e583b 100644
--- a/src/Bridge/IBridge.cpp
+++ b/src/Bridge/IBridge.cpp
@@ -165,7 +165,7 @@ void IBridge::initialize(Application & self)
     http_timeout = config().getUInt64("http-timeout", DEFAULT_HTTP_READ_BUFFER_TIMEOUT);
     max_server_connections = config().getUInt("max-server-connections", 1024);
     keep_alive_timeout = config().getUInt64("keep-alive-timeout", 10);
-    http_max_field_value_size = config().getUInt64("http-max-field-value-size", 1048576);
+    http_max_field_value_size = config().getUInt64("http-max-field-value-size", 128 * 1024);
 
     struct rlimit limit;
     const UInt64 gb = 1024 * 1024 * 1024;
diff --git a/src/BridgeHelper/ExternalDictionaryLibraryBridgeHelper.cpp b/src/BridgeHelper/ExternalDictionaryLibraryBridgeHelper.cpp
index 284e7740a58..fcb8ebd1f22 100644
--- a/src/BridgeHelper/ExternalDictionaryLibraryBridgeHelper.cpp
+++ b/src/BridgeHelper/ExternalDictionaryLibraryBridgeHelper.cpp
@@ -239,6 +239,7 @@ QueryPipeline ExternalDictionaryLibraryBridgeHelper::loadKeys(const Block & requ
         WriteBufferFromOStream out_buffer(os);
         auto output_format = getContext()->getOutputFormat(ExternalDictionaryLibraryBridgeHelper::DEFAULT_FORMAT, out_buffer, requested_block.cloneEmpty());
         formatBlock(output_format, requested_block);
+        out_buffer.finalize();
     };
     return QueryPipeline(loadBase(uri, out_stream_callback));
 }
diff --git a/src/CMakeLists.txt b/src/CMakeLists.txt
index e1359a5a8aa..ca428fbff3a 100644
--- a/src/CMakeLists.txt
+++ b/src/CMakeLists.txt
@@ -413,6 +413,7 @@ dbms_target_link_libraries (
         boost::system
         clickhouse_common_io
         Poco::MongoDB
+        Poco::Redis
 )
 
 if (TARGET ch::mysqlxx)
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index 1de047b634f..cf1c2ed8779 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -77,7 +77,6 @@
 #include "config_version.h"
 #include "config.h"
 
-
 namespace fs = std::filesystem;
 using namespace std::literals;
 
@@ -103,6 +102,7 @@ namespace ErrorCodes
     extern const int UNRECOGNIZED_ARGUMENTS;
     extern const int LOGICAL_ERROR;
     extern const int CANNOT_OPEN_FILE;
+    extern const int FILE_ALREADY_EXISTS;
 }
 
 }
@@ -278,7 +278,7 @@ public:
     static Int32 cancelled_status() { return exit_after_signals.load(); }
 };
 
-/// This signal handler is set only for SIGINT.
+/// This signal handler is set for SIGINT and SIGQUIT.
 void interruptSignalHandler(int signum)
 {
     if (QueryInterruptHandler::try_stop())
@@ -317,6 +317,9 @@ void ClientBase::setupSignalHandler()
 
     if (sigaction(SIGINT, &new_act, nullptr))
         throwFromErrno("Cannot set signal handler.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+
+    if (sigaction(SIGQUIT, &new_act, nullptr))
+        throwFromErrno("Cannot set signal handler.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
 }
 
 
@@ -359,7 +362,7 @@ ASTPtr ClientBase::parseQuery(const char *& pos, const char * end, bool allow_mu
         std::cout << std::endl;
         WriteBufferFromOStream res_buf(std::cout, 4096);
         formatAST(*res, res_buf);
-        res_buf.next();
+        res_buf.finalize();
         std::cout << std::endl << std::endl;
     }
 
@@ -565,30 +568,17 @@ try
                 CompressionMethod compression_method = chooseCompressionMethod(out_file, compression_method_string);
                 UInt64 compression_level = 3;
 
-                if (query_with_output->is_outfile_append && compression_method != CompressionMethod::None)
-                {
-                    throw Exception(
-                        ErrorCodes::BAD_ARGUMENTS,
-                        "Cannot append to compressed file. Please use uncompressed file or remove APPEND keyword.");
-                }
-
                 if (query_with_output->compression_level)
                 {
                     const auto & compression_level_node = query_with_output->compression_level->as<ASTLiteral &>();
-                    bool res = compression_level_node.value.tryGet<UInt64>(compression_level);
-                    auto range = getCompressionLevelRange(compression_method);
-
-                    if (!res || compression_level < range.first || compression_level > range.second)
-                        throw Exception(
-                            ErrorCodes::BAD_ARGUMENTS,
-                            "Invalid compression level, must be positive integer in range {}-{}",
-                            range.first,
-                            range.second);
+                    compression_level_node.value.tryGet<UInt64>(compression_level);
                 }
 
                 auto flags = O_WRONLY | O_EXCL;
                 if (query_with_output->is_outfile_append)
                     flags |= O_APPEND;
+                else if (query_with_output->is_outfile_truncate)
+                    flags |= O_TRUNC;
                 else
                     flags |= O_CREAT;
 
@@ -869,6 +859,67 @@ void ClientBase::processOrdinaryQuery(const String & query_to_execute, ASTPtr pa
         }
     }
 
+    // Run some local checks to make sure queries into output file will work before sending to server.
+    if (const auto * query_with_output = dynamic_cast<const ASTQueryWithOutput *>(parsed_query.get()))
+    {
+        String out_file;
+        if (query_with_output->out_file)
+        {
+            const auto & out_file_node = query_with_output->out_file->as<ASTLiteral &>();
+            out_file = out_file_node.value.safeGet<std::string>();
+
+            std::string compression_method_string;
+
+            if (query_with_output->compression)
+            {
+                const auto & compression_method_node = query_with_output->compression->as<ASTLiteral &>();
+                compression_method_string = compression_method_node.value.safeGet<std::string>();
+            }
+
+            CompressionMethod compression_method = chooseCompressionMethod(out_file, compression_method_string);
+            UInt64 compression_level = 3;
+
+            if (query_with_output->is_outfile_append && query_with_output->is_outfile_truncate)
+            {
+                throw Exception(
+                    ErrorCodes::BAD_ARGUMENTS,
+                    "Cannot use INTO OUTFILE with APPEND and TRUNCATE simultaneously.");
+            }
+
+            if (query_with_output->is_outfile_append && compression_method != CompressionMethod::None)
+            {
+                throw Exception(
+                    ErrorCodes::BAD_ARGUMENTS,
+                    "Cannot append to compressed file. Please use uncompressed file or remove APPEND keyword.");
+            }
+
+            if (query_with_output->compression_level)
+            {
+                const auto & compression_level_node = query_with_output->compression_level->as<ASTLiteral &>();
+                bool res = compression_level_node.value.tryGet<UInt64>(compression_level);
+                auto range = getCompressionLevelRange(compression_method);
+
+                if (!res || compression_level < range.first || compression_level > range.second)
+                    throw Exception(
+                        ErrorCodes::BAD_ARGUMENTS,
+                        "Invalid compression level, must be positive integer in range {}-{}",
+                        range.first,
+                        range.second);
+            }
+
+            if (fs::exists(out_file))
+            {
+                if (!query_with_output->is_outfile_append && !query_with_output->is_outfile_truncate)
+                {
+                    throw Exception(
+                        ErrorCodes::FILE_ALREADY_EXISTS,
+                        "File {} exists, consider using APPEND or TRUNCATE.",
+                        out_file);
+                }
+            }
+        }
+    }
+
     const auto & settings = global_context->getSettingsRef();
     const Int32 signals_before_stop = settings.partial_result_on_first_cancel ? 2 : 1;
 
@@ -893,7 +944,6 @@ void ClientBase::processOrdinaryQuery(const String & query_to_execute, ASTPtr pa
 
             if (send_external_tables)
                 sendExternalTables(parsed_query);
-
             receiveResult(parsed_query, signals_before_stop, settings.partial_result_on_first_cancel);
 
             break;
@@ -1045,6 +1095,10 @@ bool ClientBase::receiveAndProcessPacket(ASTPtr parsed_query, bool cancelled_)
             onProfileEvents(packet.block);
             return true;
 
+        case Protocol::Server::TimezoneUpdate:
+            onTimezoneUpdate(packet.server_timezone);
+            return true;
+
         default:
             throw Exception(
                 ErrorCodes::UNKNOWN_PACKET_FROM_SERVER, "Unknown packet {} from server {}", packet.type, connection->getDescription());
@@ -1067,6 +1121,11 @@ void ClientBase::onProgress(const Progress & value)
         progress_indication.writeProgress(*tty_buf);
 }
 
+void ClientBase::onTimezoneUpdate(const String & tz)
+{
+    global_context->setSetting("session_timezone", tz);
+}
+
 
 void ClientBase::onEndOfStream()
 {
@@ -1162,11 +1221,20 @@ void ClientBase::onProfileEvents(Block & block)
 /// Flush all buffers.
 void ClientBase::resetOutput()
 {
+    /// Order is important: format, compression, file
+
     if (output_format)
         output_format->finalize();
     output_format.reset();
+
     logs_out_stream.reset();
 
+    if (out_file_buf)
+    {
+        out_file_buf->finalize();
+        out_file_buf.reset();
+    }
+
     if (pager_cmd)
     {
         pager_cmd->in.close();
@@ -1174,15 +1242,9 @@ void ClientBase::resetOutput()
     }
     pager_cmd = nullptr;
 
-    if (out_file_buf)
-    {
-        out_file_buf->next();
-        out_file_buf.reset();
-    }
-
     if (out_logs_buf)
     {
-        out_logs_buf->next();
+        out_logs_buf->finalize();
         out_logs_buf.reset();
     }
 
@@ -1215,9 +1277,13 @@ bool ClientBase::receiveSampleBlock(Block & out, ColumnsDescription & columns_de
                 columns_description = ColumnsDescription::parse(packet.multistring_message[1]);
                 return receiveSampleBlock(out, columns_description, parsed_query);
 
+            case Protocol::Server::TimezoneUpdate:
+                onTimezoneUpdate(packet.server_timezone);
+                break;
+
             default:
                 throw NetException(ErrorCodes::UNEXPECTED_PACKET_FROM_SERVER,
-                    "Unexpected packet from server (expected Data, Exception or Log, got {})",
+                    "Unexpected packet from server (expected Data, Exception, Log or TimezoneUpdate, got {})",
                     String(Protocol::Server::toString(packet.type)));
         }
     }
@@ -1361,6 +1427,7 @@ void ClientBase::sendData(Block & sample, const ColumnsDescription & columns_des
             columns_description_for_query,
             ConstraintsDescription{},
             String{},
+            {},
         };
         StoragePtr storage = std::make_shared<StorageFile>(in_file, global_context->getUserFilesPath(), args);
         storage->startup();
@@ -1531,7 +1598,9 @@ void ClientBase::receiveLogsAndProfileEvents(ASTPtr parsed_query)
 {
     auto packet_type = connection->checkPacket(0);
 
-    while (packet_type && (*packet_type == Protocol::Server::Log || *packet_type == Protocol::Server::ProfileEvents))
+    while (packet_type && (*packet_type == Protocol::Server::Log
+            || *packet_type == Protocol::Server::ProfileEvents
+            || *packet_type == Protocol::Server::TimezoneUpdate))
     {
         receiveAndProcessPacket(parsed_query, false);
         packet_type = connection->checkPacket(0);
@@ -1568,6 +1637,10 @@ bool ClientBase::receiveEndOfQuery()
                 onProfileEvents(packet.block);
                 break;
 
+            case Protocol::Server::TimezoneUpdate:
+                onTimezoneUpdate(packet.server_timezone);
+                break;
+
             default:
                 throw NetException(ErrorCodes::UNEXPECTED_PACKET_FROM_SERVER,
                     "Unexpected packet from server (expected Exception, EndOfStream, Log, Progress or ProfileEvents. Got {})",
diff --git a/src/Client/ClientBase.h b/src/Client/ClientBase.h
index ee4567a0922..bd17318d1df 100644
--- a/src/Client/ClientBase.h
+++ b/src/Client/ClientBase.h
@@ -148,6 +148,7 @@ private:
     void cancelQuery();
 
     void onProgress(const Progress & value);
+    void onTimezoneUpdate(const String & tz);
     void onData(Block & block, ASTPtr parsed_query);
     void onLogData(Block & block);
     void onTotals(Block & block, ASTPtr parsed_query);
diff --git a/src/Client/Connection.cpp b/src/Client/Connection.cpp
index b579645dcc9..cd102f46ffe 100644
--- a/src/Client/Connection.cpp
+++ b/src/Client/Connection.cpp
@@ -138,11 +138,6 @@ void Connection::connect(const ConnectionTimeouts & timeouts)
                         socket->impl()->error(err); // Throws an exception
 
                     socket->setBlocking(true);
-
-#if USE_SSL
-                    if (static_cast<bool>(secure))
-                        static_cast<Poco::Net::SecureStreamSocket *>(socket.get())->completeHandshake();
-#endif
                 }
                 else
                 {
@@ -593,7 +588,7 @@ void Connection::sendQuery(
         if (method == "ZSTD")
             level = settings->network_zstd_compression_level;
 
-        CompressionCodecFactory::instance().validateCodec(method, level, !settings->allow_suspicious_codecs, settings->allow_experimental_codecs);
+        CompressionCodecFactory::instance().validateCodec(method, level, !settings->allow_suspicious_codecs, settings->allow_experimental_codecs, settings->enable_deflate_qpl_codec);
         compression_codec = CompressionCodecFactory::instance().get(method, level);
     }
     else
@@ -1027,6 +1022,11 @@ Packet Connection::receivePacket()
                 res.block = receiveProfileEvents();
                 return res;
 
+            case Protocol::Server::TimezoneUpdate:
+                readStringBinary(server_timezone, *in);
+                res.server_timezone = server_timezone;
+                return res;
+
             default:
                 /// In unknown state, disconnect - to not leave unsynchronised connection.
                 disconnect();
@@ -1175,16 +1175,12 @@ ProfileInfo Connection::receiveProfileInfo() const
 
 ParallelReadRequest Connection::receiveParallelReadRequest() const
 {
-    ParallelReadRequest request;
-    request.deserialize(*in);
-    return request;
+    return ParallelReadRequest::deserialize(*in);
 }
 
 InitialAllRangesAnnouncement Connection::receiveInitialParallelReadAnnounecement() const
 {
-    InitialAllRangesAnnouncement announcement;
-    announcement.deserialize(*in);
-    return announcement;
+    return InitialAllRangesAnnouncement::deserialize(*in);
 }
 
 
diff --git a/src/Client/ConnectionPool.cpp b/src/Client/ConnectionPool.cpp
index 8433b0833fa..5cabb1465d1 100644
--- a/src/Client/ConnectionPool.cpp
+++ b/src/Client/ConnectionPool.cpp
@@ -18,7 +18,7 @@ ConnectionPoolPtr ConnectionPoolFactory::get(
     String client_name,
     Protocol::Compression compression,
     Protocol::Secure secure,
-    Int64 priority)
+    Priority priority)
 {
     Key key{
         max_connections, host, port, default_database, user, password, quota_key, cluster, cluster_secret, client_name, compression, secure, priority};
@@ -74,7 +74,7 @@ size_t ConnectionPoolFactory::KeyHash::operator()(const ConnectionPoolFactory::K
     hash_combine(seed, hash_value(k.client_name));
     hash_combine(seed, hash_value(k.compression));
     hash_combine(seed, hash_value(k.secure));
-    hash_combine(seed, hash_value(k.priority));
+    hash_combine(seed, hash_value(k.priority.value));
     return seed;
 }
 
diff --git a/src/Client/ConnectionPool.h b/src/Client/ConnectionPool.h
index aacd0a063c7..b6d03daacfb 100644
--- a/src/Client/ConnectionPool.h
+++ b/src/Client/ConnectionPool.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <Common/PoolBase.h>
+#include <Common/Priority.h>
 #include <Client/Connection.h>
 #include <IO/ConnectionTimeouts.h>
 #include <Core/Settings.h>
@@ -34,7 +35,7 @@ public:
                       const Settings * settings = nullptr,
                       bool force_connected = true) = 0;
 
-    virtual Int64 getPriority() const { return 1; }
+    virtual Priority getPriority() const { return Priority{1}; }
 };
 
 using ConnectionPoolPtr = std::shared_ptr<IConnectionPool>;
@@ -60,7 +61,7 @@ public:
             const String & client_name_,
             Protocol::Compression compression_,
             Protocol::Secure secure_,
-            Int64 priority_ = 1)
+            Priority priority_ = Priority{1})
        : Base(max_connections_,
         &Poco::Logger::get("ConnectionPool (" + host_ + ":" + toString(port_) + ")")),
         host(host_),
@@ -103,7 +104,7 @@ public:
         return host + ":" + toString(port);
     }
 
-    Int64 getPriority() const override
+    Priority getPriority() const override
     {
         return priority;
     }
@@ -134,7 +135,7 @@ private:
     String client_name;
     Protocol::Compression compression; /// Whether to compress data when interacting with the server.
     Protocol::Secure secure;           /// Whether to encrypt data when interacting with the server.
-    Int64 priority;                    /// priority from <remote_servers>
+    Priority priority;                 /// priority from <remote_servers>
 };
 
 /**
@@ -157,7 +158,7 @@ public:
         String client_name;
         Protocol::Compression compression;
         Protocol::Secure secure;
-        Int64 priority;
+        Priority priority;
     };
 
     struct KeyHash
@@ -180,7 +181,7 @@ public:
         String client_name,
         Protocol::Compression compression,
         Protocol::Secure secure,
-        Int64 priority);
+        Priority priority);
 private:
     mutable std::mutex mutex;
     using ConnectionPoolWeakPtr = std::weak_ptr<IConnectionPool>;
diff --git a/src/Client/ConnectionPoolWithFailover.cpp b/src/Client/ConnectionPoolWithFailover.cpp
index 129bc10bc27..feb4c01c374 100644
--- a/src/Client/ConnectionPoolWithFailover.cpp
+++ b/src/Client/ConnectionPoolWithFailover.cpp
@@ -71,7 +71,7 @@ IConnectionPool::Entry ConnectionPoolWithFailover::get(const ConnectionTimeouts
     return Base::get(max_ignored_errors, fallback_to_stale_replicas, try_get_entry, get_priority);
 }
 
-Int64 ConnectionPoolWithFailover::getPriority() const
+Priority ConnectionPoolWithFailover::getPriority() const
 {
     return (*std::max_element(nested_pools.begin(), nested_pools.end(), [](const auto & a, const auto & b)
     {
diff --git a/src/Client/ConnectionPoolWithFailover.h b/src/Client/ConnectionPoolWithFailover.h
index 0273ce41589..75a0dafd977 100644
--- a/src/Client/ConnectionPoolWithFailover.h
+++ b/src/Client/ConnectionPoolWithFailover.h
@@ -48,7 +48,7 @@ public:
               const Settings * settings,
               bool force_connected) override; /// From IConnectionPool
 
-    Int64 getPriority() const override; /// From IConnectionPool
+    Priority getPriority() const override; /// From IConnectionPool
 
     /** Allocates up to the specified number of connections to work.
       * Connections provide access to different replicas of one shard.
diff --git a/src/Client/ConnectionString.cpp b/src/Client/ConnectionString.cpp
new file mode 100644
index 00000000000..f4a4e73c198
--- /dev/null
+++ b/src/Client/ConnectionString.cpp
@@ -0,0 +1,239 @@
+#include "ConnectionString.h"
+
+#include <Common/Exception.h>
+#include <Poco/Exception.h>
+#include <Poco/URI.h>
+
+#include <array>
+#include <iostream>
+#include <string>
+#include <unordered_map>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+}
+
+}
+
+namespace
+{
+
+using namespace std::string_literals;
+using namespace std::literals::string_view_literals;
+
+constexpr auto CONNECTION_URI_SCHEME = "clickhouse:"sv;
+
+const std::unordered_map<std::string_view, std::string_view> PROHIBITED_CLIENT_OPTIONS = {
+    /// Client option, client option long name
+    {"-h", "--host"},
+    {"--host", "--host"},
+    {"--port", "--port"},
+    {"--connection", "--connection"},
+};
+
+std::string uriDecode(const std::string & uri_encoded_string, bool plus_as_space)
+{
+    std::string decoded_string;
+    Poco::URI::decode(uri_encoded_string, decoded_string, plus_as_space);
+    return decoded_string;
+}
+
+void getHostAndPort(const Poco::URI & uri, std::vector<std::vector<std::string>> & hosts_and_ports_arguments)
+{
+    std::vector<std::string> host_and_port;
+    const std::string & host = uri.getHost();
+    if (!host.empty())
+    {
+        host_and_port.push_back("--host=" + uriDecode(host, false));
+    }
+
+    // Port can be written without host (":9000"). Empty host name equals to default host.
+    auto port = uri.getPort();
+    if (port != 0)
+        host_and_port.push_back("--port=" + std::to_string(port));
+
+    if (!host_and_port.empty())
+        hosts_and_ports_arguments.push_back(std::move(host_and_port));
+}
+
+void buildConnectionString(
+    std::string_view host_and_port,
+    std::string_view right_part,
+    Poco::URI & uri,
+    std::vector<std::vector<std::string>> & hosts_and_ports_arguments)
+{
+    // User info does not matter in sub URI
+    auto uri_string = std::string(CONNECTION_URI_SCHEME);
+    if (!host_and_port.empty())
+    {
+        uri_string.append("//");
+        uri_string.append(host_and_port);
+    }
+
+    // Right part from string includes '/database?[params]'
+    uri_string.append(right_part);
+    try
+    {
+        uri = Poco::URI(uri_string);
+    }
+    catch (const Poco::URISyntaxException & invalid_uri_exception)
+    {
+        throw DB::Exception(DB::ErrorCodes::BAD_ARGUMENTS,
+                            "Invalid connection string syntax {}: {}", uri_string, invalid_uri_exception.what());
+    }
+
+    getHostAndPort(uri, hosts_and_ports_arguments);
+}
+
+std::string makeArgument(const std::string & connection_string_parameter_name)
+{
+    return (connection_string_parameter_name.size() == 1 ? "-"s : "--"s) + connection_string_parameter_name;
+}
+
+}
+
+namespace DB
+{
+
+bool tryParseConnectionString(
+    std::string_view connection_string,
+    std::vector<std::string> & common_arguments,
+    std::vector<std::vector<std::string>> & hosts_and_ports_arguments)
+{
+    if (connection_string == CONNECTION_URI_SCHEME)
+        return true;
+
+    if (!connection_string.starts_with(CONNECTION_URI_SCHEME))
+        return false;
+
+    size_t offset = CONNECTION_URI_SCHEME.size();
+    if ((connection_string.substr(offset).starts_with("//")))
+        offset += 2;
+
+    auto hosts_end_pos = std::string_view::npos;
+    auto hosts_or_user_info_end_pos = connection_string.find_first_of("?/@", offset);
+
+    auto has_user_info = hosts_or_user_info_end_pos != std::string_view::npos && connection_string[hosts_or_user_info_end_pos] == '@';
+    if (has_user_info)
+    {
+        // Move offset right after user info
+        offset = hosts_or_user_info_end_pos + 1;
+        hosts_end_pos = connection_string.find_first_of("?/@", offset);
+        // Several '@' symbols in connection string is prohibited.
+        // If user name contains '@' then it should be percent-encoded.
+        // several users: 'usr1@host1,@usr2@host2' is invalid.
+        if (hosts_end_pos != std::string_view::npos && connection_string[hosts_end_pos] == '@')
+        {
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                            "Symbols '@' in URI in password or user name should be percent-encoded. Individual user names for different hosts also prohibited. {}",
+                            connection_string);
+        }
+    }
+    else
+        hosts_end_pos = hosts_or_user_info_end_pos;
+
+    const auto * hosts_end = hosts_end_pos != std::string_view::npos ? connection_string.begin() + hosts_end_pos
+                                                                     : connection_string.end();
+
+    try
+    {
+        /** Poco::URI doesn't support several hosts in URI.
+          * Split string clickhouse:[user[:password]@]host1:port1, ... , hostN:portN[database]?[query_parameters]
+          * into multiple string for each host:
+          * clickhouse:[user[:password]@]host1:port1[database]?[query_parameters]
+          * ...
+          * clickhouse:[user[:password]@]hostN:portN[database]?[query_parameters]
+          */
+        Poco::URI uri;
+        const auto * last_host_begin = connection_string.begin() + offset;
+        for (const auto * it = last_host_begin; it != hosts_end; ++it)
+        {
+            if (*it == ',')
+            {
+                buildConnectionString({last_host_begin, it}, {hosts_end, connection_string.end()}, uri, hosts_and_ports_arguments);
+                last_host_begin = it + 1;
+            }
+        }
+
+        if (uri.empty())
+        {
+            // URI has no host specified
+            uri = std::string(connection_string);
+            getHostAndPort(uri, hosts_and_ports_arguments);
+        }
+        else
+            buildConnectionString({last_host_begin, hosts_end}, {hosts_end, connection_string.end()}, uri, hosts_and_ports_arguments);
+
+        Poco::URI::QueryParameters params = uri.getQueryParameters();
+        for (const auto & param : params)
+        {
+            if (param.first == "secure" || param.first == "s")
+            {
+                if (!param.second.empty())
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "secure URI query parameter does not allow value");
+
+                common_arguments.push_back(makeArgument(param.first));
+            }
+            else
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "URI query parameter {} is not supported", param.first);
+        }
+
+        auto user_info = uri.getUserInfo();
+        if (!user_info.empty())
+        {
+            // Poco::URI doesn't decode user name/password by default.
+            // But ClickHouse allows to have users with email user name like: 'john@some_mail.com'
+            // john@some_mail.com should be percent-encoded: 'john%40some_mail.com'
+            size_t pos = user_info.find(':');
+            if (pos != std::string::npos)
+            {
+                common_arguments.push_back("--user");
+                common_arguments.push_back(uriDecode(user_info.substr(0, pos), true));
+
+                ++pos; // Skip ':'
+                common_arguments.push_back("--password");
+                if (user_info.size() > pos + 1)
+                    common_arguments.push_back(uriDecode(user_info.substr(pos), true));
+                else
+                {
+                    // in case of user_info == 'user:', ':' is specified, but password is empty
+                    // then add password argument "\n" which means: Ask user for a password.
+                    common_arguments.push_back("\n");
+                }
+            }
+            else
+            {
+                common_arguments.push_back("--user");
+                common_arguments.push_back(uriDecode(user_info, true));
+            }
+        }
+
+        const auto & database_name = uri.getPath();
+        size_t start_symbol = !database_name.empty() && database_name[0] == '/' ? 1u : 0u;
+        if (database_name.size() > start_symbol)
+        {
+            common_arguments.push_back("--database");
+            common_arguments.push_back(start_symbol == 0u ? database_name : database_name.substr(start_symbol));
+        }
+    }
+    catch (const Poco::URISyntaxException & invalid_uri_exception)
+    {
+        throw DB::Exception(DB::ErrorCodes::BAD_ARGUMENTS,
+                            "Invalid connection string '{}': {}", connection_string, invalid_uri_exception.what());
+    }
+
+    return true;
+}
+
+void checkIfCmdLineOptionCanBeUsedWithConnectionString(std::string_view command_line_option)
+{
+    if (PROHIBITED_CLIENT_OPTIONS.contains(command_line_option))
+        throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                        "Mixing a connection string and {} option is prohibited", PROHIBITED_CLIENT_OPTIONS.at(command_line_option));
+}
+
+}
diff --git a/src/Client/ConnectionString.h b/src/Client/ConnectionString.h
new file mode 100644
index 00000000000..ad63e9cda3d
--- /dev/null
+++ b/src/Client/ConnectionString.h
@@ -0,0 +1,27 @@
+#pragma once
+
+#include <string>
+#include <string_view>
+#include <vector>
+
+namespace DB
+{
+/** Tries to parse ClickHouse connection string.
+ * if @connection_string starts with 'clickhouse:' then connection string will be parsed
+ * and converted into a set of arguments for the client.
+ * Connection string format is similar to URI "clickhouse:[//[user[:password]@][hosts_and_ports]][/dbname][?query_parameters]"
+ * with the difference that hosts_and_ports can contain multiple hosts separated by ','.
+ * example: clickhouse://user@host1:port1,host2:port2
+ * @return Returns false if no connection string was specified. If a connection string was specified, returns true if it is valid, and throws an exception if it is invalid.
+ * @exception Throws DB::Exception if URI has valid scheme (clickhouse:), but invalid internals.
+*/
+bool tryParseConnectionString(
+    std::string_view connection_string,
+    std::vector<std::string> & common_arguments,
+    std::vector<std::vector<std::string>> & hosts_and_ports_arguments);
+
+// Throws DB::Exception with BAD_ARGUMENTS if the given command line argument
+// is not allowed to be used with a connection string.
+void checkIfCmdLineOptionCanBeUsedWithConnectionString(std::string_view command_line_option);
+
+}
diff --git a/src/Client/HedgedConnections.cpp b/src/Client/HedgedConnections.cpp
index f8966847e5a..fb6fe258d48 100644
--- a/src/Client/HedgedConnections.cpp
+++ b/src/Client/HedgedConnections.cpp
@@ -419,6 +419,7 @@ Packet HedgedConnections::receivePacketFromReplica(const ReplicaLocation & repli
             }
             replica_with_last_received_packet = replica_location;
             break;
+        case Protocol::Server::TimezoneUpdate:
         case Protocol::Server::PartUUIDs:
         case Protocol::Server::ProfileInfo:
         case Protocol::Server::Totals:
diff --git a/src/Client/IServerConnection.h b/src/Client/IServerConnection.h
index cd4db8f5258..a0c029c79fb 100644
--- a/src/Client/IServerConnection.h
+++ b/src/Client/IServerConnection.h
@@ -16,6 +16,10 @@
 
 #include <boost/noncopyable.hpp>
 
+#include <optional>
+#include <vector>
+#include <memory>
+#include <string>
 
 namespace DB
 {
@@ -34,9 +38,11 @@ struct Packet
     ProfileInfo profile_info;
     std::vector<UUID> part_uuids;
 
-    InitialAllRangesAnnouncement announcement;
-    ParallelReadRequest request;
-    ParallelReadResponse response;
+    /// The part of parallel replicas protocol
+    std::optional<InitialAllRangesAnnouncement> announcement;
+    std::optional<ParallelReadRequest> request;
+
+    std::string server_timezone;
 
     Packet() : type(Protocol::Server::Hello) {}
 };
diff --git a/src/Client/MultiplexedConnections.cpp b/src/Client/MultiplexedConnections.cpp
index 71f536b9687..e5c4a19e02a 100644
--- a/src/Client/MultiplexedConnections.cpp
+++ b/src/Client/MultiplexedConnections.cpp
@@ -259,6 +259,7 @@ Packet MultiplexedConnections::drain()
 
         switch (packet.type)
         {
+            case Protocol::Server::TimezoneUpdate:
             case Protocol::Server::MergeTreeAllRangesAnnounecement:
             case Protocol::Server::MergeTreeReadTaskRequest:
             case Protocol::Server::ReadTaskRequest:
@@ -340,6 +341,7 @@ Packet MultiplexedConnections::receivePacketUnlocked(AsyncCallback async_callbac
 
     switch (packet.type)
     {
+        case Protocol::Server::TimezoneUpdate:
         case Protocol::Server::MergeTreeAllRangesAnnounecement:
         case Protocol::Server::MergeTreeReadTaskRequest:
         case Protocol::Server::ReadTaskRequest:
diff --git a/src/Client/QueryFuzzer.cpp b/src/Client/QueryFuzzer.cpp
index bfcfe659982..39ca7a5ed88 100644
--- a/src/Client/QueryFuzzer.cpp
+++ b/src/Client/QueryFuzzer.cpp
@@ -1244,7 +1244,7 @@ void QueryFuzzer::fuzzMain(ASTPtr & ast)
     std::cout << std::endl;
     WriteBufferFromOStream ast_buf(std::cout, 4096);
     formatAST(*ast, ast_buf, false /*highlight*/);
-    ast_buf.next();
+    ast_buf.finalize();
     std::cout << std::endl << std::endl;
 }
 
diff --git a/src/Client/Suggest.cpp b/src/Client/Suggest.cpp
index 4ffa828dd40..6e989e10f76 100644
--- a/src/Client/Suggest.cpp
+++ b/src/Client/Suggest.cpp
@@ -43,7 +43,7 @@ Suggest::Suggest()
         "IN",           "KILL",     "QUERY",  "SYNC",      "ASYNC",    "TEST",        "BETWEEN",  "TRUNCATE",    "USER",    "ROLE",
         "PROFILE",      "QUOTA",    "POLICY", "ROW",       "GRANT",    "REVOKE",      "OPTION",   "ADMIN",       "EXCEPT",  "REPLACE",
         "IDENTIFIED",   "HOST",     "NAME",   "READONLY",  "WRITABLE", "PERMISSIVE",  "FOR",      "RESTRICTIVE", "RANDOMIZED",
-        "INTERVAL",     "LIMITS",   "ONLY",   "TRACKING",  "IP",       "REGEXP",      "ILIKE",    "CLEANUP"
+        "INTERVAL",     "LIMITS",   "ONLY",   "TRACKING",  "IP",       "REGEXP",      "ILIKE",    "CLEANUP",     "APPEND"
     });
 }
 
@@ -101,7 +101,9 @@ static String getLoadSuggestionQuery(Int32 suggestion_limit, bool basic_suggesti
         add_column("name", "columns", true, suggestion_limit);
     }
 
-    query = "SELECT DISTINCT arrayJoin(extractAll(name, '[\\\\w_]{2,}')) AS res FROM (" + query + ") WHERE notEmpty(res)";
+    /// FIXME: Forbid this query using new analyzer because of bug https://github.com/ClickHouse/ClickHouse/issues/50669
+    /// We should remove this restriction after resolving this bug.
+    query = "SELECT DISTINCT arrayJoin(extractAll(name, '[\\\\w_]{2,}')) AS res FROM (" + query + ") WHERE notEmpty(res) SETTINGS allow_experimental_analyzer=0";
     return query;
 }
 
@@ -158,6 +160,7 @@ void Suggest::fetch(IServerConnection & connection, const ConnectionTimeouts & t
                 fillWordsFromBlock(packet.block);
                 continue;
 
+            case Protocol::Server::TimezoneUpdate:
             case Protocol::Server::Progress:
             case Protocol::Server::ProfileInfo:
             case Protocol::Server::Totals:
diff --git a/src/Columns/ColumnAggregateFunction.cpp b/src/Columns/ColumnAggregateFunction.cpp
index e521262acd2..62ec324455e 100644
--- a/src/Columns/ColumnAggregateFunction.cpp
+++ b/src/Columns/ColumnAggregateFunction.cpp
@@ -528,6 +528,7 @@ StringRef ColumnAggregateFunction::serializeValueIntoArena(size_t n, Arena & are
 {
     WriteBufferFromArena out(arena, begin);
     func->serialize(data[n], out, version);
+    out.finalize();
     return out.complete();
 }
 
diff --git a/src/Columns/ColumnArray.h b/src/Columns/ColumnArray.h
index e60c388831d..f011d9a607b 100644
--- a/src/Columns/ColumnArray.h
+++ b/src/Columns/ColumnArray.h
@@ -151,13 +151,13 @@ public:
 
     ColumnPtr compress() const override;
 
-    void forEachSubcolumn(ColumnCallback callback) const override
+    void forEachSubcolumn(MutableColumnCallback callback) override
     {
         callback(offsets);
         callback(data);
     }
 
-    void forEachSubcolumnRecursively(RecursiveColumnCallback callback) const override
+    void forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback) override
     {
         callback(*offsets);
         offsets->forEachSubcolumnRecursively(callback);
diff --git a/src/Columns/ColumnConst.h b/src/Columns/ColumnConst.h
index fcdcd2ce224..f769dd6cc2a 100644
--- a/src/Columns/ColumnConst.h
+++ b/src/Columns/ColumnConst.h
@@ -230,12 +230,12 @@ public:
         data->getExtremes(min, max);
     }
 
-    void forEachSubcolumn(ColumnCallback callback) const override
+    void forEachSubcolumn(MutableColumnCallback callback) override
     {
         callback(data);
     }
 
-    void forEachSubcolumnRecursively(RecursiveColumnCallback callback) const override
+    void forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback) override
     {
         callback(*data);
         data->forEachSubcolumnRecursively(callback);
diff --git a/src/Columns/ColumnLowCardinality.cpp b/src/Columns/ColumnLowCardinality.cpp
index 4f9ab8215be..9269ea4ee4d 100644
--- a/src/Columns/ColumnLowCardinality.cpp
+++ b/src/Columns/ColumnLowCardinality.cpp
@@ -313,6 +313,11 @@ MutableColumnPtr ColumnLowCardinality::cloneResized(size_t size) const
 MutableColumnPtr ColumnLowCardinality::cloneNullable() const
 {
     auto res = cloneFinalized();
+    /* Compact required not to share dictionary.
+     * If `shared` flag is not set `cloneFinalized` will return shallow copy
+     * and `nestedToNullable` will mutate source column.
+     */
+    assert_cast<ColumnLowCardinality &>(*res).compactInplace();
     assert_cast<ColumnLowCardinality &>(*res).nestedToNullable();
     return res;
 }
diff --git a/src/Columns/ColumnLowCardinality.h b/src/Columns/ColumnLowCardinality.h
index a5c056153bb..dcd07ff3b34 100644
--- a/src/Columns/ColumnLowCardinality.h
+++ b/src/Columns/ColumnLowCardinality.h
@@ -166,7 +166,7 @@ public:
     size_t byteSizeAt(size_t n) const override { return getDictionary().byteSizeAt(getIndexes().getUInt(n)); }
     size_t allocatedBytes() const override { return idx.getPositions()->allocatedBytes() + getDictionary().allocatedBytes(); }
 
-    void forEachSubcolumn(ColumnCallback callback) const override
+    void forEachSubcolumn(MutableColumnCallback callback) override
     {
         callback(idx.getPositionsPtr());
 
@@ -175,7 +175,7 @@ public:
             callback(dictionary.getColumnUniquePtr());
     }
 
-    void forEachSubcolumnRecursively(RecursiveColumnCallback callback) const override
+    void forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback) override
     {
         callback(*idx.getPositionsPtr());
         idx.getPositionsPtr()->forEachSubcolumnRecursively(callback);
@@ -340,7 +340,7 @@ private:
         explicit Dictionary(MutableColumnPtr && column_unique, bool is_shared);
         explicit Dictionary(ColumnPtr column_unique, bool is_shared);
 
-        const ColumnPtr & getColumnUniquePtr() const { return column_unique; }
+        const WrappedPtr & getColumnUniquePtr() const { return column_unique; }
         WrappedPtr & getColumnUniquePtr() { return column_unique; }
 
         const IColumnUnique & getColumnUnique() const { return static_cast<const IColumnUnique &>(*column_unique); }
diff --git a/src/Columns/ColumnMap.cpp b/src/Columns/ColumnMap.cpp
index 7f5693bf470..797700e87b0 100644
--- a/src/Columns/ColumnMap.cpp
+++ b/src/Columns/ColumnMap.cpp
@@ -273,12 +273,12 @@ void ColumnMap::getExtremes(Field & min, Field & max) const
     max = std::move(map_max_value);
 }
 
-void ColumnMap::forEachSubcolumn(ColumnCallback callback) const
+void ColumnMap::forEachSubcolumn(MutableColumnCallback callback)
 {
     callback(nested);
 }
 
-void ColumnMap::forEachSubcolumnRecursively(RecursiveColumnCallback callback) const
+void ColumnMap::forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback)
 {
     callback(*nested);
     nested->forEachSubcolumnRecursively(callback);
diff --git a/src/Columns/ColumnMap.h b/src/Columns/ColumnMap.h
index a11905fcaa0..e5bc26127df 100644
--- a/src/Columns/ColumnMap.h
+++ b/src/Columns/ColumnMap.h
@@ -88,8 +88,8 @@ public:
     size_t byteSizeAt(size_t n) const override;
     size_t allocatedBytes() const override;
     void protect() override;
-    void forEachSubcolumn(ColumnCallback callback) const override;
-    void forEachSubcolumnRecursively(RecursiveColumnCallback callback) const override;
+    void forEachSubcolumn(MutableColumnCallback callback) override;
+    void forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback) override;
     bool structureEquals(const IColumn & rhs) const override;
     double getRatioOfDefaultRows(double sample_ratio) const override;
     UInt64 getNumberOfDefaultRows() const override;
diff --git a/src/Columns/ColumnNullable.h b/src/Columns/ColumnNullable.h
index 47afd982b1e..bc95eca69b9 100644
--- a/src/Columns/ColumnNullable.h
+++ b/src/Columns/ColumnNullable.h
@@ -130,13 +130,13 @@ public:
 
     ColumnPtr compress() const override;
 
-    void forEachSubcolumn(ColumnCallback callback) const override
+    void forEachSubcolumn(MutableColumnCallback callback) override
     {
         callback(nested_column);
         callback(null_map);
     }
 
-    void forEachSubcolumnRecursively(RecursiveColumnCallback callback) const override
+    void forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback) override
     {
         callback(*nested_column);
         nested_column->forEachSubcolumnRecursively(callback);
diff --git a/src/Columns/ColumnObject.cpp b/src/Columns/ColumnObject.cpp
index b2adf9e0059..07872774559 100644
--- a/src/Columns/ColumnObject.cpp
+++ b/src/Columns/ColumnObject.cpp
@@ -664,18 +664,18 @@ size_t ColumnObject::allocatedBytes() const
     return res;
 }
 
-void ColumnObject::forEachSubcolumn(ColumnCallback callback) const
+void ColumnObject::forEachSubcolumn(MutableColumnCallback callback)
 {
-    for (const auto & entry : subcolumns)
-        for (const auto & part : entry->data.data)
+    for (auto & entry : subcolumns)
+        for (auto & part : entry->data.data)
             callback(part);
 }
 
-void ColumnObject::forEachSubcolumnRecursively(RecursiveColumnCallback callback) const
+void ColumnObject::forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback)
 {
-    for (const auto & entry : subcolumns)
+    for (auto & entry : subcolumns)
     {
-        for (const auto & part : entry->data.data)
+        for (auto & part : entry->data.data)
         {
             callback(*part);
             part->forEachSubcolumnRecursively(callback);
diff --git a/src/Columns/ColumnObject.h b/src/Columns/ColumnObject.h
index 91920908542..bc5a6b69bb0 100644
--- a/src/Columns/ColumnObject.h
+++ b/src/Columns/ColumnObject.h
@@ -206,8 +206,8 @@ public:
     size_t size() const override;
     size_t byteSize() const override;
     size_t allocatedBytes() const override;
-    void forEachSubcolumn(ColumnCallback callback) const override;
-    void forEachSubcolumnRecursively(RecursiveColumnCallback callback) const override;
+    void forEachSubcolumn(MutableColumnCallback callback) override;
+    void forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback) override;
     void insert(const Field & field) override;
     void insertDefault() override;
     void insertFrom(const IColumn & src, size_t n) override;
diff --git a/src/Columns/ColumnSet.h b/src/Columns/ColumnSet.h
index 3f5cf4ad280..935a72e551a 100644
--- a/src/Columns/ColumnSet.h
+++ b/src/Columns/ColumnSet.h
@@ -21,7 +21,7 @@ class ColumnSet final : public COWHelper<IColumnDummy, ColumnSet>
 private:
     friend class COWHelper<IColumnDummy, ColumnSet>;
 
-    ColumnSet(size_t s_, FutureSet data_) : data(std::move(data_)) { s = s_; }
+    ColumnSet(size_t s_, FutureSetPtr data_) : data(std::move(data_)) { s = s_; }
     ColumnSet(const ColumnSet &) = default;
 
 public:
@@ -29,13 +29,13 @@ public:
     TypeIndex getDataType() const override { return TypeIndex::Set; }
     MutableColumnPtr cloneDummy(size_t s_) const override { return ColumnSet::create(s_, data); }
 
-    ConstSetPtr getData() const { if (!data.isReady()) return nullptr; return data.get(); }
+    FutureSetPtr getData() const { return data; }
 
     // Used only for debugging, making it DUMPABLE
     Field operator[](size_t) const override { return {}; }
 
 private:
-    FutureSet data;
+    FutureSetPtr data;
 };
 
 }
diff --git a/src/Columns/ColumnSparse.cpp b/src/Columns/ColumnSparse.cpp
index 9e4609ab4b5..0cad2c2d36b 100644
--- a/src/Columns/ColumnSparse.cpp
+++ b/src/Columns/ColumnSparse.cpp
@@ -751,13 +751,13 @@ bool ColumnSparse::structureEquals(const IColumn & rhs) const
     return false;
 }
 
-void ColumnSparse::forEachSubcolumn(ColumnCallback callback) const
+void ColumnSparse::forEachSubcolumn(MutableColumnCallback callback)
 {
     callback(values);
     callback(offsets);
 }
 
-void ColumnSparse::forEachSubcolumnRecursively(RecursiveColumnCallback callback) const
+void ColumnSparse::forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback)
 {
     callback(*values);
     values->forEachSubcolumnRecursively(callback);
diff --git a/src/Columns/ColumnSparse.h b/src/Columns/ColumnSparse.h
index d4eb13bf208..26e05655f60 100644
--- a/src/Columns/ColumnSparse.h
+++ b/src/Columns/ColumnSparse.h
@@ -140,8 +140,8 @@ public:
 
     ColumnPtr compress() const override;
 
-    void forEachSubcolumn(ColumnCallback callback) const override;
-    void forEachSubcolumnRecursively(RecursiveColumnCallback callback) const override;
+    void forEachSubcolumn(MutableColumnCallback callback) override;
+    void forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback) override;
 
     bool structureEquals(const IColumn & rhs) const override;
 
diff --git a/src/Columns/ColumnString.cpp b/src/Columns/ColumnString.cpp
index de96c57700b..38c7b2c0dd6 100644
--- a/src/Columns/ColumnString.cpp
+++ b/src/Columns/ColumnString.cpp
@@ -31,14 +31,12 @@ ColumnString::ColumnString(const ColumnString & src)
     offsets(src.offsets.begin(), src.offsets.end()),
     chars(src.chars.begin(), src.chars.end())
 {
-    if (!offsets.empty())
-    {
-        Offset last_offset = offsets.back();
-
-        /// This will also prevent possible overflow in offset.
-        if (chars.size() != last_offset)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "String offsets has data inconsistent with chars array");
-    }
+    Offset last_offset = offsets.empty() ? 0 : offsets.back();
+    /// This will also prevent possible overflow in offset.
+    if (last_offset != chars.size())
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+            "String offsets has data inconsistent with chars array. Last offset: {}, array length: {}",
+            last_offset, chars.size());
 }
 
 
@@ -157,6 +155,7 @@ ColumnPtr ColumnString::filter(const Filter & filt, ssize_t result_size_hint) co
     Offsets & res_offsets = res->offsets;
 
     filterArraysImpl<UInt8>(chars, offsets, res_chars, res_offsets, filt, result_size_hint);
+
     return res;
 }
 
@@ -571,10 +570,11 @@ void ColumnString::protect()
 
 void ColumnString::validate() const
 {
-    if (!offsets.empty() && offsets.back() != chars.size())
+    Offset last_offset = offsets.empty() ? 0 : offsets.back();
+    if (last_offset != chars.size())
         throw Exception(ErrorCodes::LOGICAL_ERROR,
                         "ColumnString validation failed: size mismatch (internal logical error) {} != {}",
-                        offsets.back(), chars.size());
+                        last_offset, chars.size());
 }
 
 }
diff --git a/src/Columns/ColumnTuple.cpp b/src/Columns/ColumnTuple.cpp
index 9f659aa7a7c..9702d275114 100644
--- a/src/Columns/ColumnTuple.cpp
+++ b/src/Columns/ColumnTuple.cpp
@@ -495,15 +495,15 @@ void ColumnTuple::getExtremes(Field & min, Field & max) const
     max = max_tuple;
 }
 
-void ColumnTuple::forEachSubcolumn(ColumnCallback callback) const
+void ColumnTuple::forEachSubcolumn(MutableColumnCallback callback)
 {
-    for (const auto & column : columns)
+    for (auto & column : columns)
         callback(column);
 }
 
-void ColumnTuple::forEachSubcolumnRecursively(RecursiveColumnCallback callback) const
+void ColumnTuple::forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback)
 {
-    for (const auto & column : columns)
+    for (auto & column : columns)
     {
         callback(*column);
         column->forEachSubcolumnRecursively(callback);
diff --git a/src/Columns/ColumnTuple.h b/src/Columns/ColumnTuple.h
index 281fd94d893..e7dee9b8ff9 100644
--- a/src/Columns/ColumnTuple.h
+++ b/src/Columns/ColumnTuple.h
@@ -96,8 +96,8 @@ public:
     size_t byteSizeAt(size_t n) const override;
     size_t allocatedBytes() const override;
     void protect() override;
-    void forEachSubcolumn(ColumnCallback callback) const override;
-    void forEachSubcolumnRecursively(RecursiveColumnCallback callback) const override;
+    void forEachSubcolumn(MutableColumnCallback callback) override;
+    void forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback) override;
     bool structureEquals(const IColumn & rhs) const override;
     bool isCollationSupported() const override;
     ColumnPtr compress() const override;
diff --git a/src/Columns/IColumn.cpp b/src/Columns/IColumn.cpp
index 46f07cffa9e..7923bca6354 100644
--- a/src/Columns/IColumn.cpp
+++ b/src/Columns/IColumn.cpp
@@ -62,19 +62,19 @@ ColumnPtr IColumn::createWithOffsets(const Offsets & offsets, const Field & defa
     return res;
 }
 
-void IColumn::forEachSubcolumn(MutableColumnCallback callback)
+void IColumn::forEachSubcolumn(ColumnCallback callback) const
 {
-    std::as_const(*this).forEachSubcolumn([&callback](const WrappedPtr & subcolumn)
+    const_cast<IColumn*>(this)->forEachSubcolumn([&callback](WrappedPtr & subcolumn)
     {
-        callback(const_cast<WrappedPtr &>(subcolumn));
+        callback(std::as_const(subcolumn));
     });
 }
 
-void IColumn::forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback)
+void IColumn::forEachSubcolumnRecursively(RecursiveColumnCallback callback) const
 {
-    std::as_const(*this).forEachSubcolumnRecursively([&callback](const IColumn & subcolumn)
+    const_cast<IColumn*>(this)->forEachSubcolumnRecursively([&callback](IColumn & subcolumn)
     {
-        callback(const_cast<IColumn &>(subcolumn));
+        callback(std::as_const(subcolumn));
     });
 }
 
diff --git a/src/Columns/IColumn.h b/src/Columns/IColumn.h
index 633bb384fb8..b4eaf5c28f5 100644
--- a/src/Columns/IColumn.h
+++ b/src/Columns/IColumn.h
@@ -418,21 +418,23 @@ public:
     /// If the column contains subcolumns (such as Array, Nullable, etc), do callback on them.
     /// Shallow: doesn't do recursive calls; don't do call for itself.
 
-    using ColumnCallback = std::function<void(const WrappedPtr &)>;
-    virtual void forEachSubcolumn(ColumnCallback) const {}
-
     using MutableColumnCallback = std::function<void(WrappedPtr &)>;
-    virtual void forEachSubcolumn(MutableColumnCallback callback);
+    virtual void forEachSubcolumn(MutableColumnCallback) {}
+
+    /// Default implementation calls the mutable overload using const_cast.
+    using ColumnCallback = std::function<void(const WrappedPtr &)>;
+    virtual void forEachSubcolumn(ColumnCallback) const;
 
     /// Similar to forEachSubcolumn but it also do recursive calls.
     /// In recursive calls it's prohibited to replace pointers
     /// to subcolumns, so we use another callback function.
 
-    using RecursiveColumnCallback = std::function<void(const IColumn &)>;
-    virtual void forEachSubcolumnRecursively(RecursiveColumnCallback) const {}
-
     using RecursiveMutableColumnCallback = std::function<void(IColumn &)>;
-    virtual void forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback);
+    virtual void forEachSubcolumnRecursively(RecursiveMutableColumnCallback) {}
+
+    /// Default implementation calls the mutable overload using const_cast.
+    using RecursiveColumnCallback = std::function<void(const IColumn &)>;
+    virtual void forEachSubcolumnRecursively(RecursiveColumnCallback) const;
 
     /// Columns have equal structure.
     /// If true - you can use "compareAt", "insertFrom", etc. methods.
diff --git a/src/Columns/tests/gtest_low_cardinality.cpp b/src/Columns/tests/gtest_low_cardinality.cpp
index 3ffc88f6a7d..5e01279b7df 100644
--- a/src/Columns/tests/gtest_low_cardinality.cpp
+++ b/src/Columns/tests/gtest_low_cardinality.cpp
@@ -48,3 +48,16 @@ TEST(ColumnLowCardinality, Insert)
     testLowCardinalityNumberInsert<Float32>(std::make_shared<DataTypeFloat32>());
     testLowCardinalityNumberInsert<Float64>(std::make_shared<DataTypeFloat64>());
 }
+
+TEST(ColumnLowCardinality, Clone)
+{
+    auto data_type = std::make_shared<DataTypeInt32>();
+    auto low_cardinality_type = std::make_shared<DataTypeLowCardinality>(data_type);
+    auto column = low_cardinality_type->createColumn();
+    ASSERT_FALSE(assert_cast<const ColumnLowCardinality &>(*column).nestedIsNullable());
+
+    auto nullable_column = assert_cast<const ColumnLowCardinality &>(*column).cloneNullable();
+
+    ASSERT_TRUE(assert_cast<const ColumnLowCardinality &>(*nullable_column).nestedIsNullable());
+    ASSERT_FALSE(assert_cast<const ColumnLowCardinality &>(*column).nestedIsNullable());
+}
diff --git a/src/Common/AsyncLoader.cpp b/src/Common/AsyncLoader.cpp
index 86edcdc8f3d..9662146e137 100644
--- a/src/Common/AsyncLoader.cpp
+++ b/src/Common/AsyncLoader.cpp
@@ -200,9 +200,11 @@ void AsyncLoader::start()
 
 void AsyncLoader::wait()
 {
-    // Because job can create new jobs in other pools we have to recheck in cycle
+    // Because job can create new jobs in other pools we have to recheck in cycle.
+    // Also wait for all workers to finish to avoid races on `pool.workers`,
+    // which can decrease even after all jobs are already finished.
     std::unique_lock lock{mutex};
-    while (!scheduled_jobs.empty())
+    while (!scheduled_jobs.empty() || hasWorker(lock))
     {
         lock.unlock();
         for (auto & p : pools)
@@ -719,4 +721,14 @@ void AsyncLoader::worker(Pool & pool)
     }
 }
 
+bool AsyncLoader::hasWorker(std::unique_lock<std::mutex> &) const
+{
+    for (const Pool & pool : pools)
+    {
+        if (pool.workers > 0)
+            return true;
+    }
+    return false;
+}
+
 }
diff --git a/src/Common/AsyncLoader.h b/src/Common/AsyncLoader.h
index 322a4482e4e..77905319f00 100644
--- a/src/Common/AsyncLoader.h
+++ b/src/Common/AsyncLoader.h
@@ -445,6 +445,7 @@ private:
     void updateCurrentPriorityAndSpawn(std::unique_lock<std::mutex> &);
     void spawn(Pool & pool, std::unique_lock<std::mutex> &);
     void worker(Pool & pool);
+    bool hasWorker(std::unique_lock<std::mutex> &) const;
 
     // Logging
     const bool log_failures; // Worker should log all exceptions caught from job functions.
diff --git a/src/Common/AsynchronousMetrics.cpp b/src/Common/AsynchronousMetrics.cpp
index 6821647a180..36c87010fa5 100644
--- a/src/Common/AsynchronousMetrics.cpp
+++ b/src/Common/AsynchronousMetrics.cpp
@@ -727,6 +727,68 @@ void AsynchronousMetrics::update(TimePoint update_time)
         }
     }
 
+    Float64 max_cpu_cgroups = 0;
+    if (cgroupcpu_max)
+    {
+        try
+        {
+            cgroupcpu_max->rewind();
+
+            uint64_t quota = 0;
+            uint64_t period = 0;
+
+            std::string line;
+            readText(line, *cgroupcpu_max);
+
+            auto space = line.find(' ');
+
+            if (line.rfind("max", space) == std::string::npos)
+            {
+                auto field1 = line.substr(0, space);
+                quota = std::stoull(field1);
+            }
+
+            if (space != std::string::npos)
+            {
+                auto field2 = line.substr(space + 1);
+                period = std::stoull(field2);
+            }
+
+            if (quota > 0 && period > 0)
+                max_cpu_cgroups = static_cast<Float64>(quota) / period;
+        }
+        catch (...)
+        {
+            tryLogCurrentException(__PRETTY_FUNCTION__);
+        }
+    }
+    else if (cgroupcpu_cfs_quota && cgroupcpu_cfs_period)
+    {
+        try
+        {
+            cgroupcpu_cfs_quota->rewind();
+            cgroupcpu_cfs_period->rewind();
+
+            uint64_t quota = 0;
+            uint64_t period = 0;
+
+            tryReadText(quota, *cgroupcpu_cfs_quota);
+            tryReadText(period, *cgroupcpu_cfs_period);
+
+            if (quota > 0 && period > 0)
+                max_cpu_cgroups = static_cast<Float64>(quota) / period;
+        }
+        catch (...)
+        {
+            tryLogCurrentException(__PRETTY_FUNCTION__);
+        }
+    }
+
+    if (max_cpu_cgroups > 0)
+    {
+        new_values["CGroupMaxCPU"] = { max_cpu_cgroups, "The maximum number of CPU cores according to CGroups."};
+    }
+
     if (proc_stat)
     {
         try
@@ -871,36 +933,38 @@ void AsynchronousMetrics::update(TimePoint update_time)
                 /// Also write values normalized to 0..1 by diving to the number of CPUs.
                 /// These values are good to be averaged across the cluster of non-uniform servers.
 
-                if (num_cpus)
+                Float64 num_cpus_to_normalize = max_cpu_cgroups > 0 ? max_cpu_cgroups : num_cpus;
+
+                if (num_cpus_to_normalize > 0)
                 {
-                    new_values["OSUserTimeNormalized"] = { delta_values_all_cpus.user * multiplier / num_cpus,
+                    new_values["OSUserTimeNormalized"] = { delta_values_all_cpus.user * multiplier / num_cpus_to_normalize,
                         "The value is similar to `OSUserTime` but divided to the number of CPU cores to be measured in the [0..1] interval regardless of the number of cores."
                         " This allows you to average the values of this metric across multiple servers in a cluster even if the number of cores is non-uniform, and still get the average resource utilization metric."};
-                    new_values["OSNiceTimeNormalized"] = { delta_values_all_cpus.nice * multiplier / num_cpus,
+                    new_values["OSNiceTimeNormalized"] = { delta_values_all_cpus.nice * multiplier / num_cpus_to_normalize,
                         "The value is similar to `OSNiceTime` but divided to the number of CPU cores to be measured in the [0..1] interval regardless of the number of cores."
                         " This allows you to average the values of this metric across multiple servers in a cluster even if the number of cores is non-uniform, and still get the average resource utilization metric."};
-                    new_values["OSSystemTimeNormalized"] = { delta_values_all_cpus.system * multiplier / num_cpus,
+                    new_values["OSSystemTimeNormalized"] = { delta_values_all_cpus.system * multiplier / num_cpus_to_normalize,
                         "The value is similar to `OSSystemTime` but divided to the number of CPU cores to be measured in the [0..1] interval regardless of the number of cores."
                         " This allows you to average the values of this metric across multiple servers in a cluster even if the number of cores is non-uniform, and still get the average resource utilization metric."};
-                    new_values["OSIdleTimeNormalized"] = { delta_values_all_cpus.idle * multiplier / num_cpus,
+                    new_values["OSIdleTimeNormalized"] = { delta_values_all_cpus.idle * multiplier / num_cpus_to_normalize,
                         "The value is similar to `OSIdleTime` but divided to the number of CPU cores to be measured in the [0..1] interval regardless of the number of cores."
                         " This allows you to average the values of this metric across multiple servers in a cluster even if the number of cores is non-uniform, and still get the average resource utilization metric."};
-                    new_values["OSIOWaitTimeNormalized"] = { delta_values_all_cpus.iowait * multiplier / num_cpus,
+                    new_values["OSIOWaitTimeNormalized"] = { delta_values_all_cpus.iowait * multiplier / num_cpus_to_normalize,
                         "The value is similar to `OSIOWaitTime` but divided to the number of CPU cores to be measured in the [0..1] interval regardless of the number of cores."
                         " This allows you to average the values of this metric across multiple servers in a cluster even if the number of cores is non-uniform, and still get the average resource utilization metric."};
-                    new_values["OSIrqTimeNormalized"] = { delta_values_all_cpus.irq * multiplier / num_cpus,
+                    new_values["OSIrqTimeNormalized"] = { delta_values_all_cpus.irq * multiplier / num_cpus_to_normalize,
                         "The value is similar to `OSIrqTime` but divided to the number of CPU cores to be measured in the [0..1] interval regardless of the number of cores."
                         " This allows you to average the values of this metric across multiple servers in a cluster even if the number of cores is non-uniform, and still get the average resource utilization metric."};
-                    new_values["OSSoftIrqTimeNormalized"] = { delta_values_all_cpus.softirq * multiplier / num_cpus,
+                    new_values["OSSoftIrqTimeNormalized"] = { delta_values_all_cpus.softirq * multiplier / num_cpus_to_normalize,
                         "The value is similar to `OSSoftIrqTime` but divided to the number of CPU cores to be measured in the [0..1] interval regardless of the number of cores."
                         " This allows you to average the values of this metric across multiple servers in a cluster even if the number of cores is non-uniform, and still get the average resource utilization metric."};
-                    new_values["OSStealTimeNormalized"] = { delta_values_all_cpus.steal * multiplier / num_cpus,
+                    new_values["OSStealTimeNormalized"] = { delta_values_all_cpus.steal * multiplier / num_cpus_to_normalize,
                         "The value is similar to `OSStealTime` but divided to the number of CPU cores to be measured in the [0..1] interval regardless of the number of cores."
                         " This allows you to average the values of this metric across multiple servers in a cluster even if the number of cores is non-uniform, and still get the average resource utilization metric."};
-                    new_values["OSGuestTimeNormalized"] = { delta_values_all_cpus.guest * multiplier / num_cpus,
+                    new_values["OSGuestTimeNormalized"] = { delta_values_all_cpus.guest * multiplier / num_cpus_to_normalize,
                         "The value is similar to `OSGuestTime` but divided to the number of CPU cores to be measured in the [0..1] interval regardless of the number of cores."
                         " This allows you to average the values of this metric across multiple servers in a cluster even if the number of cores is non-uniform, and still get the average resource utilization metric."};
-                    new_values["OSGuestNiceTimeNormalized"] = { delta_values_all_cpus.guest_nice * multiplier / num_cpus,
+                    new_values["OSGuestNiceTimeNormalized"] = { delta_values_all_cpus.guest_nice * multiplier / num_cpus_to_normalize,
                         "The value is similar to `OSGuestNiceTime` but divided to the number of CPU cores to be measured in the [0..1] interval regardless of the number of cores."
                         " This allows you to average the values of this metric across multiple servers in a cluster even if the number of cores is non-uniform, and still get the average resource utilization metric."};
                 }
@@ -937,60 +1001,6 @@ void AsynchronousMetrics::update(TimePoint update_time)
         }
     }
 
-    if (cgroupcpu_max)
-    {
-        try {
-            cgroupcpu_max->rewind();
-
-            uint64_t quota = 0;
-            uint64_t period = 0;
-
-            std::string line;
-            readText(line, *cgroupcpu_max);
-
-            auto space = line.find(' ');
-
-            if (line.rfind("max", space) == std::string::npos)
-            {
-                auto field1 = line.substr(0, space);
-                quota = std::stoull(field1);
-            }
-
-            if (space != std::string::npos)
-            {
-                auto field2 = line.substr(space + 1);
-                period = std::stoull(field2);
-            }
-
-            new_values["CGroupCpuCfsPeriod"] = { period, "The CFS period of CPU cgroup."};
-            new_values["CGroupCpuCfsQuota"] = { quota, "The CFS quota of CPU cgroup. If stated zero, the quota is max."};
-        }
-        catch (...)
-        {
-            tryLogCurrentException(__PRETTY_FUNCTION__);
-        }
-    }
-    else if (cgroupcpu_cfs_quota && cgroupcpu_cfs_period)
-    {
-        try {
-            cgroupcpu_cfs_quota->rewind();
-            cgroupcpu_cfs_period->rewind();
-
-            uint64_t quota = 0;
-            uint64_t period = 0;
-
-            tryReadText(quota, *cgroupcpu_cfs_quota);
-            tryReadText(period, *cgroupcpu_cfs_period);
-
-            new_values["CGroupCpuCfsPeriod"] = { period, "The CFS period of CPU cgroup."};
-            new_values["CGroupCpuCfsQuota"] = { quota, "The CFS quota of CPU cgroup. If stated zero, the quota is max."};
-        }
-        catch (...)
-        {
-            tryLogCurrentException(__PRETTY_FUNCTION__);
-        }
-    }
-
     if (meminfo)
     {
         try
diff --git a/src/Common/CurrentMetrics.cpp b/src/Common/CurrentMetrics.cpp
index 82d68ca8185..105a7c0548f 100644
--- a/src/Common/CurrentMetrics.cpp
+++ b/src/Common/CurrentMetrics.cpp
@@ -131,8 +131,14 @@
     M(DistributedInsertThreadsActive, "Number of threads used for INSERT into Distributed running a task.") \
     M(StorageS3Threads, "Number of threads in the StorageS3 thread pool.") \
     M(StorageS3ThreadsActive, "Number of threads in the StorageS3 thread pool running a task.") \
+    M(ObjectStorageS3Threads, "Number of threads in the S3ObjectStorage thread pool.") \
+    M(ObjectStorageS3ThreadsActive, "Number of threads in the S3ObjectStorage thread pool running a task.") \
+    M(ObjectStorageAzureThreads, "Number of threads in the AzureObjectStorage thread pool.") \
+    M(ObjectStorageAzureThreadsActive, "Number of threads in the AzureObjectStorage thread pool running a task.") \
     M(MergeTreePartsLoaderThreads, "Number of threads in the MergeTree parts loader thread pool.") \
     M(MergeTreePartsLoaderThreadsActive, "Number of threads in the MergeTree parts loader thread pool running a task.") \
+    M(MergeTreeOutdatedPartsLoaderThreads, "Number of threads in the threadpool for loading Outdated data parts.") \
+    M(MergeTreeOutdatedPartsLoaderThreadsActive, "Number of active threads in the threadpool for loading Outdated data parts.") \
     M(MergeTreePartsCleanerThreads, "Number of threads in the MergeTree parts cleaner thread pool.") \
     M(MergeTreePartsCleanerThreadsActive, "Number of threads in the MergeTree parts cleaner thread pool running a task.") \
     M(SystemReplicasThreads, "Number of threads in the system.replicas thread pool.") \
@@ -145,8 +151,10 @@
     M(ParquetDecoderThreadsActive, "Number of threads in the ParquetBlockInputFormat thread pool.") \
     M(OutdatedPartsLoadingThreads, "Number of threads in the threadpool for loading Outdated data parts.") \
     M(OutdatedPartsLoadingThreadsActive, "Number of active threads in the threadpool for loading Outdated data parts.") \
+    M(DistributedBytesToInsert, "Number of pending bytes to process for asynchronous insertion into Distributed tables. Number of bytes for every shard is summed.") \
+    M(BrokenDistributedBytesToInsert, "Number of bytes for asynchronous insertion into Distributed tables that has been marked as broken. Number of bytes for every shard is summed.") \
     M(DistributedFilesToInsert, "Number of pending files to process for asynchronous insertion into Distributed tables. Number of files for every shard is summed.") \
-    M(BrokenDistributedFilesToInsert, "Number of files for asynchronous insertion into Distributed tables that has been marked as broken. This metric will starts from 0 on start. Number of files for every shard is summed.") \
+    M(BrokenDistributedFilesToInsert, "Number of files for asynchronous insertion into Distributed tables that has been marked as broken. Number of files for every shard is summed.") \
     M(TablesToDropQueueSize, "Number of dropped tables, that are waiting for background data removal.") \
     M(MaxDDLEntryID, "Max processed DDL entry of DDLWorker.") \
     M(MaxPushedDDLEntryID, "Max DDL entry of DDLWorker that pushed to zookeeper.") \
@@ -180,6 +188,7 @@
     M(CacheDetachedFileSegments, "Number of existing detached cache file segments") \
     M(FilesystemCacheSize, "Filesystem cache size in bytes") \
     M(FilesystemCacheElements, "Filesystem cache elements (file segments)") \
+    M(FilesystemCacheDownloadQueueElements, "Filesystem cache elements in download queue") \
     M(AsyncInsertCacheSize, "Number of async insert hash id in cache") \
     M(S3Requests, "S3 requests") \
     M(KeeperAliveConnections, "Number of alive connections") \
@@ -189,8 +198,9 @@
     M(IOUringInFlightEvents, "Number of io_uring SQEs in flight") \
     M(ReadTaskRequestsSent, "The current number of callback requests in flight from the remote server back to the initiator server to choose the read task (for s3Cluster table function and similar). Measured on the remote server side.") \
     M(MergeTreeReadTaskRequestsSent, "The current number of callback requests in flight from the remote server back to the initiator server to choose the read task (for MergeTree tables). Measured on the remote server side.") \
-    M(MergeTreeAllRangesAnnouncementsSent, "The current number of announcement being sent in flight from the remote server to the initiator server about the set of data parts (for MergeTree tables). Measured on the remote server side.")
-
+    M(MergeTreeAllRangesAnnouncementsSent, "The current number of announcement being sent in flight from the remote server to the initiator server about the set of data parts (for MergeTree tables). Measured on the remote server side.") \
+    M(CreatedTimersInQueryProfiler, "Number of Created thread local timers in QueryProfiler") \
+    M(ActiveTimersInQueryProfiler, "Number of Active thread local timers in QueryProfiler")
 
 namespace CurrentMetrics
 {
diff --git a/src/Common/DNSResolver.cpp b/src/Common/DNSResolver.cpp
index b6a68bdfb45..a8ff347f399 100644
--- a/src/Common/DNSResolver.cpp
+++ b/src/Common/DNSResolver.cpp
@@ -104,7 +104,7 @@ DNSResolver::IPAddresses hostByName(const std::string & host)
     }
     catch (const Poco::Net::DNSException & e)
     {
-        LOG_ERROR(&Poco::Logger::get("DNSResolver"), "Cannot resolve host ({}), error {}: {}.", host, e.code(), e.name());
+        LOG_WARNING(&Poco::Logger::get("DNSResolver"), "Cannot resolve host ({}), error {}: {}.", host, e.code(), e.name());
         addresses.clear();
     }
 
diff --git a/src/Common/DateLUT.cpp b/src/Common/DateLUT.cpp
index a31ece00c0b..2b261a28469 100644
--- a/src/Common/DateLUT.cpp
+++ b/src/Common/DateLUT.cpp
@@ -7,6 +7,7 @@
 
 #include <filesystem>
 #include <fstream>
+#include <Interpreters/Context.h>
 
 
 namespace
@@ -163,3 +164,8 @@ DateLUT & DateLUT::getInstance()
     static DateLUT ret;
     return ret;
 }
+
+std::string DateLUT::extractTimezoneFromContext(DB::ContextPtr query_context)
+{
+    return query_context->getSettingsRef().session_timezone.value;
+}
diff --git a/src/Common/DateLUT.h b/src/Common/DateLUT.h
index fe259f0f3c3..2045d4895e7 100644
--- a/src/Common/DateLUT.h
+++ b/src/Common/DateLUT.h
@@ -5,6 +5,7 @@
 #include <base/defines.h>
 
 #include <boost/noncopyable.hpp>
+#include "Common/CurrentThread.h"
 
 #include <atomic>
 #include <memory>
@@ -16,22 +17,59 @@
 class DateLUT : private boost::noncopyable
 {
 public:
-    /// Return singleton DateLUTImpl instance for the default time zone.
+    /// Return DateLUTImpl instance for session timezone.
+    /// session_timezone is a session-level setting.
+    /// If setting is not set, returns the server timezone.
     static ALWAYS_INLINE const DateLUTImpl & instance()
+    {
+        const auto & date_lut = getInstance();
+
+        if (DB::CurrentThread::isInitialized())
+        {
+            std::string timezone_from_context;
+            const DB::ContextPtr query_context = DB::CurrentThread::get().getQueryContext();
+
+            if (query_context)
+            {
+                timezone_from_context = extractTimezoneFromContext(query_context);
+
+                if (!timezone_from_context.empty())
+                    return date_lut.getImplementation(timezone_from_context);
+            }
+
+            /// On the server side, timezone is passed in query_context,
+            /// but on CH-client side we have no query context,
+            /// and each time we modify client's global context
+            const DB::ContextPtr global_context = DB::CurrentThread::get().getGlobalContext();
+            if (global_context)
+            {
+                timezone_from_context = extractTimezoneFromContext(global_context);
+
+                if (!timezone_from_context.empty())
+                    return date_lut.getImplementation(timezone_from_context);
+            }
+
+        }
+        return serverTimezoneInstance();
+    }
+
+    static ALWAYS_INLINE const DateLUTImpl & instance(const std::string & time_zone)
+    {
+        if (time_zone.empty())
+            return instance();
+
+        const auto & date_lut = getInstance();
+        return date_lut.getImplementation(time_zone);
+    }
+
+    /// Return singleton DateLUTImpl for the server time zone.
+    /// It may be set using 'timezone' server setting.
+    static ALWAYS_INLINE const DateLUTImpl & serverTimezoneInstance()
     {
         const auto & date_lut = getInstance();
         return *date_lut.default_impl.load(std::memory_order_acquire);
     }
 
-    /// Return singleton DateLUTImpl instance for a given time zone.
-    static ALWAYS_INLINE const DateLUTImpl & instance(const std::string & time_zone)
-    {
-        const auto & date_lut = getInstance();
-        if (time_zone.empty())
-            return *date_lut.default_impl.load(std::memory_order_acquire);
-
-        return date_lut.getImplementation(time_zone);
-    }
     static void setDefaultTimezone(const std::string & time_zone)
     {
         auto & date_lut = getInstance();
@@ -45,6 +83,8 @@ protected:
 private:
     static DateLUT & getInstance();
 
+    static std::string extractTimezoneFromContext(DB::ContextPtr query_context);
+
     const DateLUTImpl & getImplementation(const std::string & time_zone) const;
 
     using DateLUTImplPtr = std::unique_ptr<DateLUTImpl>;
diff --git a/src/Common/DateLUTImpl.cpp b/src/Common/DateLUTImpl.cpp
index 6eb8b47b114..d7bdd0bb3d9 100644
--- a/src/Common/DateLUTImpl.cpp
+++ b/src/Common/DateLUTImpl.cpp
@@ -33,8 +33,24 @@ UInt8 getDayOfWeek(const cctz::civil_day & date)
     UNREACHABLE();
 }
 
+inline cctz::time_point<cctz::seconds> lookupTz(const cctz::time_zone & cctz_time_zone, const cctz::civil_day & date)
+{
+    cctz::time_zone::civil_lookup lookup = cctz_time_zone.lookup(date);
+
+    /// Ambiguity is possible if time was changed backwards at the midnight
+    /// or after midnight time has been changed back to midnight, for example one hour backwards at 01:00
+    /// or after midnight time has been changed to the previous day, for example two hours backwards at 01:00
+    /// Then midnight appears twice. Usually time change happens exactly at 00:00 or 01:00.
+
+    /// If transition did not involve previous day, we should use the first midnight as the start of the day,
+    /// otherwise it's better to use the second midnight.
+
+    return lookup.trans < lookup.post
+        ? lookup.post /* Second midnight appears after transition, so there was a piece of previous day after transition */
+        : lookup.pre;
 }
 
+}
 
 __attribute__((__weak__)) extern bool inside_main;
 
@@ -63,27 +79,52 @@ DateLUTImpl::DateLUTImpl(const std::string & time_zone_)
     offset_is_whole_number_of_minutes_during_epoch = true;
 
     cctz::civil_day date = lut_start;
+    cctz::time_point<cctz::seconds> start_of_day_time_point_if_no_transitions = lookupTz(cctz_time_zone, date);
 
+    auto next_transition_date = date;
+
+    /// Fill the lookup table:
+    /// Adjustments only occur at the dates of transitions. We save next_transition_date and add 24h to the
+    /// previous value until we reach the it. Then we do the adjustment and get the new next_transition_date.
     UInt32 i = 0;
     do
     {
-        cctz::time_zone::civil_lookup lookup = cctz_time_zone.lookup(date);
-
-        /// Ambiguity is possible if time was changed backwards at the midnight
-        /// or after midnight time has been changed back to midnight, for example one hour backwards at 01:00
-        /// or after midnight time has been changed to the previous day, for example two hours backwards at 01:00
-        /// Then midnight appears twice. Usually time change happens exactly at 00:00 or 01:00.
-
-        /// If transition did not involve previous day, we should use the first midnight as the start of the day,
-        /// otherwise it's better to use the second midnight.
-
-        std::chrono::time_point start_of_day_time_point = lookup.trans < lookup.post
-            ? lookup.post /* Second midnight appears after transition, so there was a piece of previous day after transition */
-            : lookup.pre;
-
-        start_of_day = std::chrono::system_clock::to_time_t(start_of_day_time_point);
-
         Values & values = lut[i];
+
+        values.time_at_offset_change_value = 0;
+        values.amount_of_offset_change_value = 0;
+
+        if (date >= next_transition_date)
+        {
+            start_of_day_time_point_if_no_transitions = lookupTz(cctz_time_zone, date);
+
+            /// If UTC offset was changed this day.
+            /// Change in time zone without transition is possible, e.g. Moscow 1991 Sun, 31 Mar, 02:00 MSK to EEST
+            cctz::time_zone::civil_transition transition{};
+            if (cctz_time_zone.next_transition(start_of_day_time_point_if_no_transitions - std::chrono::seconds(1), &transition)
+                && (cctz::civil_day(transition.from) == date || cctz::civil_day(transition.to) == date)
+                && transition.from != transition.to)
+            {
+                values.time_at_offset_change_value = (transition.from - cctz::civil_second(date)) / Values::OffsetChangeFactor;
+                values.amount_of_offset_change_value = (transition.to - transition.from) / Values::OffsetChangeFactor;
+
+                /// We don't support too large changes.
+                if (values.amount_of_offset_change_value > 24 * 4)
+                    values.amount_of_offset_change_value = 24 * 4;
+                else if (values.amount_of_offset_change_value < -24 * 4)
+                    values.amount_of_offset_change_value = -24 * 4;
+
+                /// We don't support cases when time change results in switching to previous day.
+                /// Shift the point of time change later.
+                if (values.time_at_offset_change_value + values.amount_of_offset_change_value < 0)
+                    values.time_at_offset_change_value = -values.amount_of_offset_change_value;
+            }
+
+            next_transition_date = std::min(cctz::civil_day(transition.to), cctz::civil_day(transition.from));
+        }
+
+        start_of_day = std::chrono::system_clock::to_time_t(start_of_day_time_point_if_no_transitions);
+
         values.year = date.year();
         values.month = date.month();
         values.day_of_month = date.day();
@@ -103,38 +144,14 @@ DateLUTImpl::DateLUTImpl(const std::string & time_zone_)
         else
             values.days_in_month = i != 0 ? lut[i - 1].days_in_month : 31;
 
-        values.time_at_offset_change_value = 0;
-        values.amount_of_offset_change_value = 0;
-
         if (offset_is_whole_number_of_hours_during_epoch && start_of_day > 0 && start_of_day % 3600)
             offset_is_whole_number_of_hours_during_epoch = false;
 
         if (offset_is_whole_number_of_minutes_during_epoch && start_of_day > 0 && start_of_day % 60)
             offset_is_whole_number_of_minutes_during_epoch = false;
 
-        /// If UTC offset was changed this day.
-        /// Change in time zone without transition is possible, e.g. Moscow 1991 Sun, 31 Mar, 02:00 MSK to EEST
-        cctz::time_zone::civil_transition transition{};
-        if (cctz_time_zone.next_transition(start_of_day_time_point - std::chrono::seconds(1), &transition)
-            && (cctz::civil_day(transition.from) == date || cctz::civil_day(transition.to) == date)
-            && transition.from != transition.to)
-        {
-            values.time_at_offset_change_value = (transition.from - cctz::civil_second(date)) / Values::OffsetChangeFactor;
-            values.amount_of_offset_change_value = (transition.to - transition.from) / Values::OffsetChangeFactor;
-
-            /// We don't support too large changes.
-            if (values.amount_of_offset_change_value > 24 * 4)
-                values.amount_of_offset_change_value = 24 * 4;
-            else if (values.amount_of_offset_change_value < -24 * 4)
-                values.amount_of_offset_change_value = -24 * 4;
-
-            /// We don't support cases when time change results in switching to previous day.
-            /// Shift the point of time change later.
-            if (values.time_at_offset_change_value + values.amount_of_offset_change_value < 0)
-                values.time_at_offset_change_value = -values.amount_of_offset_change_value;
-        }
-
         /// Going to next day.
+        start_of_day_time_point_if_no_transitions += std::chrono::hours(24);
         ++date;
         ++i;
     }
diff --git a/src/Common/ErrorCodes.cpp b/src/Common/ErrorCodes.cpp
index 83a7314ac7a..4c08d762df2 100644
--- a/src/Common/ErrorCodes.cpp
+++ b/src/Common/ErrorCodes.cpp
@@ -580,6 +580,8 @@
     M(695, ASYNC_LOAD_FAILED) \
     M(696, ASYNC_LOAD_CANCELED) \
     M(697, CANNOT_RESTORE_TO_NONENCRYPTED_DISK) \
+    M(698, INVALID_REDIS_STORAGE_TYPE) \
+    M(699, INVALID_REDIS_TABLE_STRUCTURE) \
     \
     M(999, KEEPER_EXCEPTION) \
     M(1000, POCO_EXCEPTION) \
diff --git a/src/Common/Exception.cpp b/src/Common/Exception.cpp
index 20206b76225..ee268be45f6 100644
--- a/src/Common/Exception.cpp
+++ b/src/Common/Exception.cpp
@@ -1,5 +1,6 @@
 #include "Exception.h"
 
+#include <algorithm>
 #include <cstring>
 #include <cxxabi.h>
 #include <cstdlib>
@@ -83,6 +84,7 @@ Exception::Exception(const MessageMasked & msg_masked, int code, bool remote_)
     : Poco::Exception(msg_masked.msg, code)
     , remote(remote_)
 {
+    capture_thread_frame_pointers = thread_frame_pointers;
     handle_error_code(msg_masked.msg, code, remote, getStackFramePointers());
 }
 
@@ -90,12 +92,14 @@ Exception::Exception(MessageMasked && msg_masked, int code, bool remote_)
     : Poco::Exception(msg_masked.msg, code)
     , remote(remote_)
 {
+    capture_thread_frame_pointers = thread_frame_pointers;
     handle_error_code(message(), code, remote, getStackFramePointers());
 }
 
 Exception::Exception(CreateFromPocoTag, const Poco::Exception & exc)
     : Poco::Exception(exc.displayText(), ErrorCodes::POCO_EXCEPTION)
 {
+    capture_thread_frame_pointers = thread_frame_pointers;
 #ifdef STD_EXCEPTION_HAS_STACK_TRACE
     auto * stack_trace_frames = exc.get_stack_trace_frames();
     auto stack_trace_size = exc.get_stack_trace_size();
@@ -107,6 +111,7 @@ Exception::Exception(CreateFromPocoTag, const Poco::Exception & exc)
 Exception::Exception(CreateFromSTDTag, const std::exception & exc)
     : Poco::Exception(demangle(typeid(exc).name()) + ": " + String(exc.what()), ErrorCodes::STD_EXCEPTION)
 {
+    capture_thread_frame_pointers = thread_frame_pointers;
 #ifdef STD_EXCEPTION_HAS_STACK_TRACE
     auto * stack_trace_frames = exc.get_stack_trace_frames();
     auto stack_trace_size = exc.get_stack_trace_size();
@@ -153,7 +158,17 @@ std::string Exception::getStackTraceString() const
     auto * stack_trace_frames = get_stack_trace_frames();
     auto stack_trace_size = get_stack_trace_size();
     __msan_unpoison(stack_trace_frames, stack_trace_size * sizeof(stack_trace_frames[0]));
-    return StackTrace::toString(stack_trace_frames, 0, stack_trace_size);
+    String thread_stack_trace;
+    std::for_each(capture_thread_frame_pointers.rbegin(), capture_thread_frame_pointers.rend(),
+        [&thread_stack_trace](StackTrace::FramePointers & frame_pointers)
+        {
+            thread_stack_trace +=
+                "\nJob's origin stack trace:\n" +
+                StackTrace::toString(frame_pointers.data(), 0, std::ranges::find(frame_pointers, nullptr) - frame_pointers.begin());
+        }
+    );
+
+    return StackTrace::toString(stack_trace_frames, 0, stack_trace_size) + thread_stack_trace;
 #else
     return trace.toString();
 #endif
@@ -185,6 +200,9 @@ Exception::FramePointers Exception::getStackFramePointers() const
     return frame_pointers;
 }
 
+thread_local bool Exception::enable_job_stack_trace = false;
+thread_local std::vector<StackTrace::FramePointers> Exception::thread_frame_pointers = {};
+
 
 void throwFromErrno(const std::string & s, int code, int the_errno)
 {
diff --git a/src/Common/Exception.h b/src/Common/Exception.h
index 170e0d32b3c..f80dfe7f0a2 100644
--- a/src/Common/Exception.h
+++ b/src/Common/Exception.h
@@ -25,18 +25,27 @@ class Exception : public Poco::Exception
 public:
     using FramePointers = std::vector<void *>;
 
-    Exception() = default;
+    Exception()
+    {
+        capture_thread_frame_pointers = thread_frame_pointers;
+    }
 
     Exception(const PreformattedMessage & msg, int code): Exception(msg.text, code)
     {
+        capture_thread_frame_pointers = thread_frame_pointers;
         message_format_string = msg.format_string;
     }
 
     Exception(PreformattedMessage && msg, int code): Exception(std::move(msg.text), code)
     {
+        capture_thread_frame_pointers = thread_frame_pointers;
         message_format_string = msg.format_string;
     }
 
+    /// Collect call stacks of all previous jobs' schedulings leading to this thread job's execution
+    static thread_local bool enable_job_stack_trace;
+    static thread_local std::vector<StackTrace::FramePointers> thread_frame_pointers;
+
 protected:
     // used to remove the sensitive information from exceptions if query_masking_rules is configured
     struct MessageMasked
@@ -66,6 +75,7 @@ public:
     Exception(int code, T && message)
         : Exception(message, code)
     {
+        capture_thread_frame_pointers = thread_frame_pointers;
         message_format_string = tryGetStaticFormatString(message);
     }
 
@@ -80,6 +90,7 @@ public:
     Exception(int code, FormatStringHelper<Args...> fmt, Args &&... args)
         : Exception(fmt::format(fmt.fmt_str, std::forward<Args>(args)...), code)
     {
+        capture_thread_frame_pointers = thread_frame_pointers;
         message_format_string = fmt.message_format_string;
     }
 
@@ -131,6 +142,8 @@ private:
 
 protected:
     std::string_view message_format_string;
+    /// Local copy of static per-thread thread_frame_pointers, should be mutable to be unpoisoned on printout
+    mutable std::vector<StackTrace::FramePointers> capture_thread_frame_pointers;
 };
 
 
diff --git a/src/Common/FileRenamer.cpp b/src/Common/FileRenamer.cpp
new file mode 100644
index 00000000000..3473d543c00
--- /dev/null
+++ b/src/Common/FileRenamer.cpp
@@ -0,0 +1,96 @@
+#include <Common/FileRenamer.h>
+
+#include <Common/DateLUT.h>
+#include <Common/Exception.h>
+
+#include <chrono>
+#include <filesystem>
+#include <format>
+#include <map>
+#include <re2/re2.h>
+
+#include <boost/algorithm/string.hpp>
+#include <boost/algorithm/string/replace.hpp>
+
+namespace fs = std::filesystem;
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+}
+
+FileRenamer::FileRenamer() = default;
+
+FileRenamer::FileRenamer(const String & renaming_rule)
+    : rule(renaming_rule)
+{
+    FileRenamer::validateRenamingRule(rule, true);
+}
+
+String FileRenamer::generateNewFilename(const String & filename) const
+{
+    // Split filename and extension
+    String file_base = fs::path(filename).stem();
+    String file_ext = fs::path(filename).extension();
+
+    // Get current timestamp in microseconds
+    String timestamp;
+    if (rule.find("%t") != String::npos)
+    {
+        auto now = std::chrono::system_clock::now();
+        timestamp = std::to_string(timeInMicroseconds(now));
+    }
+
+    // Define placeholders and their corresponding values
+    std::map<String, String> placeholders =
+    {
+        {"%f", file_base},
+        {"%e", file_ext},
+        {"%t", timestamp},
+        {"%%", "%"}
+    };
+
+    // Replace placeholders with their actual values
+    String new_name = rule;
+    for (const auto & [placeholder, value] : placeholders)
+        boost::replace_all(new_name, placeholder, value);
+
+    return new_name;
+}
+
+bool FileRenamer::isEmpty() const
+{
+    return rule.empty();
+}
+
+bool FileRenamer::validateRenamingRule(const String & rule, bool throw_on_error)
+{
+    // Check if the rule contains invalid placeholders
+    re2::RE2 invalid_placeholder_pattern("^([^%]|%[fet%])*$");
+    if (!re2::RE2::FullMatch(rule, invalid_placeholder_pattern))
+    {
+        if (throw_on_error)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid renaming rule: Allowed placeholders only %f, %e, %t, and %%");
+        return false;
+    }
+
+    // Replace valid placeholders with empty strings and count remaining percentage signs.
+    String replaced_rule = rule;
+    boost::replace_all(replaced_rule, "%f", "");
+    boost::replace_all(replaced_rule, "%e", "");
+    boost::replace_all(replaced_rule, "%t", "");
+    if (std::count(replaced_rule.begin(), replaced_rule.end(), '%') % 2)
+    {
+        if (throw_on_error)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid renaming rule: Odd number of consecutive percentage signs");
+        return false;
+    }
+
+    return true;
+}
+
+
+} // DB
diff --git a/src/Common/FileRenamer.h b/src/Common/FileRenamer.h
new file mode 100644
index 00000000000..c062978d6f6
--- /dev/null
+++ b/src/Common/FileRenamer.h
@@ -0,0 +1,39 @@
+#pragma once
+
+#include <string>
+#include <base/types.h>
+
+namespace DB
+{
+
+/**
+  * The FileRenamer class provides functionality for renaming files based on given pattern with placeholders
+  * The supported placeholders are:
+  *   %f - Original filename without extension ("sample")
+  *   %e - Original file extension with dot (".csv")
+  *   %t - Timestamp (in microseconds)
+  *   %% - Percentage sign ("%")
+  *
+  * Example:
+  *   Pattern             - "processed_%f_%t%e"
+  *   Original filename   - "sample.csv"
+  *   New filename        - "processed_sample_1683405960646224.csv"
+  */
+class FileRenamer
+{
+public:
+    FileRenamer();
+
+    FileRenamer(const String & renaming_rule);
+
+    String generateNewFilename(const String & filename) const;
+
+    bool isEmpty() const;
+
+    static bool validateRenamingRule(const String & rule, bool throw_on_error = false);
+
+private:
+    String rule;
+};
+
+} // DB
diff --git a/src/Common/GetPriorityForLoadBalancing.cpp b/src/Common/GetPriorityForLoadBalancing.cpp
index 5da60fb1bae..c4d36acc70c 100644
--- a/src/Common/GetPriorityForLoadBalancing.cpp
+++ b/src/Common/GetPriorityForLoadBalancing.cpp
@@ -1,4 +1,5 @@
 #include <Common/GetPriorityForLoadBalancing.h>
+#include <Common/Priority.h>
 
 namespace DB
 {
@@ -8,23 +9,23 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-std::function<size_t(size_t index)> GetPriorityForLoadBalancing::getPriorityFunc(LoadBalancing load_balance, size_t offset, size_t pool_size) const
+std::function<Priority(size_t index)> GetPriorityForLoadBalancing::getPriorityFunc(LoadBalancing load_balance, size_t offset, size_t pool_size) const
 {
-    std::function<size_t(size_t index)> get_priority;
+    std::function<Priority(size_t index)> get_priority;
     switch (load_balance)
     {
         case LoadBalancing::NEAREST_HOSTNAME:
             if (hostname_differences.empty())
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "It's a bug: hostname_differences is not initialized");
-            get_priority = [this](size_t i) { return hostname_differences[i]; };
+            get_priority = [this](size_t i) { return Priority{static_cast<Int64>(hostname_differences[i])}; };
             break;
         case LoadBalancing::IN_ORDER:
-            get_priority = [](size_t i) { return i; };
+            get_priority = [](size_t i) { return Priority{static_cast<Int64>(i)}; };
             break;
         case LoadBalancing::RANDOM:
             break;
         case LoadBalancing::FIRST_OR_RANDOM:
-            get_priority = [offset](size_t i) -> size_t { return i != offset; };
+            get_priority = [offset](size_t i) { return i != offset ? Priority{1} : Priority{0}; };
             break;
         case LoadBalancing::ROUND_ROBIN:
             if (last_used >= pool_size)
@@ -38,8 +39,8 @@ std::function<size_t(size_t index)> GetPriorityForLoadBalancing::getPriorityFunc
              * */
             get_priority = [this, pool_size](size_t i)
             {
-                ++i;
-                return i < last_used ? pool_size - i : i - last_used;
+                ++i; // To make `i` indexing start with 1 instead of 0 as `last_used` does
+                return Priority{static_cast<Int64>(i < last_used ? pool_size - i : i - last_used)};
             };
             break;
     }
diff --git a/src/Common/GetPriorityForLoadBalancing.h b/src/Common/GetPriorityForLoadBalancing.h
index e57b02b5e90..8052185ac13 100644
--- a/src/Common/GetPriorityForLoadBalancing.h
+++ b/src/Common/GetPriorityForLoadBalancing.h
@@ -21,7 +21,7 @@ public:
         return !(*this == other);
     }
 
-    std::function<size_t(size_t index)> getPriorityFunc(LoadBalancing load_balance, size_t offset, size_t pool_size) const;
+    std::function<Priority(size_t index)> getPriorityFunc(LoadBalancing load_balance, size_t offset, size_t pool_size) const;
 
     std::vector<size_t> hostname_differences; /// Distances from name of this host to the names of hosts of pools.
 
diff --git a/src/Common/LocalDate.h b/src/Common/LocalDate.h
index dc36f92bebf..2331a40fd12 100644
--- a/src/Common/LocalDate.h
+++ b/src/Common/LocalDate.h
@@ -24,9 +24,8 @@ private:
     unsigned char m_month;
     unsigned char m_day;
 
-    void init(time_t time)
+    void init(time_t time, const DateLUTImpl & date_lut)
     {
-        const auto & date_lut = DateLUT::instance();
         const auto & values = date_lut.getValues(time);
 
         m_year = values.year;
@@ -56,22 +55,22 @@ private:
     }
 
 public:
-    explicit LocalDate(time_t time)
+    explicit LocalDate(time_t time, const DateLUTImpl & time_zone = DateLUT::instance())
     {
-        init(time);
+        init(time, time_zone);
     }
 
-    LocalDate(DayNum day_num) /// NOLINT
+    LocalDate(DayNum day_num, const DateLUTImpl & time_zone = DateLUT::instance()) /// NOLINT
     {
-        const auto & values = DateLUT::instance().getValues(day_num);
+        const auto & values = time_zone.getValues(day_num);
         m_year  = values.year;
         m_month = values.month;
         m_day   = values.day_of_month;
     }
 
-    explicit LocalDate(ExtendedDayNum day_num)
+    explicit LocalDate(ExtendedDayNum day_num, const DateLUTImpl & time_zone = DateLUT::instance())
     {
-        const auto & values = DateLUT::instance().getValues(day_num);
+        const auto & values = time_zone.getValues(day_num);
         m_year  = values.year;
         m_month = values.month;
         m_day   = values.day_of_month;
@@ -99,15 +98,13 @@ public:
     LocalDate(const LocalDate &) noexcept = default;
     LocalDate & operator= (const LocalDate &) noexcept = default;
 
-    DayNum getDayNum() const
+    DayNum getDayNum(const DateLUTImpl & lut = DateLUT::instance()) const
     {
-        const auto & lut = DateLUT::instance();
         return DayNum(lut.makeDayNum(m_year, m_month, m_day).toUnderType());
     }
 
-    ExtendedDayNum  getExtenedDayNum() const
+    ExtendedDayNum getExtenedDayNum(const DateLUTImpl & lut = DateLUT::instance()) const
     {
-        const auto & lut = DateLUT::instance();
         return ExtendedDayNum (lut.makeDayNum(m_year, m_month, m_day).toUnderType());
     }
 
diff --git a/src/Common/OptimizedRegularExpression.cpp b/src/Common/OptimizedRegularExpression.cpp
index f2fe922ef19..5df9ce76098 100644
--- a/src/Common/OptimizedRegularExpression.cpp
+++ b/src/Common/OptimizedRegularExpression.cpp
@@ -669,16 +669,16 @@ unsigned OptimizedRegularExpressionImpl<thread_safe>::match(const char * subject
             matches.resize(limit);
             for (size_t i = 0; i < limit; ++i)
             {
-                if (pieces[i] != nullptr)
-                {
-                    matches[i].offset = pieces[i].data() - subject;
-                    matches[i].length = pieces[i].length();
-                }
-                else
+                if (pieces[i].empty())
                 {
                     matches[i].offset = std::string::npos;
                     matches[i].length = 0;
                 }
+                else
+                {
+                    matches[i].offset = pieces[i].data() - subject;
+                    matches[i].length = pieces[i].length();
+                }
             }
             return limit;
         }
diff --git a/src/Common/PoolWithFailoverBase.h b/src/Common/PoolWithFailoverBase.h
index 646e10d6443..c6f44a7701a 100644
--- a/src/Common/PoolWithFailoverBase.h
+++ b/src/Common/PoolWithFailoverBase.h
@@ -13,6 +13,7 @@
 #include <Common/NetException.h>
 #include <Common/Exception.h>
 #include <Common/randomSeed.h>
+#include <Common/Priority.h>
 
 
 namespace DB
@@ -34,7 +35,7 @@ namespace ProfileEvents
 /// This class provides a pool with fault tolerance. It is used for pooling of connections to replicated DB.
 /// Initialized by several PoolBase objects.
 /// When a connection is requested, tries to create or choose an alive connection from one of the nested pools.
-/// Pools are tried in the order consistent with lexicographical order of (error count, priority, random number) tuples.
+/// Pools are tried in the order consistent with lexicographical order of (error count, slowdown count, config priority, priority, random number) tuples.
 /// Number of tries for a single pool is limited by max_tries parameter.
 /// The client can set nested pool priority by passing a GetPriority functor.
 ///
@@ -113,7 +114,7 @@ public:
 
     /// The client can provide this functor to affect load balancing - the index of a pool is passed to
     /// this functor. The pools with lower result value will be tried first.
-    using GetPriorityFunc = std::function<size_t(size_t index)>;
+    using GetPriorityFunc = std::function<Priority(size_t index)>;
 
     /// Returns at least min_entries and at most max_entries connections (at most one connection per nested pool).
     /// The method will throw if it is unable to get min_entries alive connections or
@@ -336,9 +337,9 @@ struct PoolWithFailoverBase<TNestedPool>::PoolState
     /// The number of slowdowns that led to changing replica in HedgedRequestsFactory
     UInt64 slowdown_count = 0;
     /// Priority from the <remote_server> configuration.
-    Int64 config_priority = 1;
+    Priority config_priority{1};
     /// Priority from the GetPriorityFunc.
-    Int64 priority = 0;
+    Priority priority{0};
     UInt64 random = 0;
 
     void randomize()
diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index fdee9902634..0838e0366df 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -348,6 +348,9 @@ The server successfully detected this situation and will download merged part fr
     M(S3PutObject, "Number of S3 API PutObject calls.") \
     M(S3GetObject, "Number of S3 API GetObject calls.") \
     \
+    M(AzureDeleteObjects, "Number of Azure blob storage API DeleteObject(s) calls.") \
+    M(AzureListObjects, "Number of Azure blob storage API ListObjects calls.") \
+    \
     M(DiskS3DeleteObjects, "Number of DiskS3 API DeleteObject(s) calls.") \
     M(DiskS3CopyObject, "Number of DiskS3 API CopyObject calls.") \
     M(DiskS3ListObjects, "Number of DiskS3 API ListObjects calls.") \
@@ -378,11 +381,26 @@ The server successfully detected this situation and will download merged part fr
     M(CachedReadBufferReadFromCacheBytes, "Bytes read from filesystem cache") \
     M(CachedReadBufferCacheWriteBytes, "Bytes written from source (remote fs, etc) to filesystem cache") \
     M(CachedReadBufferCacheWriteMicroseconds, "Time spent writing data into filesystem cache") \
+    M(CachedReadBufferCreateBufferMicroseconds, "Prepare buffer time") \
     M(CachedWriteBufferCacheWriteBytes, "Bytes written from source (remote fs, etc) to filesystem cache") \
     M(CachedWriteBufferCacheWriteMicroseconds, "Time spent writing data into filesystem cache") \
     \
     M(FilesystemCacheEvictedBytes, "Number of bytes evicted from filesystem cache") \
     M(FilesystemCacheEvictedFileSegments, "Number of file segments evicted from filesystem cache") \
+    M(FilesystemCacheLockKeyMicroseconds, "Lock cache key time") \
+    M(FilesystemCacheLockMetadataMicroseconds, "Lock filesystem cache metadata time") \
+    M(FilesystemCacheLockCacheMicroseconds, "Lock filesystem cache time") \
+    M(FilesystemCacheReserveMicroseconds, "Filesystem cache space reservation time") \
+    M(FilesystemCacheEvictMicroseconds, "Filesystem cache eviction time") \
+    M(FilesystemCacheGetOrSetMicroseconds, "Filesystem cache getOrSet() time") \
+    M(FilesystemCacheGetMicroseconds, "Filesystem cache get() time") \
+    M(FileSegmentWaitMicroseconds, "Wait on DOWNLOADING state") \
+    M(FileSegmentCompleteMicroseconds, "Duration of FileSegment::complete() in filesystem cache") \
+    M(FileSegmentLockMicroseconds, "Lock file segment time") \
+    M(FileSegmentWriteMicroseconds, "File segment write() time") \
+    M(FileSegmentUseMicroseconds, "File segment use() time") \
+    M(FileSegmentRemoveMicroseconds, "File segment remove() time") \
+    M(FileSegmentHolderCompleteMicroseconds, "File segments holder complete() time") \
     \
     M(RemoteFSSeeks, "Total number of seeks for async buffer") \
     M(RemoteFSPrefetches, "Number of prefetches made with asynchronous reading from remote filesystem") \
@@ -404,7 +422,6 @@ The server successfully detected this situation and will download merged part fr
     \
     M(FileSegmentWaitReadBufferMicroseconds, "Metric per file segment. Time spend waiting for internal read buffer (includes cache waiting)") \
     M(FileSegmentReadMicroseconds, "Metric per file segment. Time spend reading from file") \
-    M(FileSegmentWriteMicroseconds, "Metric per file segment. Time spend writing cache") \
     M(FileSegmentCacheWriteMicroseconds, "Metric per file segment. Time spend writing data to cache") \
     M(FileSegmentPredownloadMicroseconds, "Metric per file segment. Time spent predownloading data to cache (predownloading - finishing file segment download (after someone who failed to do that) up to the point current thread was requested to do)") \
     M(FileSegmentUsedBytes, "Metric per file segment. How many bytes were actually used from current file segment") \
diff --git a/src/Common/QueryProfiler.cpp b/src/Common/QueryProfiler.cpp
index e1af3ad7724..085c8fb8af4 100644
--- a/src/Common/QueryProfiler.cpp
+++ b/src/Common/QueryProfiler.cpp
@@ -2,6 +2,7 @@
 
 #include <IO/WriteHelpers.h>
 #include <Common/TraceSender.h>
+#include <Common/CurrentMetrics.h>
 #include <Common/Exception.h>
 #include <Common/StackTrace.h>
 #include <Common/thread_local_rng.h>
@@ -12,6 +13,11 @@
 
 #include <random>
 
+namespace CurrentMetrics
+{
+    extern const Metric CreatedTimersInQueryProfiler;
+    extern const Metric ActiveTimersInQueryProfiler;
+}
 
 namespace ProfileEvents
 {
@@ -85,48 +91,14 @@ namespace ErrorCodes
     extern const int NOT_IMPLEMENTED;
 }
 
-template <typename ProfilerImpl>
-QueryProfilerBase<ProfilerImpl>::QueryProfilerBase(UInt64 thread_id, int clock_type, UInt32 period, int pause_signal_)
-    : log(&Poco::Logger::get("QueryProfiler"))
-    , pause_signal(pause_signal_)
+#if USE_UNWIND
+Timer::Timer()
+    : log(&Poco::Logger::get("Timer"))
+{}
+
+void Timer::createIfNecessary(UInt64 thread_id, int clock_type, int pause_signal)
 {
-#if defined(SANITIZER)
-    UNUSED(thread_id);
-    UNUSED(clock_type);
-    UNUSED(period);
-    UNUSED(pause_signal);
-
-    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "QueryProfiler disabled because they cannot work under sanitizers");
-#elif !USE_UNWIND
-    UNUSED(thread_id);
-    UNUSED(clock_type);
-    UNUSED(period);
-    UNUSED(pause_signal);
-
-    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "QueryProfiler cannot work with stock libunwind");
-#else
-    /// Sanity check.
-    if (!hasPHDRCache())
-        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "QueryProfiler cannot be used without PHDR cache, that is not available for TSan build");
-
-    /// Too high frequency can introduce infinite busy loop of signal handlers. We will limit maximum frequency (with 1000 signals per second).
-    if (period < 1000000)
-        period = 1000000;
-
-    struct sigaction sa{};
-    sa.sa_sigaction = ProfilerImpl::signalHandler;
-    sa.sa_flags = SA_SIGINFO | SA_RESTART;
-
-    if (sigemptyset(&sa.sa_mask))
-        throwFromErrno("Failed to clean signal mask for query profiler", ErrorCodes::CANNOT_MANIPULATE_SIGSET);
-
-    if (sigaddset(&sa.sa_mask, pause_signal))
-        throwFromErrno("Failed to add signal to mask for query profiler", ErrorCodes::CANNOT_MANIPULATE_SIGSET);
-
-    if (sigaction(pause_signal, &sa, nullptr))
-        throwFromErrno("Failed to setup signal handler for query profiler", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
-
-    try
+    if (!timer_id)
     {
         struct sigevent sev {};
         sev.sigev_notify = SIGEV_THREAD_ID;
@@ -151,25 +123,117 @@ QueryProfilerBase<ProfilerImpl>::QueryProfilerBase(UInt64 thread_id, int clock_t
             throwFromErrno("Failed to create thread timer", ErrorCodes::CANNOT_CREATE_TIMER);
         }
         timer_id.emplace(local_timer_id);
+        CurrentMetrics::add(CurrentMetrics::CreatedTimersInQueryProfiler);
+    }
+}
 
-        /// Randomize offset as uniform random value from 0 to period - 1.
-        /// It will allow to sample short queries even if timer period is large.
-        /// (For example, with period of 1 second, query with 50 ms duration will be sampled with 1 / 20 probability).
-        /// It also helps to avoid interference (moire).
-        UInt32 period_rand = std::uniform_int_distribution<UInt32>(0, period)(thread_local_rng);
+void Timer::set(UInt32 period)
+{
+    /// Too high frequency can introduce infinite busy loop of signal handlers. We will limit maximum frequency (with 1000 signals per second).
+    if (period < 1000000)
+        period = 1000000;
+    /// Randomize offset as uniform random value from 0 to period - 1.
+    /// It will allow to sample short queries even if timer period is large.
+    /// (For example, with period of 1 second, query with 50 ms duration will be sampled with 1 / 20 probability).
+    /// It also helps to avoid interference (moire).
+    UInt32 period_rand = std::uniform_int_distribution<UInt32>(0, period)(thread_local_rng);
 
-        struct timespec interval{.tv_sec = period / TIMER_PRECISION, .tv_nsec = period % TIMER_PRECISION};
-        struct timespec offset{.tv_sec = period_rand / TIMER_PRECISION, .tv_nsec = period_rand % TIMER_PRECISION};
+    struct timespec interval{.tv_sec = period / TIMER_PRECISION, .tv_nsec = period % TIMER_PRECISION};
+    struct timespec offset{.tv_sec = period_rand / TIMER_PRECISION, .tv_nsec = period_rand % TIMER_PRECISION};
 
-        struct itimerspec timer_spec = {.it_interval = interval, .it_value = offset};
-        if (timer_settime(*timer_id, 0, &timer_spec, nullptr))
-            throwFromErrno("Failed to set thread timer period", ErrorCodes::CANNOT_SET_TIMER_PERIOD);
+    struct itimerspec timer_spec = {.it_interval = interval, .it_value = offset};
+    if (timer_settime(*timer_id, 0, &timer_spec, nullptr))
+        throwFromErrno("Failed to set thread timer period", ErrorCodes::CANNOT_SET_TIMER_PERIOD);
+    CurrentMetrics::add(CurrentMetrics::ActiveTimersInQueryProfiler);
+}
 
+void Timer::stop()
+{
+    if (timer_id)
+    {
+        struct timespec stop_timer{.tv_sec = 0, .tv_nsec = 0};
+        struct itimerspec timer_spec = {.it_interval = stop_timer, .it_value = stop_timer};
+        int err = timer_settime(*timer_id, 0, &timer_spec, nullptr);
+        if (err)
+            LOG_ERROR(log, "Failed to stop query profiler timer {}", errnoToString());
+        chassert(!err && "Failed to stop query profiler timer");
+        CurrentMetrics::sub(CurrentMetrics::ActiveTimersInQueryProfiler);
+    }
+}
+
+Timer::~Timer()
+{
+    try
+    {
+        cleanup();
+    }
+    catch (...)
+    {
+        tryLogCurrentException(log);
+    }
+}
+
+void Timer::cleanup()
+{
+    if (timer_id)
+    {
+        int err = timer_delete(*timer_id);
+        if (err)
+            LOG_ERROR(log, "Failed to delete query profiler timer {}", errnoToString());
+        chassert(!err && "Failed to delete query profiler timer");
+
+        timer_id.reset();
+        CurrentMetrics::sub(CurrentMetrics::CreatedTimersInQueryProfiler);
+    }
+}
+#endif
+
+template <typename ProfilerImpl>
+QueryProfilerBase<ProfilerImpl>::QueryProfilerBase(UInt64 thread_id, int clock_type, UInt32 period, int pause_signal_)
+    : log(&Poco::Logger::get("QueryProfiler"))
+    , pause_signal(pause_signal_)
+{
+#if defined(SANITIZER)
+    UNUSED(thread_id);
+    UNUSED(clock_type);
+    UNUSED(period);
+    UNUSED(pause_signal);
+
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "QueryProfiler disabled because they cannot work under sanitizers");
+#elif !USE_UNWIND
+    UNUSED(thread_id);
+    UNUSED(clock_type);
+    UNUSED(period);
+    UNUSED(pause_signal);
+
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "QueryProfiler cannot work with stock libunwind");
+#else
+    /// Sanity check.
+    if (!hasPHDRCache())
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "QueryProfiler cannot be used without PHDR cache, that is not available for TSan build");
+
+    struct sigaction sa{};
+    sa.sa_sigaction = ProfilerImpl::signalHandler;
+    sa.sa_flags = SA_SIGINFO | SA_RESTART;
+
+    if (sigemptyset(&sa.sa_mask))
+        throwFromErrno("Failed to clean signal mask for query profiler", ErrorCodes::CANNOT_MANIPULATE_SIGSET);
+
+    if (sigaddset(&sa.sa_mask, pause_signal))
+        throwFromErrno("Failed to add signal to mask for query profiler", ErrorCodes::CANNOT_MANIPULATE_SIGSET);
+
+    if (sigaction(pause_signal, &sa, nullptr))
+        throwFromErrno("Failed to setup signal handler for query profiler", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+
+    try
+    {
+        timer.createIfNecessary(thread_id, clock_type, pause_signal);
+        timer.set(period);
         signal_handler_disarmed = false;
     }
     catch (...)
     {
-        tryCleanup();
+        timer.cleanup();
         throw;
     }
 #endif
@@ -178,22 +242,21 @@ QueryProfilerBase<ProfilerImpl>::QueryProfilerBase(UInt64 thread_id, int clock_t
 template <typename ProfilerImpl>
 QueryProfilerBase<ProfilerImpl>::~QueryProfilerBase()
 {
-    tryCleanup();
+    try
+    {
+        cleanup();
+    }
+    catch (...)
+    {
+        tryLogCurrentException(log);
+    }
 }
 
 template <typename ProfilerImpl>
-void QueryProfilerBase<ProfilerImpl>::tryCleanup()
+void QueryProfilerBase<ProfilerImpl>::cleanup()
 {
 #if USE_UNWIND
-    if (timer_id.has_value())
-    {
-        int err = timer_delete(*timer_id);
-        if (err)
-            LOG_ERROR(log, "Failed to delete query profiler timer {}", errnoToString());
-        chassert(!err && "Failed to delete query profiler timer");
-        timer_id.reset();
-    }
-
+    timer.stop();
     signal_handler_disarmed = true;
 #endif
 }
diff --git a/src/Common/QueryProfiler.h b/src/Common/QueryProfiler.h
index fb2f470b6d6..6a9ed10e315 100644
--- a/src/Common/QueryProfiler.h
+++ b/src/Common/QueryProfiler.h
@@ -27,6 +27,27 @@ namespace DB
   * Destructor tries to unset timer and restore previous signal handler.
   * Note that signal handler implementation is defined by template parameter. See QueryProfilerReal and QueryProfilerCPU.
   */
+
+#if USE_UNWIND
+class Timer
+{
+public:
+    Timer();
+    Timer(const Timer &) = delete;
+    Timer & operator = (const Timer &) = delete;
+    ~Timer();
+
+    void createIfNecessary(UInt64 thread_id, int clock_type, int pause_signal);
+    void set(UInt32 period);
+    void stop();
+    void cleanup();
+
+private:
+    Poco::Logger * log;
+    std::optional<timer_t> timer_id;
+};
+#endif
+
 template <typename ProfilerImpl>
 class QueryProfilerBase
 {
@@ -35,13 +56,12 @@ public:
     ~QueryProfilerBase();
 
 private:
-    void tryCleanup();
+    void cleanup();
 
     Poco::Logger * log;
 
 #if USE_UNWIND
-    /// Timer id from timer_create(2)
-    std::optional<timer_t> timer_id;
+    inline static thread_local Timer timer = Timer();
 #endif
 
     /// Pause signal to interrupt threads to get traces
diff --git a/src/Common/ShellCommand.cpp b/src/Common/ShellCommand.cpp
index 0616ac6303c..533e73c7adb 100644
--- a/src/Common/ShellCommand.cpp
+++ b/src/Common/ShellCommand.cpp
@@ -260,7 +260,7 @@ std::unique_ptr<ShellCommand> ShellCommand::executeDirect(const ShellCommand::Co
 
     std::vector<char *> argv(arguments.size() + 2);
     std::vector<char> argv_data(argv_sum_size);
-    WriteBuffer writer(argv_data.data(), argv_sum_size);
+    WriteBufferFromPointer writer(argv_data.data(), argv_sum_size);
 
     argv[0] = writer.position();
     writer.write(path.data(), path.size() + 1);
@@ -271,6 +271,8 @@ std::unique_ptr<ShellCommand> ShellCommand::executeDirect(const ShellCommand::Co
         writer.write(arguments[i].data(), arguments[i].size() + 1);
     }
 
+    writer.finalize();
+
     argv[arguments.size() + 1] = nullptr;
 
     return executeImpl(path.data(), argv.data(), config);
diff --git a/src/Common/StackTrace.cpp b/src/Common/StackTrace.cpp
index e6b7839c4e2..aea0f854fe1 100644
--- a/src/Common/StackTrace.cpp
+++ b/src/Common/StackTrace.cpp
@@ -412,6 +412,21 @@ void StackTrace::toStringEveryLine(std::function<void(std::string_view)> callbac
     toStringEveryLineImpl(true, {frame_pointers, offset, size}, std::move(callback));
 }
 
+void StackTrace::toStringEveryLine(const FramePointers & frame_pointers, std::function<void(std::string_view)> callback)
+{
+    toStringEveryLineImpl(true, {frame_pointers, 0, static_cast<size_t>(std::ranges::find(frame_pointers, nullptr) - frame_pointers.begin())}, std::move(callback));
+}
+
+void StackTrace::toStringEveryLine(void ** frame_pointers_raw, size_t offset, size_t size, std::function<void(std::string_view)> callback)
+{
+    __msan_unpoison(frame_pointers_raw, size * sizeof(*frame_pointers_raw));
+
+    StackTrace::FramePointers frame_pointers{};
+    std::copy_n(frame_pointers_raw, size, frame_pointers.begin());
+
+    toStringEveryLineImpl(true, {frame_pointers, offset, size}, std::move(callback));
+}
+
 using StackTraceCache = std::map<StackTraceTriple, String, std::less<>>;
 
 static StackTraceCache & cacheInstance()
diff --git a/src/Common/StackTrace.h b/src/Common/StackTrace.h
index 3940c880c5b..656f543d837 100644
--- a/src/Common/StackTrace.h
+++ b/src/Common/StackTrace.h
@@ -65,6 +65,8 @@ public:
     static void symbolize(const FramePointers & frame_pointers, size_t offset, size_t size, StackTrace::Frames & frames);
 
     void toStringEveryLine(std::function<void(std::string_view)> callback) const;
+    static void toStringEveryLine(const FramePointers & frame_pointers, std::function<void(std::string_view)> callback);
+    static void toStringEveryLine(void ** frame_pointers_raw, size_t offset, size_t size, std::function<void(std::string_view)> callback);
 
     /// Displaying the addresses can be disabled for security reasons.
     /// If you turn off addresses, it will be more secure, but we will be unable to help you with debugging.
diff --git a/src/Common/StringSearcher.h b/src/Common/StringSearcher.h
index ae440f9151b..3ed192d05f3 100644
--- a/src/Common/StringSearcher.h
+++ b/src/Common/StringSearcher.h
@@ -21,12 +21,6 @@
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int BAD_ARGUMENTS;
-}
-
-
 /** Variants for searching a substring in a string.
   * In most cases, performance is less than Volnitsky (see Volnitsky.h).
   */
@@ -811,15 +805,22 @@ class TokenSearcher : public StringSearcherBase
     size_t needle_size;
 
 public:
+
+    template <typename CharT>
+    requires (sizeof(CharT) == 1)
+    static bool isValidNeedle(const CharT * needle_, size_t needle_size_)
+    {
+        return std::none_of(needle_, needle_ + needle_size_, isTokenSeparator);
+    }
+
     template <typename CharT>
     requires (sizeof(CharT) == 1)
     TokenSearcher(const CharT * needle_, size_t needle_size_)
         : searcher(needle_, needle_size_)
         , needle_size(needle_size_)
     {
-        if (std::any_of(needle_, needle_ + needle_size_, isTokenSeparator))
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Needle must not contain whitespace or separator characters");
-
+        /// The caller is responsible for calling isValidNeedle()
+        chassert(isValidNeedle(needle_, needle_size_));
     }
 
     template <typename CharT>
@@ -880,6 +881,7 @@ using ASCIICaseSensitiveStringSearcher =   impl::StringSearcher<true, true>;
 using ASCIICaseInsensitiveStringSearcher = impl::StringSearcher<false, true>;
 using UTF8CaseSensitiveStringSearcher =    impl::StringSearcher<true, false>;
 using UTF8CaseInsensitiveStringSearcher =  impl::StringSearcher<false, false>;
+
 using ASCIICaseSensitiveTokenSearcher =    impl::TokenSearcher<ASCIICaseSensitiveStringSearcher>;
 using ASCIICaseInsensitiveTokenSearcher =  impl::TokenSearcher<ASCIICaseInsensitiveStringSearcher>;
 
diff --git a/src/Common/ThreadPool.cpp b/src/Common/ThreadPool.cpp
index f91849ead66..cc88594d84f 100644
--- a/src/Common/ThreadPool.cpp
+++ b/src/Common/ThreadPool.cpp
@@ -189,7 +189,9 @@ ReturnType ThreadPoolImpl<Thread>::scheduleImpl(Job job, Priority priority, std:
         jobs.emplace(std::move(job),
                      priority,
                      /// Tracing context on this thread is used as parent context for the sub-thread that runs the job
-                     propagate_opentelemetry_tracing_context ? DB::OpenTelemetry::CurrentContext() : DB::OpenTelemetry::TracingContextOnThread());
+                     propagate_opentelemetry_tracing_context ? DB::OpenTelemetry::CurrentContext() : DB::OpenTelemetry::TracingContextOnThread(),
+                     /// capture_frame_pointers
+                     DB::Exception::enable_job_stack_trace);
 
         ++scheduled_jobs;
     }
@@ -348,6 +350,8 @@ void ThreadPoolImpl<Thread>::worker(typename std::list<Thread>::iterator thread_
         /// A copy of parent trace context
         DB::OpenTelemetry::TracingContextOnThread parent_thread_trace_context;
 
+        std::vector<StackTrace::FramePointers> thread_frame_pointers;
+
         /// Get a job from the queue.
         Job job;
 
@@ -393,6 +397,9 @@ void ThreadPoolImpl<Thread>::worker(typename std::list<Thread>::iterator thread_
             /// to prevent us from modifying its priority. We have to use const_cast to force move semantics on JobWithPriority::job.
             job = std::move(const_cast<Job &>(jobs.top().job));
             parent_thread_trace_context = std::move(const_cast<DB::OpenTelemetry::TracingContextOnThread &>(jobs.top().thread_trace_context));
+            DB::Exception::enable_job_stack_trace = jobs.top().enable_job_stack_trace;
+            if (DB::Exception::enable_job_stack_trace)
+                thread_frame_pointers = std::move(const_cast<std::vector<StackTrace::FramePointers> &>(jobs.top().frame_pointers));
             jobs.pop();
 
             /// We don't run jobs after `shutdown` is set, but we have to properly dequeue all jobs and finish them.
@@ -411,6 +418,10 @@ void ThreadPoolImpl<Thread>::worker(typename std::list<Thread>::iterator thread_
         /// Run the job.
         try
         {
+            if (DB::Exception::enable_job_stack_trace)
+                DB::Exception::thread_frame_pointers = std::move(thread_frame_pointers);
+
+
             CurrentMetrics::Increment metric_active_pool_threads(metric_active_threads);
 
             job();
diff --git a/src/Common/ThreadPool.h b/src/Common/ThreadPool.h
index 70053ff7558..f5721146e09 100644
--- a/src/Common/ThreadPool.h
+++ b/src/Common/ThreadPool.h
@@ -19,6 +19,8 @@
 #include <Common/CurrentMetrics.h>
 #include <Common/ThreadPool_fwd.h>
 #include <Common/Priority.h>
+#include <Common/StackTrace.h>
+#include <Common/Exception.h>
 #include <base/scope_guard.h>
 
 /** Very simple thread pool similar to boost::threadpool.
@@ -127,8 +129,19 @@ private:
         Priority priority;
         DB::OpenTelemetry::TracingContextOnThread thread_trace_context;
 
-        JobWithPriority(Job job_, Priority priority_, const DB::OpenTelemetry::TracingContextOnThread & thread_trace_context_)
-            : job(job_), priority(priority_), thread_trace_context(thread_trace_context_) {}
+        /// Call stacks of all jobs' schedulings leading to this one
+        std::vector<StackTrace::FramePointers> frame_pointers;
+        bool enable_job_stack_trace = false;
+
+        JobWithPriority(Job job_, Priority priority_, const DB::OpenTelemetry::TracingContextOnThread & thread_trace_context_, bool capture_frame_pointers = false)
+            : job(job_), priority(priority_), thread_trace_context(thread_trace_context_), enable_job_stack_trace(capture_frame_pointers)
+        {
+            if (!capture_frame_pointers)
+                return;
+            /// Save all previous jobs call stacks and append with current
+            frame_pointers = DB::Exception::thread_frame_pointers;
+            frame_pointers.push_back(StackTrace().getFramePointers());
+        }
 
         bool operator<(const JobWithPriority & rhs) const
         {
diff --git a/src/Common/ThreadStatus.h b/src/Common/ThreadStatus.h
index 061959d9f1f..3b6b947471e 100644
--- a/src/Common/ThreadStatus.h
+++ b/src/Common/ThreadStatus.h
@@ -290,6 +290,7 @@ public:
     void flushUntrackedMemory();
 
 private:
+    void applyGlobalSettings();
     void applyQuerySettings();
 
     void initPerformanceCounters();
diff --git a/src/Common/TransformEndianness.hpp b/src/Common/TransformEndianness.hpp
new file mode 100644
index 00000000000..4d690d75d9e
--- /dev/null
+++ b/src/Common/TransformEndianness.hpp
@@ -0,0 +1,62 @@
+#pragma once
+
+#include <base/Decimal_fwd.h>
+#include <base/extended_types.h>
+
+#include <utility>
+
+namespace DB
+{
+template <std::endian endian, typename T>
+requires std::is_integral_v<T>
+inline void transformEndianness(T & value)
+{
+    if constexpr (endian != std::endian::native)
+        value = std::byteswap(value);
+}
+
+template <std::endian endian, typename T>
+requires is_big_int_v<T>
+inline void transformEndianness(T & x)
+{
+    if constexpr (std::endian::native != endian)
+    {
+        auto & items = x.items;
+        std::transform(std::begin(items), std::end(items), std::begin(items), [](auto & item) { return std::byteswap(item); });
+        std::reverse(std::begin(items), std::end(items));
+    }
+}
+
+template <std::endian endian, typename T>
+requires is_decimal<T>
+inline void transformEndianness(T & x)
+{
+    transformEndianness<endian>(x.value);
+}
+
+template <std::endian endian, typename T>
+requires std::is_floating_point_v<T>
+inline void transformEndianness(T & value)
+{
+    if constexpr (std::endian::native != endian)
+    {
+        auto * start = reinterpret_cast<std::byte *>(&value);
+        std::reverse(start, start + sizeof(T));
+    }
+}
+
+template <std::endian endian, typename T>
+requires std::is_scoped_enum_v<T>
+inline void transformEndianness(T & x)
+{
+    using UnderlyingType = std::underlying_type_t<T>;
+    transformEndianness<endian>(reinterpret_cast<UnderlyingType &>(x));
+}
+
+template <std::endian endian, typename A, typename B>
+inline void transformEndianness(std::pair<A, B> & pair)
+{
+    transformEndianness<endian>(pair.first);
+    transformEndianness<endian>(pair.second);
+}
+}
diff --git a/src/Common/Volnitsky.h b/src/Common/Volnitsky.h
index 64c5bf4c0d3..8f9aa23a38a 100644
--- a/src/Common/Volnitsky.h
+++ b/src/Common/Volnitsky.h
@@ -406,8 +406,7 @@ public:
         /// And also adding from the end guarantees that we will find first occurrence because we will lookup bigger offsets first.
         for (auto i = static_cast<ssize_t>(needle_size - sizeof(VolnitskyTraits::Ngram)); i >= 0; --i)
         {
-            bool ok = VolnitskyTraits::putNGram<CaseSensitive, ASCII>(
-                needle + i, static_cast<int>(i + 1), needle, needle_size, callback);
+            bool ok = VolnitskyTraits::putNGram<CaseSensitive, ASCII>(needle + i, static_cast<int>(i + 1), needle, needle_size, callback);
 
             /** `putNGramUTF8CaseInsensitive` does not work if characters with lower and upper cases
               * are represented by different number of bytes or code points.
diff --git a/src/Common/ZooKeeper/CMakeLists.txt b/src/Common/ZooKeeper/CMakeLists.txt
index a9a335d1461..3f7e87ff4a7 100644
--- a/src/Common/ZooKeeper/CMakeLists.txt
+++ b/src/Common/ZooKeeper/CMakeLists.txt
@@ -2,6 +2,8 @@ include("${ClickHouse_SOURCE_DIR}/cmake/dbms_glob_sources.cmake")
 
 add_headers_and_sources(clickhouse_common_zookeeper .)
 
+list(APPEND clickhouse_common_zookeeper_sources ${CMAKE_CURRENT_SOURCE_DIR}/../../../src/Coordination/KeeperFeatureFlags.cpp)
+
 # for clickhouse server
 add_library(clickhouse_common_zookeeper ${clickhouse_common_zookeeper_headers} ${clickhouse_common_zookeeper_sources})
 target_compile_definitions (clickhouse_common_zookeeper PRIVATE -DZOOKEEPER_LOG)
diff --git a/src/Common/ZooKeeper/IKeeper.h b/src/Common/ZooKeeper/IKeeper.h
index 3eb5819df90..2703c1079c0 100644
--- a/src/Common/ZooKeeper/IKeeper.h
+++ b/src/Common/ZooKeeper/IKeeper.h
@@ -2,7 +2,7 @@
 
 #include <base/types.h>
 #include <Common/Exception.h>
-#include <Coordination/KeeperConstants.h>
+#include <Coordination/KeeperFeatureFlags.h>
 #include <Poco/Net/SocketAddress.h>
 
 #include <vector>
@@ -530,7 +530,9 @@ public:
         const Requests & requests,
         MultiCallback callback) = 0;
 
-    virtual DB::KeeperApiVersion getApiVersion() const = 0;
+    virtual bool isFeatureEnabled(DB::KeeperFeatureFlag feature_flag) const = 0;
+
+    virtual const DB::KeeperFeatureFlags * getKeeperFeatureFlags() const { return nullptr; }
 
     /// Expire session and finish all pending requests
     virtual void finalize(const String & reason) = 0;
diff --git a/src/Common/ZooKeeper/TestKeeper.h b/src/Common/ZooKeeper/TestKeeper.h
index 4bffa4e1d4f..9bbd018cfb1 100644
--- a/src/Common/ZooKeeper/TestKeeper.h
+++ b/src/Common/ZooKeeper/TestKeeper.h
@@ -11,6 +11,7 @@
 #include <Common/ZooKeeper/ZooKeeperArgs.h>
 #include <Common/ThreadPool.h>
 #include <Common/ConcurrentBoundedQueue.h>
+#include <Coordination/KeeperFeatureFlags.h>
 
 
 namespace Coordination
@@ -92,9 +93,9 @@ public:
 
     void finalize(const String & reason) override;
 
-    DB::KeeperApiVersion getApiVersion() const override
+    bool isFeatureEnabled(DB::KeeperFeatureFlag) const override
     {
-        return KeeperApiVersion::ZOOKEEPER_COMPATIBLE;
+        return false;
     }
 
     struct Node
diff --git a/src/Common/ZooKeeper/ZooKeeper.cpp b/src/Common/ZooKeeper/ZooKeeper.cpp
index a587ad6caf4..5dd7948276d 100644
--- a/src/Common/ZooKeeper/ZooKeeper.cpp
+++ b/src/Common/ZooKeeper/ZooKeeper.cpp
@@ -179,7 +179,7 @@ ZooKeeper::ZooKeeper(const Poco::Util::AbstractConfiguration & config, const std
 
 std::vector<ShuffleHost> ZooKeeper::shuffleHosts() const
 {
-    std::function<size_t(size_t index)> get_priority = args.get_priority_load_balancing.getPriorityFunc(args.get_priority_load_balancing.load_balancing, 0, args.hosts.size());
+    std::function<Priority(size_t index)> get_priority = args.get_priority_load_balancing.getPriorityFunc(args.get_priority_load_balancing.load_balancing, 0, args.hosts.size());
     std::vector<ShuffleHost> shuffle_hosts;
     for (size_t i = 0; i < args.hosts.size(); ++i)
     {
@@ -865,9 +865,9 @@ bool ZooKeeper::expired()
     return impl->isExpired();
 }
 
-DB::KeeperApiVersion ZooKeeper::getApiVersion() const
+bool ZooKeeper::isFeatureEnabled(DB::KeeperFeatureFlag feature_flag) const
 {
-    return impl->getApiVersion();
+    return impl->isFeatureEnabled(feature_flag);
 }
 
 Int64 ZooKeeper::getClientID()
diff --git a/src/Common/ZooKeeper/ZooKeeper.h b/src/Common/ZooKeeper/ZooKeeper.h
index 96f9914b597..1fcb048add2 100644
--- a/src/Common/ZooKeeper/ZooKeeper.h
+++ b/src/Common/ZooKeeper/ZooKeeper.h
@@ -15,6 +15,7 @@
 #include <Common/ZooKeeper/ZooKeeperConstants.h>
 #include <Common/ZooKeeper/ZooKeeperArgs.h>
 #include <Common/thread_local_rng.h>
+#include <Coordination/KeeperFeatureFlags.h>
 #include <unistd.h>
 #include <random>
 
@@ -49,7 +50,7 @@ constexpr size_t MULTI_BATCH_SIZE = 100;
 struct ShuffleHost
 {
     String host;
-    Int64 priority = 0;
+    Priority priority;
     UInt64 random = 0;
 
     void randomize()
@@ -215,7 +216,7 @@ public:
     /// Returns true, if the session has expired.
     bool expired();
 
-    DB::KeeperApiVersion getApiVersion() const;
+    bool isFeatureEnabled(DB::KeeperFeatureFlag feature_flag) const;
 
     /// Create a znode.
     /// Throw an exception if something went wrong.
@@ -526,6 +527,9 @@ public:
     String getConnectedZooKeeperHost() const { return connected_zk_host; }
     UInt16 getConnectedZooKeeperPort() const { return connected_zk_port; }
     size_t getConnectedZooKeeperIndex() const { return connected_zk_index; }
+    UInt64 getConnectedTime() const { return connected_time; }
+
+    const DB::KeeperFeatureFlags * getKeeperFeatureFlags() const { return impl->getKeeperFeatureFlags(); }
 
 private:
     void init(ZooKeeperArgs args_);
@@ -553,7 +557,7 @@ private:
     template <typename TResponse, bool try_multi, typename TIter>
     MultiReadResponses<TResponse, try_multi> multiRead(TIter start, TIter end, RequestFactory request_factory, AsyncFunction<TResponse> async_fun)
     {
-        if (getApiVersion() >= DB::KeeperApiVersion::WITH_MULTI_READ)
+        if (isFeatureEnabled(DB::KeeperFeatureFlag::MULTI_READ))
         {
             Coordination::Requests requests;
             for (auto it = start; it != end; ++it)
@@ -593,6 +597,7 @@ private:
     String connected_zk_host;
     UInt16 connected_zk_port;
     size_t connected_zk_index;
+    UInt64 connected_time = timeInSeconds(std::chrono::system_clock::now());
 
     std::mutex mutex;
 
@@ -685,7 +690,7 @@ String getZooKeeperConfigName(const Poco::Util::AbstractConfiguration & config);
 template <typename Client>
 void addCheckNotExistsRequest(Coordination::Requests & requests, const Client & client, const std::string & path)
 {
-    if (client.getApiVersion() >= DB::KeeperApiVersion::WITH_CHECK_NOT_EXISTS)
+    if (client.isFeatureEnabled(DB::KeeperFeatureFlag::CHECK_NOT_EXISTS))
     {
         auto request = std::make_shared<Coordination::CheckRequest>();
         request->path = path;
diff --git a/src/Common/ZooKeeper/ZooKeeperArgs.cpp b/src/Common/ZooKeeper/ZooKeeperArgs.cpp
index 0ebc7f667cb..e99285b0056 100644
--- a/src/Common/ZooKeeper/ZooKeeperArgs.cpp
+++ b/src/Common/ZooKeeper/ZooKeeperArgs.cpp
@@ -4,6 +4,7 @@
 #include <base/getFQDNOrHostName.h>
 #include <Poco/Util/AbstractConfiguration.h>
 #include <Common/isLocalAddress.h>
+#include <Common/StringUtils/StringUtils.h>
 #include <Poco/String.h>
 
 namespace DB
diff --git a/src/Common/ZooKeeper/ZooKeeperImpl.cpp b/src/Common/ZooKeeper/ZooKeeperImpl.cpp
index 7f23ac00efe..0f27d078234 100644
--- a/src/Common/ZooKeeper/ZooKeeperImpl.cpp
+++ b/src/Common/ZooKeeper/ZooKeeperImpl.cpp
@@ -354,7 +354,8 @@ ZooKeeper::ZooKeeper(
         send_thread = ThreadFromGlobalPool([this] { sendThread(); });
         receive_thread = ThreadFromGlobalPool([this] { receiveThread(); });
 
-        initApiVersion();
+        initFeatureFlags();
+        keeper_feature_flags.logFlags(log);
 
         ProfileEvents::increment(ProfileEvents::ZooKeeperInit);
     }
@@ -362,6 +363,16 @@ ZooKeeper::ZooKeeper(
     {
         tryLogCurrentException(log, "Failed to connect to ZooKeeper");
 
+        try
+        {
+            requests_queue.finish();
+            socket.shutdown();
+        }
+        catch (...)
+        {
+            tryLogCurrentException(log);
+        }
+
         send_thread.join();
         receive_thread.join();
 
@@ -1089,41 +1100,64 @@ void ZooKeeper::pushRequest(RequestInfo && info)
     ProfileEvents::increment(ProfileEvents::ZooKeeperTransactions);
 }
 
-KeeperApiVersion ZooKeeper::getApiVersion() const
+bool ZooKeeper::isFeatureEnabled(KeeperFeatureFlag feature_flag) const
 {
-    return keeper_api_version;
+    return keeper_feature_flags.isEnabled(feature_flag);
 }
 
-void ZooKeeper::initApiVersion()
+void ZooKeeper::initFeatureFlags()
 {
-    auto promise = std::make_shared<std::promise<Coordination::GetResponse>>();
-    auto future = promise->get_future();
-
-    auto callback = [promise](const Coordination::GetResponse & response) mutable
+    const auto try_get = [&](const std::string & path, const std::string & description) -> std::optional<std::string>
     {
-        promise->set_value(response);
+        auto promise = std::make_shared<std::promise<Coordination::GetResponse>>();
+        auto future = promise->get_future();
+
+        auto callback = [promise](const Coordination::GetResponse & response) mutable
+        {
+            promise->set_value(response);
+        };
+
+        get(path, std::move(callback), {});
+        if (future.wait_for(std::chrono::milliseconds(args.operation_timeout_ms)) != std::future_status::ready)
+            throw Exception(Error::ZOPERATIONTIMEOUT, "Failed to get {}: timeout", description);
+
+        auto response = future.get();
+
+        if (response.error == Coordination::Error::ZNONODE)
+        {
+            LOG_TRACE(log, "Failed to get {}", description);
+            return std::nullopt;
+        }
+        else if (response.error != Coordination::Error::ZOK)
+        {
+            throw Exception(response.error, "Failed to get {}", description);
+        }
+
+        return std::move(response.data);
     };
 
-    get(keeper_api_version_path, std::move(callback), {});
-    if (future.wait_for(std::chrono::milliseconds(args.operation_timeout_ms)) != std::future_status::ready)
+    if (auto feature_flags = try_get(keeper_api_feature_flags_path, "feature flags"); feature_flags.has_value())
     {
-        LOG_TRACE(log, "Failed to get API version: timeout");
+        keeper_feature_flags.setFeatureFlags(std::move(*feature_flags));
         return;
     }
 
-    auto response = future.get();
+    auto keeper_api_version_string = try_get(keeper_api_version_path, "API version");
 
-    if (response.error != Coordination::Error::ZOK)
+    DB::KeeperApiVersion keeper_api_version{DB::KeeperApiVersion::ZOOKEEPER_COMPATIBLE};
+
+    if (!keeper_api_version_string.has_value())
     {
-        LOG_TRACE(log, "Failed to get API version");
+        LOG_TRACE(log, "API version not found, assuming {}", keeper_api_version);
         return;
     }
 
+    DB::ReadBufferFromOwnString buf(*keeper_api_version_string);
     uint8_t keeper_version{0};
-    DB::ReadBufferFromOwnString buf(response.data);
     DB::readIntText(keeper_version, buf);
     keeper_api_version = static_cast<DB::KeeperApiVersion>(keeper_version);
     LOG_TRACE(log, "Detected server's API version: {}", keeper_api_version);
+    keeper_feature_flags.fromApiVersion(keeper_api_version);
 }
 
 
@@ -1243,7 +1277,7 @@ void ZooKeeper::list(
     WatchCallback watch)
 {
     std::shared_ptr<ZooKeeperListRequest> request{nullptr};
-    if (keeper_api_version < Coordination::KeeperApiVersion::WITH_FILTERED_LIST)
+    if (!isFeatureEnabled(KeeperFeatureFlag::FILTERED_LIST))
     {
         if (list_request_type != ListRequestType::ALL)
             throw Exception(Error::ZBADARGUMENTS, "Filtered list request type cannot be used because it's not supported by the server");
@@ -1308,7 +1342,7 @@ void ZooKeeper::multi(
 {
     ZooKeeperMultiRequest request(requests, default_acls);
 
-    if (request.getOpNum() == OpNum::MultiRead && keeper_api_version < Coordination::KeeperApiVersion::WITH_MULTI_READ)
+    if (request.getOpNum() == OpNum::MultiRead && !isFeatureEnabled(KeeperFeatureFlag::MULTI_READ))
             throw Exception(Error::ZBADARGUMENTS, "MultiRead request type cannot be used because it's not supported by the server");
 
     RequestInfo request_info;
diff --git a/src/Common/ZooKeeper/ZooKeeperImpl.h b/src/Common/ZooKeeper/ZooKeeperImpl.h
index 944c5032fac..44ea993947e 100644
--- a/src/Common/ZooKeeper/ZooKeeperImpl.h
+++ b/src/Common/ZooKeeper/ZooKeeperImpl.h
@@ -9,6 +9,7 @@
 #include <Common/ZooKeeper/ZooKeeperCommon.h>
 #include <Common/ZooKeeper/ZooKeeperArgs.h>
 #include <Coordination/KeeperConstants.h>
+#include <Coordination/KeeperFeatureFlags.h>
 
 #include <IO/ReadBuffer.h>
 #include <IO/WriteBuffer.h>
@@ -181,7 +182,7 @@ public:
         const Requests & requests,
         MultiCallback callback) override;
 
-    DB::KeeperApiVersion getApiVersion() const override;
+    bool isFeatureEnabled(KeeperFeatureFlag feature_flag) const override;
 
     /// Without forcefully invalidating (finalizing) ZooKeeper session before
     /// establishing a new one, there was a possibility that server is using
@@ -201,6 +202,8 @@ public:
 
     void setServerCompletelyStarted();
 
+    const KeeperFeatureFlags * getKeeperFeatureFlags() const override { return &keeper_feature_flags; }
+
 private:
     ACLs default_acls;
     Poco::Net::SocketAddress connected_zk_address;
@@ -312,12 +315,12 @@ private:
 
     void logOperationIfNeeded(const ZooKeeperRequestPtr & request, const ZooKeeperResponsePtr & response = nullptr, bool finalize = false, UInt64 elapsed_ms = 0);
 
-    void initApiVersion();
+    void initFeatureFlags();
 
     CurrentMetrics::Increment active_session_metric_increment{CurrentMetrics::ZooKeeperSession};
     std::shared_ptr<ZooKeeperLog> zk_log;
 
-    DB::KeeperApiVersion keeper_api_version{DB::KeeperApiVersion::ZOOKEEPER_COMPATIBLE};
+    DB::KeeperFeatureFlags keeper_feature_flags;
 };
 
 }
diff --git a/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.h b/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.h
index bf99cb76798..9d02d674010 100644
--- a/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.h
+++ b/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.h
@@ -402,9 +402,9 @@ public:
         ephemeral_nodes.clear();
     }
 
-    KeeperApiVersion getApiVersion() const
+    bool isFeatureEnabled(KeeperFeatureFlag feature_flag) const
     {
-        return keeper->getApiVersion();
+        return keeper->isFeatureEnabled(feature_flag);
     }
 
 private:
diff --git a/src/Common/assertProcessUserMatchesDataOwner.h b/src/Common/assertProcessUserMatchesDataOwner.h
index b31d795da71..7a6c5d36335 100644
--- a/src/Common/assertProcessUserMatchesDataOwner.h
+++ b/src/Common/assertProcessUserMatchesDataOwner.h
@@ -1,5 +1,7 @@
 #pragma once
+
 #include <string>
+#include <functional>
 
 namespace DB
 {
diff --git a/src/Common/assert_cast.h b/src/Common/assert_cast.h
index 604cfaed6e2..0b73ba1cc12 100644
--- a/src/Common/assert_cast.h
+++ b/src/Common/assert_cast.h
@@ -23,7 +23,7 @@ namespace DB
   * The exact match of the type is checked. That is, cast to the ancestor will be unsuccessful.
   */
 template <typename To, typename From>
-To assert_cast(From && from)
+inline To assert_cast(From && from)
 {
 #ifndef NDEBUG
     try
diff --git a/src/Common/checkSSLReturnCode.cpp b/src/Common/checkSSLReturnCode.cpp
new file mode 100644
index 00000000000..ffb912da18a
--- /dev/null
+++ b/src/Common/checkSSLReturnCode.cpp
@@ -0,0 +1,29 @@
+#include <Common/checkSSLReturnCode.h>
+#include "config.h"
+
+#if USE_SSL
+#include <Poco/Net/SecureStreamSocket.h>
+#endif
+
+namespace DB
+{
+
+bool checkSSLWantRead([[maybe_unused]] ssize_t ret)
+{
+#if USE_SSL
+    return ret == Poco::Net::SecureStreamSocket::ERR_SSL_WANT_READ;
+#else
+    return false;
+#endif
+}
+
+bool checkSSLWantWrite([[maybe_unused]] ssize_t ret)
+{
+#if USE_SSL
+    return ret == Poco::Net::SecureStreamSocket::ERR_SSL_WANT_WRITE;
+#else
+    return false;
+#endif
+}
+
+}
diff --git a/src/Common/checkSSLReturnCode.h b/src/Common/checkSSLReturnCode.h
new file mode 100644
index 00000000000..77e51625daf
--- /dev/null
+++ b/src/Common/checkSSLReturnCode.h
@@ -0,0 +1,13 @@
+#pragma once
+#include <sys/types.h>
+
+namespace DB
+{
+
+/// Check if ret is ERR_SSL_WANT_READ.
+bool checkSSLWantRead(ssize_t ret);
+
+/// CHeck if ret is ERR_SSL_WANT_WRITE.
+bool checkSSLWantWrite(ssize_t ret);
+
+}
diff --git a/src/Common/getHashOfLoadedBinary.cpp b/src/Common/getHashOfLoadedBinary.cpp
index cc0ad0d2143..b81300b8536 100644
--- a/src/Common/getHashOfLoadedBinary.cpp
+++ b/src/Common/getHashOfLoadedBinary.cpp
@@ -37,7 +37,7 @@ SipHash getHashOfLoadedBinary()
 std::string getHashOfLoadedBinaryHex()
 {
     SipHash hash = getHashOfLoadedBinary();
-    std::array<UInt64, 2> checksum;
+    UInt128 checksum;
     hash.get128(checksum);
     return getHexUIntUppercase(checksum);
 }
diff --git a/src/Common/getNumberOfPhysicalCPUCores.cpp b/src/Common/getNumberOfPhysicalCPUCores.cpp
index ed82c59140d..8fbb32e911f 100644
--- a/src/Common/getNumberOfPhysicalCPUCores.cpp
+++ b/src/Common/getNumberOfPhysicalCPUCores.cpp
@@ -1,4 +1,5 @@
 #include "getNumberOfPhysicalCPUCores.h"
+#include <filesystem>
 
 #include "config.h"
 #if defined(OS_LINUX)
@@ -7,6 +8,8 @@
 #endif
 
 #include <boost/algorithm/string/trim.hpp>
+#include <boost/algorithm/string/split.hpp>
+#include <base/range.h>
 
 #include <thread>
 #include <set>
@@ -15,7 +18,7 @@ namespace
 {
 
 #if defined(OS_LINUX)
-int32_t readFrom(const char * filename, int default_value)
+int32_t readFrom(const std::filesystem::path & filename, int default_value)
 {
     std::ifstream infile(filename);
     if (!infile.is_open())
@@ -31,10 +34,87 @@ int32_t readFrom(const char * filename, int default_value)
 uint32_t getCGroupLimitedCPUCores(unsigned default_cpu_count)
 {
     uint32_t quota_count = default_cpu_count;
+    std::filesystem::path prefix = "/sys/fs/cgroup";
+    /// cgroupsv2
+    std::ifstream contr_file(prefix / "cgroup.controllers");
+    if (contr_file.is_open())
+    {
+        /// First, we identify the cgroup the process belongs
+        std::ifstream cgroup_name_file("/proc/self/cgroup");
+        if (!cgroup_name_file.is_open())
+            return default_cpu_count;
+
+        // cgroup_name_file always starts with '0::/' for v2
+        cgroup_name_file.ignore(4);
+        std::string cgroup_name;
+        cgroup_name_file >> cgroup_name;
+
+        std::filesystem::path current_cgroup;
+        if (cgroup_name.empty())
+            current_cgroup = prefix;
+        else
+            current_cgroup = prefix / cgroup_name;
+
+        // Looking for cpu.max in directories from the current cgroup to the top level
+        // It does not stop on the first time since the child could have a greater value than parent
+        while (current_cgroup != prefix.parent_path())
+        {
+            std::ifstream cpu_max_file(current_cgroup / "cpu.max");
+            current_cgroup = current_cgroup.parent_path();
+            if (cpu_max_file.is_open())
+            {
+                std::string cpu_limit_str;
+                float cpu_period;
+                cpu_max_file >> cpu_limit_str >> cpu_period;
+                if (cpu_limit_str != "max" && cpu_period != 0)
+                {
+                    float cpu_limit = std::stof(cpu_limit_str);
+                    quota_count = std::min(static_cast<uint32_t>(ceil(cpu_limit / cpu_period)), quota_count);
+                }
+            }
+        }
+        current_cgroup = prefix / cgroup_name;
+        // Looking for cpuset.cpus.effective in directories from the current cgroup to the top level
+        while (current_cgroup != prefix.parent_path())
+        {
+            std::ifstream cpuset_cpus_file(current_cgroup / "cpuset.cpus.effective");
+            current_cgroup = current_cgroup.parent_path();
+            if (cpuset_cpus_file.is_open())
+            {
+                // The line in the file is "0,2-4,6,9-14" cpu numbers
+                // It's always grouped and ordered
+                std::vector<std::string> cpu_ranges;
+                std::string cpuset_line;
+                cpuset_cpus_file >> cpuset_line;
+                if (cpuset_line.empty())
+                    continue;
+                boost::split(cpu_ranges, cpuset_line, boost::is_any_of(","));
+                uint32_t cpus_count = 0;
+                for (const std::string& cpu_number_or_range : cpu_ranges)
+                {
+                    std::vector<std::string> cpu_range;
+                    boost::split(cpu_range, cpu_number_or_range, boost::is_any_of("-"));
+
+                    if (cpu_range.size() == 2)
+                    {
+                        int start = std::stoi(cpu_range[0]);
+                        int end = std::stoi(cpu_range[1]);
+                        cpus_count += (end - start) + 1;
+                    }
+                    else
+                        cpus_count++;
+                }
+                quota_count = std::min(cpus_count, quota_count);
+                break;
+            }
+        }
+        return quota_count;
+    }
+    /// cgroupsv1
     /// Return the number of milliseconds per period process is guaranteed to run.
     /// -1 for no quota
-    int cgroup_quota = readFrom("/sys/fs/cgroup/cpu/cpu.cfs_quota_us", -1);
-    int cgroup_period = readFrom("/sys/fs/cgroup/cpu/cpu.cfs_period_us", -1);
+    int cgroup_quota = readFrom(prefix / "cpu/cpu.cfs_quota_us", -1);
+    int cgroup_period = readFrom(prefix / "cpu/cpu.cfs_period_us", -1);
     if (cgroup_quota > -1 && cgroup_period > 0)
         quota_count = static_cast<uint32_t>(ceil(static_cast<float>(cgroup_quota) / static_cast<float>(cgroup_period)));
 
diff --git a/src/Common/parseGlobs.cpp b/src/Common/parseGlobs.cpp
index f8d331c2b76..07cce38afff 100644
--- a/src/Common/parseGlobs.cpp
+++ b/src/Common/parseGlobs.cpp
@@ -40,7 +40,7 @@ std::string makeRegexpPatternFromGlobs(const std::string & initial_str_with_glob
     size_t current_index = 0;
     while (RE2::FindAndConsume(&input, enum_or_range, &matched))
     {
-        std::string buffer = matched.ToString();
+        std::string buffer{matched};
         oss_for_replacing << escaped_with_globs.substr(current_index, matched.data() - escaped_with_globs.data() - current_index - 1) << '(';
 
         if (buffer.find(',') == std::string::npos)
diff --git a/src/Common/typeid_cast.h b/src/Common/typeid_cast.h
index baee3aaf632..f1ded97a9f1 100644
--- a/src/Common/typeid_cast.h
+++ b/src/Common/typeid_cast.h
@@ -25,17 +25,10 @@ namespace DB
   */
 template <typename To, typename From>
 requires std::is_reference_v<To>
-To typeid_cast(From & from)
+To typeid_cast(From & from) noexcept(false)
 {
-    try
-    {
-        if ((typeid(From) == typeid(To)) || (typeid(from) == typeid(To)))
-            return static_cast<To>(from);
-    }
-    catch (const std::exception & e)
-    {
-        throw DB::Exception::createDeprecated(e.what(), DB::ErrorCodes::LOGICAL_ERROR);
-    }
+    if ((typeid(From) == typeid(To)) || (typeid(from) == typeid(To)))
+        return static_cast<To>(from);
 
     throw DB::Exception(DB::ErrorCodes::LOGICAL_ERROR, "Bad cast from type {} to {}",
                         demangle(typeid(from).name()), demangle(typeid(To).name()));
@@ -44,19 +37,12 @@ To typeid_cast(From & from)
 
 template <typename To, typename From>
 requires std::is_pointer_v<To>
-To typeid_cast(From * from)
+To typeid_cast(From * from) noexcept
 {
-    try
-    {
-        if ((typeid(From) == typeid(std::remove_pointer_t<To>)) || (from && typeid(*from) == typeid(std::remove_pointer_t<To>)))
-            return static_cast<To>(from);
-        else
-            return nullptr;
-    }
-    catch (const std::exception & e)
-    {
-        throw DB::Exception::createDeprecated(e.what(), DB::ErrorCodes::LOGICAL_ERROR);
-    }
+    if ((typeid(From) == typeid(std::remove_pointer_t<To>)) || (from && typeid(*from) == typeid(std::remove_pointer_t<To>)))
+        return static_cast<To>(from);
+    else
+        return nullptr;
 }
 
 namespace detail
@@ -79,17 +65,10 @@ inline constexpr bool is_shared_ptr_v = is_shared_ptr<T>::value;
 
 template <typename To, typename From>
 requires detail::is_shared_ptr_v<To>
-To typeid_cast(const std::shared_ptr<From> & from)
+To typeid_cast(const std::shared_ptr<From> & from) noexcept
 {
-    try
-    {
-        if ((typeid(From) == typeid(typename To::element_type)) || (from && typeid(*from) == typeid(typename To::element_type)))
-            return std::static_pointer_cast<typename To::element_type>(from);
-        else
-            return nullptr;
-    }
-    catch (const std::exception & e)
-    {
-        throw DB::Exception::createDeprecated(e.what(), DB::ErrorCodes::LOGICAL_ERROR);
-    }
+    if ((typeid(From) == typeid(typename To::element_type)) || (from && typeid(*from) == typeid(typename To::element_type)))
+        return std::static_pointer_cast<typename To::element_type>(from);
+    else
+        return nullptr;
 }
diff --git a/src/Compression/CompressedReadBufferBase.cpp b/src/Compression/CompressedReadBufferBase.cpp
index 278210d770a..dd19955d010 100644
--- a/src/Compression/CompressedReadBufferBase.cpp
+++ b/src/Compression/CompressedReadBufferBase.cpp
@@ -49,8 +49,8 @@ static void validateChecksum(char * data, size_t size, const Checksum expected_c
 
     /// TODO mess up of endianness in error message.
     message << "Checksum doesn't match: corrupted data."
-        " Reference: " + getHexUIntLowercase(expected_checksum.first) + getHexUIntLowercase(expected_checksum.second)
-        + ". Actual: " + getHexUIntLowercase(calculated_checksum.first) + getHexUIntLowercase(calculated_checksum.second)
+        " Reference: " + getHexUIntLowercase(expected_checksum)
+        + ". Actual: " + getHexUIntLowercase(calculated_checksum)
         + ". Size of compressed block: " + toString(size);
 
     const char * message_hardware_failure = "This is most likely due to hardware failure. "
@@ -95,8 +95,8 @@ static void validateChecksum(char * data, size_t size, const Checksum expected_c
     }
 
     /// Check if the difference caused by single bit flip in stored checksum.
-    size_t difference = std::popcount(expected_checksum.first ^ calculated_checksum.first)
-        + std::popcount(expected_checksum.second ^ calculated_checksum.second);
+    size_t difference = std::popcount(expected_checksum.low64 ^ calculated_checksum.low64)
+        + std::popcount(expected_checksum.high64 ^ calculated_checksum.high64);
 
     if (difference == 1)
     {
@@ -194,8 +194,8 @@ size_t CompressedReadBufferBase::readCompressedData(size_t & size_decompressed,
     {
         Checksum checksum;
         ReadBufferFromMemory checksum_in(own_compressed_buffer.data(), sizeof(checksum));
-        readBinaryLittleEndian(checksum.first, checksum_in);
-        readBinaryLittleEndian(checksum.second, checksum_in);
+        readBinaryLittleEndian(checksum.low64, checksum_in);
+        readBinaryLittleEndian(checksum.high64, checksum_in);
 
         validateChecksum(compressed_buffer, size_compressed_without_checksum, checksum);
     }
@@ -238,8 +238,8 @@ size_t CompressedReadBufferBase::readCompressedDataBlockForAsynchronous(size_t &
         {
             Checksum checksum;
             ReadBufferFromMemory checksum_in(own_compressed_buffer.data(), sizeof(checksum));
-            readBinaryLittleEndian(checksum.first, checksum_in);
-            readBinaryLittleEndian(checksum.second, checksum_in);
+            readBinaryLittleEndian(checksum.low64, checksum_in);
+            readBinaryLittleEndian(checksum.high64, checksum_in);
 
             validateChecksum(compressed_buffer, size_compressed_without_checksum, checksum);
         }
diff --git a/src/Compression/CompressedWriteBuffer.cpp b/src/Compression/CompressedWriteBuffer.cpp
index cb2ee1140d0..f16330332ab 100644
--- a/src/Compression/CompressedWriteBuffer.cpp
+++ b/src/Compression/CompressedWriteBuffer.cpp
@@ -38,8 +38,8 @@ void CompressedWriteBuffer::nextImpl()
 
         CityHash_v1_0_2::uint128 checksum = CityHash_v1_0_2::CityHash128(out_compressed_ptr, compressed_size);
 
-        writeBinaryLittleEndian(checksum.first, out);
-        writeBinaryLittleEndian(checksum.second, out);
+        writeBinaryLittleEndian(checksum.low64, out);
+        writeBinaryLittleEndian(checksum.high64, out);
 
         out.position() += compressed_size;
     }
@@ -50,8 +50,8 @@ void CompressedWriteBuffer::nextImpl()
 
         CityHash_v1_0_2::uint128 checksum = CityHash_v1_0_2::CityHash128(compressed_buffer.data(), compressed_size);
 
-        writeBinaryLittleEndian(checksum.first, out);
-        writeBinaryLittleEndian(checksum.second, out);
+        writeBinaryLittleEndian(checksum.low64, out);
+        writeBinaryLittleEndian(checksum.high64, out);
 
         out.write(compressed_buffer.data(), compressed_size);
     }
diff --git a/src/Compression/CompressionCodecDeflateQpl.cpp b/src/Compression/CompressionCodecDeflateQpl.cpp
index 60efbd96f8f..859a9c2463a 100644
--- a/src/Compression/CompressionCodecDeflateQpl.cpp
+++ b/src/Compression/CompressionCodecDeflateQpl.cpp
@@ -8,6 +8,8 @@
 #include <Poco/Logger.h>
 #include <Common/logger_useful.h>
 #include "libaccel_config.h"
+#include <Common/MemorySanitizer.h>
+#include <base/scope_guard.h>
 
 namespace DB
 {
@@ -33,6 +35,7 @@ DeflateQplJobHWPool::DeflateQplJobHWPool()
     // loop all configured workqueue size to get maximum job number.
     accfg_ctx * ctx_ptr = nullptr;
     auto ctx_status = accfg_new(&ctx_ptr);
+    SCOPE_EXIT({ accfg_unref(ctx_ptr); });
     if (ctx_status == 0)
     {
         auto * dev_ptr = accfg_device_get_first(ctx_ptr);
@@ -382,6 +385,11 @@ UInt32 CompressionCodecDeflateQpl::getMaxCompressedDataSize(UInt32 uncompressed_
 
 UInt32 CompressionCodecDeflateQpl::doCompressData(const char * source, UInt32 source_size, char * dest) const
 {
+/// QPL library is using AVX-512 with some shuffle operations.
+/// Memory sanitizer don't understand if there was uninitialized memory in SIMD register but it was not used in the result of shuffle.
+#if defined(MEMORY_SANITIZER)
+    __msan_unpoison(dest, getMaxCompressedDataSize(source_size));
+#endif
     Int32 res = HardwareCodecDeflateQpl::RET_ERROR;
     if (DeflateQplJobHWPool::instance().isJobPoolReady())
         res = hw_codec->doCompressData(source, source_size, dest, getMaxCompressedDataSize(source_size));
@@ -392,6 +400,11 @@ UInt32 CompressionCodecDeflateQpl::doCompressData(const char * source, UInt32 so
 
 void CompressionCodecDeflateQpl::doDecompressData(const char * source, UInt32 source_size, char * dest, UInt32 uncompressed_size) const
 {
+/// QPL library is using AVX-512 with some shuffle operations.
+/// Memory sanitizer don't understand if there was uninitialized memory in SIMD register but it was not used in the result of shuffle.
+#if defined(MEMORY_SANITIZER)
+    __msan_unpoison(dest, uncompressed_size);
+#endif
     switch (getDecompressMode())
     {
         case CodecMode::Synchronous:
diff --git a/src/Compression/CompressionCodecDeflateQpl.h b/src/Compression/CompressionCodecDeflateQpl.h
index 7a1a764295d..8d73568707e 100644
--- a/src/Compression/CompressionCodecDeflateQpl.h
+++ b/src/Compression/CompressionCodecDeflateQpl.h
@@ -98,7 +98,7 @@ public:
 protected:
     bool isCompression() const override { return true; }
     bool isGenericCompression() const override { return true; }
-    bool isExperimental() const override { return true; }
+    bool isDeflateQpl() const override { return true; }
 
     UInt32 doCompressData(const char * source, UInt32 source_size, char * dest) const override;
     void doDecompressData(const char * source, UInt32 source_size, char * dest, UInt32 uncompressed_size) const override;
diff --git a/src/Compression/CompressionFactory.h b/src/Compression/CompressionFactory.h
index a4451f9ed2e..4f2627587a3 100644
--- a/src/Compression/CompressionFactory.h
+++ b/src/Compression/CompressionFactory.h
@@ -40,10 +40,10 @@ public:
     CompressionCodecPtr getDefaultCodec() const;
 
     /// Validate codecs AST specified by user and parses codecs description (substitute default parameters)
-    ASTPtr validateCodecAndGetPreprocessedAST(const ASTPtr & ast, const DataTypePtr & column_type, bool sanity_check, bool allow_experimental_codecs) const;
+    ASTPtr validateCodecAndGetPreprocessedAST(const ASTPtr & ast, const DataTypePtr & column_type, bool sanity_check, bool allow_experimental_codecs, bool enable_deflate_qpl_codec) const;
 
     /// Validate codecs AST specified by user
-    void validateCodec(const String & family_name, std::optional<int> level, bool sanity_check, bool allow_experimental_codecs) const;
+    void validateCodec(const String & family_name, std::optional<int> level, bool sanity_check, bool allow_experimental_codecs, bool enable_deflate_qpl_codec) const;
 
     /// Get codec by AST and possible column_type. Some codecs can use
     /// information about type to improve inner settings, but every codec should
diff --git a/src/Compression/CompressionFactoryAdditions.cpp b/src/Compression/CompressionFactoryAdditions.cpp
index 978a0fe5069..98e9e7480da 100644
--- a/src/Compression/CompressionFactoryAdditions.cpp
+++ b/src/Compression/CompressionFactoryAdditions.cpp
@@ -34,7 +34,7 @@ namespace ErrorCodes
 
 
 void CompressionCodecFactory::validateCodec(
-    const String & family_name, std::optional<int> level, bool sanity_check, bool allow_experimental_codecs) const
+    const String & family_name, std::optional<int> level, bool sanity_check, bool allow_experimental_codecs, bool enable_deflate_qpl_codec) const
 {
     if (family_name.empty())
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Compression codec name cannot be empty");
@@ -43,13 +43,13 @@ void CompressionCodecFactory::validateCodec(
     {
         auto literal = std::make_shared<ASTLiteral>(static_cast<UInt64>(*level));
         validateCodecAndGetPreprocessedAST(makeASTFunction("CODEC", makeASTFunction(Poco::toUpper(family_name), literal)),
-            {}, sanity_check, allow_experimental_codecs);
+            {}, sanity_check, allow_experimental_codecs, enable_deflate_qpl_codec);
     }
     else
     {
         auto identifier = std::make_shared<ASTIdentifier>(Poco::toUpper(family_name));
         validateCodecAndGetPreprocessedAST(makeASTFunction("CODEC", identifier),
-            {}, sanity_check, allow_experimental_codecs);
+            {}, sanity_check, allow_experimental_codecs, enable_deflate_qpl_codec);
     }
 }
 
@@ -77,7 +77,7 @@ bool innerDataTypeIsFloat(const DataTypePtr & type)
 }
 
 ASTPtr CompressionCodecFactory::validateCodecAndGetPreprocessedAST(
-    const ASTPtr & ast, const DataTypePtr & column_type, bool sanity_check, bool allow_experimental_codecs) const
+    const ASTPtr & ast, const DataTypePtr & column_type, bool sanity_check, bool allow_experimental_codecs, bool enable_deflate_qpl_codec) const
 {
     if (const auto * func = ast->as<ASTFunction>())
     {
@@ -159,6 +159,12 @@ ASTPtr CompressionCodecFactory::validateCodecAndGetPreprocessedAST(
                         " You can enable it with the 'allow_experimental_codecs' setting.",
                         codec_family_name);
 
+                if (!enable_deflate_qpl_codec && result_codec->isDeflateQpl())
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                        "Codec {} is disabled by default."
+                        " You can enable it with the 'enable_deflate_qpl_codec' setting.",
+                        codec_family_name);
+
                 codecs_descriptions->children.emplace_back(result_codec->getCodecDesc());
             }
 
diff --git a/src/Compression/ICompressionCodec.h b/src/Compression/ICompressionCodec.h
index 44835ac19cb..6630838fa64 100644
--- a/src/Compression/ICompressionCodec.h
+++ b/src/Compression/ICompressionCodec.h
@@ -109,6 +109,9 @@ public:
     /// It will not be allowed to use unless the user will turn off the safety switch.
     virtual bool isExperimental() const { return false; }
 
+    /// Is this the DEFLATE_QPL codec?
+    virtual bool isDeflateQpl() const { return false; }
+
     /// If it does nothing.
     virtual bool isNone() const { return false; }
 
diff --git a/src/Coordination/Changelog.cpp b/src/Coordination/Changelog.cpp
index 894fd93cfa7..94062140bac 100644
--- a/src/Coordination/Changelog.cpp
+++ b/src/Coordination/Changelog.cpp
@@ -1,18 +1,20 @@
 #include <filesystem>
 #include <Coordination/Changelog.h>
+#include <Disks/DiskLocal.h>
 #include <IO/ReadBufferFromFile.h>
 #include <IO/ReadHelpers.h>
+#include <IO/WriteBufferFromFile.h>
 #include <IO/WriteHelpers.h>
 #include <IO/ZstdDeflatingAppendableWriteBuffer.h>
+#include <base/errnoToString.h>
 #include <boost/algorithm/string/join.hpp>
 #include <boost/algorithm/string/split.hpp>
 #include <boost/algorithm/string/trim.hpp>
-#include <Common/filesystemHelpers.h>
 #include <Common/Exception.h>
 #include <Common/SipHash.h>
+#include <Common/filesystemHelpers.h>
 #include <Common/logger_useful.h>
-#include <IO/WriteBufferFromFile.h>
-#include <base/errnoToString.h>
+#include <libnuraft/log_val_type.hxx>
 
 
 namespace DB
@@ -23,20 +25,41 @@ namespace ErrorCodes
     extern const int CHECKSUM_DOESNT_MATCH;
     extern const int CORRUPTED_DATA;
     extern const int UNKNOWN_FORMAT_VERSION;
+    extern const int NOT_IMPLEMENTED;
+    extern const int BAD_ARGUMENTS;
     extern const int LOGICAL_ERROR;
 }
 
 namespace
 {
 
+constexpr std::string_view tmp_prefix = "tmp_";
+
+void moveFileBetweenDisks(DiskPtr disk_from, ChangelogFileDescriptionPtr description, DiskPtr disk_to, const std::string & path_to)
+{
+    /// we use empty file with prefix tmp_ to detect incomplete copies
+    /// if a copy is complete we don't care from which disk we use the same file
+    /// so it's okay if a failure happens after removing of tmp file but before we remove
+    /// the changelog from the source disk
+    auto from_path = fs::path(description->path);
+    auto tmp_changelog_name = from_path.parent_path() / (std::string{tmp_prefix} + from_path.filename().string());
+    {
+        auto buf = disk_to->writeFile(tmp_changelog_name);
+        buf->finalize();
+    }
+    disk_from->copyFile(from_path, *disk_to, path_to, {});
+    disk_to->removeFile(tmp_changelog_name);
+    disk_from->removeFile(description->path);
+    description->path = path_to;
+    description->disk = disk_to;
+}
+
 constexpr auto DEFAULT_PREFIX = "changelog";
 
-std::string formatChangelogPath(
-    const std::string & prefix, const std::string & name_prefix, uint64_t from_index, uint64_t to_index, const std::string & extension)
+inline std::string
+formatChangelogPath(const std::string & name_prefix, uint64_t from_index, uint64_t to_index, const std::string & extension)
 {
-    std::filesystem::path path(prefix);
-    path /= std::filesystem::path(fmt::format("{}_{}_{}.{}", name_prefix, from_index, to_index, extension));
-    return path;
+    return fmt::format("{}_{}_{}.{}", name_prefix, from_index, to_index, extension);
 }
 
 ChangelogFileDescriptionPtr getChangelogFileDescription(const std::filesystem::path & path)
@@ -88,17 +111,19 @@ class ChangelogWriter
 public:
     ChangelogWriter(
         std::map<uint64_t, ChangelogFileDescriptionPtr> & existing_changelogs_,
-        const std::filesystem::path & changelogs_dir_,
+        KeeperContextPtr keeper_context_,
         LogFileSettings log_file_settings_)
         : existing_changelogs(existing_changelogs_)
         , log_file_settings(log_file_settings_)
-        , changelogs_dir(changelogs_dir_)
+        , keeper_context(std::move(keeper_context_))
         , log(&Poco::Logger::get("Changelog"))
     {
     }
 
     void setFile(ChangelogFileDescriptionPtr file_description, WriteMode mode)
     {
+        auto disk = getDisk();
+
         try
         {
             if (mode == WriteMode::Append && file_description->expectedEntriesCountInLog() != log_file_settings.rotate_interval)
@@ -109,7 +134,7 @@ public:
                     file_description->expectedEntriesCountInLog());
 
             // we have a file we need to finalize first
-            if (tryGetFileBuffer() && prealloc_done)
+            if (tryGetFileBaseBuffer() && prealloc_done)
             {
                 finalizeCurrentFile();
 
@@ -117,27 +142,55 @@ public:
                 // if we wrote at least 1 log in the log file we can rename the file to reflect correctly the
                 // contained logs
                 // file can be deleted from disk earlier by compaction
-                if (!current_file_description->deleted && last_index_written
-                    && *last_index_written != current_file_description->to_log_index)
+                if (!current_file_description->deleted)
                 {
-                    auto new_path = formatChangelogPath(
-                        changelogs_dir,
-                        current_file_description->prefix,
-                        current_file_description->from_log_index,
-                        *last_index_written,
-                        current_file_description->extension);
-                    std::filesystem::rename(current_file_description->path, new_path);
-                    current_file_description->path = std::move(new_path);
+                    auto log_disk = current_file_description->disk;
+                    const auto & path = current_file_description->path;
+                    std::string new_path = path;
+                    if (last_index_written && *last_index_written != current_file_description->to_log_index)
+                    {
+                        new_path = formatChangelogPath(
+                            current_file_description->prefix,
+                            current_file_description->from_log_index,
+                            *last_index_written,
+                            current_file_description->extension);
+                    }
+
+                    if (disk == log_disk)
+                    {
+                        if (path != new_path)
+                        {
+                            try
+                            {
+                                disk->moveFile(path, new_path);
+                            }
+                            catch (...)
+                            {
+                                tryLogCurrentException(log, fmt::format("File rename failed on disk {}", disk->getName()));
+                            }
+                            current_file_description->path = std::move(new_path);
+                        }
+                    }
+                    else
+                    {
+                        moveFileBetweenDisks(log_disk, current_file_description, disk, new_path);
+                    }
                 }
             }
 
-            file_buf = std::make_unique<WriteBufferFromFile>(
-                file_description->path, DBMS_DEFAULT_BUFFER_SIZE, mode == WriteMode::Rewrite ? -1 : (O_APPEND | O_CREAT | O_WRONLY));
+            auto latest_log_disk = getLatestLogDisk();
+            assert(file_description->disk == latest_log_disk);
+            file_buf = latest_log_disk->writeFile(file_description->path, DBMS_DEFAULT_BUFFER_SIZE, mode);
+            assert(file_buf);
             last_index_written.reset();
             current_file_description = std::move(file_description);
 
             if (log_file_settings.compress_logs)
-                compressed_buffer = std::make_unique<ZstdDeflatingAppendableWriteBuffer>(std::move(file_buf), /* compression level = */ 3, /* append_to_existing_file_ = */ mode == WriteMode::Append);
+                compressed_buffer = std::make_unique<ZstdDeflatingAppendableWriteBuffer>(
+                    std::move(file_buf),
+                    /* compressi)on level = */ 3,
+                    /* append_to_existing_file_ = */ mode == WriteMode::Append,
+                    [latest_log_disk, path = current_file_description->path] { return latest_log_disk->readFile(path); });
 
             prealloc_done = false;
         }
@@ -148,12 +201,12 @@ public:
         }
     }
 
-    bool isFileSet() const { return tryGetFileBuffer() != nullptr; }
-
+    /// There is bug when compressed_buffer has value, file_buf's ownership transfer to compressed_buffer
+    bool isFileSet() const { return compressed_buffer != nullptr || file_buf != nullptr; }
 
     bool appendRecord(ChangelogRecord && record)
     {
-        const auto * file_buffer = tryGetFileBuffer();
+        const auto * file_buffer = tryGetFileBaseBuffer();
         assert(file_buffer && current_file_description);
 
         assert(record.header.index - getStartIndex() <= current_file_description->expectedEntriesCountInLog());
@@ -210,7 +263,7 @@ public:
 
     void flush()
     {
-        auto * file_buffer = tryGetFileBuffer();
+        auto * file_buffer = tryGetFileBaseBuffer();
         if (file_buffer)
         {
             /// Fsync file system if needed
@@ -235,12 +288,12 @@ public:
         new_description->from_log_index = new_start_log_index;
         new_description->to_log_index = new_start_log_index + log_file_settings.rotate_interval - 1;
         new_description->extension = "bin";
+        new_description->disk = getLatestLogDisk();
 
         if (log_file_settings.compress_logs)
             new_description->extension += "." + toContentEncodingName(CompressionMethod::Zstd);
 
         new_description->path = formatChangelogPath(
-            changelogs_dir,
             new_description->prefix,
             new_start_log_index,
             new_start_log_index + log_file_settings.rotate_interval - 1,
@@ -259,17 +312,15 @@ public:
     }
 
 private:
-
     void finalizeCurrentFile()
     {
-        const auto * file_buffer = tryGetFileBuffer();
-        assert(file_buffer && prealloc_done);
+        assert(prealloc_done);
 
         assert(current_file_description);
         // compact can delete the file and we don't need to do anything
         if (current_file_description->deleted)
         {
-            LOG_WARNING(log, "Log {} is already deleted", file_buffer->getFileName());
+            LOG_WARNING(log, "Log {} is already deleted", current_file_description->path);
             return;
         }
 
@@ -278,27 +329,36 @@ private:
 
         flush();
 
-        if (log_file_settings.max_size != 0)
+        const auto * file_buffer = tryGetFileBuffer();
+
+        if (log_file_settings.max_size != 0 && file_buffer)
         {
             int res = -1;
             do
             {
                 res = ftruncate(file_buffer->getFD(), initial_file_size + file_buffer->count());
-            }
-            while (res < 0 && errno == EINTR);
+            } while (res < 0 && errno == EINTR);
 
             if (res != 0)
                 LOG_WARNING(log, "Could not ftruncate file. Error: {}, errno: {}", errnoToString(), errno);
         }
 
         if (log_file_settings.compress_logs)
+        {
             compressed_buffer.reset();
+        }
         else
+        {
+            chassert(file_buf);
+            file_buf->finalize();
             file_buf.reset();
+        }
     }
 
     WriteBuffer & getBuffer()
     {
+        /// TODO: unify compressed_buffer and file_buf,
+        /// compressed_buffer can use its NestedBuffer directly if compress_logs=false
         if (compressed_buffer)
             return *compressed_buffer;
 
@@ -318,38 +378,42 @@ private:
         return *file_buffer;
     }
 
-    const WriteBufferFromFile * tryGetFileBuffer() const
-    {
-        return const_cast<ChangelogWriter *>(this)->tryGetFileBuffer();
-    }
+    const WriteBufferFromFile * tryGetFileBuffer() const { return const_cast<ChangelogWriter *>(this)->tryGetFileBuffer(); }
 
     WriteBufferFromFile * tryGetFileBuffer()
     {
         if (compressed_buffer)
             return dynamic_cast<WriteBufferFromFile *>(compressed_buffer->getNestedBuffer());
 
-        if (file_buf)
-            return file_buf.get();
+        return dynamic_cast<WriteBufferFromFile *>(file_buf.get());
+    }
 
-        return nullptr;
+    WriteBufferFromFileBase * tryGetFileBaseBuffer()
+    {
+        if (compressed_buffer)
+            return dynamic_cast<WriteBufferFromFileBase *>(compressed_buffer->getNestedBuffer());
+
+        return file_buf.get();
     }
 
     void tryPreallocateForFile()
     {
-        if (log_file_settings.max_size == 0)
+        const auto * file_buffer = tryGetFileBuffer();
+
+        if (log_file_settings.max_size == 0 || !file_buffer)
         {
             initial_file_size = 0;
             prealloc_done = true;
             return;
         }
 
-        const auto & file_buffer = getFileBuffer();
 #ifdef OS_LINUX
         {
             int res = -1;
             do
             {
-                res = fallocate(file_buffer.getFD(), FALLOC_FL_KEEP_SIZE, 0, log_file_settings.max_size + log_file_settings.overallocate_size);
+                res = fallocate(
+                    file_buffer->getFD(), FALLOC_FL_KEEP_SIZE, 0, log_file_settings.max_size + log_file_settings.overallocate_size);
             } while (res < 0 && errno == EINTR);
 
             if (res != 0)
@@ -364,15 +428,21 @@ private:
             }
         }
 #endif
-        initial_file_size = getSizeFromFileDescriptor(file_buffer.getFD());
+        initial_file_size = getSizeFromFileDescriptor(file_buffer->getFD());
 
         prealloc_done = true;
     }
 
+    DiskPtr getLatestLogDisk() const { return keeper_context->getLatestLogDisk(); }
+
+    DiskPtr getDisk() const { return keeper_context->getLogDisk(); }
+
+    bool isLocalDisk() const { return dynamic_cast<DiskLocal *>(getDisk().get()) != nullptr; }
+
     std::map<uint64_t, ChangelogFileDescriptionPtr> & existing_changelogs;
 
     ChangelogFileDescriptionPtr current_file_description{nullptr};
-    std::unique_ptr<WriteBufferFromFile> file_buf;
+    std::unique_ptr<WriteBufferFromFileBase> file_buf;
     std::optional<uint64_t> last_index_written;
     size_t initial_file_size{0};
 
@@ -382,7 +452,7 @@ private:
 
     LogFileSettings log_file_settings;
 
-    const std::filesystem::path changelogs_dir;
+    KeeperContextPtr keeper_context;
 
     Poco::Logger * const log;
 };
@@ -412,10 +482,10 @@ struct ChangelogReadResult
 class ChangelogReader
 {
 public:
-    explicit ChangelogReader(const std::string & filepath_) : filepath(filepath_)
+    explicit ChangelogReader(DiskPtr disk_, const std::string & filepath_) : disk(disk_), filepath(filepath_)
     {
         auto compression_method = chooseCompressionMethod(filepath, "");
-        auto read_buffer_from_file = std::make_unique<ReadBufferFromFile>(filepath);
+        auto read_buffer_from_file = disk->readFile(filepath);
         read_buf = wrapReadBufferWithCompressionMethod(std::move(read_buffer_from_file), compression_method);
     }
 
@@ -479,7 +549,7 @@ public:
                     continue;
 
                 /// Create log entry for read data
-                auto log_entry = nuraft::cs_new<nuraft::log_entry>(record.header.term, record.blob, record.header.value_type);
+                auto log_entry = nuraft::cs_new<nuraft::log_entry>(record.header.term, record.blob, static_cast<nuraft::log_val_type>(record.header.value_type));
                 if (result.first_read_index == 0)
                     result.first_read_index = record.header.index;
 
@@ -511,37 +581,103 @@ public:
     }
 
 private:
+    DiskPtr disk;
     std::string filepath;
     std::unique_ptr<ReadBuffer> read_buf;
 };
 
-Changelog::Changelog(
-    const std::string & changelogs_dir_,
-    Poco::Logger * log_,
-    LogFileSettings log_file_settings)
-    : changelogs_dir(changelogs_dir_)
-    , changelogs_detached_dir(changelogs_dir / "detached")
+Changelog::Changelog(Poco::Logger * log_, LogFileSettings log_file_settings, KeeperContextPtr keeper_context_)
+    : changelogs_detached_dir("detached")
     , rotate_interval(log_file_settings.rotate_interval)
     , log(log_)
     , write_operations(std::numeric_limits<size_t>::max())
     , append_completion_queue(std::numeric_limits<size_t>::max())
+    , keeper_context(std::move(keeper_context_))
 {
-    /// Load all files in changelog directory
-    namespace fs = std::filesystem;
-    if (!fs::exists(changelogs_dir))
-        fs::create_directories(changelogs_dir);
-
-    for (const auto & p : fs::directory_iterator(changelogs_dir))
+    if (auto latest_log_disk = getLatestLogDisk();
+        log_file_settings.force_sync && dynamic_cast<const DiskLocal *>(latest_log_disk.get()) == nullptr)
     {
-        if (p == changelogs_detached_dir)
-            continue;
-
-        auto file_description = getChangelogFileDescription(p.path());
-        existing_changelogs[file_description->from_log_index] = std::move(file_description);
+        throw DB::Exception(
+            DB::ErrorCodes::BAD_ARGUMENTS,
+            "force_sync is set to true for logs but disk '{}' cannot satisfy such guarantee because it's not of type DiskLocal.\n"
+            "If you want to use force_sync and same disk for all logs, please set keeper_server.log_storage_disk to a local disk.\n"
+            "If you want to use force_sync and different disk only for old logs, please set 'keeper_server.log_storage_disk' to any "
+            "supported disk and 'keeper_server.latest_log_storage_disk' to a local disk.\n"
+            "Otherwise, disable force_sync",
+            latest_log_disk->getName());
     }
 
+    /// Load all files on changelog disks
+
+    const auto load_from_disk = [&](const auto & disk)
+    {
+        LOG_TRACE(log, "Reading from disk {}", disk->getName());
+        std::unordered_map<std::string, std::string> incomplete_files;
+
+        const auto clean_incomplete_file = [&](const auto & file_path)
+        {
+            if (auto incomplete_it = incomplete_files.find(fs::path(file_path).filename()); incomplete_it != incomplete_files.end())
+            {
+                LOG_TRACE(log, "Removing {} from {}", file_path, disk->getName());
+                disk->removeFile(file_path);
+                disk->removeFile(incomplete_it->second);
+                incomplete_files.erase(incomplete_it);
+                return true;
+            }
+
+            return false;
+        };
+
+        std::vector<std::string> changelog_files;
+        for (auto it = disk->iterateDirectory(""); it->isValid(); it->next())
+        {
+            if (it->name() == changelogs_detached_dir)
+                continue;
+
+            if (it->name().starts_with(tmp_prefix))
+            {
+                incomplete_files.emplace(it->name().substr(tmp_prefix.size()), it->path());
+                continue;
+            }
+
+            if (clean_incomplete_file(it->path()))
+                continue;
+
+            changelog_files.push_back(it->path());
+        }
+
+        for (const auto & changelog_file : changelog_files)
+        {
+            if (clean_incomplete_file(fs::path(changelog_file).filename()))
+                continue;
+
+            auto file_description = getChangelogFileDescription(changelog_file);
+            file_description->disk = disk;
+
+            LOG_TRACE(log, "Found {} on {}", changelog_file, disk->getName());
+            auto [changelog_it, inserted] = existing_changelogs.insert_or_assign(file_description->from_log_index, std::move(file_description));
+
+            if (!inserted)
+                LOG_WARNING(log, "Found duplicate entries for {}, will use the entry from {}", changelog_it->second->path, disk->getName());
+        }
+
+        for (const auto & [name, path] : incomplete_files)
+            disk->removeFile(path);
+    };
+
+    /// Load all files from old disks
+    for (const auto & disk : keeper_context->getOldLogDisks())
+        load_from_disk(disk);
+
+    auto disk = getDisk();
+    load_from_disk(disk);
+
+    auto latest_log_disk = getLatestLogDisk();
+    if (disk != latest_log_disk)
+        load_from_disk(latest_log_disk);
+
     if (existing_changelogs.empty())
-        LOG_WARNING(log, "No logs exists in {}. It's Ok if it's the first run of clickhouse-keeper.", changelogs_dir.generic_string());
+        LOG_WARNING(log, "No logs exists in {}. It's Ok if it's the first run of clickhouse-keeper.", disk->getPath());
 
     clean_log_thread = ThreadFromGlobalPool([this] { cleanLogThread(); });
 
@@ -549,8 +685,7 @@ Changelog::Changelog(
 
     append_completion_thread = ThreadFromGlobalPool([this] { appendCompletionThread(); });
 
-    current_writer = std::make_unique<ChangelogWriter>(
-        existing_changelogs, changelogs_dir, log_file_settings);
+    current_writer = std::make_unique<ChangelogWriter>(existing_changelogs, keeper_context, log_file_settings);
 }
 
 void Changelog::readChangelogAndInitWriter(uint64_t last_commited_log_index, uint64_t logs_to_keep)
@@ -622,7 +757,7 @@ void Changelog::readChangelogAndInitWriter(uint64_t last_commited_log_index, uin
                 break;
             }
 
-            ChangelogReader reader(changelog_description.path);
+            ChangelogReader reader(changelog_description.disk, changelog_description.path);
             last_log_read_result = reader.readChangelog(logs, start_to_read_from, log);
             last_log_read_result->log_start_index = changelog_description.from_log_index;
 
@@ -683,13 +818,13 @@ void Changelog::readChangelogAndInitWriter(uint64_t last_commited_log_index, uin
         assert(existing_changelogs.find(last_log_read_result->log_start_index) != existing_changelogs.end());
         assert(existing_changelogs.find(last_log_read_result->log_start_index)->first == existing_changelogs.rbegin()->first);
 
-        /// Continue to write into incomplete existing log if it doesn't finished with error
+        /// Continue to write into incomplete existing log if it didn't finish with error
         const auto & description = existing_changelogs[last_log_read_result->log_start_index];
 
         if (last_log_read_result->last_read_index == 0 || last_log_read_result->error) /// If it's broken log then remove it
         {
             LOG_INFO(log, "Removing chagelog {} because it's empty or read finished with error", description->path);
-            std::filesystem::remove(description->path);
+            description->disk->removeFile(description->path);
             existing_changelogs.erase(last_log_read_result->log_start_index);
             std::erase_if(logs, [last_log_read_result](const auto & item) { return item.first >= last_log_read_result->log_start_index; });
         }
@@ -698,55 +833,124 @@ void Changelog::readChangelogAndInitWriter(uint64_t last_commited_log_index, uin
             initWriter(description);
         }
     }
+    else if (last_log_read_result.has_value())
+    {
+        /// check if we need to move completed log to another disk
+        auto latest_log_disk = getLatestLogDisk();
+        auto disk = getDisk();
+
+        auto & description = existing_changelogs.at(last_log_read_result->log_start_index);
+        if (latest_log_disk != disk && latest_log_disk == description->disk)
+            moveFileBetweenDisks(latest_log_disk, description, disk, description->path);
+    }
 
     /// Start new log if we don't initialize writer from previous log. All logs can be "complete".
     if (!current_writer->isFileSet())
         current_writer->rotate(max_log_id + 1);
 
+    /// Move files to correct disks
+    auto latest_start_index = current_writer->getStartIndex();
+    auto latest_log_disk = getLatestLogDisk();
+    auto disk = getDisk();
+    for (const auto & [start_index, description] : existing_changelogs)
+    {
+        /// latest log should already be on latest_log_disk
+        if (start_index == latest_start_index)
+        {
+            chassert(description->disk == latest_log_disk);
+            continue;
+        }
+
+        if (description->disk != disk)
+            moveFileBetweenDisks(description->disk, description, disk, description->path);
+    }
+
+
     initialized = true;
 }
 
 
 void Changelog::initWriter(ChangelogFileDescriptionPtr description)
 {
+    if (description->expectedEntriesCountInLog() != rotate_interval)
+        LOG_TRACE(
+            log,
+            "Looks like rotate_logs_interval was changed, current {}, expected entries in last log {}",
+            rotate_interval,
+            description->expectedEntriesCountInLog());
+
     LOG_TRACE(log, "Continue to write into {}", description->path);
+
+    auto log_disk = description->disk;
+    auto latest_log_disk = getLatestLogDisk();
+    if (log_disk != latest_log_disk)
+        moveFileBetweenDisks(log_disk, description, latest_log_disk, description->path);
+
     current_writer->setFile(std::move(description), WriteMode::Append);
 }
 
 namespace
 {
 
-std::string getCurrentTimestampFolder()
-{
-    const auto timestamp = LocalDateTime{std::time(nullptr)};
-    return fmt::format(
-        "{:02}{:02}{:02}T{:02}{:02}{:02}",
-        timestamp.year(),
-        timestamp.month(),
-        timestamp.day(),
-        timestamp.hour(),
-        timestamp.minute(),
-        timestamp.second());
+    std::string getCurrentTimestampFolder()
+    {
+        const auto timestamp = LocalDateTime{std::time(nullptr)};
+        return fmt::format(
+            "{:02}{:02}{:02}T{:02}{:02}{:02}",
+            timestamp.year(),
+            timestamp.month(),
+            timestamp.day(),
+            timestamp.hour(),
+            timestamp.minute(),
+            timestamp.second());
+    }
+
 }
 
+DiskPtr Changelog::getDisk() const
+{
+    return keeper_context->getLogDisk();
+}
+
+DiskPtr Changelog::getLatestLogDisk() const
+{
+    return keeper_context->getLatestLogDisk();
 }
 
 void Changelog::removeExistingLogs(ChangelogIter begin, ChangelogIter end)
 {
-    const auto timestamp_folder = changelogs_detached_dir / getCurrentTimestampFolder();
+    auto disk = getDisk();
+
+    const auto timestamp_folder = (fs::path(changelogs_detached_dir) / getCurrentTimestampFolder()).generic_string();
 
     for (auto itr = begin; itr != end;)
     {
-        if (!std::filesystem::exists(timestamp_folder))
+        if (!disk->exists(timestamp_folder))
         {
-            LOG_WARNING(log, "Moving broken logs to {}", timestamp_folder.generic_string());
-            std::filesystem::create_directories(timestamp_folder);
+            LOG_WARNING(log, "Moving broken logs to {}", timestamp_folder);
+            disk->createDirectories(timestamp_folder);
         }
 
         LOG_WARNING(log, "Removing changelog {}", itr->second->path);
         const std::filesystem::path & path = itr->second->path;
         const auto new_path = timestamp_folder / path.filename();
-        std::filesystem::rename(path, new_path);
+
+        auto changelog_disk = itr->second->disk;
+        if (changelog_disk == disk)
+        {
+            try
+            {
+                disk->moveFile(path.generic_string(), new_path.generic_string());
+            }
+            catch (const DB::Exception & e)
+            {
+                if (e.code() == DB::ErrorCodes::NOT_IMPLEMENTED)
+                    moveFileBetweenDisks(changelog_disk, itr->second, disk, new_path);
+            }
+        }
+        else
+            moveFileBetweenDisks(changelog_disk, itr->second, disk, new_path);
+
         itr = existing_changelogs.erase(itr);
     }
 }
@@ -881,7 +1085,6 @@ void Changelog::writeAt(uint64_t index, const LogEntryPtr & log_entry)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Changelog must be initialized before writing records");
 
     {
-
         std::lock_guard lock(writer_mutex);
         /// This write_at require to overwrite everything in this file and also in previous file(s)
         const bool go_to_previous_file = index < current_writer->getStartIndex();
@@ -897,13 +1100,18 @@ void Changelog::writeAt(uint64_t index, const LogEntryPtr & log_entry)
             else
                 description = std::prev(index_changelog)->second;
 
+            auto log_disk = description->disk;
+            auto latest_log_disk = getLatestLogDisk();
+            if (log_disk != latest_log_disk)
+                moveFileBetweenDisks(log_disk, description, latest_log_disk, description->path);
+
             current_writer->setFile(std::move(description), WriteMode::Append);
 
             /// Remove all subsequent files if overwritten something in previous one
             auto to_remove_itr = existing_changelogs.upper_bound(index);
             for (auto itr = to_remove_itr; itr != existing_changelogs.end();)
             {
-                std::filesystem::remove(itr->second->path);
+                itr->second->disk->removeFile(itr->second->path);
                 itr = existing_changelogs.erase(itr);
             }
         }
@@ -953,14 +1161,22 @@ void Changelog::compact(uint64_t up_to_log_index)
             LOG_INFO(log, "Removing changelog {} because of compaction", changelog_description.path);
 
             /// If failed to push to queue for background removing, then we will remove it now
-            if (!log_files_to_delete_queue.tryPush(changelog_description.path, 1))
+            if (!log_files_to_delete_queue.tryPush({changelog_description.path, changelog_description.disk}, 1))
             {
-                std::error_code ec;
-                std::filesystem::remove(changelog_description.path, ec);
-                if (ec)
-                    LOG_WARNING(log, "Failed to remove changelog {} in compaction, error message: {}", changelog_description.path, ec.message());
-                else
-                    LOG_INFO(log, "Removed changelog {} because of compaction", changelog_description.path);
+                try
+                {
+                    changelog_description.disk->removeFile(changelog_description.path);
+                    LOG_INFO(log, "Removed changelog {} because of compaction.", changelog_description.path);
+                }
+                catch (Exception & e)
+                {
+                    LOG_WARNING(
+                        log, "Failed to remove changelog {} in compaction, error message: {}", changelog_description.path, e.message());
+                }
+                catch (...)
+                {
+                    tryLogCurrentException(log);
+                }
             }
 
             changelog_description.deleted = true;
@@ -1150,14 +1366,23 @@ Changelog::~Changelog()
 
 void Changelog::cleanLogThread()
 {
-    std::string path;
-    while (log_files_to_delete_queue.pop(path))
+    std::pair<std::string, DiskPtr> path_with_disk;
+    while (log_files_to_delete_queue.pop(path_with_disk))
     {
-        std::error_code ec;
-        if (std::filesystem::remove(path, ec))
+        const auto & [path, disk] = path_with_disk;
+        try
+        {
+            disk->removeFile(path);
             LOG_INFO(log, "Removed changelog {} because of compaction.", path);
-        else
-            LOG_WARNING(log, "Failed to remove changelog {} in compaction, error message: {}", path, ec.message());
+        }
+        catch (Exception & e)
+        {
+            LOG_WARNING(log, "Failed to remove changelog {} in compaction, error message: {}", path, e.message());
+        }
+        catch (...)
+        {
+            tryLogCurrentException(log);
+        }
     }
 }
 
diff --git a/src/Coordination/Changelog.h b/src/Coordination/Changelog.h
index 56b0475ba8b..9789a6b03dd 100644
--- a/src/Coordination/Changelog.h
+++ b/src/Coordination/Changelog.h
@@ -11,6 +11,7 @@
 #include <libnuraft/raft_server.hxx>
 #include <Common/ConcurrentBoundedQueue.h>
 #include <Common/ThreadPool.h>
+#include <Coordination/KeeperContext.h>
 
 namespace DB
 {
@@ -39,7 +40,7 @@ struct ChangelogRecordHeader
     ChangelogVersion version = CURRENT_CHANGELOG_VERSION;
     uint64_t index = 0; /// entry log number
     uint64_t term = 0;
-    nuraft::log_val_type value_type{};
+    int32_t value_type{};
     uint64_t blob_size = 0;
 };
 
@@ -59,6 +60,7 @@ struct ChangelogFileDescription
     uint64_t to_log_index;
     std::string extension;
 
+    DiskPtr disk;
     std::string path;
 
     bool deleted = false;
@@ -87,9 +89,9 @@ class Changelog
 {
 public:
     Changelog(
-        const std::string & changelogs_dir_,
         Poco::Logger * log_,
-        LogFileSettings log_file_settings);
+        LogFileSettings log_file_settings,
+        KeeperContextPtr keeper_context_);
 
     Changelog(Changelog &&) = delete;
 
@@ -152,6 +154,9 @@ private:
     /// Pack log_entry into changelog record
     static ChangelogRecord buildRecord(uint64_t index, const LogEntryPtr & log_entry);
 
+    DiskPtr getDisk() const;
+    DiskPtr getLatestLogDisk() const;
+
     /// Currently existing changelogs
     std::map<uint64_t, ChangelogFileDescriptionPtr> existing_changelogs;
 
@@ -169,8 +174,7 @@ private:
     /// Clean useless log files in a background thread
     void cleanLogThread();
 
-    const std::filesystem::path changelogs_dir;
-    const std::filesystem::path changelogs_detached_dir;
+    const String changelogs_detached_dir;
     const uint64_t rotate_interval;
     Poco::Logger * log;
 
@@ -185,7 +189,7 @@ private:
     uint64_t max_log_id = 0;
     /// For compaction, queue of delete not used logs
     /// 128 is enough, even if log is not removed, it's not a problem
-    ConcurrentBoundedQueue<std::string> log_files_to_delete_queue{128};
+    ConcurrentBoundedQueue<std::pair<std::string, DiskPtr>> log_files_to_delete_queue{128};
     ThreadFromGlobalPool clean_log_thread;
 
     struct AppendLog
@@ -223,6 +227,8 @@ private:
 
     nuraft::wptr<nuraft::raft_server> raft_server;
 
+    KeeperContextPtr keeper_context;
+
     bool initialized = false;
 };
 
diff --git a/src/Coordination/CoordinationSettings.cpp b/src/Coordination/CoordinationSettings.cpp
index 7a66134f43f..2b2709baf8e 100644
--- a/src/Coordination/CoordinationSettings.cpp
+++ b/src/Coordination/CoordinationSettings.cpp
@@ -36,7 +36,7 @@ void CoordinationSettings::loadFromConfig(const String & config_elem, const Poco
 }
 
 
-const String KeeperConfigurationAndSettings::DEFAULT_FOUR_LETTER_WORD_CMD = "conf,cons,crst,envi,ruok,srst,srvr,stat,wchs,dirs,mntr,isro,rcvr,apiv,csnp,lgif,rqld,rclc,clrs";
+const String KeeperConfigurationAndSettings::DEFAULT_FOUR_LETTER_WORD_CMD = "conf,cons,crst,envi,ruok,srst,srvr,stat,wchs,dirs,mntr,isro,rcvr,apiv,csnp,lgif,rqld,rclc,clrs,ftfl";
 
 KeeperConfigurationAndSettings::KeeperConfigurationAndSettings()
     : server_id(NOT_EXIST)
@@ -85,14 +85,6 @@ void KeeperConfigurationAndSettings::dump(WriteBufferFromOwnString & buf) const
     writeText(four_letter_word_allow_list, buf);
     buf.write('\n');
 
-    writeText("log_storage_path=", buf);
-    writeText(log_storage_path, buf);
-    buf.write('\n');
-
-    writeText("snapshot_storage_path=", buf);
-    writeText(snapshot_storage_path, buf);
-    buf.write('\n');
-
     /// coordination_settings
 
     writeText("max_requests_batch_size=", buf);
@@ -188,61 +180,9 @@ KeeperConfigurationAndSettings::loadFromConfig(const Poco::Util::AbstractConfigu
                          DEFAULT_FOUR_LETTER_WORD_CMD));
 
 
-    ret->log_storage_path = getLogsPathFromConfig(config, standalone_keeper_);
-    ret->snapshot_storage_path = getSnapshotsPathFromConfig(config, standalone_keeper_);
-
-    ret->state_file_path = getStateFilePathFromConfig(config, standalone_keeper_);
-
     ret->coordination_settings->loadFromConfig("keeper_server.coordination_settings", config);
 
     return ret;
 }
 
-String KeeperConfigurationAndSettings::getLogsPathFromConfig(const Poco::Util::AbstractConfiguration & config, bool standalone_keeper_)
-{
-    /// the most specialized path
-    if (config.has("keeper_server.log_storage_path"))
-        return config.getString("keeper_server.log_storage_path");
-
-    if (config.has("keeper_server.storage_path"))
-        return std::filesystem::path{config.getString("keeper_server.storage_path")} / "logs";
-
-    if (standalone_keeper_)
-        return std::filesystem::path{config.getString("path", KEEPER_DEFAULT_PATH)} / "logs";
-    else
-        return std::filesystem::path{config.getString("path", DBMS_DEFAULT_PATH)} / "coordination/logs";
-}
-
-String KeeperConfigurationAndSettings::getSnapshotsPathFromConfig(const Poco::Util::AbstractConfiguration & config, bool standalone_keeper_)
-{
-    /// the most specialized path
-    if (config.has("keeper_server.snapshot_storage_path"))
-        return config.getString("keeper_server.snapshot_storage_path");
-
-    if (config.has("keeper_server.storage_path"))
-        return std::filesystem::path{config.getString("keeper_server.storage_path")} / "snapshots";
-
-    if (standalone_keeper_)
-        return std::filesystem::path{config.getString("path", KEEPER_DEFAULT_PATH)} / "snapshots";
-    else
-        return std::filesystem::path{config.getString("path", DBMS_DEFAULT_PATH)} / "coordination/snapshots";
-}
-
-String KeeperConfigurationAndSettings::getStateFilePathFromConfig(const Poco::Util::AbstractConfiguration & config, bool standalone_keeper_)
-{
-    if (config.has("keeper_server.storage_path"))
-        return std::filesystem::path{config.getString("keeper_server.storage_path")} / "state";
-
-    if (config.has("keeper_server.snapshot_storage_path"))
-        return std::filesystem::path(config.getString("keeper_server.snapshot_storage_path")).parent_path() / "state";
-
-    if (config.has("keeper_server.log_storage_path"))
-        return std::filesystem::path(config.getString("keeper_server.log_storage_path")).parent_path() / "state";
-
-    if (standalone_keeper_)
-        return std::filesystem::path{config.getString("path", KEEPER_DEFAULT_PATH)} / "state";
-    else
-        return std::filesystem::path{config.getString("path", DBMS_DEFAULT_PATH)} / "coordination/state";
-}
-
 }
diff --git a/src/Coordination/CoordinationSettings.h b/src/Coordination/CoordinationSettings.h
index 81be3c3eaa4..220265b6cb0 100644
--- a/src/Coordination/CoordinationSettings.h
+++ b/src/Coordination/CoordinationSettings.h
@@ -82,17 +82,8 @@ struct KeeperConfigurationAndSettings
     bool standalone_keeper;
     CoordinationSettingsPtr coordination_settings;
 
-    String log_storage_path;
-    String snapshot_storage_path;
-    String state_file_path;
-
     void dump(WriteBufferFromOwnString & buf) const;
     static std::shared_ptr<KeeperConfigurationAndSettings> loadFromConfig(const Poco::Util::AbstractConfiguration & config, bool standalone_keeper_);
-
-private:
-    static String getLogsPathFromConfig(const Poco::Util::AbstractConfiguration & config, bool standalone_keeper_);
-    static String getSnapshotsPathFromConfig(const Poco::Util::AbstractConfiguration & config, bool standalone_keeper_);
-    static String getStateFilePathFromConfig(const Poco::Util::AbstractConfiguration & config, bool standalone_keeper_);
 };
 
 using KeeperConfigurationAndSettingsPtr = std::shared_ptr<KeeperConfigurationAndSettings>;
diff --git a/src/Coordination/FourLetterCommand.cpp b/src/Coordination/FourLetterCommand.cpp
index 7077e792fd8..0490213d296 100644
--- a/src/Coordination/FourLetterCommand.cpp
+++ b/src/Coordination/FourLetterCommand.cpp
@@ -9,9 +9,11 @@
 #include <Common/getCurrentProcessFDCount.h>
 #include <Common/getMaxFileDescriptorCount.h>
 #include <Common/StringUtils/StringUtils.h>
+#include "Coordination/KeeperFeatureFlags.h"
 #include <Coordination/Keeper4LWInfo.h>
 #include <IO/WriteHelpers.h>
 #include <IO/Operators.h>
+#include <boost/algorithm/string.hpp>
 
 #include <unistd.h>
 #include <bit>
@@ -153,6 +155,9 @@ void FourLetterCommandFactory::registerCommands(KeeperDispatcher & keeper_dispat
         FourLetterCommandPtr clean_resources_command = std::make_shared<CleanResourcesCommand>(keeper_dispatcher);
         factory.registerCommand(clean_resources_command);
 
+        FourLetterCommandPtr feature_flags_command = std::make_shared<FeatureFlagsCommand>(keeper_dispatcher);
+        factory.registerCommand(feature_flags_command);
+
         factory.initializeAllowList(keeper_dispatcher);
         factory.setInitialize(true);
     }
@@ -292,6 +297,7 @@ String ConfCommand::run()
 
     StringBuffer buf;
     keeper_dispatcher.getKeeperConfigurationAndSettings()->dump(buf);
+    keeper_dispatcher.getKeeperContext()->dumpConfiguration(buf);
     return buf.str();
 }
 
@@ -486,7 +492,7 @@ String RecoveryCommand::run()
 
 String ApiVersionCommand::run()
 {
-    return toString(static_cast<uint8_t>(Coordination::current_keeper_api_version));
+    return toString(static_cast<uint8_t>(KeeperApiVersion::WITH_MULTI_READ));
 }
 
 String CreateSnapshotCommand::run()
@@ -535,4 +541,29 @@ String CleanResourcesCommand::run()
     return "ok";
 }
 
+String FeatureFlagsCommand::run()
+{
+    const auto & feature_flags = keeper_dispatcher.getKeeperContext()->getFeatureFlags();
+
+    StringBuffer ret;
+
+    auto append = [&ret] (const String & key, uint8_t value) -> void
+    {
+        writeText(key, ret);
+        writeText('\t', ret);
+        writeText(std::to_string(value), ret);
+        writeText('\n', ret);
+    };
+
+    for (const auto & [feature_flag, name] : magic_enum::enum_entries<KeeperFeatureFlag>())
+    {
+        std::string feature_flag_string(name);
+        boost::to_lower(feature_flag_string);
+        append(feature_flag_string, feature_flags.isEnabled(feature_flag));
+    }
+
+    return ret.str();
+
+}
+
 }
diff --git a/src/Coordination/FourLetterCommand.h b/src/Coordination/FourLetterCommand.h
index c1a91303c05..eb2cf9419ae 100644
--- a/src/Coordination/FourLetterCommand.h
+++ b/src/Coordination/FourLetterCommand.h
@@ -401,4 +401,16 @@ struct CleanResourcesCommand : public IFourLetterCommand
     ~CleanResourcesCommand() override = default;
 };
 
+struct FeatureFlagsCommand : public IFourLetterCommand
+{
+    explicit FeatureFlagsCommand(KeeperDispatcher & keeper_dispatcher_)
+        : IFourLetterCommand(keeper_dispatcher_)
+    {
+    }
+
+    String name() override { return "ftfl"; }
+    String run() override;
+    ~FeatureFlagsCommand() override = default;
+};
+
 }
diff --git a/src/Coordination/KeeperAsynchronousMetrics.cpp b/src/Coordination/KeeperAsynchronousMetrics.cpp
index 2d523a26dcc..890079e98f7 100644
--- a/src/Coordination/KeeperAsynchronousMetrics.cpp
+++ b/src/Coordination/KeeperAsynchronousMetrics.cpp
@@ -28,8 +28,8 @@ void updateKeeperInformation(KeeperDispatcher & keeper_dispatcher, AsynchronousM
     size_t zxid = 0;
     size_t session_with_watches = 0;
     size_t paths_watched = 0;
-    size_t snapshot_dir_size = 0;
-    size_t log_dir_size = 0;
+    //size_t snapshot_dir_size = 0;
+    //size_t log_dir_size = 0;
 
     if (keeper_dispatcher.isServerActive())
     {
@@ -49,8 +49,8 @@ void updateKeeperInformation(KeeperDispatcher & keeper_dispatcher, AsynchronousM
         latest_snapshot_size = state_machine.getLatestSnapshotBufSize();
         session_with_watches = state_machine.getSessionsWithWatchesCount();
         paths_watched = state_machine.getWatchedPathsCount();
-        snapshot_dir_size = keeper_dispatcher.getSnapDirSize();
-        log_dir_size = keeper_dispatcher.getLogDirSize();
+        //snapshot_dir_size = keeper_dispatcher.getSnapDirSize();
+        //log_dir_size = keeper_dispatcher.getLogDirSize();
 
 #    if defined(__linux__) || defined(__APPLE__)
         open_file_descriptor_count = getCurrentProcessFDCount();
@@ -85,8 +85,8 @@ void updateKeeperInformation(KeeperDispatcher & keeper_dispatcher, AsynchronousM
     new_values["KeeperZxid"] = { zxid, "The current transaction id number (zxid) in ClickHouse Keeper." };
     new_values["KeeperSessionWithWatches"] = { session_with_watches, "The number of client sessions of ClickHouse Keeper having watches." };
     new_values["KeeperPathsWatched"] = { paths_watched, "The number of different paths watched by the clients of ClickHouse Keeper." };
-    new_values["KeeperSnapshotDirSize"] = { snapshot_dir_size, "The size of the snapshots directory of ClickHouse Keeper, in bytes." };
-    new_values["KeeperLogDirSize"] = { log_dir_size, "The size of the logs directory of ClickHouse Keeper, in bytes." };
+    //new_values["KeeperSnapshotDirSize"] = { snapshot_dir_size, "The size of the snapshots directory of ClickHouse Keeper, in bytes." };
+    //new_values["KeeperLogDirSize"] = { log_dir_size, "The size of the logs directory of ClickHouse Keeper, in bytes." };
 
     auto keeper_log_info = keeper_dispatcher.getKeeperLogInfo();
 
@@ -108,8 +108,8 @@ void updateKeeperInformation(KeeperDispatcher & keeper_dispatcher, AsynchronousM
 }
 
 KeeperAsynchronousMetrics::KeeperAsynchronousMetrics(
-    TinyContextPtr tiny_context_, int update_period_seconds, const ProtocolServerMetricsFunc & protocol_server_metrics_func_)
-    : AsynchronousMetrics(update_period_seconds, protocol_server_metrics_func_), tiny_context(std::move(tiny_context_))
+    ContextPtr context_, int update_period_seconds, const ProtocolServerMetricsFunc & protocol_server_metrics_func_)
+    : AsynchronousMetrics(update_period_seconds, protocol_server_metrics_func_), context(std::move(context_))
 {
 }
 
@@ -117,7 +117,7 @@ void KeeperAsynchronousMetrics::updateImpl(AsynchronousMetricValues & new_values
 {
 #if USE_NURAFT
     {
-        auto keeper_dispatcher = tiny_context->tryGetKeeperDispatcher();
+        auto keeper_dispatcher = context->tryGetKeeperDispatcher();
         if (keeper_dispatcher)
             updateKeeperInformation(*keeper_dispatcher, new_values);
     }
diff --git a/src/Coordination/KeeperAsynchronousMetrics.h b/src/Coordination/KeeperAsynchronousMetrics.h
index 8fa27336bc5..14092c11c15 100644
--- a/src/Coordination/KeeperAsynchronousMetrics.h
+++ b/src/Coordination/KeeperAsynchronousMetrics.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Coordination/TinyContext.h>
+#include <Interpreters/Context.h>
 #include <Common/AsynchronousMetrics.h>
 
 namespace DB
@@ -13,10 +13,10 @@ class KeeperAsynchronousMetrics : public AsynchronousMetrics
 {
 public:
     KeeperAsynchronousMetrics(
-        TinyContextPtr tiny_context_, int update_period_seconds, const ProtocolServerMetricsFunc & protocol_server_metrics_func_);
+        ContextPtr context_, int update_period_seconds, const ProtocolServerMetricsFunc & protocol_server_metrics_func_);
 
 private:
-    TinyContextPtr tiny_context;
+    ContextPtr context;
 
     void updateImpl(AsynchronousMetricValues & new_values, TimePoint update_time, TimePoint current_time) override;
 };
diff --git a/src/Coordination/KeeperConstants.h b/src/Coordination/KeeperConstants.h
index 4b5a5b54be0..84cbb0ab7c5 100644
--- a/src/Coordination/KeeperConstants.h
+++ b/src/Coordination/KeeperConstants.h
@@ -5,6 +5,7 @@
 namespace DB
 {
 
+/// left for backwards compatibility
 enum class KeeperApiVersion : uint8_t
 {
     ZOOKEEPER_COMPATIBLE = 0,
@@ -13,15 +14,8 @@ enum class KeeperApiVersion : uint8_t
     WITH_CHECK_NOT_EXISTS,
 };
 
-inline constexpr auto current_keeper_api_version = KeeperApiVersion::WITH_CHECK_NOT_EXISTS;
-
 const std::string keeper_system_path = "/keeper";
 const std::string keeper_api_version_path = keeper_system_path + "/api_version";
-
-using PathWithData = std::pair<std::string_view, std::string>;
-const std::vector<PathWithData> child_system_paths_with_data
-{
-    {keeper_api_version_path, toString(static_cast<uint8_t>(current_keeper_api_version))}
-};
+const std::string keeper_api_feature_flags_path = keeper_system_path + "/feature_flags";
 
 }
diff --git a/src/Coordination/KeeperContext.cpp b/src/Coordination/KeeperContext.cpp
new file mode 100644
index 00000000000..3c3c0500540
--- /dev/null
+++ b/src/Coordination/KeeperContext.cpp
@@ -0,0 +1,324 @@
+#include <Coordination/KeeperContext.h>
+
+#include <Coordination/Defines.h>
+#include <Disks/DiskLocal.h>
+#include <Interpreters/Context.h>
+#include <Poco/Util/AbstractConfiguration.h>
+#include <Coordination/KeeperConstants.h>
+#include <Common/logger_useful.h>
+#include <Coordination/KeeperFeatureFlags.h>
+#include <boost/algorithm/string.hpp>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+
+extern const int BAD_ARGUMENTS;
+
+}
+
+KeeperContext::KeeperContext(bool standalone_keeper_)
+    : disk_selector(std::make_shared<DiskSelector>())
+    , standalone_keeper(standalone_keeper_)
+{
+    /// enable by default some feature flags
+    feature_flags.enableFeatureFlag(KeeperFeatureFlag::FILTERED_LIST);
+    feature_flags.enableFeatureFlag(KeeperFeatureFlag::MULTI_READ);
+    system_nodes_with_data[keeper_api_feature_flags_path] = feature_flags.getFeatureFlags();
+
+    /// for older clients, the default is equivalent to WITH_MULTI_READ version
+    system_nodes_with_data[keeper_api_version_path] = toString(static_cast<uint8_t>(KeeperApiVersion::WITH_MULTI_READ));
+}
+
+void KeeperContext::initialize(const Poco::Util::AbstractConfiguration & config)
+{
+    digest_enabled = config.getBool("keeper_server.digest_enabled", false);
+    ignore_system_path_on_startup = config.getBool("keeper_server.ignore_system_path_on_startup", false);
+
+    initializeFeatureFlags(config);
+    initializeDisks(config);
+}
+
+void KeeperContext::initializeDisks(const Poco::Util::AbstractConfiguration & config)
+{
+    disk_selector->initialize(config, "storage_configuration.disks", Context::getGlobalContextInstance());
+
+    log_storage = getLogsPathFromConfig(config);
+
+    if (config.has("keeper_server.latest_log_storage_disk"))
+        latest_log_storage = config.getString("keeper_server.latest_log_storage_disk");
+    else
+        latest_log_storage = log_storage;
+
+    const auto collect_old_disk_names = [&](const std::string_view key_prefix, std::vector<std::string> & disk_names)
+    {
+        Poco::Util::AbstractConfiguration::Keys disk_name_keys;
+        config.keys("keeper_server", disk_name_keys);
+        for (const auto & key : disk_name_keys)
+        {
+            if (key.starts_with(key_prefix))
+                disk_names.push_back(config.getString(fmt::format("keeper_server.{}", key)));
+        }
+    };
+
+    collect_old_disk_names("old_log_storage_disk", old_log_disk_names);
+    collect_old_disk_names("old_snapshot_storage_disk", old_snapshot_disk_names);
+
+    snapshot_storage = getSnapshotsPathFromConfig(config);
+
+    if (config.has("keeper_server.latest_snapshot_storage_disk"))
+        latest_snapshot_storage = config.getString("keeper_server.latest_snapshot_storage_disk");
+    else
+        latest_snapshot_storage = snapshot_storage;
+
+    state_file_storage = getStatePathFromConfig(config);
+}
+
+KeeperContext::Phase KeeperContext::getServerState() const
+{
+    return server_state;
+}
+
+void KeeperContext::setServerState(KeeperContext::Phase server_state_)
+{
+    server_state = server_state_;
+}
+
+bool KeeperContext::ignoreSystemPathOnStartup() const
+{
+    return ignore_system_path_on_startup;
+}
+
+bool KeeperContext::digestEnabled() const
+{
+    return digest_enabled;
+}
+
+void KeeperContext::setDigestEnabled(bool digest_enabled_)
+{
+    digest_enabled = digest_enabled_;
+}
+
+DiskPtr KeeperContext::getDisk(const Storage & storage) const
+{
+    if (const auto * storage_disk = std::get_if<DiskPtr>(&storage))
+        return *storage_disk;
+
+    const auto & disk_name = std::get<std::string>(storage);
+    return disk_selector->get(disk_name);
+}
+
+DiskPtr KeeperContext::getLogDisk() const
+{
+    return getDisk(log_storage);
+}
+
+std::vector<DiskPtr> KeeperContext::getOldLogDisks() const
+{
+    std::vector<DiskPtr> old_log_disks;
+    old_log_disks.reserve(old_log_disk_names.size());
+
+    for (const auto & disk_name : old_log_disk_names)
+        old_log_disks.push_back(disk_selector->get(disk_name));
+
+    return old_log_disks;
+}
+
+DiskPtr KeeperContext::getLatestLogDisk() const
+{
+    return getDisk(latest_log_storage);
+}
+
+void KeeperContext::setLogDisk(DiskPtr disk)
+{
+    log_storage = disk;
+    latest_log_storage = std::move(disk);
+}
+
+DiskPtr KeeperContext::getLatestSnapshotDisk() const
+{
+    return getDisk(latest_snapshot_storage);
+}
+
+DiskPtr KeeperContext::getSnapshotDisk() const
+{
+    return getDisk(snapshot_storage);
+}
+
+std::vector<DiskPtr> KeeperContext::getOldSnapshotDisks() const
+{
+    std::vector<DiskPtr> old_snapshot_disks;
+    old_snapshot_disks.reserve(old_snapshot_disk_names.size());
+
+    for (const auto & disk_name : old_snapshot_disk_names)
+        old_snapshot_disks.push_back(disk_selector->get(disk_name));
+
+    return old_snapshot_disks;
+}
+
+void KeeperContext::setSnapshotDisk(DiskPtr disk)
+{
+    snapshot_storage = std::move(disk);
+    latest_snapshot_storage = snapshot_storage;
+}
+
+DiskPtr KeeperContext::getStateFileDisk() const
+{
+    return getDisk(state_file_storage);
+}
+
+void KeeperContext::setStateFileDisk(DiskPtr disk)
+{
+    state_file_storage = std::move(disk);
+}
+
+const std::unordered_map<std::string, std::string> & KeeperContext::getSystemNodesWithData() const
+{
+    return system_nodes_with_data;
+}
+
+const KeeperFeatureFlags & KeeperContext::getFeatureFlags() const
+{
+    return feature_flags;
+}
+
+void KeeperContext::dumpConfiguration(WriteBufferFromOwnString & buf) const
+{
+    auto dump_disk_info = [&](const std::string_view prefix, const IDisk & disk)
+    {
+        writeText(fmt::format("{}_path=", prefix), buf);
+        writeText(disk.getPath(), buf);
+        buf.write('\n');
+
+        writeText(fmt::format("{}_disk=", prefix), buf);
+        writeText(disk.getName(), buf);
+        buf.write('\n');
+
+    };
+
+    {
+        auto log_disk = getDisk(log_storage);
+        dump_disk_info("log_storage", *log_disk);
+
+        auto latest_log_disk = getDisk(latest_log_storage);
+        if (log_disk != latest_log_disk)
+            dump_disk_info("latest_log_storage", *latest_log_disk);
+    }
+
+    {
+        auto snapshot_disk = getDisk(snapshot_storage);
+        dump_disk_info("snapshot_storage", *snapshot_disk);
+    }
+}
+
+KeeperContext::Storage KeeperContext::getLogsPathFromConfig(const Poco::Util::AbstractConfiguration & config) const
+{
+    const auto create_local_disk = [](const auto & path)
+    {
+        if (!fs::exists(path))
+            fs::create_directories(path);
+
+        return std::make_shared<DiskLocal>("LocalLogDisk", path, 0);
+    };
+
+    /// the most specialized path
+    if (config.has("keeper_server.log_storage_path"))
+        return create_local_disk(config.getString("keeper_server.log_storage_path"));
+
+    if (config.has("keeper_server.log_storage_disk"))
+        return config.getString("keeper_server.log_storage_disk");
+
+    if (config.has("keeper_server.storage_path"))
+        return create_local_disk(std::filesystem::path{config.getString("keeper_server.storage_path")} / "logs");
+
+    if (standalone_keeper)
+        return create_local_disk(std::filesystem::path{config.getString("path", KEEPER_DEFAULT_PATH)} / "logs");
+    else
+        return create_local_disk(std::filesystem::path{config.getString("path", DBMS_DEFAULT_PATH)} / "coordination/logs");
+}
+
+KeeperContext::Storage KeeperContext::getSnapshotsPathFromConfig(const Poco::Util::AbstractConfiguration & config) const
+{
+    const auto create_local_disk = [](const auto & path)
+    {
+        if (!fs::exists(path))
+            fs::create_directories(path);
+
+        return std::make_shared<DiskLocal>("LocalSnapshotDisk", path, 0);
+    };
+
+    /// the most specialized path
+    if (config.has("keeper_server.snapshot_storage_path"))
+        return create_local_disk(config.getString("keeper_server.snapshot_storage_path"));
+
+    if (config.has("keeper_server.snapshot_storage_disk"))
+        return config.getString("keeper_server.snapshot_storage_disk");
+
+    if (config.has("keeper_server.storage_path"))
+        return create_local_disk(std::filesystem::path{config.getString("keeper_server.storage_path")} / "snapshots");
+
+    if (standalone_keeper)
+        return create_local_disk(std::filesystem::path{config.getString("path", KEEPER_DEFAULT_PATH)} / "snapshots");
+    else
+        return create_local_disk(std::filesystem::path{config.getString("path", DBMS_DEFAULT_PATH)} / "coordination/snapshots");
+}
+
+KeeperContext::Storage KeeperContext::getStatePathFromConfig(const Poco::Util::AbstractConfiguration & config) const
+{
+    const auto create_local_disk = [](const auto & path)
+    {
+        if (!fs::exists(path))
+            fs::create_directories(path);
+
+        return std::make_shared<DiskLocal>("LocalStateFileDisk", path, 0);
+    };
+
+    if (config.has("keeper_server.state_storage_disk"))
+        return config.getString("keeper_server.state_storage_disk");
+
+    if (config.has("keeper_server.storage_path"))
+        return create_local_disk(std::filesystem::path{config.getString("keeper_server.storage_path")});
+
+    if (config.has("keeper_server.snapshot_storage_path"))
+        return create_local_disk(std::filesystem::path(config.getString("keeper_server.snapshot_storage_path")).parent_path());
+
+    if (config.has("keeper_server.log_storage_path"))
+        return create_local_disk(std::filesystem::path(config.getString("keeper_server.log_storage_path")).parent_path());
+
+    if (standalone_keeper)
+        return create_local_disk(std::filesystem::path{config.getString("path", KEEPER_DEFAULT_PATH)});
+    else
+        return create_local_disk(std::filesystem::path{config.getString("path", DBMS_DEFAULT_PATH)} / "coordination");
+}
+
+void KeeperContext::initializeFeatureFlags(const Poco::Util::AbstractConfiguration & config)
+{
+    static const std::string feature_flags_key = "keeper_server.feature_flags";
+    if (config.has(feature_flags_key))
+    {
+        Poco::Util::AbstractConfiguration::Keys keys;
+        config.keys(feature_flags_key, keys);
+        for (const auto & key : keys)
+        {
+            auto feature_flag_string = boost::to_upper_copy(key);
+            auto feature_flag = magic_enum::enum_cast<KeeperFeatureFlag>(feature_flag_string);
+
+            if (!feature_flag.has_value())
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid feature flag defined in config for Keeper: {}", key);
+
+            auto is_enabled = config.getBool(feature_flags_key + "." + key);
+            if (is_enabled)
+                feature_flags.enableFeatureFlag(feature_flag.value());
+            else
+                feature_flags.disableFeatureFlag(feature_flag.value());
+        }
+
+        system_nodes_with_data[keeper_api_feature_flags_path] = feature_flags.getFeatureFlags();
+    }
+
+    feature_flags.logFlags(&Poco::Logger::get("KeeperContext"));
+}
+
+}
diff --git a/src/Coordination/KeeperContext.h b/src/Coordination/KeeperContext.h
index 64fa8cea6ec..229dbd51ab2 100644
--- a/src/Coordination/KeeperContext.h
+++ b/src/Coordination/KeeperContext.h
@@ -1,10 +1,22 @@
 #pragma once
 
+#include <Poco/Util/AbstractConfiguration.h>
+
+#include <Coordination/KeeperFeatureFlags.h>
+#include <IO/WriteBufferFromString.h>
+#include <Disks/DiskSelector.h>
+
+#include <cstdint>
+#include <memory>
+
 namespace DB
 {
 
-struct KeeperContext
+class KeeperContext
 {
+public:
+    explicit KeeperContext(bool standalone_keeper_);
+
     enum class Phase : uint8_t
     {
         INIT,
@@ -12,10 +24,67 @@ struct KeeperContext
         SHUTDOWN
     };
 
+    void initialize(const Poco::Util::AbstractConfiguration & config);
+
+    Phase getServerState() const;
+    void setServerState(Phase server_state_);
+
+    bool ignoreSystemPathOnStartup() const;
+
+    bool digestEnabled() const;
+    void setDigestEnabled(bool digest_enabled_);
+
+    DiskPtr getLatestLogDisk() const;
+    DiskPtr getLogDisk() const;
+    std::vector<DiskPtr> getOldLogDisks() const;
+    void setLogDisk(DiskPtr disk);
+
+    DiskPtr getLatestSnapshotDisk() const;
+    DiskPtr getSnapshotDisk() const;
+    std::vector<DiskPtr> getOldSnapshotDisks() const;
+    void setSnapshotDisk(DiskPtr disk);
+
+    DiskPtr getStateFileDisk() const;
+    void setStateFileDisk(DiskPtr disk);
+
+    const std::unordered_map<std::string, std::string> & getSystemNodesWithData() const;
+    const KeeperFeatureFlags & getFeatureFlags() const;
+
+    void dumpConfiguration(WriteBufferFromOwnString & buf) const;
+private:
+    /// local disk defined using path or disk name
+    using Storage = std::variant<DiskPtr, std::string>;
+
+    void initializeFeatureFlags(const Poco::Util::AbstractConfiguration & config);
+    void initializeDisks(const Poco::Util::AbstractConfiguration & config);
+
+    Storage getLogsPathFromConfig(const Poco::Util::AbstractConfiguration & config) const;
+    Storage getSnapshotsPathFromConfig(const Poco::Util::AbstractConfiguration & config) const;
+    Storage getStatePathFromConfig(const Poco::Util::AbstractConfiguration & config) const;
+
+    DiskPtr getDisk(const Storage & storage) const;
+
     Phase server_state{Phase::INIT};
 
     bool ignore_system_path_on_startup{false};
     bool digest_enabled{true};
+
+    std::shared_ptr<DiskSelector> disk_selector;
+
+    Storage log_storage;
+    Storage latest_log_storage;
+    Storage snapshot_storage;
+    Storage latest_snapshot_storage;
+    Storage state_file_storage;
+
+    std::vector<std::string> old_log_disk_names;
+    std::vector<std::string> old_snapshot_disk_names;
+
+    bool standalone_keeper;
+
+    std::unordered_map<std::string, std::string> system_nodes_with_data;
+
+    KeeperFeatureFlags feature_flags;
 };
 
 using KeeperContextPtr = std::shared_ptr<KeeperContext>;
diff --git a/src/Coordination/KeeperDispatcher.cpp b/src/Coordination/KeeperDispatcher.cpp
index d64134f3024..9d9df5c7f30 100644
--- a/src/Coordination/KeeperDispatcher.cpp
+++ b/src/Coordination/KeeperDispatcher.cpp
@@ -38,8 +38,6 @@ namespace ProfileEvents
     extern const Event MemoryAllocatorPurgeTimeMicroseconds;
 }
 
-namespace fs = std::filesystem;
-
 namespace DB
 {
 
@@ -238,13 +236,13 @@ void KeeperDispatcher::snapshotThread()
 
         try
         {
-            auto snapshot_path = task.create_snapshot(std::move(task.snapshot));
+            auto snapshot_file_info = task.create_snapshot(std::move(task.snapshot));
 
-            if (snapshot_path.empty())
+            if (snapshot_file_info.path.empty())
                 continue;
 
             if (isLeader())
-                snapshot_s3.uploadSnapshot(snapshot_path);
+                snapshot_s3.uploadSnapshot(snapshot_file_info);
         }
         catch (...)
         {
@@ -336,28 +334,39 @@ void KeeperDispatcher::initialize(const Poco::Util::AbstractConfiguration & conf
 
     snapshot_s3.startup(config, macros);
 
-    server = std::make_unique<KeeperServer>(configuration_and_settings, config, responses_queue, snapshots_queue, snapshot_s3, [this](const KeeperStorage::RequestForSession & request_for_session)
-    {
-        /// check if we have queue of read requests depending on this request to be committed
-        std::lock_guard lock(read_request_queue_mutex);
-        if (auto it = read_request_queue.find(request_for_session.session_id); it != read_request_queue.end())
+    keeper_context = std::make_shared<KeeperContext>(standalone_keeper);
+    keeper_context->initialize(config);
+
+    server = std::make_unique<KeeperServer>(
+        configuration_and_settings,
+        config,
+        responses_queue,
+        snapshots_queue,
+        keeper_context,
+        snapshot_s3,
+        [this](const KeeperStorage::RequestForSession & request_for_session)
         {
-            auto & xid_to_request_queue = it->second;
-
-            if (auto request_queue_it = xid_to_request_queue.find(request_for_session.request->xid); request_queue_it != xid_to_request_queue.end())
+            /// check if we have queue of read requests depending on this request to be committed
+            std::lock_guard lock(read_request_queue_mutex);
+            if (auto it = read_request_queue.find(request_for_session.session_id); it != read_request_queue.end())
             {
-                for (const auto & read_request : request_queue_it->second)
-                {
-                    if (server->isLeaderAlive())
-                        server->putLocalReadRequest(read_request);
-                    else
-                        addErrorResponses({read_request}, Coordination::Error::ZCONNECTIONLOSS);
-                }
+                auto & xid_to_request_queue = it->second;
 
-                xid_to_request_queue.erase(request_queue_it);
+                if (auto request_queue_it = xid_to_request_queue.find(request_for_session.request->xid);
+                    request_queue_it != xid_to_request_queue.end())
+                {
+                    for (const auto & read_request : request_queue_it->second)
+                    {
+                        if (server->isLeaderAlive())
+                            server->putLocalReadRequest(read_request);
+                        else
+                            addErrorResponses({read_request}, Coordination::Error::ZCONNECTIONLOSS);
+                    }
+
+                    xid_to_request_queue.erase(request_queue_it);
+                }
             }
-        }
-    });
+        });
 
     try
     {
@@ -766,35 +775,37 @@ void KeeperDispatcher::updateKeeperStatLatency(uint64_t process_time_ms)
     keeper_stats.updateLatency(process_time_ms);
 }
 
-static uint64_t getDirSize(const fs::path & dir)
+static uint64_t getTotalSize(const DiskPtr & disk, const std::string & path = "")
 {
     checkStackSize();
-    if (!fs::exists(dir))
-        return 0;
 
-    fs::directory_iterator it(dir);
-    fs::directory_iterator end;
-
-    uint64_t size{0};
-    while (it != end)
+    uint64_t size = 0;
+    for (auto it = disk->iterateDirectory(path); it->isValid(); it->next())
     {
-        if (it->is_regular_file())
-            size += fs::file_size(*it);
+        if (disk->isFile(it->path()))
+            size += disk->getFileSize(it->path());
         else
-            size += getDirSize(it->path());
-        ++it;
+            size += getTotalSize(disk, it->path());
     }
+
     return size;
 }
 
 uint64_t KeeperDispatcher::getLogDirSize() const
 {
-    return getDirSize(configuration_and_settings->log_storage_path);
+    auto log_disk = keeper_context->getLogDisk();
+    auto size = getTotalSize(log_disk);
+
+    auto latest_log_disk = keeper_context->getLatestLogDisk();
+    if (log_disk != latest_log_disk)
+        size += getTotalSize(latest_log_disk);
+
+    return size;
 }
 
 uint64_t KeeperDispatcher::getSnapDirSize() const
 {
-    return getDirSize(configuration_and_settings->snapshot_storage_path);
+    return getTotalSize(keeper_context->getSnapshotDisk());
 }
 
 Keeper4LWInfo KeeperDispatcher::getKeeper4LWInfo() const
diff --git a/src/Coordination/KeeperDispatcher.h b/src/Coordination/KeeperDispatcher.h
index 4b8b134cf8f..1b44f0f6ced 100644
--- a/src/Coordination/KeeperDispatcher.h
+++ b/src/Coordination/KeeperDispatcher.h
@@ -81,6 +81,8 @@ private:
 
     KeeperSnapshotManagerS3 snapshot_s3;
 
+    KeeperContextPtr keeper_context;
+
     /// Thread put requests to raft
     void requestThread();
     /// Thread put responses for subscribed sessions
@@ -198,6 +200,11 @@ public:
         return configuration_and_settings;
     }
 
+    const KeeperContextPtr & getKeeperContext() const
+    {
+        return keeper_context;
+    }
+
     void incrementPacketsSent()
     {
         keeper_stats.incrementPacketsSent();
diff --git a/src/Coordination/KeeperFeatureFlags.cpp b/src/Coordination/KeeperFeatureFlags.cpp
new file mode 100644
index 00000000000..d0cd1c86b55
--- /dev/null
+++ b/src/Coordination/KeeperFeatureFlags.cpp
@@ -0,0 +1,92 @@
+#include <Coordination/KeeperFeatureFlags.h>
+#include <Common/ErrorCodes.h>
+#include <Common/Exception.h>
+#include <Common/logger_useful.h>
+
+namespace DB
+{
+
+namespace
+{
+
+std::pair<size_t, size_t> getByteAndBitIndex(size_t num)
+{
+    size_t byte_idx = num / 8;
+    auto bit_idx = (7 - num % 8);
+    return {byte_idx, bit_idx};
+}
+
+}
+
+KeeperFeatureFlags::KeeperFeatureFlags()
+{
+    /// get byte idx of largest value
+    auto [byte_idx, _] = getByteAndBitIndex(magic_enum::enum_count<KeeperFeatureFlag>() - 1);
+    feature_flags = std::string(byte_idx + 1, 0);
+}
+
+KeeperFeatureFlags::KeeperFeatureFlags(std::string feature_flags_)
+    : feature_flags(std::move(feature_flags_))
+{}
+
+void KeeperFeatureFlags::fromApiVersion(KeeperApiVersion keeper_api_version)
+{
+    if (keeper_api_version == KeeperApiVersion::ZOOKEEPER_COMPATIBLE)
+        return;
+
+    if (keeper_api_version >= KeeperApiVersion::WITH_FILTERED_LIST)
+        enableFeatureFlag(KeeperFeatureFlag::FILTERED_LIST);
+
+    if (keeper_api_version >= KeeperApiVersion::WITH_MULTI_READ)
+        enableFeatureFlag(KeeperFeatureFlag::MULTI_READ);
+
+    if (keeper_api_version >= KeeperApiVersion::WITH_CHECK_NOT_EXISTS)
+        enableFeatureFlag(KeeperFeatureFlag::CHECK_NOT_EXISTS);
+}
+
+bool KeeperFeatureFlags::isEnabled(KeeperFeatureFlag feature_flag) const
+{
+    auto [byte_idx, bit_idx] = getByteAndBitIndex(magic_enum::enum_integer(feature_flag));
+
+    if (byte_idx > feature_flags.size())
+        return false;
+
+    return feature_flags[byte_idx] & (1 << bit_idx);
+}
+
+void KeeperFeatureFlags::setFeatureFlags(std::string feature_flags_)
+{
+    feature_flags = std::move(feature_flags_);
+}
+
+void KeeperFeatureFlags::enableFeatureFlag(KeeperFeatureFlag feature_flag)
+{
+    auto [byte_idx, bit_idx] = getByteAndBitIndex(magic_enum::enum_integer(feature_flag));
+    chassert(byte_idx < feature_flags.size());
+
+    feature_flags[byte_idx] |= (1 << bit_idx);
+}
+
+void KeeperFeatureFlags::disableFeatureFlag(KeeperFeatureFlag feature_flag)
+{
+    auto [byte_idx, bit_idx] = getByteAndBitIndex(magic_enum::enum_integer(feature_flag));
+    chassert(byte_idx < feature_flags.size());
+
+    feature_flags[byte_idx] &= ~(1 << bit_idx);
+}
+
+const std::string & KeeperFeatureFlags::getFeatureFlags() const
+{
+    return feature_flags;
+}
+
+void KeeperFeatureFlags::logFlags(Poco::Logger * log) const
+{
+    for (const auto & [feature_flag, feature_flag_name] : magic_enum::enum_entries<KeeperFeatureFlag>())
+    {
+        auto is_enabled = isEnabled(feature_flag);
+        LOG_INFO(log, "Keeper feature flag {}: {}", feature_flag_name, is_enabled ? "enabled" : "disabled");
+    }
+}
+
+}
diff --git a/src/Coordination/KeeperFeatureFlags.h b/src/Coordination/KeeperFeatureFlags.h
new file mode 100644
index 00000000000..6c48915f60c
--- /dev/null
+++ b/src/Coordination/KeeperFeatureFlags.h
@@ -0,0 +1,39 @@
+#pragma once
+
+#include <Coordination/KeeperConstants.h>
+
+namespace DB
+{
+
+/// these values cannot be reordered or removed, only new values can be added
+enum class KeeperFeatureFlag : size_t
+{
+    FILTERED_LIST = 0,
+    MULTI_READ,
+    CHECK_NOT_EXISTS,
+};
+
+class KeeperFeatureFlags
+{
+public:
+    KeeperFeatureFlags();
+
+    explicit KeeperFeatureFlags(std::string feature_flags_);
+
+    /// backwards compatibility
+    void fromApiVersion(KeeperApiVersion keeper_api_version);
+
+    bool isEnabled(KeeperFeatureFlag feature) const;
+
+    void setFeatureFlags(std::string feature_flags_);
+    const std::string & getFeatureFlags() const;
+
+    void enableFeatureFlag(KeeperFeatureFlag feature);
+    void disableFeatureFlag(KeeperFeatureFlag feature);
+
+    void logFlags(Poco::Logger * log) const;
+private:
+    std::string feature_flags;
+};
+
+}
diff --git a/src/Coordination/KeeperLogStore.cpp b/src/Coordination/KeeperLogStore.cpp
index 10619a44517..a9153475dbc 100644
--- a/src/Coordination/KeeperLogStore.cpp
+++ b/src/Coordination/KeeperLogStore.cpp
@@ -1,14 +1,14 @@
 #include <Coordination/KeeperLogStore.h>
 #include <IO/CompressionMethod.h>
+#include <Disks/DiskLocal.h>
 #include <Common/logger_useful.h>
 
 namespace DB
 {
 
-KeeperLogStore::KeeperLogStore(
-    const std::string & changelogs_path, LogFileSettings log_file_settings)
+KeeperLogStore::KeeperLogStore(LogFileSettings log_file_settings, KeeperContextPtr keeper_context)
     : log(&Poco::Logger::get("KeeperLogStore"))
-    , changelog(changelogs_path, log, log_file_settings)
+    , changelog(log, log_file_settings, keeper_context)
 {
     if (log_file_settings.force_sync)
         LOG_INFO(log, "force_sync enabled");
diff --git a/src/Coordination/KeeperLogStore.h b/src/Coordination/KeeperLogStore.h
index e48e3a32463..6e71d8c55cf 100644
--- a/src/Coordination/KeeperLogStore.h
+++ b/src/Coordination/KeeperLogStore.h
@@ -4,6 +4,7 @@
 #include <mutex>
 #include <Core/Types.h>
 #include <Coordination/Changelog.h>
+#include <Coordination/KeeperContext.h>
 #include <base/defines.h>
 
 namespace DB
@@ -13,7 +14,7 @@ namespace DB
 class KeeperLogStore : public nuraft::log_store
 {
 public:
-    KeeperLogStore(const std::string & changelogs_path, LogFileSettings log_file_settings);
+    KeeperLogStore(LogFileSettings log_file_settings, KeeperContextPtr keeper_context);
 
     /// Read log storage from filesystem starting from last_commited_log_index
     void init(uint64_t last_commited_log_index, uint64_t logs_to_keep);
diff --git a/src/Coordination/KeeperServer.cpp b/src/Coordination/KeeperServer.cpp
index 45db9e85fa5..82c843287c1 100644
--- a/src/Coordination/KeeperServer.cpp
+++ b/src/Coordination/KeeperServer.cpp
@@ -21,10 +21,12 @@
 #include <libnuraft/raft_server.hxx>
 #include <Poco/Util/AbstractConfiguration.h>
 #include <Poco/Util/Application.h>
+#include <Common/Exception.h>
 #include <Common/LockMemoryExceptionInThread.h>
 #include <Common/ZooKeeper/ZooKeeperIO.h>
 #include <Common/Stopwatch.h>
 #include <Common/getMultipleKeysFromConfig.h>
+#include <Disks/DiskLocal.h>
 
 namespace DB
 {
@@ -107,25 +109,22 @@ KeeperServer::KeeperServer(
     const Poco::Util::AbstractConfiguration & config,
     ResponsesQueue & responses_queue_,
     SnapshotsQueue & snapshots_queue_,
+    KeeperContextPtr keeper_context_,
     KeeperSnapshotManagerS3 & snapshot_manager_s3,
     KeeperStateMachine::CommitCallback commit_callback)
     : server_id(configuration_and_settings_->server_id)
     , coordination_settings(configuration_and_settings_->coordination_settings)
     , log(&Poco::Logger::get("KeeperServer"))
     , is_recovering(config.getBool("keeper_server.force_recovery", false))
-    , keeper_context{std::make_shared<KeeperContext>()}
+    , keeper_context{std::move(keeper_context_)}
     , create_snapshot_on_exit(config.getBool("keeper_server.create_snapshot_on_exit", true))
 {
     if (coordination_settings->quorum_reads)
         LOG_WARNING(log, "Quorum reads enabled, Keeper will work slower.");
 
-    keeper_context->digest_enabled = config.getBool("keeper_server.digest_enabled", false);
-    keeper_context->ignore_system_path_on_startup = config.getBool("keeper_server.ignore_system_path_on_startup", false);
-
     state_machine = nuraft::cs_new<KeeperStateMachine>(
         responses_queue_,
         snapshots_queue_,
-        configuration_and_settings_->snapshot_storage_path,
         coordination_settings,
         keeper_context,
         config.getBool("keeper_server.upload_snapshot_on_exit", true) ? &snapshot_manager_s3 : nullptr,
@@ -135,10 +134,10 @@ KeeperServer::KeeperServer(
     state_manager = nuraft::cs_new<KeeperStateManager>(
         server_id,
         "keeper_server",
-        configuration_and_settings_->log_storage_path,
-        configuration_and_settings_->state_file_path,
+        "state",
         config,
-        coordination_settings);
+        coordination_settings,
+        keeper_context);
 }
 
 /**
@@ -414,7 +413,7 @@ void KeeperServer::startup(const Poco::Util::AbstractConfiguration & config, boo
 
     launchRaftServer(config, enable_ipv6);
 
-    keeper_context->server_state = KeeperContext::Phase::RUNNING;
+    keeper_context->setServerState(KeeperContext::Phase::RUNNING);
 }
 
 void KeeperServer::shutdownRaftServer()
@@ -429,7 +428,7 @@ void KeeperServer::shutdownRaftServer()
 
     raft_instance->shutdown();
 
-    keeper_context->server_state = KeeperContext::Phase::SHUTDOWN;
+    keeper_context->setServerState(KeeperContext::Phase::SHUTDOWN);
 
     if (create_snapshot_on_exit)
         raft_instance->create_snapshot();
@@ -607,12 +606,30 @@ nuraft::cb_func::ReturnCode KeeperServer::callbackFunc(nuraft::cb_func::Type typ
         }
     }
 
+    const auto follower_preappend = [&](const auto & entry)
+    {
+        if (entry->get_val_type() != nuraft::app_log)
+            return nuraft::cb_func::ReturnCode::Ok;
+
+        try
+        {
+            state_machine->parseRequest(entry->get_buf(), /*final=*/false);
+        }
+        catch (...)
+        {
+            tryLogCurrentException(log, "Failed to parse request from log entry");
+            throw;
+        }
+        return nuraft::cb_func::ReturnCode::Ok;
+
+    };
+
     if (initialized_flag)
     {
         switch (type)
         {
             // This event is called before a single log is appended to the entry on the leader node
-            case nuraft::cb_func::PreAppendLog:
+            case nuraft::cb_func::PreAppendLogLeader:
             {
                 // we are relying on the fact that request are being processed under a mutex
                 // and not a RW lock
@@ -655,7 +672,7 @@ nuraft::cb_func::ReturnCode KeeperServer::callbackFunc(nuraft::cb_func::Type typ
 
                 auto * buffer_start = reinterpret_cast<BufferBase::Position>(entry_buf->data_begin() + entry_buf->size() - write_buffer_header_size);
 
-                WriteBuffer write_buf(buffer_start, write_buffer_header_size);
+                WriteBufferFromPointer write_buf(buffer_start, write_buffer_header_size);
 
                 if (serialization_version < KeeperStateMachine::ZooKeeperLogSerializationVersion::WITH_TIME)
                     writeIntBinary(request_for_session->time, write_buf);
@@ -665,7 +682,14 @@ nuraft::cb_func::ReturnCode KeeperServer::callbackFunc(nuraft::cb_func::Type typ
                 if (request_for_session->digest->version != KeeperStorage::NO_DIGEST)
                     writeIntBinary(request_for_session->digest->value, write_buf);
 
-                break;
+                write_buf.finalize();
+
+                return nuraft::cb_func::ReturnCode::Ok;
+            }
+            case nuraft::cb_func::PreAppendLogFollower:
+            {
+                const auto & entry = *static_cast<LogEntryPtr *>(param->ctx);
+                return follower_preappend(entry);
             }
             case nuraft::cb_func::AppendLogFailed:
             {
@@ -678,13 +702,11 @@ nuraft::cb_func::ReturnCode KeeperServer::callbackFunc(nuraft::cb_func::Type typ
                 auto & entry_buf = entry->get_buf();
                 auto request_for_session = state_machine->parseRequest(entry_buf, true);
                 state_machine->rollbackRequest(*request_for_session, true);
-                break;
+                return nuraft::cb_func::ReturnCode::Ok;
             }
             default:
-                break;
+                return nuraft::cb_func::ReturnCode::Ok;
         }
-
-        return nuraft::cb_func::ReturnCode::Ok;
     }
 
     size_t last_commited = state_machine->last_commit_index();
@@ -737,6 +759,11 @@ nuraft::cb_func::ReturnCode KeeperServer::callbackFunc(nuraft::cb_func::Type typ
             initial_batch_committed = true;
             return nuraft::cb_func::ReturnCode::Ok;
         }
+        case nuraft::cb_func::PreAppendLogFollower:
+        {
+            const auto & entry = *static_cast<LogEntryPtr *>(param->ctx);
+            return follower_preappend(entry);
+        }
         default: /// ignore other events
             return nuraft::cb_func::ReturnCode::Ok;
     }
diff --git a/src/Coordination/KeeperServer.h b/src/Coordination/KeeperServer.h
index db4e9c1962e..8f416b1f48c 100644
--- a/src/Coordination/KeeperServer.h
+++ b/src/Coordination/KeeperServer.h
@@ -72,6 +72,7 @@ public:
         const Poco::Util::AbstractConfiguration & config_,
         ResponsesQueue & responses_queue_,
         SnapshotsQueue & snapshots_queue_,
+        KeeperContextPtr keeper_context_,
         KeeperSnapshotManagerS3 & snapshot_manager_s3,
         KeeperStateMachine::CommitCallback commit_callback);
 
diff --git a/src/Coordination/KeeperSnapshotManager.cpp b/src/Coordination/KeeperSnapshotManager.cpp
index 8b80db3e520..a216272a9e1 100644
--- a/src/Coordination/KeeperSnapshotManager.cpp
+++ b/src/Coordination/KeeperSnapshotManager.cpp
@@ -9,13 +9,15 @@
 #include <IO/WriteHelpers.h>
 #include <IO/copyData.h>
 #include <Common/ZooKeeper/ZooKeeperIO.h>
-#include <Coordination/pathUtils.h>
 #include <filesystem>
 #include <memory>
 #include <Common/logger_useful.h>
 #include <Coordination/KeeperContext.h>
+#include <Coordination/pathUtils.h>
 #include <Coordination/KeeperConstants.h>
 #include <Common/ZooKeeper/ZooKeeperCommon.h>
+#include "Core/Field.h"
+#include <Disks/DiskLocal.h>
 
 
 namespace DB
@@ -30,6 +32,25 @@ namespace ErrorCodes
 
 namespace
 {
+    constexpr std::string_view tmp_prefix = "tmp_";
+
+    void moveFileBetweenDisks(DiskPtr disk_from, const std::string & path_from, DiskPtr disk_to, const std::string & path_to)
+    {
+        /// we use empty file with prefix tmp_ to detect incomplete copies
+        /// if a copy is complete we don't care from which disk we use the same file
+        /// so it's okay if a failure happens after removing of tmp file but before we remove
+        /// the snapshot from the source disk
+        auto from_path = fs::path(path_from);
+        auto tmp_snapshot_name = from_path.parent_path() / (std::string{tmp_prefix} + from_path.filename().string());
+        {
+            auto buf = disk_to->writeFile(tmp_snapshot_name);
+            buf->finalize();
+        }
+        disk_from->copyFile(from_path, *disk_to, path_to, {});
+        disk_to->removeFile(tmp_snapshot_name);
+        disk_from->removeFile(path_from);
+    }
+
     uint64_t getSnapshotPathUpToLogIdx(const String & snapshot_path)
     {
         std::filesystem::path path(snapshot_path);
@@ -41,7 +62,7 @@ namespace
 
     std::string getSnapshotFileName(uint64_t up_to_log_idx, bool compress_zstd)
     {
-        auto base = std::string{"snapshot_"} + std::to_string(up_to_log_idx) + ".bin";
+        auto base = fmt::format("snapshot_{}.bin", up_to_log_idx);
         if (compress_zstd)
             base += ".zstd";
         return base;
@@ -156,7 +177,7 @@ void KeeperStorageSnapshot::serialize(const KeeperStorageSnapshot & snapshot, Wr
     if (snapshot.version >= SnapshotVersion::V5)
     {
         writeBinary(snapshot.zxid, out);
-        if (keeper_context->digest_enabled)
+        if (keeper_context->digestEnabled())
         {
             writeBinary(static_cast<uint8_t>(KeeperStorage::CURRENT_DIGEST_VERSION), out);
             writeBinary(snapshot.nodes_digest, out);
@@ -185,7 +206,7 @@ void KeeperStorageSnapshot::serialize(const KeeperStorageSnapshot & snapshot, Wr
     }
 
     /// Serialize data tree
-    writeBinary(snapshot.snapshot_container_size - child_system_paths_with_data.size(), out);
+    writeBinary(snapshot.snapshot_container_size - keeper_context->getSystemNodesWithData().size(), out);
     size_t counter = 0;
     for (auto it = snapshot.begin; counter < snapshot.snapshot_container_size; ++counter)
     {
@@ -267,7 +288,7 @@ void KeeperStorageSnapshot::deserialize(SnapshotDeserializationResult & deserial
     deserialization_result.snapshot_meta = deserializeSnapshotMetadata(in);
     KeeperStorage & storage = *deserialization_result.storage;
 
-    bool recalculate_digest = keeper_context->digest_enabled;
+    bool recalculate_digest = keeper_context->digestEnabled();
     if (version >= SnapshotVersion::V5)
     {
         readBinary(storage.zxid, in);
@@ -349,7 +370,7 @@ void KeeperStorageSnapshot::deserialize(SnapshotDeserializationResult & deserial
         const std::string error_msg = fmt::format("Cannot read node on path {} from a snapshot because it is used as a system node", path);
         if (match_result == IS_CHILD)
         {
-            if (keeper_context->ignore_system_path_on_startup || keeper_context->server_state != KeeperContext::Phase::INIT)
+            if (keeper_context->ignoreSystemPathOnStartup() || keeper_context->getServerState() != KeeperContext::Phase::INIT)
             {
                 LOG_ERROR(&Poco::Logger::get("KeeperSnapshotManager"), "{}. Ignoring it", error_msg);
                 continue;
@@ -365,7 +386,7 @@ void KeeperStorageSnapshot::deserialize(SnapshotDeserializationResult & deserial
         {
             if (!is_node_empty(node))
             {
-                if (keeper_context->ignore_system_path_on_startup || keeper_context->server_state != KeeperContext::Phase::INIT)
+                if (keeper_context->ignoreSystemPathOnStartup() || keeper_context->getServerState() != KeeperContext::Phase::INIT)
                 {
                     LOG_ERROR(&Poco::Logger::get("KeeperSnapshotManager"), "{}. Ignoring it", error_msg);
                     node = KeeperStorage::Node{};
@@ -394,9 +415,9 @@ void KeeperStorageSnapshot::deserialize(SnapshotDeserializationResult & deserial
     {
         if (itr.key != "/")
         {
-            auto parent_path = parentPath(itr.key);
+            auto parent_path = parentNodePath(itr.key);
             storage.container.updateValue(
-                parent_path, [version, path = itr.key](KeeperStorage::Node & value) { value.addChild(getBaseName(path), /*update_size*/ version < SnapshotVersion::V4); });
+                parent_path, [version, path = itr.key](KeeperStorage::Node & value) { value.addChild(getBaseNodeName(path), /*update_size*/ version < SnapshotVersion::V4); });
         }
     }
 
@@ -507,70 +528,110 @@ KeeperStorageSnapshot::~KeeperStorageSnapshot()
 }
 
 KeeperSnapshotManager::KeeperSnapshotManager(
-    const std::string & snapshots_path_,
     size_t snapshots_to_keep_,
     const KeeperContextPtr & keeper_context_,
     bool compress_snapshots_zstd_,
     const std::string & superdigest_,
     size_t storage_tick_time_)
-    : snapshots_path(snapshots_path_)
-    , snapshots_to_keep(snapshots_to_keep_)
+    : snapshots_to_keep(snapshots_to_keep_)
     , compress_snapshots_zstd(compress_snapshots_zstd_)
     , superdigest(superdigest_)
     , storage_tick_time(storage_tick_time_)
     , keeper_context(keeper_context_)
 {
-    namespace fs = std::filesystem;
-
-    if (!fs::exists(snapshots_path))
-        fs::create_directories(snapshots_path);
-
-    for (const auto & p : fs::directory_iterator(snapshots_path))
+    const auto load_snapshot_from_disk = [&](const auto & disk)
     {
-        const auto & path = p.path();
+        LOG_TRACE(log, "Reading from disk {}", disk->getName());
+        std::unordered_map<std::string, std::string> incomplete_files;
 
-        if (!path.has_filename())
-            continue;
-
-        if (startsWith(path.filename(), "tmp_")) /// Unfinished tmp files
+        const auto clean_incomplete_file = [&](const auto & file_path)
         {
-            std::filesystem::remove(p);
-            continue;
+            if (auto incomplete_it = incomplete_files.find(fs::path(file_path).filename()); incomplete_it != incomplete_files.end())
+            {
+                LOG_TRACE(log, "Removing {} from {}", file_path, disk->getName());
+                disk->removeFile(file_path);
+                disk->removeFile(incomplete_it->second);
+                incomplete_files.erase(incomplete_it);
+                return true;
+            }
+
+            return false;
+        };
+
+        std::vector<std::string> snapshot_files;
+        for (auto it = disk->iterateDirectory(""); it->isValid(); it->next())
+        {
+            if (it->name().starts_with(tmp_prefix))
+            {
+                incomplete_files.emplace(it->name().substr(tmp_prefix.size()), it->path());
+                continue;
+            }
+
+            if (it->name().starts_with("snapshot_") && !clean_incomplete_file(it->path()))
+                snapshot_files.push_back(it->path());
         }
 
-        /// Not snapshot file
-        if (!startsWith(path.filename(), "snapshot_"))
+        for (const auto & snapshot_file : snapshot_files)
         {
-            continue;
+            if (clean_incomplete_file(fs::path(snapshot_file).filename()))
+                continue;
+
+            LOG_TRACE(log, "Found {} on {}", snapshot_file, disk->getName());
+            size_t snapshot_up_to = getSnapshotPathUpToLogIdx(snapshot_file);
+            auto [_, inserted] = existing_snapshots.insert_or_assign(snapshot_up_to, SnapshotFileInfo{snapshot_file, disk});
+
+            if (!inserted)
+                LOG_WARNING(
+                    &Poco::Logger::get("KeeperSnapshotManager"),
+                    "Found another snapshots with last log idx {}, will use snapshot from disk {}",
+                    snapshot_up_to,
+                    disk->getName());
         }
 
-        size_t snapshot_up_to = getSnapshotPathUpToLogIdx(p.path());
-        existing_snapshots[snapshot_up_to] = p.path();
-    }
+        for (const auto & [name, path] : incomplete_files)
+            disk->removeFile(path);
+    };
+
+    for (const auto & disk : keeper_context->getOldSnapshotDisks())
+        load_snapshot_from_disk(disk);
+
+    auto disk = getDisk();
+    load_snapshot_from_disk(disk);
+
+    auto latest_snapshot_disk = getLatestSnapshotDisk();
+    if (latest_snapshot_disk != disk)
+        load_snapshot_from_disk(latest_snapshot_disk);
 
     removeOutdatedSnapshotsIfNeeded();
+    moveSnapshotsIfNeeded();
 }
 
-
-std::string KeeperSnapshotManager::serializeSnapshotBufferToDisk(nuraft::buffer & buffer, uint64_t up_to_log_idx)
+SnapshotFileInfo KeeperSnapshotManager::serializeSnapshotBufferToDisk(nuraft::buffer & buffer, uint64_t up_to_log_idx)
 {
     ReadBufferFromNuraftBuffer reader(buffer);
 
     auto snapshot_file_name = getSnapshotFileName(up_to_log_idx, compress_snapshots_zstd);
     auto tmp_snapshot_file_name = "tmp_" + snapshot_file_name;
-    std::string tmp_snapshot_path = std::filesystem::path{snapshots_path} / tmp_snapshot_file_name;
-    std::string new_snapshot_path = std::filesystem::path{snapshots_path} / snapshot_file_name;
 
-    WriteBufferFromFile plain_buf(tmp_snapshot_path);
-    copyData(reader, plain_buf);
-    plain_buf.sync();
+    auto disk = getLatestSnapshotDisk();
 
-    std::filesystem::rename(tmp_snapshot_path, new_snapshot_path);
+    {
+        auto buf = disk->writeFile(tmp_snapshot_file_name);
+        buf->finalize();
+    }
 
-    existing_snapshots.emplace(up_to_log_idx, new_snapshot_path);
+    auto plain_buf = disk->writeFile(snapshot_file_name);
+    copyData(reader, *plain_buf);
+    plain_buf->sync();
+    plain_buf->finalize();
+
+    disk->removeFile(tmp_snapshot_file_name);
+
+    existing_snapshots.emplace(up_to_log_idx, SnapshotFileInfo{snapshot_file_name, disk});
     removeOutdatedSnapshotsIfNeeded();
+    moveSnapshotsIfNeeded();
 
-    return new_snapshot_path;
+    return {snapshot_file_name, disk};
 }
 
 nuraft::ptr<nuraft::buffer> KeeperSnapshotManager::deserializeLatestSnapshotBufferFromDisk()
@@ -584,7 +645,8 @@ nuraft::ptr<nuraft::buffer> KeeperSnapshotManager::deserializeLatestSnapshotBuff
         }
         catch (const DB::Exception &)
         {
-            std::filesystem::remove(latest_itr->second);
+            const auto & [path, disk] = latest_itr->second;
+            disk->removeFile(path);
             existing_snapshots.erase(latest_itr->first);
             tryLogCurrentException(__PRETTY_FUNCTION__);
         }
@@ -595,10 +657,10 @@ nuraft::ptr<nuraft::buffer> KeeperSnapshotManager::deserializeLatestSnapshotBuff
 
 nuraft::ptr<nuraft::buffer> KeeperSnapshotManager::deserializeSnapshotBufferFromDisk(uint64_t up_to_log_idx) const
 {
-    const std::string & snapshot_path = existing_snapshots.at(up_to_log_idx);
+    const auto & [snapshot_path, snapshot_disk] = existing_snapshots.at(up_to_log_idx);
     WriteBufferFromNuraftBuffer writer;
-    ReadBufferFromFile reader(snapshot_path);
-    copyData(reader, writer);
+    auto reader = snapshot_disk->readFile(snapshot_path);
+    copyData(*reader, writer);
     return writer.getBuffer();
 }
 
@@ -659,30 +721,75 @@ SnapshotDeserializationResult KeeperSnapshotManager::restoreFromLatestSnapshot()
     return deserializeSnapshotFromBuffer(buffer);
 }
 
+DiskPtr KeeperSnapshotManager::getDisk() const
+{
+    return keeper_context->getSnapshotDisk();
+}
+
+DiskPtr KeeperSnapshotManager::getLatestSnapshotDisk() const
+{
+    return keeper_context->getLatestSnapshotDisk();
+}
+
 void KeeperSnapshotManager::removeOutdatedSnapshotsIfNeeded()
 {
     while (existing_snapshots.size() > snapshots_to_keep)
         removeSnapshot(existing_snapshots.begin()->first);
 }
 
+void KeeperSnapshotManager::moveSnapshotsIfNeeded()
+{
+    /// move snapshots to correct disks
+
+    auto disk = getDisk();
+    auto latest_snapshot_disk = getLatestSnapshotDisk();
+    auto latest_snapshot_idx = getLatestSnapshotIndex();
+
+    for (auto & [idx, file_info] : existing_snapshots)
+    {
+        if (idx == latest_snapshot_idx)
+        {
+            if (file_info.disk != latest_snapshot_disk)
+            {
+                moveFileBetweenDisks(file_info.disk, file_info.path, latest_snapshot_disk, file_info.path);
+                file_info.disk = latest_snapshot_disk;
+            }
+        }
+        else
+        {
+            if (file_info.disk != disk)
+            {
+                moveFileBetweenDisks(file_info.disk, file_info.path, disk, file_info.path);
+                file_info.disk = disk;
+            }
+        }
+    }
+
+}
+
 void KeeperSnapshotManager::removeSnapshot(uint64_t log_idx)
 {
     auto itr = existing_snapshots.find(log_idx);
     if (itr == existing_snapshots.end())
         throw Exception(ErrorCodes::UNKNOWN_SNAPSHOT, "Unknown snapshot with log index {}", log_idx);
-    std::filesystem::remove(itr->second);
+    const auto & [path, disk] = itr->second;
+    disk->removeFile(path);
     existing_snapshots.erase(itr);
 }
 
-std::pair<std::string, std::error_code> KeeperSnapshotManager::serializeSnapshotToDisk(const KeeperStorageSnapshot & snapshot)
+SnapshotFileInfo KeeperSnapshotManager::serializeSnapshotToDisk(const KeeperStorageSnapshot & snapshot)
 {
     auto up_to_log_idx = snapshot.snapshot_meta->get_last_log_idx();
     auto snapshot_file_name = getSnapshotFileName(up_to_log_idx, compress_snapshots_zstd);
     auto tmp_snapshot_file_name = "tmp_" + snapshot_file_name;
-    std::string tmp_snapshot_path = std::filesystem::path{snapshots_path} / tmp_snapshot_file_name;
-    std::string new_snapshot_path = std::filesystem::path{snapshots_path} / snapshot_file_name;
 
-    auto writer = std::make_unique<WriteBufferFromFile>(tmp_snapshot_path, O_WRONLY | O_TRUNC | O_CREAT | O_CLOEXEC | O_APPEND);
+    auto disk = getLatestSnapshotDisk();
+    {
+        auto buf = disk->writeFile(tmp_snapshot_file_name);
+        buf->finalize();
+    }
+
+    auto writer = disk->writeFile(snapshot_file_name);
     std::unique_ptr<WriteBuffer> compressed_writer;
     if (compress_snapshots_zstd)
         compressed_writer = wrapWriteBufferWithCompressionMethod(std::move(writer), CompressionMethod::Zstd, 3);
@@ -693,14 +800,13 @@ std::pair<std::string, std::error_code> KeeperSnapshotManager::serializeSnapshot
     compressed_writer->finalize();
     compressed_writer->sync();
 
-    std::error_code ec;
-    std::filesystem::rename(tmp_snapshot_path, new_snapshot_path, ec);
-    if (!ec)
-    {
-        existing_snapshots.emplace(up_to_log_idx, new_snapshot_path);
-        removeOutdatedSnapshotsIfNeeded();
-    }
-    return {new_snapshot_path, ec};
+    disk->removeFile(tmp_snapshot_file_name);
+
+    existing_snapshots.emplace(up_to_log_idx, SnapshotFileInfo{snapshot_file_name, disk});
+    removeOutdatedSnapshotsIfNeeded();
+    moveSnapshotsIfNeeded();
+
+    return {snapshot_file_name, disk};
 }
 
 }
diff --git a/src/Coordination/KeeperSnapshotManager.h b/src/Coordination/KeeperSnapshotManager.h
index 52647712083..9bb287b9276 100644
--- a/src/Coordination/KeeperSnapshotManager.h
+++ b/src/Coordination/KeeperSnapshotManager.h
@@ -6,6 +6,7 @@
 #include <IO/WriteBuffer.h>
 #include <libnuraft/nuraft.hxx>
 #include <Coordination/KeeperContext.h>
+#include <Disks/IDisk.h>
 
 namespace DB
 {
@@ -86,8 +87,14 @@ public:
     uint64_t nodes_digest;
 };
 
+struct SnapshotFileInfo
+{
+    std::string path;
+    DiskPtr disk;
+};
+
 using KeeperStorageSnapshotPtr = std::shared_ptr<KeeperStorageSnapshot>;
-using CreateSnapshotCallback = std::function<std::string(KeeperStorageSnapshotPtr &&)>;
+using CreateSnapshotCallback = std::function<SnapshotFileInfo(KeeperStorageSnapshotPtr &&)>;
 
 
 using SnapshotMetaAndStorage = std::pair<SnapshotMetadataPtr, KeeperStoragePtr>;
@@ -98,7 +105,6 @@ class KeeperSnapshotManager
 {
 public:
     KeeperSnapshotManager(
-        const std::string & snapshots_path_,
         size_t snapshots_to_keep_,
         const KeeperContextPtr & keeper_context_,
         bool compress_snapshots_zstd_ = true,
@@ -112,10 +118,10 @@ public:
     nuraft::ptr<nuraft::buffer> serializeSnapshotToBuffer(const KeeperStorageSnapshot & snapshot) const;
 
     /// Serialize already compressed snapshot to disk (return path)
-    std::string serializeSnapshotBufferToDisk(nuraft::buffer & buffer, uint64_t up_to_log_idx);
+    SnapshotFileInfo serializeSnapshotBufferToDisk(nuraft::buffer & buffer, uint64_t up_to_log_idx);
 
     /// Serialize snapshot directly to disk
-    std::pair<std::string, std::error_code> serializeSnapshotToDisk(const KeeperStorageSnapshot & snapshot);
+    SnapshotFileInfo serializeSnapshotToDisk(const KeeperStorageSnapshot & snapshot);
 
     SnapshotDeserializationResult deserializeSnapshotFromBuffer(nuraft::ptr<nuraft::buffer> buffer) const;
 
@@ -139,30 +145,39 @@ public:
         return 0;
     }
 
-    std::string getLatestSnapshotPath() const
+    SnapshotFileInfo getLatestSnapshotInfo() const
     {
         if (!existing_snapshots.empty())
         {
-            const auto & path = existing_snapshots.at(getLatestSnapshotIndex());
-            std::error_code ec;
-            if (std::filesystem::exists(path, ec))
-                return path;
+            const auto & [path, disk] = existing_snapshots.at(getLatestSnapshotIndex());
+
+            try
+            {
+                if (disk->exists(path))
+                    return {path, disk};
+            }
+            catch (...)
+            {
+            }
         }
-        return "";
+        return {"", nullptr};
     }
 
 private:
     void removeOutdatedSnapshotsIfNeeded();
+    void moveSnapshotsIfNeeded();
+
+    DiskPtr getDisk() const;
+    DiskPtr getLatestSnapshotDisk() const;
 
     /// Checks first 4 buffer bytes to became sure that snapshot compressed with
     /// ZSTD codec.
     static bool isZstdCompressed(nuraft::ptr<nuraft::buffer> buffer);
 
-    const std::string snapshots_path;
     /// How many snapshots to keep before remove
     const size_t snapshots_to_keep;
     /// All existing snapshots in our path (log_index -> path)
-    std::map<uint64_t, std::string> existing_snapshots;
+    std::map<uint64_t, SnapshotFileInfo> existing_snapshots;
     /// Compress snapshots in common ZSTD format instead of custom ClickHouse block LZ4 format
     const bool compress_snapshots_zstd;
     /// Superdigest for deserialization of storage
@@ -171,6 +186,8 @@ private:
     size_t storage_tick_time;
 
     KeeperContextPtr keeper_context;
+
+    Poco::Logger * log = &Poco::Logger::get("KeeperSnapshotManager");
 };
 
 /// Keeper create snapshots in background thread. KeeperStateMachine just create
diff --git a/src/Coordination/KeeperSnapshotManagerS3.cpp b/src/Coordination/KeeperSnapshotManagerS3.cpp
index 1afe0b352c5..580e166e302 100644
--- a/src/Coordination/KeeperSnapshotManagerS3.cpp
+++ b/src/Coordination/KeeperSnapshotManagerS3.cpp
@@ -132,8 +132,9 @@ std::shared_ptr<KeeperSnapshotManagerS3::S3Configuration> KeeperSnapshotManagerS
     return snapshot_s3_client;
 }
 
-void KeeperSnapshotManagerS3::uploadSnapshotImpl(const std::string & snapshot_path)
+void KeeperSnapshotManagerS3::uploadSnapshotImpl(const SnapshotFileInfo & snapshot_file_info)
 {
+    const auto & [snapshot_path, snapshot_disk] = snapshot_file_info;
     try
     {
         auto s3_client = getSnapshotS3Client();
@@ -154,8 +155,9 @@ void KeeperSnapshotManagerS3::uploadSnapshotImpl(const std::string & snapshot_pa
             };
         };
 
-        LOG_INFO(log, "Will try to upload snapshot on {} to S3", snapshot_path);
-        ReadBufferFromFile snapshot_file(snapshot_path);
+        LOG_INFO(log, "Will try to upload snapshot on {} to S3", snapshot_file_info.path);
+
+        auto snapshot_file = snapshot_disk->readFile(snapshot_file_info.path);
 
         auto snapshot_name = fs::path(snapshot_path).filename().string();
         auto lock_file = fmt::format(".{}_LOCK", snapshot_name);
@@ -222,7 +224,7 @@ void KeeperSnapshotManagerS3::uploadSnapshotImpl(const std::string & snapshot_pa
         });
 
         WriteBufferFromS3 snapshot_writer = create_writer(snapshot_name);
-        copyData(snapshot_file, snapshot_writer);
+        copyData(*snapshot_file, snapshot_writer);
         snapshot_writer.finalize();
 
         LOG_INFO(log, "Successfully uploaded {} to S3", snapshot_path);
@@ -240,31 +242,31 @@ void KeeperSnapshotManagerS3::snapshotS3Thread()
 
     while (!shutdown_called)
     {
-        std::string snapshot_path;
-        if (!snapshots_s3_queue.pop(snapshot_path))
+        SnapshotFileInfo snapshot_file_info;
+        if (!snapshots_s3_queue.pop(snapshot_file_info))
             break;
 
         if (shutdown_called)
             break;
 
-        uploadSnapshotImpl(snapshot_path);
+        uploadSnapshotImpl(snapshot_file_info);
     }
 }
 
-void KeeperSnapshotManagerS3::uploadSnapshot(const std::string & path, bool async_upload)
+void KeeperSnapshotManagerS3::uploadSnapshot(const SnapshotFileInfo & file_info, bool async_upload)
 {
     if (getSnapshotS3Client() == nullptr)
         return;
 
     if (async_upload)
     {
-        if (!snapshots_s3_queue.push(path))
-            LOG_WARNING(log, "Failed to add snapshot {} to S3 queue", path);
+        if (!snapshots_s3_queue.push(file_info))
+            LOG_WARNING(log, "Failed to add snapshot {} to S3 queue", file_info.path);
 
         return;
     }
 
-    uploadSnapshotImpl(path);
+    uploadSnapshotImpl(file_info);
 }
 
 void KeeperSnapshotManagerS3::startup(const Poco::Util::AbstractConfiguration & config, const MultiVersion<Macros>::Version & macros)
diff --git a/src/Coordination/KeeperSnapshotManagerS3.h b/src/Coordination/KeeperSnapshotManagerS3.h
index eff7868bba9..e17cf5a1cfb 100644
--- a/src/Coordination/KeeperSnapshotManagerS3.h
+++ b/src/Coordination/KeeperSnapshotManagerS3.h
@@ -6,10 +6,13 @@
 #include <Common/MultiVersion.h>
 #include <Common/Macros.h>
 
+#include <Coordination/KeeperSnapshotManager.h>
+
 #if USE_AWS_S3
 #include <Common/ConcurrentBoundedQueue.h>
 #include <Common/ThreadPool.h>
 
+
 #include <string>
 #endif
 
@@ -24,13 +27,13 @@ public:
 
     /// 'macros' are used to substitute macros in endpoint of disks
     void updateS3Configuration(const Poco::Util::AbstractConfiguration & config, const MultiVersion<Macros>::Version & macros);
-    void uploadSnapshot(const std::string & path, bool async_upload = true);
+    void uploadSnapshot(const SnapshotFileInfo & file_info, bool async_upload = true);
 
     /// 'macros' are used to substitute macros in endpoint of disks
     void startup(const Poco::Util::AbstractConfiguration & config, const MultiVersion<Macros>::Version & macros);
     void shutdown();
 private:
-    using SnapshotS3Queue = ConcurrentBoundedQueue<std::string>;
+    using SnapshotS3Queue = ConcurrentBoundedQueue<SnapshotFileInfo>;
     SnapshotS3Queue snapshots_s3_queue;
 
     /// Upload new snapshots to S3
@@ -48,7 +51,7 @@ private:
 
     std::shared_ptr<S3Configuration> getSnapshotS3Client() const;
 
-    void uploadSnapshotImpl(const std::string & snapshot_path);
+    void uploadSnapshotImpl(const SnapshotFileInfo & snapshot_file_info);
 
     /// Thread upload snapshots to S3 in the background
     void snapshotS3Thread();
@@ -60,7 +63,7 @@ public:
     KeeperSnapshotManagerS3() = default;
 
     void updateS3Configuration(const Poco::Util::AbstractConfiguration &, const MultiVersion<Macros>::Version &) {}
-    void uploadSnapshot(const std::string &, [[maybe_unused]] bool async_upload = true) {}
+    void uploadSnapshot(const SnapshotFileInfo &, [[maybe_unused]] bool async_upload = true) {}
 
     void startup(const Poco::Util::AbstractConfiguration &, const MultiVersion<Macros>::Version &) {}
 
diff --git a/src/Coordination/KeeperStateMachine.cpp b/src/Coordination/KeeperStateMachine.cpp
index f787cc8722e..5c84f23fc60 100644
--- a/src/Coordination/KeeperStateMachine.cpp
+++ b/src/Coordination/KeeperStateMachine.cpp
@@ -14,6 +14,8 @@
 #include <Common/logger_useful.h>
 #include "Coordination/KeeperStorage.h"
 
+#include <Disks/DiskLocal.h>
+
 
 namespace ProfileEvents
 {
@@ -33,17 +35,11 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
-    extern const int SYSTEM_ERROR;
-}
-
-namespace
-{
 }
 
 KeeperStateMachine::KeeperStateMachine(
     ResponsesQueue & responses_queue_,
     SnapshotsQueue & snapshots_queue_,
-    const std::string & snapshots_path_,
     const CoordinationSettingsPtr & coordination_settings_,
     const KeeperContextPtr & keeper_context_,
     KeeperSnapshotManagerS3 * snapshot_manager_s3_,
@@ -52,7 +48,6 @@ KeeperStateMachine::KeeperStateMachine(
     : commit_callback(commit_callback_)
     , coordination_settings(coordination_settings_)
     , snapshot_manager(
-          snapshots_path_,
           coordination_settings->snapshots_to_keep,
           keeper_context_,
           coordination_settings->compress_snapshots_with_zstd_format,
@@ -69,6 +64,16 @@ KeeperStateMachine::KeeperStateMachine(
 {
 }
 
+namespace
+{
+
+bool isLocalDisk(const IDisk & disk)
+{
+    return dynamic_cast<const DiskLocal *>(&disk) != nullptr;
+}
+
+}
+
 void KeeperStateMachine::init()
 {
     /// Do everything without mutexes, no other threads exist.
@@ -83,9 +88,13 @@ void KeeperStateMachine::init()
 
         try
         {
-            auto snapshot_deserialization_result
-                = snapshot_manager.deserializeSnapshotFromBuffer(snapshot_manager.deserializeSnapshotBufferFromDisk(latest_log_index));
-            latest_snapshot_path = snapshot_manager.getLatestSnapshotPath();
+            latest_snapshot_buf = snapshot_manager.deserializeSnapshotBufferFromDisk(latest_log_index);
+            auto snapshot_deserialization_result = snapshot_manager.deserializeSnapshotFromBuffer(latest_snapshot_buf);
+            latest_snapshot_info = snapshot_manager.getLatestSnapshotInfo();
+
+            if (isLocalDisk(*latest_snapshot_info.disk))
+                latest_snapshot_buf = nullptr;
+
             storage = std::move(snapshot_deserialization_result.storage);
             latest_snapshot_meta = snapshot_deserialization_result.snapshot_meta;
             cluster_config = snapshot_deserialization_result.cluster_config;
@@ -272,12 +281,11 @@ bool KeeperStateMachine::preprocess(const KeeperStorage::RequestForSession & req
     }
     catch (...)
     {
-        tryLogCurrentException(__PRETTY_FUNCTION__);
-        rollbackRequestNoLock(request_for_session, true);
-        throw;
+        tryLogCurrentException(__PRETTY_FUNCTION__, "Failed to preprocess stored log, aborting to avoid inconsistent state");
+        std::abort();
     }
 
-    if (keeper_context->digest_enabled && request_for_session.digest)
+    if (keeper_context->digestEnabled() && request_for_session.digest)
         assertDigest(*request_for_session.digest, storage->getNodesDigest(false), *request_for_session.request, false);
 
     return true;
@@ -334,7 +342,7 @@ nuraft::ptr<nuraft::buffer> KeeperStateMachine::commit(const uint64_t log_idx, n
                     response_for_session.session_id);
             }
 
-        if (keeper_context->digest_enabled && request_for_session->digest)
+        if (keeper_context->digestEnabled() && request_for_session->digest)
             assertDigest(*request_for_session->digest, storage->getNodesDigest(true), *request_for_session->request, true);
     }
 
@@ -364,6 +372,7 @@ bool KeeperStateMachine::apply_snapshot(nuraft::snapshot & s)
         else if (s.get_last_log_idx() < latest_snapshot_meta->get_last_log_idx())
         {
             LOG_INFO(log, "A snapshot with a larger last log index ({}) was created, skipping applying this snapshot", latest_snapshot_meta->get_last_log_idx());
+            return true;
         }
 
         latest_snapshot_ptr = latest_snapshot_buf;
@@ -371,8 +380,17 @@ bool KeeperStateMachine::apply_snapshot(nuraft::snapshot & s)
 
     { /// deserialize and apply snapshot to storage
         std::lock_guard lock(storage_and_responses_lock);
-        auto snapshot_deserialization_result
-            = snapshot_manager.deserializeSnapshotFromBuffer(snapshot_manager.deserializeSnapshotBufferFromDisk(s.get_last_log_idx()));
+
+        SnapshotDeserializationResult snapshot_deserialization_result;
+        if (latest_snapshot_ptr)
+            snapshot_deserialization_result = snapshot_manager.deserializeSnapshotFromBuffer(latest_snapshot_ptr);
+        else
+            snapshot_deserialization_result
+                = snapshot_manager.deserializeSnapshotFromBuffer(snapshot_manager.deserializeSnapshotBufferFromDisk(s.get_last_log_idx()));
+
+        /// maybe some logs were preprocessed with log idx larger than the snapshot idx
+        /// we have to apply them to the new storage
+        storage->applyUncommittedState(*snapshot_deserialization_result.storage, s.get_last_log_idx());
         storage = std::move(snapshot_deserialization_result.storage);
         latest_snapshot_meta = snapshot_deserialization_result.snapshot_meta;
         cluster_config = snapshot_deserialization_result.cluster_config;
@@ -460,19 +478,24 @@ void KeeperStateMachine::create_snapshot(nuraft::snapshot & s, nuraft::async_res
                 }
                 else
                 {
-                    auto [path, error_code] = snapshot_manager.serializeSnapshotToDisk(*snapshot);
-                    if (error_code)
-                    {
-                        throw Exception(
-                            ErrorCodes::SYSTEM_ERROR,
-                            "Snapshot {} was created failed, error: {}",
-                            snapshot->snapshot_meta->get_last_log_idx(),
-                            error_code.message());
-                    }
-                    latest_snapshot_path = path;
                     latest_snapshot_meta = snapshot->snapshot_meta;
+                    /// we rely on the fact that the snapshot disk cannot be changed during runtime
+                    if (isLocalDisk(*keeper_context->getLatestSnapshotDisk()))
+                    {
+                        auto snapshot_info = snapshot_manager.serializeSnapshotToDisk(*snapshot);
+                        latest_snapshot_info = std::move(snapshot_info);
+                        latest_snapshot_buf = nullptr;
+                    }
+                    else
+                    {
+                        auto snapshot_buf = snapshot_manager.serializeSnapshotToBuffer(*snapshot);
+                        auto snapshot_info = snapshot_manager.serializeSnapshotBufferToDisk(*snapshot_buf, snapshot->snapshot_meta->get_last_log_idx());
+                        latest_snapshot_info = std::move(snapshot_info);
+                        latest_snapshot_buf = std::move(snapshot_buf);
+                    }
+
                     ProfileEvents::increment(ProfileEvents::KeeperSnapshotCreations);
-                    LOG_DEBUG(log, "Created persistent snapshot {} with path {}", latest_snapshot_meta->get_last_log_idx(), path);
+                    LOG_DEBUG(log, "Created persistent snapshot {} with path {}", latest_snapshot_meta->get_last_log_idx(), latest_snapshot_info.path);
                 }
             }
 
@@ -496,19 +519,19 @@ void KeeperStateMachine::create_snapshot(nuraft::snapshot & s, nuraft::async_res
 
         when_done(ret, exception);
 
-        return ret ? latest_snapshot_path : "";
+        return ret ? latest_snapshot_info : SnapshotFileInfo{};
     };
 
 
-    if (keeper_context->server_state == KeeperContext::Phase::SHUTDOWN)
+    if (keeper_context->getServerState() == KeeperContext::Phase::SHUTDOWN)
     {
         LOG_INFO(log, "Creating a snapshot during shutdown because 'create_snapshot_on_exit' is enabled.");
-        auto snapshot_path = snapshot_task.create_snapshot(std::move(snapshot_task.snapshot));
+        auto snapshot_file_info = snapshot_task.create_snapshot(std::move(snapshot_task.snapshot));
 
-        if (!snapshot_path.empty() && snapshot_manager_s3)
+        if (!snapshot_file_info.path.empty() && snapshot_manager_s3)
         {
-            LOG_INFO(log, "Uploading snapshot {} during shutdown because 'upload_snapshot_on_exit' is enabled.", snapshot_path);
-            snapshot_manager_s3->uploadSnapshot(snapshot_path, /* asnyc_upload */ false);
+            LOG_INFO(log, "Uploading snapshot {} during shutdown because 'upload_snapshot_on_exit' is enabled.", snapshot_file_info.path);
+            snapshot_manager_s3->uploadSnapshot(snapshot_file_info, /* asnyc_upload */ false);
         }
 
         return;
@@ -529,14 +552,20 @@ void KeeperStateMachine::save_logical_snp_obj(
     nuraft::ptr<nuraft::buffer> snp_buf = s.serialize();
     nuraft::ptr<nuraft::snapshot> cloned_meta = nuraft::snapshot::deserialize(*snp_buf);
 
+    nuraft::ptr<nuraft::buffer> cloned_buffer;
+
+    /// we rely on the fact that the snapshot disk cannot be changed during runtime
+    if (!isLocalDisk(*keeper_context->getSnapshotDisk()))
+        cloned_buffer = nuraft::buffer::clone(data);
+
     try
     {
         std::lock_guard lock(snapshots_lock);
         /// Serialize snapshot to disk
-        auto result_path = snapshot_manager.serializeSnapshotBufferToDisk(data, s.get_last_log_idx());
-        latest_snapshot_path = result_path;
+        latest_snapshot_info = snapshot_manager.serializeSnapshotBufferToDisk(data, s.get_last_log_idx());
         latest_snapshot_meta = cloned_meta;
-        LOG_DEBUG(log, "Saved snapshot {} to path {}", s.get_last_log_idx(), result_path);
+        latest_snapshot_buf = std::move(cloned_buffer);
+        LOG_DEBUG(log, "Saved snapshot {} to path {}", s.get_last_log_idx(), latest_snapshot_info.path);
         obj_id++;
         ProfileEvents::increment(ProfileEvents::KeeperSaveSnapshot);
     }
@@ -596,11 +625,23 @@ int KeeperStateMachine::read_logical_snp_obj(
             latest_snapshot_meta->get_last_log_idx());
         return -1;
     }
-    if (bufferFromFile(log, latest_snapshot_path, data_out))
+
+    const auto & [path, disk] = latest_snapshot_info;
+    if (isLocalDisk(*disk))
     {
-        LOG_WARNING(log, "Error reading snapshot {} from {}", s.get_last_log_idx(), latest_snapshot_path);
-        return -1;
+        auto full_path = fs::path(disk->getPath()) / path;
+        if (bufferFromFile(log, full_path, data_out))
+        {
+            LOG_WARNING(log, "Error reading snapshot {} from {}", s.get_last_log_idx(), full_path);
+            return -1;
+        }
     }
+    else
+    {
+        chassert(latest_snapshot_buf);
+        data_out = nuraft::buffer::clone(*latest_snapshot_buf);
+    }
+
     is_last_obj = true;
     ProfileEvents::increment(ProfileEvents::KeeperReadSnapshot);
 
diff --git a/src/Coordination/KeeperStateMachine.h b/src/Coordination/KeeperStateMachine.h
index f6d81d23056..b47a9b5cc42 100644
--- a/src/Coordination/KeeperStateMachine.h
+++ b/src/Coordination/KeeperStateMachine.h
@@ -26,7 +26,6 @@ public:
     KeeperStateMachine(
         ResponsesQueue & responses_queue_,
         SnapshotsQueue & snapshots_queue_,
-        const std::string & snapshots_path_,
         const CoordinationSettingsPtr & coordination_settings_,
         const KeeperContextPtr & keeper_context_,
         KeeperSnapshotManagerS3 * snapshot_manager_s3_,
@@ -128,7 +127,7 @@ private:
     /// In our state machine we always have a single snapshot which is stored
     /// in memory in compressed (serialized) format.
     SnapshotMetadataPtr latest_snapshot_meta = nullptr;
-    std::string latest_snapshot_path;
+    SnapshotFileInfo latest_snapshot_info;
     nuraft::ptr<nuraft::buffer> latest_snapshot_buf = nullptr;
 
     CoordinationSettingsPtr coordination_settings;
diff --git a/src/Coordination/KeeperStateManager.cpp b/src/Coordination/KeeperStateManager.cpp
index 8736fb7d4e3..450fd04b61d 100644
--- a/src/Coordination/KeeperStateManager.cpp
+++ b/src/Coordination/KeeperStateManager.cpp
@@ -8,6 +8,7 @@
 #include <IO/ReadHelpers.h>
 #include <IO/ReadBufferFromFile.h>
 #include <Common/getMultipleKeysFromConfig.h>
+#include <Disks/DiskLocal.h>
 #include <Common/logger_useful.h>
 
 namespace DB
@@ -22,6 +23,8 @@ namespace ErrorCodes
 namespace
 {
 
+const std::string copy_lock_file = "STATE_COPY_LOCK";
+
 bool isLocalhost(const std::string & hostname)
 {
     try
@@ -212,12 +215,14 @@ KeeperStateManager::parseServersConfiguration(const Poco::Util::AbstractConfigur
     return result;
 }
 
-KeeperStateManager::KeeperStateManager(
-    int server_id_, const std::string & host, int port, const std::string & logs_path, const std::string & state_file_path)
+KeeperStateManager::KeeperStateManager(int server_id_, const std::string & host, int port, KeeperContextPtr keeper_context_)
     : my_server_id(server_id_)
     , secure(false)
-    , log_store(nuraft::cs_new<KeeperLogStore>(logs_path, LogFileSettings{.force_sync =false, .compress_logs = false, .rotate_interval = 5000}))
-    , server_state_path(state_file_path)
+    , log_store(nuraft::cs_new<KeeperLogStore>(
+          LogFileSettings{.force_sync = false, .compress_logs = false, .rotate_interval = 5000},
+          keeper_context_))
+    , server_state_file_name("state")
+    , keeper_context(keeper_context_)
     , logger(&Poco::Logger::get("KeeperStateManager"))
 {
     auto peer_config = nuraft::cs_new<nuraft::srv_config>(my_server_id, host + ":" + std::to_string(port));
@@ -230,16 +235,15 @@ KeeperStateManager::KeeperStateManager(
 KeeperStateManager::KeeperStateManager(
     int my_server_id_,
     const std::string & config_prefix_,
-    const std::string & log_storage_path,
-    const std::string & state_file_path,
+    const std::string & server_state_file_name_,
     const Poco::Util::AbstractConfiguration & config,
-    const CoordinationSettingsPtr & coordination_settings)
+    const CoordinationSettingsPtr & coordination_settings,
+    KeeperContextPtr keeper_context_)
     : my_server_id(my_server_id_)
     , secure(config.getBool(config_prefix_ + ".raft_configuration.secure", false))
     , config_prefix(config_prefix_)
     , configuration_wrapper(parseServersConfiguration(config, false))
     , log_store(nuraft::cs_new<KeeperLogStore>(
-          log_storage_path,
           LogFileSettings
           {
             .force_sync = coordination_settings->force_sync,
@@ -247,8 +251,10 @@ KeeperStateManager::KeeperStateManager(
             .rotate_interval = coordination_settings->rotate_log_storage_interval,
             .max_size = coordination_settings->max_log_file_size,
             .overallocate_size = coordination_settings->log_file_overallocate_size
-          }))
-    , server_state_path(state_file_path)
+          },
+          keeper_context_))
+    , server_state_file_name(server_state_file_name_)
+    , keeper_context(keeper_context_)
     , logger(&Poco::Logger::get("KeeperStateManager"))
 {
 }
@@ -287,16 +293,21 @@ void KeeperStateManager::save_config(const nuraft::cluster_config & config)
     configuration_wrapper.cluster_config = nuraft::cluster_config::deserialize(*buf);
 }
 
-const std::filesystem::path & KeeperStateManager::getOldServerStatePath()
+const String & KeeperStateManager::getOldServerStatePath()
 {
     static auto old_path = [this]
     {
-        return server_state_path.parent_path() / (server_state_path.filename().generic_string() + "-OLD");
+        return server_state_file_name + "-OLD";
     }();
 
     return old_path;
 }
 
+DiskPtr KeeperStateManager::getStateFileDisk() const
+{
+    return keeper_context->getStateFileDisk();
+}
+
 namespace
 {
 enum ServerStateVersion : uint8_t
@@ -312,51 +323,61 @@ void KeeperStateManager::save_state(const nuraft::srv_state & state)
 {
     const auto & old_path = getOldServerStatePath();
 
-    if (std::filesystem::exists(server_state_path))
-        std::filesystem::rename(server_state_path, old_path);
+    auto disk = getStateFileDisk();
 
-    WriteBufferFromFile server_state_file(server_state_path, DBMS_DEFAULT_BUFFER_SIZE, O_TRUNC | O_CREAT | O_WRONLY);
+    if (disk->exists(server_state_file_name))
+    {
+        auto buf = disk->writeFile(copy_lock_file);
+        buf->finalize();
+        disk->copyFile(server_state_file_name, *disk, old_path);
+        disk->removeFile(copy_lock_file);
+        disk->removeFile(old_path);
+    }
+
+    auto server_state_file = disk->writeFile(server_state_file_name);
     auto buf = state.serialize();
 
     // calculate checksum
     SipHash hash;
     hash.update(current_server_state_version);
     hash.update(reinterpret_cast<const char *>(buf->data_begin()), buf->size());
-    writeIntBinary(hash.get64(), server_state_file);
+    writeIntBinary(hash.get64(), *server_state_file);
 
-    writeIntBinary(static_cast<uint8_t>(current_server_state_version), server_state_file);
+    writeIntBinary(static_cast<uint8_t>(current_server_state_version), *server_state_file);
 
-    server_state_file.write(reinterpret_cast<const char *>(buf->data_begin()), buf->size());
-    server_state_file.sync();
-    server_state_file.close();
+    server_state_file->write(reinterpret_cast<const char *>(buf->data_begin()), buf->size());
+    server_state_file->sync();
+    server_state_file->finalize();
 
-    std::filesystem::remove(old_path);
+    disk->removeFileIfExists(old_path);
 }
 
 nuraft::ptr<nuraft::srv_state> KeeperStateManager::read_state()
 {
     const auto & old_path = getOldServerStatePath();
 
-    const auto try_read_file = [this](const auto & path) -> nuraft::ptr<nuraft::srv_state>
+    auto disk = getStateFileDisk();
+
+    const auto try_read_file = [&](const auto & path) -> nuraft::ptr<nuraft::srv_state>
     {
         try
         {
-            ReadBufferFromFile read_buf(path);
-            auto content_size = read_buf.getFileSize();
+            auto read_buf = disk->readFile(path);
+            auto content_size = read_buf->getFileSize();
 
             if (content_size == 0)
                 return nullptr;
 
             uint64_t read_checksum{0};
-            readIntBinary(read_checksum, read_buf);
+            readIntBinary(read_checksum, *read_buf);
 
             uint8_t version;
-            readIntBinary(version, read_buf);
+            readIntBinary(version, *read_buf);
 
             auto buffer_size = content_size - sizeof read_checksum - sizeof version;
 
             auto state_buf = nuraft::buffer::alloc(buffer_size);
-            read_buf.readStrict(reinterpret_cast<char *>(state_buf->data_begin()), buffer_size);
+            read_buf->readStrict(reinterpret_cast<char *>(state_buf->data_begin()), buffer_size);
 
             SipHash hash;
             hash.update(version);
@@ -366,15 +387,15 @@ nuraft::ptr<nuraft::srv_state> KeeperStateManager::read_state()
             {
                 constexpr auto error_format = "Invalid checksum while reading state from {}. Got {}, expected {}";
 #ifdef NDEBUG
-                LOG_ERROR(logger, error_format, path.generic_string(), hash.get64(), read_checksum);
+                LOG_ERROR(logger, error_format, path, hash.get64(), read_checksum);
                 return nullptr;
 #else
-                throw Exception(ErrorCodes::CORRUPTED_DATA, error_format, path.generic_string(), hash.get64(), read_checksum);
+                throw Exception(ErrorCodes::CORRUPTED_DATA, error_format, disk->getPath() + path, hash.get64(), read_checksum);
 #endif
             }
 
             auto state = nuraft::srv_state::deserialize(*state_buf);
-            LOG_INFO(logger, "Read state from {}", path.generic_string());
+            LOG_INFO(logger, "Read state from {}", fs::path(disk->getPath()) / path);
             return state;
         }
         catch (const std::exception & e)
@@ -385,37 +406,45 @@ nuraft::ptr<nuraft::srv_state> KeeperStateManager::read_state()
                 throw;
             }
 
-            LOG_ERROR(logger, "Failed to deserialize state from {}", path.generic_string());
+            LOG_ERROR(logger, "Failed to deserialize state from {}", disk->getPath() + path);
             return nullptr;
         }
     };
 
-    if (std::filesystem::exists(server_state_path))
+    if (disk->exists(server_state_file_name))
     {
-        auto state = try_read_file(server_state_path);
+        auto state = try_read_file(server_state_file_name);
 
         if (state)
         {
-            if (std::filesystem::exists(old_path))
-                std::filesystem::remove(old_path);
-
+            disk->removeFileIfExists(old_path);
             return state;
         }
 
-        std::filesystem::remove(server_state_path);
+        disk->removeFile(server_state_file_name);
     }
 
-    if (std::filesystem::exists(old_path))
+    if (disk->exists(old_path))
     {
-        auto state = try_read_file(old_path);
-
-        if (state)
+        if (disk->exists(copy_lock_file))
         {
-            std::filesystem::rename(old_path, server_state_path);
-            return state;
+            disk->removeFile(old_path);
+            disk->removeFile(copy_lock_file);
         }
-
-        std::filesystem::remove(old_path);
+        else
+        {
+            auto state = try_read_file(old_path);
+            if (state)
+            {
+                disk->moveFile(old_path, server_state_file_name);
+                return state;
+            }
+            disk->removeFile(old_path);
+        }
+    }
+    else if (disk->exists(copy_lock_file))
+    {
+        disk->removeFile(copy_lock_file);
     }
 
     LOG_WARNING(logger, "No state was read");
diff --git a/src/Coordination/KeeperStateManager.h b/src/Coordination/KeeperStateManager.h
index 5d210f8c0ea..f24f0c2b1e5 100644
--- a/src/Coordination/KeeperStateManager.h
+++ b/src/Coordination/KeeperStateManager.h
@@ -39,18 +39,17 @@ public:
     KeeperStateManager(
         int server_id_,
         const std::string & config_prefix_,
-        const std::string & log_storage_path,
-        const std::string & state_file_path,
+        const std::string & server_state_file_name_,
         const Poco::Util::AbstractConfiguration & config,
-        const CoordinationSettingsPtr & coordination_settings);
+        const CoordinationSettingsPtr & coordination_settings,
+        KeeperContextPtr keeper_context_);
 
     /// Constructor for tests
     KeeperStateManager(
         int server_id_,
         const std::string & host,
         int port,
-        const std::string & logs_path,
-        const std::string & state_file_path);
+        KeeperContextPtr keeper_context_);
 
     void loadLogStore(uint64_t last_commited_index, uint64_t logs_to_keep);
 
@@ -111,7 +110,9 @@ public:
     ConfigUpdateActions getConfigurationDiff(const Poco::Util::AbstractConfiguration & config) const;
 
 private:
-    const std::filesystem::path & getOldServerStatePath();
+    const String & getOldServerStatePath();
+
+    DiskPtr getStateFileDisk() const;
 
     /// Wrapper struct for Keeper cluster config. We parse this
     /// info from XML files.
@@ -136,7 +137,9 @@ private:
 
     nuraft::ptr<KeeperLogStore> log_store;
 
-    const std::filesystem::path server_state_path;
+    const String server_state_file_name;
+
+    KeeperContextPtr keeper_context;
 
     Poco::Logger * logger;
 
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index 7a1a5e42632..884aacc4558 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -128,7 +128,7 @@ KeeperStorage::ResponsesForSessions processWatchesImpl(
         watches.erase(watch_it);
     }
 
-    auto parent_path = parentPath(path);
+    auto parent_path = parentNodePath(path);
 
     Strings paths_to_check_for_list_watches;
     if (event_type == Coordination::Event::CREATED)
@@ -276,23 +276,23 @@ void KeeperStorage::initializeSystemNodes()
             [](auto & node)
             {
                 ++node.stat.numChildren;
-                node.addChild(getBaseName(keeper_system_path));
+                node.addChild(getBaseNodeName(keeper_system_path));
             }
         );
         addDigest(updated_root_it->value, "/");
     }
 
     // insert child system nodes
-    for (const auto & [path, data] : child_system_paths_with_data)
+    for (const auto & [path, data] : keeper_context->getSystemNodesWithData())
     {
-        assert(keeper_api_version_path.starts_with(keeper_system_path));
+        assert(path.starts_with(keeper_system_path));
         Node child_system_node;
         child_system_node.setData(data);
         auto [map_key, _] = container.insert(std::string{path}, child_system_node);
         /// Take child path from key owned by map.
-        auto child_path = getBaseName(map_key->getKey());
+        auto child_path = getBaseNodeName(map_key->getKey());
         container.updateValue(
-            parentPath(StringRef(path)),
+            parentNodePath(StringRef(path)),
             [child_path](auto & parent)
             {
                 // don't update stats so digest is okay
@@ -375,23 +375,26 @@ void KeeperStorage::UncommittedState::applyDelta(const Delta & delta)
         delta.operation);
 }
 
+void KeeperStorage::UncommittedState::addDelta(Delta new_delta)
+{
+    const auto & added_delta = deltas.emplace_back(std::move(new_delta));
+
+    if (!added_delta.path.empty())
+    {
+        deltas_for_path[added_delta.path].push_back(&added_delta);
+        applyDelta(added_delta);
+    }
+    else if (const auto * auth_delta = std::get_if<AddAuthDelta>(&added_delta.operation))
+    {
+        auto & uncommitted_auth = session_and_auth[auth_delta->session_id];
+        uncommitted_auth.emplace_back(&auth_delta->auth_id);
+    }
+}
+
 void KeeperStorage::UncommittedState::addDeltas(std::vector<Delta> new_deltas)
 {
     for (auto & delta : new_deltas)
-    {
-        const auto & added_delta = deltas.emplace_back(std::move(delta));
-
-        if (!added_delta.path.empty())
-        {
-            deltas_for_path[added_delta.path].push_back(&added_delta);
-            applyDelta(added_delta);
-        }
-        else if (const auto * auth_delta = std::get_if<AddAuthDelta>(&added_delta.operation))
-        {
-            auto & uncommitted_auth = session_and_auth[auth_delta->session_id];
-            uncommitted_auth.emplace_back(&auth_delta->auth_id);
-        }
-    }
+        addDelta(std::move(delta));
 }
 
 void KeeperStorage::UncommittedState::commit(int64_t commit_zxid)
@@ -602,6 +605,26 @@ namespace
 
 }
 
+void KeeperStorage::applyUncommittedState(KeeperStorage & other, int64_t last_zxid)
+{
+    for (const auto & transaction : uncommitted_transactions)
+    {
+        if (transaction.zxid <= last_zxid)
+            continue;
+        other.uncommitted_transactions.push_back(transaction);
+    }
+
+    auto it = uncommitted_state.deltas.begin();
+
+    for (; it != uncommitted_state.deltas.end(); ++it)
+    {
+        if (it->zxid <= last_zxid)
+            continue;
+
+        other.uncommitted_state.addDelta(*it);
+    }
+}
+
 Coordination::Error KeeperStorage::commit(int64_t commit_zxid)
 {
     // Deltas are added with increasing ZXIDs
@@ -705,7 +728,7 @@ bool KeeperStorage::createNode(
     bool is_sequental,
     Coordination::ACLs node_acls)
 {
-    auto parent_path = parentPath(path);
+    auto parent_path = parentNodePath(path);
     auto node_it = container.find(parent_path);
 
     if (node_it == container.end())
@@ -728,7 +751,7 @@ bool KeeperStorage::createNode(
     created_node.is_sequental = is_sequental;
     auto [map_key, _] = container.insert(path, created_node);
     /// Take child path from key owned by map.
-    auto child_path = getBaseName(map_key->getKey());
+    auto child_path = getBaseNodeName(map_key->getKey());
     container.updateValue(
             parent_path,
             [child_path](KeeperStorage::Node & parent)
@@ -758,8 +781,8 @@ bool KeeperStorage::removeNode(const std::string & path, int32_t version)
     acl_map.removeUsage(prev_node.acl_id);
 
     container.updateValue(
-        parentPath(path),
-        [child_basename = getBaseName(node_it->key)](KeeperStorage::Node & parent)
+        parentNodePath(path),
+        [child_basename = getBaseNodeName(node_it->key)](KeeperStorage::Node & parent)
         {
             parent.removeChild(child_basename);
             chassert(parent.stat.numChildren == static_cast<int32_t>(parent.getChildren().size()));
@@ -843,7 +866,7 @@ Coordination::ACLs getNodeACLs(KeeperStorage & storage, StringRef path, bool is_
 
 void handleSystemNodeModification(const KeeperContext & keeper_context, std::string_view error_msg)
 {
-    if (keeper_context.server_state == KeeperContext::Phase::INIT && !keeper_context.ignore_system_path_on_startup)
+    if (keeper_context.getServerState() == KeeperContext::Phase::INIT && !keeper_context.ignoreSystemPathOnStartup())
         throw Exception(
             ErrorCodes::LOGICAL_ERROR,
             "{}. Ignoring it can lead to data loss. "
@@ -906,7 +929,7 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
     bool checkAuth(KeeperStorage & storage, int64_t session_id, bool is_local) const override
     {
         auto path = zk_request->getPath();
-        return storage.checkACL(parentPath(path), Coordination::ACL::Create, session_id, is_local);
+        return storage.checkACL(parentNodePath(path), Coordination::ACL::Create, session_id, is_local);
     }
 
     std::vector<KeeperStorage::Delta>
@@ -917,7 +940,7 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
 
         std::vector<KeeperStorage::Delta> new_deltas;
 
-        auto parent_path = parentPath(request.path);
+        auto parent_path = parentNodePath(request.path);
         auto parent_node = storage.uncommitted_state.getNode(parent_path);
         if (parent_node == nullptr)
             return {KeeperStorage::Delta{zxid, Coordination::Error::ZNONODE}};
@@ -948,7 +971,7 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
         if (storage.uncommitted_state.getNode(path_created))
             return {KeeperStorage::Delta{zxid, Coordination::Error::ZNODEEXISTS}};
 
-        if (getBaseName(path_created).size == 0)
+        if (getBaseNodeName(path_created).size == 0)
             return {KeeperStorage::Delta{zxid, Coordination::Error::ZBADARGUMENTS}};
 
         Coordination::ACLs node_acls;
@@ -1037,7 +1060,7 @@ struct KeeperStorageGetRequestProcessor final : public KeeperStorageRequestProce
         ProfileEvents::increment(ProfileEvents::KeeperGetRequest);
         Coordination::ZooKeeperGetRequest & request = dynamic_cast<Coordination::ZooKeeperGetRequest &>(*zk_request);
 
-        if (request.path == Coordination::keeper_api_version_path)
+        if (request.path == Coordination::keeper_api_feature_flags_path)
             return {};
 
         if (!storage.uncommitted_state.getNode(request.path))
@@ -1098,7 +1121,7 @@ struct KeeperStorageRemoveRequestProcessor final : public KeeperStorageRequestPr
 {
     bool checkAuth(KeeperStorage & storage, int64_t session_id, bool is_local) const override
     {
-        return storage.checkACL(parentPath(zk_request->getPath()), Coordination::ACL::Delete, session_id, is_local);
+        return storage.checkACL(parentNodePath(zk_request->getPath()), Coordination::ACL::Delete, session_id, is_local);
     }
 
     using KeeperStorageRequestProcessor::KeeperStorageRequestProcessor;
@@ -1120,7 +1143,7 @@ struct KeeperStorageRemoveRequestProcessor final : public KeeperStorageRequestPr
 
         const auto update_parent_pzxid = [&]()
         {
-            auto parent_path = parentPath(request.path);
+            auto parent_path = parentNodePath(request.path);
             if (!storage.uncommitted_state.getNode(parent_path))
                 return;
 
@@ -1155,7 +1178,7 @@ struct KeeperStorageRemoveRequestProcessor final : public KeeperStorageRequestPr
             update_parent_pzxid();
 
         new_deltas.emplace_back(
-            std::string{parentPath(request.path)},
+            std::string{parentNodePath(request.path)},
             zxid,
             KeeperStorage::UpdateNodeDelta{[](KeeperStorage::Node & parent)
                                            {
@@ -1298,7 +1321,7 @@ struct KeeperStorageSetRequestProcessor final : public KeeperStorageRequestProce
                 request.version});
 
         new_deltas.emplace_back(
-                parentPath(request.path).toString(),
+                parentNodePath(request.path).toString(),
                 zxid,
                 KeeperStorage::UpdateNodeDelta
                 {
@@ -1458,7 +1481,7 @@ struct KeeperStorageCheckRequestProcessor final : public KeeperStorageRequestPro
     bool checkAuth(KeeperStorage & storage, int64_t session_id, bool is_local) const override
     {
         auto path = zk_request->getPath();
-        return storage.checkACL(check_not_exists ? parentPath(path) : path, Coordination::ACL::Read, session_id, is_local);
+        return storage.checkACL(check_not_exists ? parentNodePath(path) : path, Coordination::ACL::Read, session_id, is_local);
     }
 
     std::vector<KeeperStorage::Delta>
@@ -2001,7 +2024,7 @@ KeeperStorageRequestProcessorsFactory::KeeperStorageRequestProcessorsFactory()
 
 UInt64 KeeperStorage::calculateNodesDigest(UInt64 current_digest, const std::vector<Delta> & new_deltas) const
 {
-    if (!keeper_context->digest_enabled)
+    if (!keeper_context->digestEnabled())
         return current_digest;
 
     std::unordered_map<std::string_view, std::shared_ptr<Node>> updated_nodes;
@@ -2099,7 +2122,7 @@ void KeeperStorage::preprocessRequest(
     TransactionInfo transaction{.zxid = new_last_zxid};
     uint64_t new_digest = getNodesDigest(false).value;
     SCOPE_EXIT({
-        if (keeper_context->digest_enabled)
+        if (keeper_context->digestEnabled())
             // if the version of digest we got from the leader is the same as the one this instances has, we can simply copy the value
             // and just check the digest on the commit
             // a mistake can happen while applying the changes to the uncommitted_state so for now let's just recalculate the digest here also
@@ -2122,7 +2145,7 @@ void KeeperStorage::preprocessRequest(
             {
                 new_deltas.emplace_back
                 (
-                    parentPath(ephemeral_path).toString(),
+                    parentNodePath(ephemeral_path).toString(),
                     new_last_zxid,
                     UpdateNodeDelta
                     {
@@ -2315,7 +2338,7 @@ void KeeperStorage::rollbackRequest(int64_t rollback_zxid, bool allow_missing)
 
 KeeperStorage::Digest KeeperStorage::getNodesDigest(bool committed) const
 {
-    if (!keeper_context->digest_enabled)
+    if (!keeper_context->digestEnabled())
         return {.version = DigestVersion::NO_DIGEST};
 
     if (committed || uncommitted_transactions.empty())
@@ -2326,13 +2349,13 @@ KeeperStorage::Digest KeeperStorage::getNodesDigest(bool committed) const
 
 void KeeperStorage::removeDigest(const Node & node, const std::string_view path)
 {
-    if (keeper_context->digest_enabled)
+    if (keeper_context->digestEnabled())
         nodes_digest -= node.getDigest(path);
 }
 
 void KeeperStorage::addDigest(const Node & node, const std::string_view path)
 {
-    if (keeper_context->digest_enabled)
+    if (keeper_context->digestEnabled())
     {
         node.invalidateDigestCache();
         nodes_digest += node.getDigest(path);
diff --git a/src/Coordination/KeeperStorage.h b/src/Coordination/KeeperStorage.h
index 7eb10be3847..844cbf85c1e 100644
--- a/src/Coordination/KeeperStorage.h
+++ b/src/Coordination/KeeperStorage.h
@@ -222,6 +222,7 @@ public:
     {
         explicit UncommittedState(KeeperStorage & storage_) : storage(storage_) { }
 
+        void addDelta(Delta new_delta);
         void addDeltas(std::vector<Delta> new_deltas);
         void commit(int64_t commit_zxid);
         void rollback(int64_t rollback_zxid);
@@ -310,6 +311,10 @@ public:
 
     UncommittedState uncommitted_state{*this};
 
+    // Apply uncommitted state to another storage using only transactions
+    // with zxid > last_zxid
+    void applyUncommittedState(KeeperStorage & other, int64_t last_zxid);
+
     Coordination::Error commit(int64_t zxid);
 
     // Create node in the storage
diff --git a/src/Coordination/Standalone/Context.cpp b/src/Coordination/Standalone/Context.cpp
new file mode 100644
index 00000000000..84083169df3
--- /dev/null
+++ b/src/Coordination/Standalone/Context.cpp
@@ -0,0 +1,321 @@
+#include <Interpreters/Context.h>
+
+#include <Common/Config/ConfigProcessor.h>
+#include <Common/Macros.h>
+#include <Common/ThreadPool.h>
+
+#include <Core/ServerSettings.h>
+
+#include <boost/noncopyable.hpp>
+
+#include <memory>
+#include <cassert>
+
+namespace ProfileEvents
+{
+    extern const Event ContextLock;
+}
+
+namespace CurrentMetrics
+{
+    extern const Metric ContextLockWait;
+    extern const Metric BackgroundSchedulePoolTask;
+    extern const Metric BackgroundSchedulePoolSize;
+    extern const Metric IOWriterThreads;
+    extern const Metric IOWriterThreadsActive;
+}
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
+struct ContextSharedPart : boost::noncopyable
+{
+    ContextSharedPart()
+        : macros(std::make_unique<Macros>())
+    {}
+
+    /// For access of most of shared objects. Recursive mutex.
+    mutable std::recursive_mutex mutex;
+
+    mutable std::mutex keeper_dispatcher_mutex;
+    mutable std::shared_ptr<KeeperDispatcher> keeper_dispatcher TSA_GUARDED_BY(keeper_dispatcher_mutex);
+
+    ServerSettings server_settings;
+
+    String path;                                            /// Path to the data directory, with a slash at the end.
+    ConfigurationPtr config;                                /// Global configuration settings.
+    MultiVersion<Macros> macros;                            /// Substitutions extracted from config.
+    mutable std::unique_ptr<BackgroundSchedulePool> schedule_pool;    /// A thread pool that can run different jobs in background
+    RemoteHostFilter remote_host_filter; /// Allowed URL from config.xml
+                                         ///
+    mutable std::unique_ptr<IAsynchronousReader> asynchronous_remote_fs_reader;
+    mutable std::unique_ptr<IAsynchronousReader> asynchronous_local_fs_reader;
+    mutable std::unique_ptr<IAsynchronousReader> synchronous_local_fs_reader;
+
+    mutable std::unique_ptr<ThreadPool> threadpool_writer;
+
+    mutable ThrottlerPtr remote_read_throttler;             /// A server-wide throttler for remote IO reads
+    mutable ThrottlerPtr remote_write_throttler;            /// A server-wide throttler for remote IO writes
+
+    mutable ThrottlerPtr local_read_throttler;              /// A server-wide throttler for local IO reads
+    mutable ThrottlerPtr local_write_throttler;             /// A server-wide throttler for local IO writes
+
+};
+
+Context::Context() = default;
+Context::~Context() = default;
+Context::Context(const Context &) = default;
+Context & Context::operator=(const Context &) = default;
+
+SharedContextHolder::SharedContextHolder(SharedContextHolder &&) noexcept = default;
+SharedContextHolder & SharedContextHolder::operator=(SharedContextHolder &&) noexcept = default;
+SharedContextHolder::SharedContextHolder() = default;
+SharedContextHolder::~SharedContextHolder() = default;
+SharedContextHolder::SharedContextHolder(std::unique_ptr<ContextSharedPart> shared_context)
+    : shared(std::move(shared_context)) {}
+
+void SharedContextHolder::reset() { shared.reset(); }
+
+void Context::makeGlobalContext()
+{
+    initGlobal();
+    global_context = shared_from_this();
+}
+
+ContextMutablePtr Context::createGlobal(ContextSharedPart * shared)
+{
+    auto res = std::shared_ptr<Context>(new Context);
+    res->shared = shared;
+    return res;
+}
+
+void Context::initGlobal()
+{
+    assert(!global_context_instance);
+    global_context_instance = shared_from_this();
+}
+
+SharedContextHolder Context::createShared()
+{
+    return SharedContextHolder(std::make_unique<ContextSharedPart>());
+}
+
+ContextMutablePtr Context::getGlobalContext() const
+{
+    auto ptr = global_context.lock();
+    if (!ptr) throw Exception(ErrorCodes::LOGICAL_ERROR, "There is no global context or global context has expired");
+    return ptr;
+}
+
+std::unique_lock<std::recursive_mutex> Context::getLock() const
+{
+    ProfileEvents::increment(ProfileEvents::ContextLock);
+    CurrentMetrics::Increment increment{CurrentMetrics::ContextLockWait};
+    return std::unique_lock(shared->mutex);
+}
+
+String Context::getPath() const
+{
+    auto lock = getLock();
+    return shared->path;
+}
+
+void Context::setPath(const String & path)
+{
+    auto lock = getLock();
+    shared->path = path;
+}
+
+MultiVersion<Macros>::Version Context::getMacros() const
+{
+    return shared->macros.get();
+}
+
+void Context::setMacros(std::unique_ptr<Macros> && macros)
+{
+    shared->macros.set(std::move(macros));
+}
+
+BackgroundSchedulePool & Context::getSchedulePool() const
+{
+    auto lock = getLock();
+    if (!shared->schedule_pool)
+    {
+        shared->schedule_pool = std::make_unique<BackgroundSchedulePool>(
+            shared->server_settings.background_schedule_pool_size,
+            CurrentMetrics::BackgroundSchedulePoolTask,
+            CurrentMetrics::BackgroundSchedulePoolSize,
+            "BgSchPool");
+    }
+
+    return *shared->schedule_pool;
+}
+
+void Context::setRemoteHostFilter(const Poco::Util::AbstractConfiguration & config)
+{
+    shared->remote_host_filter.setValuesFromConfig(config);
+}
+
+const RemoteHostFilter & Context::getRemoteHostFilter() const
+{
+    return shared->remote_host_filter;
+}
+
+IAsynchronousReader & Context::getThreadPoolReader(FilesystemReaderType type) const
+{
+    auto lock = getLock();
+
+    switch (type)
+    {
+        case FilesystemReaderType::ASYNCHRONOUS_REMOTE_FS_READER:
+        {
+            if (!shared->asynchronous_remote_fs_reader)
+                shared->asynchronous_remote_fs_reader = createThreadPoolReader(type, getConfigRef());
+            return *shared->asynchronous_remote_fs_reader;
+        }
+        case FilesystemReaderType::ASYNCHRONOUS_LOCAL_FS_READER:
+        {
+            if (!shared->asynchronous_local_fs_reader)
+                shared->asynchronous_local_fs_reader = createThreadPoolReader(type, getConfigRef());
+
+            return *shared->asynchronous_local_fs_reader;
+        }
+        case FilesystemReaderType::SYNCHRONOUS_LOCAL_FS_READER:
+        {
+            if (!shared->synchronous_local_fs_reader)
+                shared->synchronous_local_fs_reader = createThreadPoolReader(type, getConfigRef());
+
+            return *shared->synchronous_local_fs_reader;
+        }
+    }
+}
+
+std::shared_ptr<FilesystemCacheLog> Context::getFilesystemCacheLog() const
+{
+    return nullptr;
+}
+
+std::shared_ptr<FilesystemReadPrefetchesLog> Context::getFilesystemReadPrefetchesLog() const
+{
+    return nullptr;
+}
+
+void Context::setConfig(const ConfigurationPtr & config)
+{
+    auto lock = getLock();
+    shared->config = config;
+}
+
+const Poco::Util::AbstractConfiguration & Context::getConfigRef() const
+{
+    auto lock = getLock();
+    return shared->config ? *shared->config : Poco::Util::Application::instance().config();
+}
+
+std::shared_ptr<AsyncReadCounters> Context::getAsyncReadCounters() const
+{
+    auto lock = getLock();
+    if (!async_read_counters)
+        async_read_counters = std::make_shared<AsyncReadCounters>();
+    return async_read_counters;
+}
+
+ThreadPool & Context::getThreadPoolWriter() const
+{
+    const auto & config = getConfigRef();
+
+    auto lock = getLock();
+
+    if (!shared->threadpool_writer)
+    {
+        auto pool_size = config.getUInt(".threadpool_writer_pool_size", 100);
+        auto queue_size = config.getUInt(".threadpool_writer_queue_size", 1000000);
+
+        shared->threadpool_writer = std::make_unique<ThreadPool>(
+            CurrentMetrics::IOWriterThreads, CurrentMetrics::IOWriterThreadsActive, pool_size, pool_size, queue_size);
+    }
+
+    return *shared->threadpool_writer;
+}
+
+ThrottlerPtr Context::getRemoteReadThrottler() const
+{
+    return nullptr;
+}
+
+ThrottlerPtr Context::getRemoteWriteThrottler() const
+{
+    return nullptr;
+}
+
+ThrottlerPtr Context::getLocalReadThrottler() const
+{
+    return nullptr;
+}
+
+ThrottlerPtr Context::getLocalWriteThrottler() const
+{
+    return nullptr;
+}
+
+ReadSettings Context::getReadSettings() const
+{
+    return ReadSettings{};
+}
+
+void Context::initializeKeeperDispatcher([[maybe_unused]] bool start_async) const
+{
+    const auto & config_ref = getConfigRef();
+
+    std::lock_guard lock(shared->keeper_dispatcher_mutex);
+
+    if (shared->keeper_dispatcher)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to initialize Keeper multiple times");
+
+    if (config_ref.has("keeper_server"))
+    {
+        shared->keeper_dispatcher = std::make_shared<KeeperDispatcher>();
+        shared->keeper_dispatcher->initialize(config_ref, true, start_async, getMacros());
+    }
+}
+
+std::shared_ptr<KeeperDispatcher> Context::getKeeperDispatcher() const
+{
+    std::lock_guard lock(shared->keeper_dispatcher_mutex);
+    if (!shared->keeper_dispatcher)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Keeper must be initialized before requests");
+
+    return shared->keeper_dispatcher;
+}
+
+std::shared_ptr<KeeperDispatcher> Context::tryGetKeeperDispatcher() const
+{
+    std::lock_guard lock(shared->keeper_dispatcher_mutex);
+    return shared->keeper_dispatcher;
+}
+
+void Context::shutdownKeeperDispatcher() const
+{
+    std::lock_guard lock(shared->keeper_dispatcher_mutex);
+    if (shared->keeper_dispatcher)
+    {
+        shared->keeper_dispatcher->shutdown();
+        shared->keeper_dispatcher.reset();
+    }
+}
+
+void Context::updateKeeperConfiguration([[maybe_unused]] const Poco::Util::AbstractConfiguration & config_)
+{
+    std::lock_guard lock(shared->keeper_dispatcher_mutex);
+    if (!shared->keeper_dispatcher)
+        return;
+
+    shared->keeper_dispatcher->updateConfiguration(getConfigRef(), getMacros());
+}
+
+}
diff --git a/src/Coordination/Standalone/Context.h b/src/Coordination/Standalone/Context.h
new file mode 100644
index 00000000000..c2eee981aaa
--- /dev/null
+++ b/src/Coordination/Standalone/Context.h
@@ -0,0 +1,120 @@
+#pragma once
+
+#include <Interpreters/Context_fwd.h>
+
+#include <Coordination/KeeperDispatcher.h>
+
+#include <Common/MultiVersion.h>
+#include <Common/RemoteHostFilter.h>
+
+#include <Disks/IO/getThreadPoolReader.h>
+
+#include <Core/Settings.h>
+#include <Core/BackgroundSchedulePool.h>
+
+#include <IO/AsyncReadCounters.h>
+
+#include <Poco/Util/Application.h>
+
+#include <memory>
+
+namespace DB
+{
+
+struct ContextSharedPart;
+class Macros;
+class FilesystemCacheLog;
+class FilesystemReadPrefetchesLog;
+
+/// A small class which owns ContextShared.
+/// We don't use something like unique_ptr directly to allow ContextShared type to be incomplete.
+struct SharedContextHolder
+{
+    ~SharedContextHolder();
+    SharedContextHolder();
+    explicit SharedContextHolder(std::unique_ptr<ContextSharedPart> shared_context);
+    SharedContextHolder(SharedContextHolder &&) noexcept;
+
+    SharedContextHolder & operator=(SharedContextHolder &&) noexcept;
+
+    ContextSharedPart * get() const { return shared.get(); }
+    void reset();
+private:
+    std::unique_ptr<ContextSharedPart> shared;
+};
+
+
+class Context : public std::enable_shared_from_this<Context>
+{
+private:
+    /// Use copy constructor or createGlobal() instead
+    Context();
+    Context(const Context &);
+    Context & operator=(const Context &);
+
+    std::unique_lock<std::recursive_mutex> getLock() const;
+
+    ContextWeakMutablePtr global_context;
+    inline static ContextPtr global_context_instance;
+    ContextSharedPart * shared;
+
+    /// Query metrics for reading data asynchronously with IAsynchronousReader.
+    mutable std::shared_ptr<AsyncReadCounters> async_read_counters;
+
+    Settings settings;  /// Setting for query execution.
+public:
+    /// Create initial Context with ContextShared and etc.
+    static ContextMutablePtr createGlobal(ContextSharedPart * shared);
+    static SharedContextHolder createShared();
+
+    ContextMutablePtr getGlobalContext() const;
+    static ContextPtr getGlobalContextInstance() { return global_context_instance; }
+
+    void makeGlobalContext();
+    void initGlobal();
+
+    ~Context();
+
+    using ConfigurationPtr = Poco::AutoPtr<Poco::Util::AbstractConfiguration>;
+
+    /// Global application configuration settings.
+    void setConfig(const ConfigurationPtr & config);
+    const Poco::Util::AbstractConfiguration & getConfigRef() const;
+
+    const Settings & getSettingsRef() const { return settings; }
+
+    String getPath() const;
+    void setPath(const String & path);
+
+    MultiVersion<Macros>::Version getMacros() const;
+    void setMacros(std::unique_ptr<Macros> && macros);
+
+    BackgroundSchedulePool & getSchedulePool() const;
+
+    /// Storage of allowed hosts from config.xml
+    void setRemoteHostFilter(const Poco::Util::AbstractConfiguration & config);
+    const RemoteHostFilter & getRemoteHostFilter() const;
+
+    std::shared_ptr<FilesystemCacheLog> getFilesystemCacheLog() const;
+    std::shared_ptr<FilesystemReadPrefetchesLog> getFilesystemReadPrefetchesLog() const;
+
+    IAsynchronousReader & getThreadPoolReader(FilesystemReaderType type) const;
+    std::shared_ptr<AsyncReadCounters> getAsyncReadCounters() const;
+    ThreadPool & getThreadPoolWriter() const;
+
+    ThrottlerPtr getRemoteReadThrottler() const;
+    ThrottlerPtr getRemoteWriteThrottler() const;
+
+    ThrottlerPtr getLocalReadThrottler() const;
+    ThrottlerPtr getLocalWriteThrottler() const;
+
+    ReadSettings getReadSettings() const;
+
+    std::shared_ptr<KeeperDispatcher> getKeeperDispatcher() const;
+    std::shared_ptr<KeeperDispatcher> tryGetKeeperDispatcher() const;
+    void initializeKeeperDispatcher(bool start_async) const;
+    void shutdownKeeperDispatcher() const;
+    void updateKeeperConfiguration(const Poco::Util::AbstractConfiguration & config);
+};
+
+}
diff --git a/src/Coordination/Standalone/Settings.cpp b/src/Coordination/Standalone/Settings.cpp
new file mode 100644
index 00000000000..12a7a42ffac
--- /dev/null
+++ b/src/Coordination/Standalone/Settings.cpp
@@ -0,0 +1,24 @@
+#include <Core/Settings.h>
+
+namespace DB
+{
+
+IMPLEMENT_SETTINGS_TRAITS(SettingsTraits, LIST_OF_SETTINGS)
+
+std::vector<String> Settings::getAllRegisteredNames() const
+{
+    std::vector<String> all_settings;
+    for (const auto & setting_field : all())
+    {
+        all_settings.push_back(setting_field.getName());
+    }
+    return all_settings;
+}
+
+void Settings::set(std::string_view name, const Field & value)
+{
+    BaseSettings::set(name, value);
+}
+
+
+}
diff --git a/src/Coordination/Standalone/ThreadStatusExt.cpp b/src/Coordination/Standalone/ThreadStatusExt.cpp
new file mode 100644
index 00000000000..97f7287be8c
--- /dev/null
+++ b/src/Coordination/Standalone/ThreadStatusExt.cpp
@@ -0,0 +1,14 @@
+#include <Common/CurrentThread.h>
+
+namespace DB
+{
+
+void CurrentThread::detachFromGroupIfNotDetached()
+{
+}
+
+void CurrentThread::attachToGroup(const ThreadGroupPtr &)
+{
+}
+
+}
diff --git a/src/Coordination/TinyContext.cpp b/src/Coordination/TinyContext.cpp
deleted file mode 100644
index 47b0a48dcda..00000000000
--- a/src/Coordination/TinyContext.cpp
+++ /dev/null
@@ -1,87 +0,0 @@
-#include <Coordination/TinyContext.h>
-
-#include <Common/Exception.h>
-#include <Coordination/KeeperDispatcher.h>
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int LOGICAL_ERROR;
-}
-
-void TinyContext::setConfig(const ConfigurationPtr & config_)
-{
-    std::lock_guard lock(keeper_dispatcher_mutex);
-    config = config_;
-}
-
-const Poco::Util::AbstractConfiguration & TinyContext::getConfigRef() const
-{
-    std::lock_guard lock(keeper_dispatcher_mutex);
-    return config ? *config : Poco::Util::Application::instance().config();
-}
-
-
-void TinyContext::initializeKeeperDispatcher([[maybe_unused]] bool start_async) const
-{
-    const auto & config_ref = getConfigRef();
-
-    std::lock_guard lock(keeper_dispatcher_mutex);
-
-    if (keeper_dispatcher)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to initialize Keeper multiple times");
-
-    if (config_ref.has("keeper_server"))
-    {
-        keeper_dispatcher = std::make_shared<KeeperDispatcher>();
-
-        MultiVersion<Macros>::Version macros;
-
-        if (config_ref.has("macros"))
-            macros = std::make_unique<Macros>(config_ref, "macros", &Poco::Logger::get("TinyContext"));
-        keeper_dispatcher->initialize(config_ref, true, start_async, macros);
-    }
-}
-
-std::shared_ptr<KeeperDispatcher> TinyContext::getKeeperDispatcher() const
-{
-    std::lock_guard lock(keeper_dispatcher_mutex);
-    if (!keeper_dispatcher)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Keeper must be initialized before requests");
-
-    return keeper_dispatcher;
-}
-
-std::shared_ptr<KeeperDispatcher> TinyContext::tryGetKeeperDispatcher() const
-{
-    std::lock_guard lock(keeper_dispatcher_mutex);
-    return keeper_dispatcher;
-}
-
-void TinyContext::shutdownKeeperDispatcher() const
-{
-    std::lock_guard lock(keeper_dispatcher_mutex);
-    if (keeper_dispatcher)
-    {
-        keeper_dispatcher->shutdown();
-        keeper_dispatcher.reset();
-    }
-}
-
-void TinyContext::updateKeeperConfiguration([[maybe_unused]] const Poco::Util::AbstractConfiguration & config_)
-{
-    std::lock_guard lock(keeper_dispatcher_mutex);
-    if (!keeper_dispatcher)
-        return;
-
-    MultiVersion<Macros>::Version macros;
-
-    if (config_.has("macros"))
-        macros = std::make_unique<Macros>(config_, "macros", &Poco::Logger::get("TinyContext"));
-
-    keeper_dispatcher->updateConfiguration(config_, macros);
-}
-
-}
diff --git a/src/Coordination/TinyContext.h b/src/Coordination/TinyContext.h
deleted file mode 100644
index b966d445004..00000000000
--- a/src/Coordination/TinyContext.h
+++ /dev/null
@@ -1,36 +0,0 @@
-#pragma once
-#include <memory>
-#include <mutex>
-
-#include <Poco/Util/Application.h>
-#include <base/defines.h>
-
-namespace DB
-{
-
-class KeeperDispatcher;
-
-class TinyContext : public std::enable_shared_from_this<TinyContext>
-{
-public:
-    std::shared_ptr<KeeperDispatcher> getKeeperDispatcher() const;
-    std::shared_ptr<KeeperDispatcher> tryGetKeeperDispatcher() const;
-    void initializeKeeperDispatcher(bool start_async) const;
-    void shutdownKeeperDispatcher() const;
-    void updateKeeperConfiguration(const Poco::Util::AbstractConfiguration & config);
-
-    using ConfigurationPtr = Poco::AutoPtr<Poco::Util::AbstractConfiguration>;
-
-    void setConfig(const ConfigurationPtr & config);
-    const Poco::Util::AbstractConfiguration & getConfigRef() const;
-
-private:
-    mutable std::mutex keeper_dispatcher_mutex;
-    mutable std::shared_ptr<KeeperDispatcher> keeper_dispatcher TSA_GUARDED_BY(keeper_dispatcher_mutex);
-
-    ConfigurationPtr config TSA_GUARDED_BY(keeper_dispatcher_mutex);
-};
-
-using TinyContextPtr = std::shared_ptr<TinyContext>;
-
-}
diff --git a/src/Coordination/ZooKeeperDataReader.cpp b/src/Coordination/ZooKeeperDataReader.cpp
index bdc462f3ea0..94fc07bcc4a 100644
--- a/src/Coordination/ZooKeeperDataReader.cpp
+++ b/src/Coordination/ZooKeeperDataReader.cpp
@@ -139,8 +139,8 @@ int64_t deserializeStorageData(KeeperStorage & storage, ReadBuffer & in, Poco::L
     {
         if (itr.key != "/")
         {
-            auto parent_path = parentPath(itr.key);
-            storage.container.updateValue(parent_path, [my_path = itr.key] (KeeperStorage::Node & value) { value.addChild(getBaseName(my_path)); ++value.stat.numChildren; });
+            auto parent_path = parentNodePath(itr.key);
+            storage.container.updateValue(parent_path, [my_path = itr.key] (KeeperStorage::Node & value) { value.addChild(getBaseNodeName(my_path)); ++value.stat.numChildren; });
         }
     }
 
diff --git a/src/Coordination/pathUtils.cpp b/src/Coordination/pathUtils.cpp
index 1e1da339d2e..afa42b4a639 100644
--- a/src/Coordination/pathUtils.cpp
+++ b/src/Coordination/pathUtils.cpp
@@ -21,7 +21,7 @@ static size_t findLastSlash(StringRef path)
     return std::string::npos;
 }
 
-StringRef parentPath(StringRef path)
+StringRef parentNodePath(StringRef path)
 {
     auto rslash_pos = findLastSlash(path);
     if (rslash_pos > 0)
@@ -29,7 +29,7 @@ StringRef parentPath(StringRef path)
     return "/";
 }
 
-StringRef getBaseName(StringRef path)
+StringRef getBaseNodeName(StringRef path)
 {
     size_t basename_start = findLastSlash(path);
     return StringRef{path.data + basename_start + 1, path.size - basename_start - 1};
diff --git a/src/Coordination/pathUtils.h b/src/Coordination/pathUtils.h
index 69ed2d8b177..b2b79b14110 100644
--- a/src/Coordination/pathUtils.h
+++ b/src/Coordination/pathUtils.h
@@ -6,8 +6,8 @@
 namespace DB
 {
 
-StringRef parentPath(StringRef path);
+StringRef parentNodePath(StringRef path);
 
-StringRef getBaseName(StringRef path);
+StringRef getBaseNodeName(StringRef path);
 
 }
diff --git a/src/Coordination/tests/gtest_coordination.cpp b/src/Coordination/tests/gtest_coordination.cpp
index 62217fb2dd3..0f60c960b8b 100644
--- a/src/Coordination/tests/gtest_coordination.cpp
+++ b/src/Coordination/tests/gtest_coordination.cpp
@@ -2,35 +2,39 @@
 #include <gtest/gtest.h>
 #include "Common/ZooKeeper/IKeeper.h"
 
-#include "Coordination/KeeperContext.h"
-#include "Coordination/KeeperStorage.h"
 #include "Core/Defines.h"
-#include "IO/WriteHelpers.h"
 #include "config.h"
 
 #if USE_NURAFT
+#include <filesystem>
+#include <thread>
+#include <Coordination/Changelog.h>
+#include <Coordination/InMemoryLogStore.h>
+#include <Coordination/KeeperContext.h>
+#include <Coordination/KeeperConstants.h>
+#include <Coordination/KeeperFeatureFlags.h>
+#include <Coordination/KeeperLogStore.h>
+#include <Coordination/KeeperSnapshotManager.h>
+#include <Coordination/KeeperStateMachine.h>
+#include <Coordination/KeeperStateManager.h>
+#include <Coordination/KeeperStorage.h>
+#include <Coordination/LoggerWrapper.h>
+#include <Coordination/ReadBufferFromNuraftBuffer.h>
+#include <Coordination/SummingStateMachine.h>
+#include <Coordination/WriteBufferFromNuraftBuffer.h>
+#include <Coordination/pathUtils.h>
+#include <IO/ReadBufferFromString.h>
+#include <IO/WriteHelpers.h>
+#include <libnuraft/nuraft.hxx>
 #include <Poco/ConsoleChannel.h>
 #include <Poco/Logger.h>
-#include <Coordination/InMemoryLogStore.h>
-#include <Coordination/KeeperStateManager.h>
-#include <Coordination/KeeperSnapshotManager.h>
-#include <Coordination/SummingStateMachine.h>
-#include <Coordination/KeeperStateMachine.h>
-#include <Coordination/LoggerWrapper.h>
-#include <Coordination/WriteBufferFromNuraftBuffer.h>
-#include <Coordination/ReadBufferFromNuraftBuffer.h>
-#include <IO/ReadBufferFromString.h>
+#include <Common/Exception.h>
+#include <Common/SipHash.h>
 #include <Common/ZooKeeper/ZooKeeperCommon.h>
 #include <Common/ZooKeeper/ZooKeeperIO.h>
-#include <Common/Exception.h>
 #include <Common/logger_useful.h>
-#include <libnuraft/nuraft.hxx>
-#include <thread>
-#include <Coordination/KeeperLogStore.h>
-#include <Coordination/Changelog.h>
-#include <filesystem>
-#include <Common/SipHash.h>
-#include <Coordination/pathUtils.h>
+
+#include <Disks/DiskLocal.h>
 
 #include <Coordination/SnapshotableHashTable.h>
 
@@ -39,9 +43,7 @@ struct ChangelogDirTest
 {
     std::string path;
     bool drop;
-    explicit ChangelogDirTest(std::string path_, bool drop_ = true)
-        : path(path_)
-        , drop(drop_)
+    explicit ChangelogDirTest(std::string path_, bool drop_ = true) : path(path_), drop(drop_)
     {
         if (fs::exists(path))
         {
@@ -66,8 +68,20 @@ struct CompressionParam
 class CoordinationTest : public ::testing::TestWithParam<CompressionParam>
 {
 protected:
-    DB::KeeperContextPtr keeper_context = std::make_shared<DB::KeeperContext>();
+    DB::KeeperContextPtr keeper_context = std::make_shared<DB::KeeperContext>(true);
     Poco::Logger * log{&Poco::Logger::get("CoordinationTest")};
+
+    void setLogDirectory(const std::string & path) { keeper_context->setLogDisk(std::make_shared<DB::DiskLocal>("LogDisk", path, 0)); }
+
+    void setSnapshotDirectory(const std::string & path)
+    {
+        keeper_context->setSnapshotDisk(std::make_shared<DB::DiskLocal>("SnapshotDisk", path, 0));
+    }
+
+    void setStateFileDirectory(const std::string & path)
+    {
+        keeper_context->setStateFileDisk(std::make_shared<DB::DiskLocal>("StateFile", path, 0));
+    }
 };
 
 TEST_P(CoordinationTest, BuildTest)
@@ -113,13 +127,14 @@ TEST_P(CoordinationTest, BufferSerde)
 template <typename StateMachine>
 struct SimpliestRaftServer
 {
-    SimpliestRaftServer(int server_id_, const std::string & hostname_, int port_, const std::string & logs_path, const std::string & state_path)
+    SimpliestRaftServer(
+        int server_id_, const std::string & hostname_, int port_, DB::KeeperContextPtr keeper_context)
         : server_id(server_id_)
         , hostname(hostname_)
         , port(port_)
         , endpoint(hostname + ":" + std::to_string(port))
         , state_machine(nuraft::cs_new<StateMachine>())
-        , state_manager(nuraft::cs_new<DB::KeeperStateManager>(server_id, hostname, port, logs_path, state_path))
+        , state_manager(nuraft::cs_new<DB::KeeperStateManager>(server_id, hostname, port, keeper_context))
     {
         state_manager->loadLogStore(1, 0);
         nuraft::raft_params params;
@@ -135,8 +150,13 @@ struct SimpliestRaftServer
         nuraft::raft_server::init_options opts;
         opts.start_server_in_constructor_ = false;
         raft_instance = launcher.init(
-            state_machine, state_manager, nuraft::cs_new<DB::LoggerWrapper>("ToyRaftLogger", DB::LogsLevel::trace), port,
-            nuraft::asio_service::options{}, params, opts);
+            state_machine,
+            state_manager,
+            nuraft::cs_new<DB::LoggerWrapper>("ToyRaftLogger", DB::LogsLevel::trace),
+            port,
+            nuraft::asio_service::options{},
+            params,
+            opts);
 
         if (!raft_instance)
         {
@@ -195,15 +215,14 @@ nuraft::ptr<nuraft::buffer> getBuffer(int64_t number)
     return ret;
 }
 
-
 TEST_P(CoordinationTest, TestSummingRaft1)
 {
     ChangelogDirTest test("./logs");
-    SummingRaftServer s1(1, "localhost", 44444, "./logs", "./state");
-    SCOPE_EXIT(
-        if (std::filesystem::exists("./state"))
-            std::filesystem::remove("./state");
-    );
+    setLogDirectory("./logs");
+    setStateFileDirectory(".");
+
+    SummingRaftServer s1(1, "localhost", 44444, keeper_context);
+    SCOPE_EXIT(if (std::filesystem::exists("./state")) std::filesystem::remove("./state"););
 
     /// Single node is leader
     EXPECT_EQ(s1.raft_instance->get_leader(), 1);
@@ -235,8 +254,10 @@ TEST_P(CoordinationTest, ChangelogTestSimple)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
+    setLogDirectory("./logs");
 
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog.init(1, 0);
     auto entry = getLogEntry("hello world", 77);
     changelog.append(entry);
@@ -263,7 +284,10 @@ TEST_P(CoordinationTest, ChangelogTestFile)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    setLogDirectory("./logs");
+
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog.init(1, 0);
     auto entry = getLogEntry("hello world", 77);
     changelog.append(entry);
@@ -292,7 +316,10 @@ TEST_P(CoordinationTest, ChangelogReadWrite)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 1000});
+    setLogDirectory("./logs");
+
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 1000}, keeper_context);
     changelog.init(1, 0);
 
     for (size_t i = 0; i < 10; ++i)
@@ -306,7 +333,8 @@ TEST_P(CoordinationTest, ChangelogReadWrite)
 
     waitDurableLogs(changelog);
 
-    DB::KeeperLogStore changelog_reader("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 1000});
+    DB::KeeperLogStore changelog_reader(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 1000}, keeper_context);
     changelog_reader.init(1, 0);
     EXPECT_EQ(changelog_reader.size(), 10);
     EXPECT_EQ(changelog_reader.last_entry()->get_term(), changelog.last_entry()->get_term());
@@ -326,7 +354,10 @@ TEST_P(CoordinationTest, ChangelogWriteAt)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 1000});
+    setLogDirectory("./logs");
+
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 1000}, keeper_context);
     changelog.init(1, 0);
     for (size_t i = 0; i < 10; ++i)
     {
@@ -348,7 +379,8 @@ TEST_P(CoordinationTest, ChangelogWriteAt)
     EXPECT_EQ(changelog.entry_at(7)->get_term(), 77);
     EXPECT_EQ(changelog.next_slot(), 8);
 
-    DB::KeeperLogStore changelog_reader("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 1000});
+    DB::KeeperLogStore changelog_reader(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 1000}, keeper_context);
     changelog_reader.init(1, 0);
 
     EXPECT_EQ(changelog_reader.size(), changelog.size());
@@ -362,7 +394,10 @@ TEST_P(CoordinationTest, ChangelogTestAppendAfterRead)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    setLogDirectory("./logs");
+
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog.init(1, 0);
     for (size_t i = 0; i < 7; ++i)
     {
@@ -378,7 +413,8 @@ TEST_P(CoordinationTest, ChangelogTestAppendAfterRead)
     EXPECT_TRUE(fs::exists("./logs/changelog_1_5.bin" + params.extension));
     EXPECT_TRUE(fs::exists("./logs/changelog_6_10.bin" + params.extension));
 
-    DB::KeeperLogStore changelog_reader("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    DB::KeeperLogStore changelog_reader(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog_reader.init(1, 0);
 
     EXPECT_EQ(changelog_reader.size(), 7);
@@ -395,7 +431,7 @@ TEST_P(CoordinationTest, ChangelogTestAppendAfterRead)
     EXPECT_TRUE(fs::exists("./logs/changelog_6_10.bin" + params.extension));
 
     size_t logs_count = 0;
-    for (const auto & _ [[maybe_unused]]: fs::directory_iterator("./logs"))
+    for (const auto & _ [[maybe_unused]] : fs::directory_iterator("./logs"))
         logs_count++;
 
     EXPECT_EQ(logs_count, 2);
@@ -412,7 +448,7 @@ TEST_P(CoordinationTest, ChangelogTestAppendAfterRead)
     EXPECT_TRUE(fs::exists("./logs/changelog_11_15.bin" + params.extension));
 
     logs_count = 0;
-    for (const auto & _ [[maybe_unused]]: fs::directory_iterator("./logs"))
+    for (const auto & _ [[maybe_unused]] : fs::directory_iterator("./logs"))
         logs_count++;
 
     EXPECT_EQ(logs_count, 3);
@@ -440,7 +476,10 @@ TEST_P(CoordinationTest, ChangelogTestCompaction)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    setLogDirectory("./logs");
+
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog.init(1, 0);
 
     for (size_t i = 0; i < 3; ++i)
@@ -489,7 +528,8 @@ TEST_P(CoordinationTest, ChangelogTestCompaction)
     EXPECT_EQ(changelog.next_slot(), 8);
     EXPECT_EQ(changelog.last_entry()->get_term(), 60);
     /// And we able to read it
-    DB::KeeperLogStore changelog_reader("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    DB::KeeperLogStore changelog_reader(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog_reader.init(7, 0);
 
     EXPECT_EQ(changelog_reader.size(), 1);
@@ -502,7 +542,10 @@ TEST_P(CoordinationTest, ChangelogTestBatchOperations)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+    setLogDirectory("./logs");
+
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
     changelog.init(1, 0);
     for (size_t i = 0; i < 10; ++i)
     {
@@ -517,7 +560,8 @@ TEST_P(CoordinationTest, ChangelogTestBatchOperations)
 
     auto entries = changelog.pack(1, 5);
 
-    DB::KeeperLogStore apply_changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+    DB::KeeperLogStore apply_changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
     apply_changelog.init(1, 0);
 
     for (size_t i = 0; i < 10; ++i)
@@ -549,23 +593,31 @@ TEST_P(CoordinationTest, ChangelogTestBatchOperationsEmpty)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
-    changelog.init(1, 0);
-    for (size_t i = 0; i < 10; ++i)
+    setLogDirectory("./logs");
+
+    nuraft::ptr<nuraft::buffer> entries;
     {
-        auto entry = getLogEntry(std::to_string(i) + "_hello_world", i * 10);
-        changelog.append(entry);
+        DB::KeeperLogStore changelog(
+            DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
+        changelog.init(1, 0);
+        for (size_t i = 0; i < 10; ++i)
+        {
+            auto entry = getLogEntry(std::to_string(i) + "_hello_world", i * 10);
+            changelog.append(entry);
+        }
+        changelog.end_of_append_batch(0, 0);
+
+        EXPECT_EQ(changelog.size(), 10);
+
+        waitDurableLogs(changelog);
+
+        entries = changelog.pack(5, 5);
     }
-    changelog.end_of_append_batch(0, 0);
-
-    EXPECT_EQ(changelog.size(), 10);
-
-    waitDurableLogs(changelog);
-
-    auto entries = changelog.pack(5, 5);
 
     ChangelogDirTest test1("./logs1");
-    DB::KeeperLogStore changelog_new("./logs1", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+    setLogDirectory("./logs1");
+    DB::KeeperLogStore changelog_new(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
     changelog_new.init(1, 0);
     EXPECT_EQ(changelog_new.size(), 0);
 
@@ -587,7 +639,8 @@ TEST_P(CoordinationTest, ChangelogTestBatchOperationsEmpty)
     EXPECT_EQ(changelog_new.start_index(), 5);
     EXPECT_EQ(changelog_new.next_slot(), 11);
 
-    DB::KeeperLogStore changelog_reader("./logs1", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+    DB::KeeperLogStore changelog_reader(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
     changelog_reader.init(5, 0);
 }
 
@@ -596,7 +649,10 @@ TEST_P(CoordinationTest, ChangelogTestWriteAtPreviousFile)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    setLogDirectory("./logs");
+
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog.init(1, 0);
 
     for (size_t i = 0; i < 33; ++i)
@@ -637,7 +693,8 @@ TEST_P(CoordinationTest, ChangelogTestWriteAtPreviousFile)
     EXPECT_FALSE(fs::exists("./logs/changelog_26_30.bin" + params.extension));
     EXPECT_FALSE(fs::exists("./logs/changelog_31_35.bin" + params.extension));
 
-    DB::KeeperLogStore changelog_read("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    DB::KeeperLogStore changelog_read(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog_read.init(1, 0);
     EXPECT_EQ(changelog_read.size(), 7);
     EXPECT_EQ(changelog_read.start_index(), 1);
@@ -649,7 +706,10 @@ TEST_P(CoordinationTest, ChangelogTestWriteAtFileBorder)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    setLogDirectory("./logs");
+
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog.init(1, 0);
 
     for (size_t i = 0; i < 33; ++i)
@@ -690,7 +750,8 @@ TEST_P(CoordinationTest, ChangelogTestWriteAtFileBorder)
     EXPECT_FALSE(fs::exists("./logs/changelog_26_30.bin" + params.extension));
     EXPECT_FALSE(fs::exists("./logs/changelog_31_35.bin" + params.extension));
 
-    DB::KeeperLogStore changelog_read("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    DB::KeeperLogStore changelog_read(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog_read.init(1, 0);
     EXPECT_EQ(changelog_read.size(), 11);
     EXPECT_EQ(changelog_read.start_index(), 1);
@@ -702,7 +763,10 @@ TEST_P(CoordinationTest, ChangelogTestWriteAtAllFiles)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    setLogDirectory("./logs");
+
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog.init(1, 0);
     for (size_t i = 0; i < 33; ++i)
     {
@@ -747,7 +811,10 @@ TEST_P(CoordinationTest, ChangelogTestStartNewLogAfterRead)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    setLogDirectory("./logs");
+
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog.init(1, 0);
 
     for (size_t i = 0; i < 35; ++i)
@@ -768,7 +835,8 @@ TEST_P(CoordinationTest, ChangelogTestStartNewLogAfterRead)
     EXPECT_TRUE(fs::exists("./logs/changelog_31_35.bin" + params.extension));
     EXPECT_FALSE(fs::exists("./logs/changelog_36_40.bin" + params.extension));
 
-    DB::KeeperLogStore changelog_reader("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    DB::KeeperLogStore changelog_reader(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog_reader.init(1, 0);
 
     auto entry = getLogEntry("36_hello_world", 360);
@@ -792,16 +860,16 @@ namespace
 {
 void assertBrokenLogRemoved(const fs::path & log_folder, const fs::path & filename)
 {
-        EXPECT_FALSE(fs::exists(log_folder / filename));
-        // broken logs are sent to the detached/{timestamp} folder
-        // we don't know timestamp so we iterate all of them
-        for (const auto & dir_entry : fs::recursive_directory_iterator(log_folder / "detached"))
-        {
-            if (dir_entry.path().filename() == filename)
-                return;
-        }
+    EXPECT_FALSE(fs::exists(log_folder / filename));
+    // broken logs are sent to the detached/{timestamp} folder
+    // we don't know timestamp so we iterate all of them
+    for (const auto & dir_entry : fs::recursive_directory_iterator(log_folder / "detached"))
+    {
+        if (dir_entry.path().filename() == filename)
+            return;
+    }
 
-        FAIL() << "Broken log " << filename << " was not moved to the detached folder";
+    FAIL() << "Broken log " << filename << " was not moved to the detached folder";
 }
 
 }
@@ -812,8 +880,10 @@ TEST_P(CoordinationTest, ChangelogTestReadAfterBrokenTruncate)
 
     auto params = GetParam();
     ChangelogDirTest test(log_folder);
+    setLogDirectory(log_folder);
 
-    DB::KeeperLogStore changelog(log_folder, DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog.init(1, 0);
 
     for (size_t i = 0; i < 35; ++i)
@@ -833,10 +903,12 @@ TEST_P(CoordinationTest, ChangelogTestReadAfterBrokenTruncate)
     EXPECT_TRUE(fs::exists("./logs/changelog_26_30.bin" + params.extension));
     EXPECT_TRUE(fs::exists("./logs/changelog_31_35.bin" + params.extension));
 
-    DB::WriteBufferFromFile plain_buf("./logs/changelog_11_15.bin" + params.extension, DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
+    DB::WriteBufferFromFile plain_buf(
+        "./logs/changelog_11_15.bin" + params.extension, DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
     plain_buf.truncate(0);
 
-    DB::KeeperLogStore changelog_reader("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    DB::KeeperLogStore changelog_reader(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog_reader.init(1, 0);
     changelog_reader.end_of_append_batch(0, 0);
 
@@ -869,7 +941,8 @@ TEST_P(CoordinationTest, ChangelogTestReadAfterBrokenTruncate)
     assertBrokenLogRemoved(log_folder, "changelog_26_30.bin" + params.extension);
     assertBrokenLogRemoved(log_folder, "changelog_31_35.bin" + params.extension);
 
-    DB::KeeperLogStore changelog_reader2("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    DB::KeeperLogStore changelog_reader2(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog_reader2.init(1, 0);
     EXPECT_EQ(changelog_reader2.size(), 11);
     EXPECT_EQ(changelog_reader2.last_entry()->get_term(), 7777);
@@ -879,8 +952,10 @@ TEST_P(CoordinationTest, ChangelogTestReadAfterBrokenTruncate2)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
+    setLogDirectory("./logs");
 
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 20});
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 20}, keeper_context);
     changelog.init(1, 0);
 
     for (size_t i = 0; i < 35; ++i)
@@ -894,10 +969,12 @@ TEST_P(CoordinationTest, ChangelogTestReadAfterBrokenTruncate2)
     EXPECT_TRUE(fs::exists("./logs/changelog_1_20.bin" + params.extension));
     EXPECT_TRUE(fs::exists("./logs/changelog_21_40.bin" + params.extension));
 
-    DB::WriteBufferFromFile plain_buf("./logs/changelog_1_20.bin" + params.extension, DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
+    DB::WriteBufferFromFile plain_buf(
+        "./logs/changelog_1_20.bin" + params.extension, DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
     plain_buf.truncate(30);
 
-    DB::KeeperLogStore changelog_reader("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 20});
+    DB::KeeperLogStore changelog_reader(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 20}, keeper_context);
     changelog_reader.init(1, 0);
 
     EXPECT_EQ(changelog_reader.size(), 0);
@@ -912,7 +989,8 @@ TEST_P(CoordinationTest, ChangelogTestReadAfterBrokenTruncate2)
     EXPECT_EQ(changelog_reader.size(), 1);
     EXPECT_EQ(changelog_reader.last_entry()->get_term(), 7777);
 
-    DB::KeeperLogStore changelog_reader2("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 1});
+    DB::KeeperLogStore changelog_reader2(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 1}, keeper_context);
     changelog_reader2.init(1, 0);
     EXPECT_EQ(changelog_reader2.size(), 1);
     EXPECT_EQ(changelog_reader2.last_entry()->get_term(), 7777);
@@ -922,8 +1000,10 @@ TEST_P(CoordinationTest, ChangelogTestLostFiles)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
+    setLogDirectory("./logs");
 
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 20});
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 20}, keeper_context);
     changelog.init(1, 0);
 
     for (size_t i = 0; i < 35; ++i)
@@ -939,7 +1019,8 @@ TEST_P(CoordinationTest, ChangelogTestLostFiles)
 
     fs::remove("./logs/changelog_1_20.bin" + params.extension);
 
-    DB::KeeperLogStore changelog_reader("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 20});
+    DB::KeeperLogStore changelog_reader(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 20}, keeper_context);
     /// It should print error message, but still able to start
     changelog_reader.init(5, 0);
     assertBrokenLogRemoved("./logs", "changelog_21_40.bin" + params.extension);
@@ -949,8 +1030,10 @@ TEST_P(CoordinationTest, ChangelogTestLostFiles2)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
+    setLogDirectory("./logs");
 
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 10});
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 10}, keeper_context);
     changelog.init(1, 0);
 
     for (size_t i = 0; i < 35; ++i)
@@ -970,7 +1053,8 @@ TEST_P(CoordinationTest, ChangelogTestLostFiles2)
     // we have a gap in our logs, we need to remove all the logs after the gap
     fs::remove("./logs/changelog_21_30.bin" + params.extension);
 
-    DB::KeeperLogStore changelog_reader("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 10});
+    DB::KeeperLogStore changelog_reader(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 10}, keeper_context);
     /// It should print error message, but still able to start
     changelog_reader.init(5, 0);
     EXPECT_TRUE(fs::exists("./logs/changelog_1_10.bin" + params.extension));
@@ -1155,7 +1239,7 @@ TEST_P(CoordinationTest, SnapshotableHashMapDataSize)
     EXPECT_EQ(world.getApproximateDataSize(), 0);
 }
 
-void addNode(DB::KeeperStorage & storage, const std::string & path, const std::string & data, int64_t ephemeral_owner=0)
+void addNode(DB::KeeperStorage & storage, const std::string & path, const std::string & data, int64_t ephemeral_owner = 0)
 {
     using Node = DB::KeeperStorage::Node;
     Node node{};
@@ -1163,19 +1247,23 @@ void addNode(DB::KeeperStorage & storage, const std::string & path, const std::s
     node.stat.ephemeralOwner = ephemeral_owner;
     storage.container.insertOrReplace(path, node);
     auto child_it = storage.container.find(path);
-    auto child_path = DB::getBaseName(child_it->key);
-    storage.container.updateValue(DB::parentPath(StringRef{path}), [&](auto & parent)
-    {
-        parent.addChild(child_path);
-        parent.stat.numChildren++;
-    });
+    auto child_path = DB::getBaseNodeName(child_it->key);
+    storage.container.updateValue(
+        DB::parentNodePath(StringRef{path}),
+        [&](auto & parent)
+        {
+            parent.addChild(child_path);
+            parent.stat.numChildren++;
+        });
 }
 
 TEST_P(CoordinationTest, TestStorageSnapshotSimple)
 {
     auto params = GetParam();
     ChangelogDirTest test("./snapshots");
-    DB::KeeperSnapshotManager manager("./snapshots", 3, keeper_context, params.enable_compression);
+    setSnapshotDirectory("./snapshots");
+
+    DB::KeeperSnapshotManager manager(3, keeper_context, params.enable_compression);
 
     DB::KeeperStorage storage(500, "", keeper_context);
     addNode(storage, "/hello", "world", 1);
@@ -1191,7 +1279,7 @@ TEST_P(CoordinationTest, TestStorageSnapshotSimple)
 
     EXPECT_EQ(snapshot.snapshot_meta->get_last_log_idx(), 2);
     EXPECT_EQ(snapshot.session_id, 7);
-    EXPECT_EQ(snapshot.snapshot_container_size, 5);
+    EXPECT_EQ(snapshot.snapshot_container_size, 6);
     EXPECT_EQ(snapshot.session_and_timeout.size(), 2);
 
     auto buf = manager.serializeSnapshotToBuffer(snapshot);
@@ -1203,7 +1291,7 @@ TEST_P(CoordinationTest, TestStorageSnapshotSimple)
 
     auto [restored_storage, snapshot_meta, _] = manager.deserializeSnapshotFromBuffer(debuf);
 
-    EXPECT_EQ(restored_storage->container.size(), 5);
+    EXPECT_EQ(restored_storage->container.size(), 6);
     EXPECT_EQ(restored_storage->container.getValue("/").getChildren().size(), 2);
     EXPECT_EQ(restored_storage->container.getValue("/hello").getChildren().size(), 1);
     EXPECT_EQ(restored_storage->container.getValue("/hello/somepath").getChildren().size(), 0);
@@ -1223,7 +1311,9 @@ TEST_P(CoordinationTest, TestStorageSnapshotMoreWrites)
 {
     auto params = GetParam();
     ChangelogDirTest test("./snapshots");
-    DB::KeeperSnapshotManager manager("./snapshots", 3, keeper_context, params.enable_compression);
+    setSnapshotDirectory("./snapshots");
+
+    DB::KeeperSnapshotManager manager(3, keeper_context, params.enable_compression);
 
     DB::KeeperStorage storage(500, "", keeper_context);
     storage.getSessionID(130);
@@ -1235,14 +1325,14 @@ TEST_P(CoordinationTest, TestStorageSnapshotMoreWrites)
 
     DB::KeeperStorageSnapshot snapshot(&storage, 50);
     EXPECT_EQ(snapshot.snapshot_meta->get_last_log_idx(), 50);
-    EXPECT_EQ(snapshot.snapshot_container_size, 53);
+    EXPECT_EQ(snapshot.snapshot_container_size, 54);
 
     for (size_t i = 50; i < 100; ++i)
     {
         addNode(storage, "/hello_" + std::to_string(i), "world_" + std::to_string(i));
     }
 
-    EXPECT_EQ(storage.container.size(), 103);
+    EXPECT_EQ(storage.container.size(), 104);
 
     auto buf = manager.serializeSnapshotToBuffer(snapshot);
     manager.serializeSnapshotBufferToDisk(*buf, 50);
@@ -1252,7 +1342,7 @@ TEST_P(CoordinationTest, TestStorageSnapshotMoreWrites)
     auto debuf = manager.deserializeSnapshotBufferFromDisk(50);
     auto [restored_storage, meta, _] = manager.deserializeSnapshotFromBuffer(debuf);
 
-    EXPECT_EQ(restored_storage->container.size(), 53);
+    EXPECT_EQ(restored_storage->container.size(), 54);
     for (size_t i = 0; i < 50; ++i)
     {
         EXPECT_EQ(restored_storage->container.getValue("/hello_" + std::to_string(i)).getData(), "world_" + std::to_string(i));
@@ -1264,7 +1354,9 @@ TEST_P(CoordinationTest, TestStorageSnapshotManySnapshots)
 {
     auto params = GetParam();
     ChangelogDirTest test("./snapshots");
-    DB::KeeperSnapshotManager manager("./snapshots", 3, keeper_context, params.enable_compression);
+    setSnapshotDirectory("./snapshots");
+
+    DB::KeeperSnapshotManager manager(3, keeper_context, params.enable_compression);
 
     DB::KeeperStorage storage(500, "", keeper_context);
     storage.getSessionID(130);
@@ -1291,7 +1383,7 @@ TEST_P(CoordinationTest, TestStorageSnapshotManySnapshots)
 
     auto [restored_storage, meta, _] = manager.restoreFromLatestSnapshot();
 
-    EXPECT_EQ(restored_storage->container.size(), 253);
+    EXPECT_EQ(restored_storage->container.size(), 254);
 
     for (size_t i = 0; i < 250; ++i)
     {
@@ -1303,7 +1395,9 @@ TEST_P(CoordinationTest, TestStorageSnapshotMode)
 {
     auto params = GetParam();
     ChangelogDirTest test("./snapshots");
-    DB::KeeperSnapshotManager manager("./snapshots", 3, keeper_context, params.enable_compression);
+    setSnapshotDirectory("./snapshots");
+
+    DB::KeeperSnapshotManager manager(3, keeper_context, params.enable_compression);
     DB::KeeperStorage storage(500, "", keeper_context);
     for (size_t i = 0; i < 50; ++i)
     {
@@ -1325,16 +1419,16 @@ TEST_P(CoordinationTest, TestStorageSnapshotMode)
             if (i % 2 == 0)
                 storage.container.erase("/hello_" + std::to_string(i));
         }
-        EXPECT_EQ(storage.container.size(), 28);
-        EXPECT_EQ(storage.container.snapshotSizeWithVersion().first, 104);
+        EXPECT_EQ(storage.container.size(), 29);
+        EXPECT_EQ(storage.container.snapshotSizeWithVersion().first, 105);
         EXPECT_EQ(storage.container.snapshotSizeWithVersion().second, 1);
         auto buf = manager.serializeSnapshotToBuffer(snapshot);
         manager.serializeSnapshotBufferToDisk(*buf, 50);
     }
     EXPECT_TRUE(fs::exists("./snapshots/snapshot_50.bin" + params.extension));
-    EXPECT_EQ(storage.container.size(), 28);
+    EXPECT_EQ(storage.container.size(), 29);
     storage.clearGarbageAfterSnapshot();
-    EXPECT_EQ(storage.container.snapshotSizeWithVersion().first, 28);
+    EXPECT_EQ(storage.container.snapshotSizeWithVersion().first, 29);
     for (size_t i = 0; i < 50; ++i)
     {
         if (i % 2 != 0)
@@ -1349,14 +1443,15 @@ TEST_P(CoordinationTest, TestStorageSnapshotMode)
     {
         EXPECT_EQ(restored_storage->container.getValue("/hello_" + std::to_string(i)).getData(), "world_" + std::to_string(i));
     }
-
 }
 
 TEST_P(CoordinationTest, TestStorageSnapshotBroken)
 {
     auto params = GetParam();
     ChangelogDirTest test("./snapshots");
-    DB::KeeperSnapshotManager manager("./snapshots", 3, keeper_context, params.enable_compression);
+    setSnapshotDirectory("./snapshots");
+
+    DB::KeeperSnapshotManager manager(3, keeper_context, params.enable_compression);
     DB::KeeperStorage storage(500, "", keeper_context);
     for (size_t i = 0; i < 50; ++i)
     {
@@ -1370,7 +1465,8 @@ TEST_P(CoordinationTest, TestStorageSnapshotBroken)
     EXPECT_TRUE(fs::exists("./snapshots/snapshot_50.bin" + params.extension));
 
     /// Let's corrupt file
-    DB::WriteBufferFromFile plain_buf("./snapshots/snapshot_50.bin" + params.extension, DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
+    DB::WriteBufferFromFile plain_buf(
+        "./snapshots/snapshot_50.bin" + params.extension, DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
     plain_buf.truncate(34);
     plain_buf.sync();
 
@@ -1390,25 +1486,35 @@ nuraft::ptr<nuraft::buffer> getBufferFromZKRequest(int64_t session_id, int64_t z
     return buf.getBuffer();
 }
 
-nuraft::ptr<nuraft::log_entry> getLogEntryFromZKRequest(size_t term, int64_t session_id, int64_t zxid, const Coordination::ZooKeeperRequestPtr & request)
+nuraft::ptr<nuraft::log_entry>
+getLogEntryFromZKRequest(size_t term, int64_t session_id, int64_t zxid, const Coordination::ZooKeeperRequestPtr & request)
 {
     auto buffer = getBufferFromZKRequest(session_id, zxid, request);
     return nuraft::cs_new<nuraft::log_entry>(term, buffer);
 }
 
-void testLogAndStateMachine(Coordination::CoordinationSettingsPtr settings, uint64_t total_logs, bool enable_compression, Coordination::KeeperContextPtr keeper_context)
+void testLogAndStateMachine(
+    Coordination::CoordinationSettingsPtr settings,
+    uint64_t total_logs,
+    bool enable_compression,
+    Coordination::KeeperContextPtr keeper_context)
 {
     using namespace Coordination;
     using namespace DB;
 
     ChangelogDirTest snapshots("./snapshots");
+    keeper_context->setSnapshotDisk(std::make_shared<DiskLocal>("SnapshotDisk", "./snapshots", 0));
     ChangelogDirTest logs("./logs");
+    keeper_context->setLogDisk(std::make_shared<DiskLocal>("LogDisk", "./logs", 0));
 
     ResponsesQueue queue(std::numeric_limits<size_t>::max());
     SnapshotsQueue snapshots_queue{1};
-    auto state_machine = std::make_shared<KeeperStateMachine>(queue, snapshots_queue, "./snapshots", settings, keeper_context, nullptr);
+    auto state_machine = std::make_shared<KeeperStateMachine>(queue, snapshots_queue, settings, keeper_context, nullptr);
     state_machine->init();
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = enable_compression, .rotate_interval = settings->rotate_log_storage_interval});
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{
+            .force_sync = true, .compress_logs = enable_compression, .rotate_interval = settings->rotate_log_storage_interval},
+        keeper_context);
     changelog.init(state_machine->last_commit_index() + 1, settings->reserved_log_items);
     for (size_t i = 1; i < total_logs + 1; ++i)
     {
@@ -1426,7 +1532,8 @@ void testLogAndStateMachine(Coordination::CoordinationSettingsPtr settings, uint
         if (i % settings->snapshot_distance == 0)
         {
             nuraft::snapshot s(i, 0, std::make_shared<nuraft::cluster_config>());
-            nuraft::async_result<bool>::handler_type when_done = [&snapshot_created] (bool & ret, nuraft::ptr<std::exception> &/*exception*/)
+            nuraft::async_result<bool>::handler_type when_done
+                = [&snapshot_created](bool & ret, nuraft::ptr<std::exception> & /*exception*/)
             {
                 snapshot_created = ret;
                 LOG_INFO(&Poco::Logger::get("CoordinationTest"), "Snapshot finished");
@@ -1444,17 +1551,21 @@ void testLogAndStateMachine(Coordination::CoordinationSettingsPtr settings, uint
     }
 
     SnapshotsQueue snapshots_queue1{1};
-    auto restore_machine = std::make_shared<KeeperStateMachine>(queue, snapshots_queue1, "./snapshots", settings, keeper_context, nullptr);
+    auto restore_machine = std::make_shared<KeeperStateMachine>(queue, snapshots_queue1, settings, keeper_context, nullptr);
     restore_machine->init();
     EXPECT_EQ(restore_machine->last_commit_index(), total_logs - total_logs % settings->snapshot_distance);
 
-    DB::KeeperLogStore restore_changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = enable_compression, .rotate_interval = settings->rotate_log_storage_interval});
+    DB::KeeperLogStore restore_changelog(
+        DB::LogFileSettings{
+            .force_sync = true, .compress_logs = enable_compression, .rotate_interval = settings->rotate_log_storage_interval},
+        keeper_context);
     restore_changelog.init(restore_machine->last_commit_index() + 1, settings->reserved_log_items);
 
     EXPECT_EQ(restore_changelog.size(), std::min(settings->reserved_log_items + total_logs % settings->snapshot_distance, total_logs));
     EXPECT_EQ(restore_changelog.next_slot(), total_logs + 1);
     if (total_logs > settings->reserved_log_items + 1)
-        EXPECT_EQ(restore_changelog.start_index(), total_logs - total_logs % settings->snapshot_distance - settings->reserved_log_items + 1);
+        EXPECT_EQ(
+            restore_changelog.start_index(), total_logs - total_logs % settings->snapshot_distance - settings->reserved_log_items + 1);
     else
         EXPECT_EQ(restore_changelog.start_index(), 1);
 
@@ -1552,11 +1663,13 @@ TEST_P(CoordinationTest, TestEphemeralNodeRemove)
     using namespace DB;
 
     ChangelogDirTest snapshots("./snapshots");
+    setSnapshotDirectory("./snapshots");
+
     CoordinationSettingsPtr settings = std::make_shared<CoordinationSettings>();
 
     ResponsesQueue queue(std::numeric_limits<size_t>::max());
     SnapshotsQueue snapshots_queue{1};
-    auto state_machine = std::make_shared<KeeperStateMachine>(queue, snapshots_queue, "./snapshots", settings, keeper_context, nullptr);
+    auto state_machine = std::make_shared<KeeperStateMachine>(queue, snapshots_queue, settings, keeper_context, nullptr);
     state_machine->init();
 
     std::shared_ptr<ZooKeeperCreateRequest> request_c = std::make_shared<ZooKeeperCreateRequest>();
@@ -1585,11 +1698,12 @@ TEST_P(CoordinationTest, TestCreateNodeWithAuthSchemeForAclWhenAuthIsPrecommitte
     using namespace DB;
 
     ChangelogDirTest snapshots("./snapshots");
+    setSnapshotDirectory("./snapshots");
     CoordinationSettingsPtr settings = std::make_shared<CoordinationSettings>();
     ResponsesQueue queue(std::numeric_limits<size_t>::max());
     SnapshotsQueue snapshots_queue{1};
 
-    auto state_machine = std::make_shared<KeeperStateMachine>(queue, snapshots_queue, "./snapshots", settings, keeper_context, nullptr);
+    auto state_machine = std::make_shared<KeeperStateMachine>(queue, snapshots_queue, settings, keeper_context, nullptr);
     state_machine->init();
 
     String user_auth_data = "test_user:test_password";
@@ -1635,11 +1749,13 @@ TEST_P(CoordinationTest, TestSetACLWithAuthSchemeForAclWhenAuthIsPrecommitted)
     using namespace DB;
 
     ChangelogDirTest snapshots("./snapshots");
+    setSnapshotDirectory("./snapshots");
+
     CoordinationSettingsPtr settings = std::make_shared<CoordinationSettings>();
     ResponsesQueue queue(std::numeric_limits<size_t>::max());
     SnapshotsQueue snapshots_queue{1};
 
-    auto state_machine = std::make_shared<KeeperStateMachine>(queue, snapshots_queue, "./snapshots", settings, keeper_context, nullptr);
+    auto state_machine = std::make_shared<KeeperStateMachine>(queue, snapshots_queue, settings, keeper_context, nullptr);
     state_machine->init();
 
     String user_auth_data = "test_user:test_password";
@@ -1691,8 +1807,10 @@ TEST_P(CoordinationTest, TestRotateIntervalChanges)
     using namespace Coordination;
     auto params = GetParam();
     ChangelogDirTest snapshots("./logs");
+    setLogDirectory("./logs");
     {
-        DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+        DB::KeeperLogStore changelog(
+            DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
 
         changelog.init(0, 3);
         for (size_t i = 1; i < 55; ++i)
@@ -1710,7 +1828,8 @@ TEST_P(CoordinationTest, TestRotateIntervalChanges)
 
     EXPECT_TRUE(fs::exists("./logs/changelog_1_100.bin" + params.extension));
 
-    DB::KeeperLogStore changelog_1("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 10});
+    DB::KeeperLogStore changelog_1(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 10}, keeper_context);
     changelog_1.init(0, 50);
     for (size_t i = 0; i < 55; ++i)
     {
@@ -1726,7 +1845,8 @@ TEST_P(CoordinationTest, TestRotateIntervalChanges)
     EXPECT_TRUE(fs::exists("./logs/changelog_1_100.bin" + params.extension));
     EXPECT_TRUE(fs::exists("./logs/changelog_101_110.bin" + params.extension));
 
-    DB::KeeperLogStore changelog_2("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 7});
+    DB::KeeperLogStore changelog_2(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 7}, keeper_context);
     changelog_2.init(98, 55);
 
     for (size_t i = 0; i < 17; ++i)
@@ -1749,7 +1869,8 @@ TEST_P(CoordinationTest, TestRotateIntervalChanges)
     EXPECT_TRUE(fs::exists("./logs/changelog_118_124.bin" + params.extension));
     EXPECT_TRUE(fs::exists("./logs/changelog_125_131.bin" + params.extension));
 
-    DB::KeeperLogStore changelog_3("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5});
+    DB::KeeperLogStore changelog_3(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 5}, keeper_context);
     changelog_3.init(116, 3);
     for (size_t i = 0; i < 17; ++i)
     {
@@ -1796,8 +1917,10 @@ TEST_P(CoordinationTest, TestCompressedLogsMultipleRewrite)
 {
     using namespace Coordination;
     auto test_params = GetParam();
-    ChangelogDirTest snapshots("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = test_params.enable_compression, .rotate_interval = 100});
+    ChangelogDirTest logs("./logs");
+    setLogDirectory("./logs");
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = test_params.enable_compression, .rotate_interval = 100}, keeper_context);
 
     changelog.init(0, 3);
     for (size_t i = 1; i < 55; ++i)
@@ -1811,7 +1934,8 @@ TEST_P(CoordinationTest, TestCompressedLogsMultipleRewrite)
 
     waitDurableLogs(changelog);
 
-    DB::KeeperLogStore changelog1("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = test_params.enable_compression, .rotate_interval = 100});
+    DB::KeeperLogStore changelog1(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = test_params.enable_compression, .rotate_interval = 100}, keeper_context);
     changelog1.init(0, 3);
     for (size_t i = 55; i < 70; ++i)
     {
@@ -1822,7 +1946,10 @@ TEST_P(CoordinationTest, TestCompressedLogsMultipleRewrite)
         changelog1.end_of_append_batch(0, 0);
     }
 
-    DB::KeeperLogStore changelog2("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = test_params.enable_compression, .rotate_interval = 100});
+    waitDurableLogs(changelog1);
+
+    DB::KeeperLogStore changelog2(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = test_params.enable_compression, .rotate_interval = 100}, keeper_context);
     changelog2.init(0, 3);
     for (size_t i = 70; i < 80; ++i)
     {
@@ -1839,7 +1966,9 @@ TEST_P(CoordinationTest, TestStorageSnapshotDifferentCompressions)
     auto params = GetParam();
 
     ChangelogDirTest test("./snapshots");
-    DB::KeeperSnapshotManager manager("./snapshots", 3, keeper_context, params.enable_compression);
+    setSnapshotDirectory("./snapshots");
+
+    DB::KeeperSnapshotManager manager(3, keeper_context, params.enable_compression);
 
     DB::KeeperStorage storage(500, "", keeper_context);
     addNode(storage, "/hello", "world", 1);
@@ -1857,13 +1986,13 @@ TEST_P(CoordinationTest, TestStorageSnapshotDifferentCompressions)
     manager.serializeSnapshotBufferToDisk(*buf, 2);
     EXPECT_TRUE(fs::exists("./snapshots/snapshot_2.bin" + params.extension));
 
-    DB::KeeperSnapshotManager new_manager("./snapshots", 3, keeper_context, !params.enable_compression);
+    DB::KeeperSnapshotManager new_manager(3, keeper_context, !params.enable_compression);
 
     auto debuf = new_manager.deserializeSnapshotBufferFromDisk(2);
 
     auto [restored_storage, snapshot_meta, _] = new_manager.deserializeSnapshotFromBuffer(debuf);
 
-    EXPECT_EQ(restored_storage->container.size(), 5);
+    EXPECT_EQ(restored_storage->container.size(), 6);
     EXPECT_EQ(restored_storage->container.getValue("/").getChildren().size(), 2);
     EXPECT_EQ(restored_storage->container.getValue("/hello").getChildren().size(), 1);
     EXPECT_EQ(restored_storage->container.getValue("/hello/somepath").getChildren().size(), 0);
@@ -1883,9 +2012,10 @@ TEST_P(CoordinationTest, ChangelogInsertThreeTimesSmooth)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
+    setLogDirectory("./logs");
     {
         LOG_INFO(log, "================First time=====================");
-        DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+        DB::KeeperLogStore changelog(DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
         changelog.init(1, 0);
         auto entry = getLogEntry("hello_world", 1000);
         changelog.append(entry);
@@ -1896,7 +2026,8 @@ TEST_P(CoordinationTest, ChangelogInsertThreeTimesSmooth)
 
     {
         LOG_INFO(log, "================Second time=====================");
-        DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+        DB::KeeperLogStore changelog(
+            DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
         changelog.init(1, 0);
         auto entry = getLogEntry("hello_world", 1000);
         changelog.append(entry);
@@ -1907,7 +2038,8 @@ TEST_P(CoordinationTest, ChangelogInsertThreeTimesSmooth)
 
     {
         LOG_INFO(log, "================Third time=====================");
-        DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+        DB::KeeperLogStore changelog(
+            DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
         changelog.init(1, 0);
         auto entry = getLogEntry("hello_world", 1000);
         changelog.append(entry);
@@ -1918,7 +2050,8 @@ TEST_P(CoordinationTest, ChangelogInsertThreeTimesSmooth)
 
     {
         LOG_INFO(log, "================Fourth time=====================");
-        DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+        DB::KeeperLogStore changelog(
+            DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
         changelog.init(1, 0);
         auto entry = getLogEntry("hello_world", 1000);
         changelog.append(entry);
@@ -1933,10 +2066,12 @@ TEST_P(CoordinationTest, ChangelogInsertMultipleTimesSmooth)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
+    setLogDirectory("./logs");
     for (size_t i = 0; i < 36; ++i)
     {
         LOG_INFO(log, "================First time=====================");
-        DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+        DB::KeeperLogStore changelog(
+            DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
         changelog.init(1, 0);
         for (size_t j = 0; j < 7; ++j)
         {
@@ -1947,7 +2082,8 @@ TEST_P(CoordinationTest, ChangelogInsertMultipleTimesSmooth)
         waitDurableLogs(changelog);
     }
 
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
     changelog.init(1, 0);
     EXPECT_EQ(changelog.next_slot(), 36 * 7 + 1);
 }
@@ -1956,9 +2092,11 @@ TEST_P(CoordinationTest, ChangelogInsertThreeTimesHard)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
+    setLogDirectory("./logs");
     {
         LOG_INFO(log, "================First time=====================");
-        DB::KeeperLogStore changelog1("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+        DB::KeeperLogStore changelog1(
+            DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
         changelog1.init(1, 0);
         auto entry = getLogEntry("hello_world", 1000);
         changelog1.append(entry);
@@ -1969,7 +2107,8 @@ TEST_P(CoordinationTest, ChangelogInsertThreeTimesHard)
 
     {
         LOG_INFO(log, "================Second time=====================");
-        DB::KeeperLogStore changelog2("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+        DB::KeeperLogStore changelog2(
+            DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
         changelog2.init(1, 0);
         auto entry = getLogEntry("hello_world", 1000);
         changelog2.append(entry);
@@ -1980,7 +2119,8 @@ TEST_P(CoordinationTest, ChangelogInsertThreeTimesHard)
 
     {
         LOG_INFO(log, "================Third time=====================");
-        DB::KeeperLogStore changelog3("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+        DB::KeeperLogStore changelog3(
+            DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
         changelog3.init(1, 0);
         auto entry = getLogEntry("hello_world", 1000);
         changelog3.append(entry);
@@ -1991,7 +2131,8 @@ TEST_P(CoordinationTest, ChangelogInsertThreeTimesHard)
 
     {
         LOG_INFO(log, "================Fourth time=====================");
-        DB::KeeperLogStore changelog4("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100});
+        DB::KeeperLogStore changelog4(
+            DB::LogFileSettings{.force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100}, keeper_context);
         changelog4.init(1, 0);
         auto entry = getLogEntry("hello_world", 1000);
         changelog4.append(entry);
@@ -2005,10 +2146,12 @@ TEST_P(CoordinationTest, TestStorageSnapshotEqual)
 {
     auto params = GetParam();
     ChangelogDirTest test("./snapshots");
+    setSnapshotDirectory("./snapshots");
+
     std::optional<UInt128> snapshot_hash;
     for (size_t i = 0; i < 15; ++i)
     {
-        DB::KeeperSnapshotManager manager("./snapshots", 3, keeper_context, params.enable_compression);
+        DB::KeeperSnapshotManager manager(3, keeper_context, params.enable_compression);
 
         DB::KeeperStorage storage(500, "", keeper_context);
         addNode(storage, "/hello", "");
@@ -2048,7 +2191,10 @@ TEST_P(CoordinationTest, TestLogGap)
     using namespace Coordination;
     auto test_params = GetParam();
     ChangelogDirTest logs("./logs");
-    DB::KeeperLogStore changelog("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = test_params.enable_compression, .rotate_interval = 100});
+    setLogDirectory("./logs");
+
+    DB::KeeperLogStore changelog(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = test_params.enable_compression, .rotate_interval = 100}, keeper_context);
 
     changelog.init(0, 3);
     for (size_t i = 1; i < 55; ++i)
@@ -2060,7 +2206,8 @@ TEST_P(CoordinationTest, TestLogGap)
         changelog.end_of_append_batch(0, 0);
     }
 
-    DB::KeeperLogStore changelog1("./logs", DB::LogFileSettings{.force_sync = true, .compress_logs = test_params.enable_compression, .rotate_interval = 100});
+    DB::KeeperLogStore changelog1(
+        DB::LogFileSettings{.force_sync = true, .compress_logs = test_params.enable_compression, .rotate_interval = 100}, keeper_context);
     changelog1.init(61, 3);
 
     /// Logs discarded
@@ -2220,13 +2367,13 @@ TEST_P(CoordinationTest, TestListRequestTypes)
         return create_response.path_created;
     };
 
-    create_path(parentPath(StringRef{test_path}).toString(), false, false);
+    create_path(parentNodePath(StringRef{test_path}).toString(), false, false);
 
     static constexpr size_t persistent_num = 5;
     std::unordered_set<std::string> expected_persistent_children;
     for (size_t i = 0; i < persistent_num; ++i)
     {
-        expected_persistent_children.insert(getBaseName(create_path(test_path, false)).toString());
+        expected_persistent_children.insert(getBaseNodeName(create_path(test_path, false)).toString());
     }
     ASSERT_EQ(expected_persistent_children.size(), persistent_num);
 
@@ -2234,7 +2381,7 @@ TEST_P(CoordinationTest, TestListRequestTypes)
     std::unordered_set<std::string> expected_ephemeral_children;
     for (size_t i = 0; i < ephemeral_num; ++i)
     {
-        expected_ephemeral_children.insert(getBaseName(create_path(test_path, true)).toString());
+        expected_ephemeral_children.insert(getBaseNodeName(create_path(test_path, true)).toString());
     }
     ASSERT_EQ(expected_ephemeral_children.size(), ephemeral_num);
 
@@ -2242,7 +2389,7 @@ TEST_P(CoordinationTest, TestListRequestTypes)
     {
         const auto list_request = std::make_shared<ZooKeeperFilteredListRequest>();
         int new_zxid = ++zxid;
-        list_request->path = parentPath(StringRef{test_path}).toString();
+        list_request->path = parentNodePath(StringRef{test_path}).toString();
         list_request->list_request_type = list_request_type;
         storage.preprocessRequest(list_request, 1, 0, new_zxid);
         auto responses = storage.processRequest(list_request, 1, new_zxid);
@@ -2270,20 +2417,23 @@ TEST_P(CoordinationTest, TestListRequestTypes)
     EXPECT_EQ(all_children.size(), ephemeral_num + persistent_num);
     for (const auto & child : all_children)
     {
-        EXPECT_TRUE(expected_ephemeral_children.contains(child) || expected_persistent_children.contains(child)) << "Missing child " << child;
+        EXPECT_TRUE(expected_ephemeral_children.contains(child) || expected_persistent_children.contains(child))
+            << "Missing child " << child;
     }
 }
 
 TEST_P(CoordinationTest, TestDurableState)
 {
     ChangelogDirTest logs("./logs");
+    setLogDirectory("./logs");
+    setStateFileDirectory(".");
 
     auto state = nuraft::cs_new<nuraft::srv_state>();
     std::optional<DB::KeeperStateManager> state_manager;
 
     const auto reload_state_manager = [&]
     {
-        state_manager.emplace(1, "localhost", 9181, "./logs", "./state");
+        state_manager.emplace(1, "localhost", 9181, keeper_context);
         state_manager->loadLogStore(1, 0);
     };
 
@@ -2318,11 +2468,11 @@ TEST_P(CoordinationTest, TestDurableState)
         write_buf.sync();
         write_buf.close();
         reload_state_manager();
-#ifdef NDEBUG
+#    ifdef NDEBUG
         ASSERT_EQ(state_manager->read_state(), nullptr);
-#else
+#    else
         ASSERT_THROW(state_manager->read_state(), DB::Exception);
-#endif
+#    endif
     }
 
     {
@@ -2346,18 +2496,19 @@ TEST_P(CoordinationTest, TestDurableState)
     }
 }
 
-TEST_P(CoordinationTest, TestCurrentApiVersion)
+TEST_P(CoordinationTest, TestFeatureFlags)
 {
     using namespace Coordination;
     KeeperStorage storage{500, "", keeper_context};
     auto request = std::make_shared<ZooKeeperGetRequest>();
-    request->path = DB::keeper_api_version_path;
+    request->path = DB::keeper_api_feature_flags_path;
     auto responses = storage.processRequest(request, 0, std::nullopt, true, true);
     const auto & get_response = getSingleResponse<ZooKeeperGetResponse>(responses);
-    uint8_t keeper_version{0};
-    DB::ReadBufferFromOwnString buf(get_response.data);
-    DB::readIntText(keeper_version, buf);
-    EXPECT_EQ(keeper_version, static_cast<uint8_t>(current_keeper_api_version));
+    DB::KeeperFeatureFlags feature_flags;
+    feature_flags.setFeatureFlags(get_response.data);
+    ASSERT_TRUE(feature_flags.isEnabled(KeeperFeatureFlag::FILTERED_LIST));
+    ASSERT_TRUE(feature_flags.isEnabled(KeeperFeatureFlag::MULTI_READ));
+    ASSERT_FALSE(feature_flags.isEnabled(KeeperFeatureFlag::CHECK_NOT_EXISTS));
 }
 
 TEST_P(CoordinationTest, TestSystemNodeModify)
@@ -2366,7 +2517,7 @@ TEST_P(CoordinationTest, TestSystemNodeModify)
     int64_t zxid{0};
 
     // On INIT we abort when a system path is modified
-    keeper_context->server_state = KeeperContext::Phase::RUNNING;
+    keeper_context->setServerState(KeeperContext::Phase::RUNNING);
     KeeperStorage storage{500, "", keeper_context};
     const auto assert_create = [&](const std::string_view path, const auto expected_code)
     {
@@ -2396,15 +2547,16 @@ TEST_P(CoordinationTest, ChangelogTestMaxLogSize)
 {
     auto params = GetParam();
     ChangelogDirTest test("./logs");
+    setLogDirectory("./logs");
 
     uint64_t last_entry_index{0};
     size_t i{0};
     {
         SCOPED_TRACE("Small rotation interval, big size limit");
         DB::KeeperLogStore changelog(
-            "./logs",
             DB::LogFileSettings{
-                .force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 20, .max_size = 50 * 1024 * 1024});
+                .force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 20, .max_size = 50 * 1024 * 1024},
+            keeper_context);
         changelog.init(1, 0);
 
         for (; i < 100; ++i)
@@ -2421,9 +2573,9 @@ TEST_P(CoordinationTest, ChangelogTestMaxLogSize)
     {
         SCOPED_TRACE("Large rotation interval, small size limit");
         DB::KeeperLogStore changelog(
-            "./logs",
             DB::LogFileSettings{
-                .force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100'000, .max_size = 4000});
+                .force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100'000, .max_size = 4000},
+            keeper_context);
         changelog.init(1, 0);
 
         ASSERT_EQ(changelog.entry_at(last_entry_index)->get_term(), (i - 1 + 44) * 10);
@@ -2442,13 +2594,12 @@ TEST_P(CoordinationTest, ChangelogTestMaxLogSize)
     {
         SCOPED_TRACE("Final verify all logs");
         DB::KeeperLogStore changelog(
-            "./logs",
             DB::LogFileSettings{
-                .force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100'000, .max_size = 4000});
+                .force_sync = true, .compress_logs = params.enable_compression, .rotate_interval = 100'000, .max_size = 4000},
+            keeper_context);
         changelog.init(1, 0);
         ASSERT_EQ(changelog.entry_at(last_entry_index)->get_term(), (i - 1 + 44) * 10);
     }
-
 }
 
 TEST_P(CoordinationTest, TestCheckNotExistsRequest)
@@ -2524,13 +2675,86 @@ TEST_P(CoordinationTest, TestCheckNotExistsRequest)
     }
 }
 
+TEST_P(CoordinationTest, TestReapplyingDeltas)
+{
+    using namespace DB;
+    using namespace Coordination;
+
+    static constexpr int64_t initial_zxid = 100;
+
+    const auto create_request = std::make_shared<ZooKeeperCreateRequest>();
+    create_request->path = "/test/data";
+    create_request->is_sequential = true;
+
+    const auto process_create = [](KeeperStorage & storage, const auto & request, int64_t zxid)
+    {
+        storage.preprocessRequest(request, 1, 0, zxid);
+        auto responses = storage.processRequest(request, 1, zxid);
+        EXPECT_GE(responses.size(), 1);
+        EXPECT_EQ(responses[0].response->error, Error::ZOK);
+    };
+
+    const auto commit_initial_data = [&](auto & storage)
+    {
+        int64_t zxid = 1;
+
+        const auto root_create = std::make_shared<ZooKeeperCreateRequest>();
+        root_create->path = "/test";
+        process_create(storage, root_create, zxid);
+        ++zxid;
+
+        for (; zxid <= initial_zxid; ++zxid)
+            process_create(storage, create_request, zxid);
+    };
+
+    KeeperStorage storage1{500, "", keeper_context};
+    commit_initial_data(storage1);
+
+    for (int64_t zxid = initial_zxid + 1; zxid < initial_zxid + 50; ++zxid)
+        storage1.preprocessRequest(create_request, 1, 0, zxid);
+
+    /// create identical new storage
+    KeeperStorage storage2{500, "", keeper_context};
+    commit_initial_data(storage2);
+
+    storage1.applyUncommittedState(storage2, initial_zxid);
+
+    const auto commit_unprocessed = [&](KeeperStorage & storage)
+    {
+        for (int64_t zxid = initial_zxid + 1; zxid < initial_zxid + 50; ++zxid)
+        {
+            auto responses = storage.processRequest(create_request, 1, zxid);
+            EXPECT_GE(responses.size(), 1);
+            EXPECT_EQ(responses[0].response->error, Error::ZOK);
+        }
+    };
+
+    commit_unprocessed(storage1);
+    commit_unprocessed(storage2);
+
+    const auto get_children = [&](KeeperStorage & storage)
+    {
+        const auto list_request = std::make_shared<ZooKeeperListRequest>();
+        list_request->path = "/test";
+        auto responses = storage.processRequest(list_request, 1, std::nullopt, /*check_acl=*/true, /*is_local=*/true);
+        EXPECT_EQ(responses.size(), 1);
+        const auto * list_response = dynamic_cast<const ListResponse *>(responses[0].response.get());
+        EXPECT_TRUE(list_response);
+        return list_response->names;
+    };
+
+    auto children1 = get_children(storage1);
+    std::unordered_set<std::string> children1_set(children1.begin(), children1.end());
+
+    auto children2 = get_children(storage2);
+    std::unordered_set<std::string> children2_set(children2.begin(), children2.end());
+
+    ASSERT_TRUE(children1_set == children2_set);
+}
+
 INSTANTIATE_TEST_SUITE_P(CoordinationTestSuite,
     CoordinationTest,
-    ::testing::ValuesIn(std::initializer_list<CompressionParam>{
-            CompressionParam{true, ".zstd"},
-            CompressionParam{false, ""}
-    })
-);
+    ::testing::ValuesIn(std::initializer_list<CompressionParam>{CompressionParam{true, ".zstd"}, CompressionParam{false, ""}}));
 
 int main(int argc, char ** argv)
 {
diff --git a/src/Core/BaseSettings.h b/src/Core/BaseSettings.h
index a14cec9cc7d..75b13304326 100644
--- a/src/Core/BaseSettings.h
+++ b/src/Core/BaseSettings.h
@@ -2,6 +2,8 @@
 
 #include <Core/SettingsFields.h>
 #include <Common/SettingsChanges.h>
+#include <Common/FieldVisitorToString.h>
+#include <IO/Operators.h>
 #include <base/range.h>
 #include <boost/blank.hpp>
 #include <unordered_map>
@@ -547,14 +549,16 @@ void BaseSettings<TTraits>::read(ReadBuffer & in, SettingsWriteFormat format)
 template <typename TTraits>
 String BaseSettings<TTraits>::toString() const
 {
-    String res;
-    for (const auto & field : *this)
+    WriteBufferFromOwnString out;
+    bool first = true;
+    for (const auto & setting : *this)
     {
-        if (!res.empty())
-            res += ", ";
-        res += field.getName() + " = " + field.getValueString();
+        if (!first)
+            out << ", ";
+        out << setting.getName() << " = " << applyVisitor(FieldVisitorToString(), setting.getValue());
+        first = false;
     }
-    return res;
+    return out.str();
 }
 
 template <typename TTraits>
diff --git a/src/Core/ExternalTable.cpp b/src/Core/ExternalTable.cpp
index 0f880ed967f..676af280cad 100644
--- a/src/Core/ExternalTable.cpp
+++ b/src/Core/ExternalTable.cpp
@@ -167,7 +167,7 @@ void ExternalTablesHandler::handlePart(const Poco::Net::MessageHeader & header,
     auto temporary_table = TemporaryTableHolder(getContext(), ColumnsDescription{columns}, {});
     auto storage = temporary_table.getTable();
     getContext()->addExternalTable(data->table_name, std::move(temporary_table));
-    auto sink = storage->write(ASTPtr(), storage->getInMemoryMetadataPtr(), getContext());
+    auto sink = storage->write(ASTPtr(), storage->getInMemoryMetadataPtr(), getContext(), /*async_insert=*/false);
 
     /// Write data
     auto pipeline = QueryPipelineBuilder::getPipeline(std::move(*data->pipe));
diff --git a/src/Core/MySQL/IMySQLWritePacket.cpp b/src/Core/MySQL/IMySQLWritePacket.cpp
index b5c95717a9b..fd27603d6a8 100644
--- a/src/Core/MySQL/IMySQLWritePacket.cpp
+++ b/src/Core/MySQL/IMySQLWritePacket.cpp
@@ -16,7 +16,7 @@ void IMySQLWritePacket::writePayload(WriteBuffer & buffer, uint8_t & sequence_id
 {
     MySQLPacketPayloadWriteBuffer buf(buffer, getPayloadSize(), sequence_id);
     writePayloadImpl(buf);
-    buf.next();
+    buf.finalize();
     if (buf.remainingPayloadSize())
     {
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Incomplete payload. Written {} bytes, expected {} bytes.",
diff --git a/src/Core/Protocol.h b/src/Core/Protocol.h
index 86c0a851c60..97a2831ffe8 100644
--- a/src/Core/Protocol.h
+++ b/src/Core/Protocol.h
@@ -83,7 +83,8 @@ namespace Protocol
             ProfileEvents = 14,             /// Packet with profile events from server.
             MergeTreeAllRangesAnnounecement = 15,
             MergeTreeReadTaskRequest = 16,  /// Request from a MergeTree replica to a coordinator
-            MAX = MergeTreeReadTaskRequest,
+            TimezoneUpdate = 17,            /// Receive server's (session-wide) default timezone
+            MAX = TimezoneUpdate,
 
         };
 
@@ -111,6 +112,7 @@ namespace Protocol
                 "ProfileEvents",
                 "MergeTreeAllRangesAnnounecement",
                 "MergeTreeReadTaskRequest",
+                "TimezoneUpdate",
             };
             return packet <= MAX
                 ? data[packet]
diff --git a/src/Core/ProtocolDefines.h b/src/Core/ProtocolDefines.h
index ff9b1fae442..dbe13d9502a 100644
--- a/src/Core/ProtocolDefines.h
+++ b/src/Core/ProtocolDefines.h
@@ -53,7 +53,7 @@
 /// NOTE: DBMS_TCP_PROTOCOL_VERSION has nothing common with VERSION_REVISION,
 /// later is just a number for server version (one number instead of commit SHA)
 /// for simplicity (sometimes it may be more convenient in some use cases).
-#define DBMS_TCP_PROTOCOL_VERSION 54462
+#define DBMS_TCP_PROTOCOL_VERSION 54464
 
 #define DBMS_MIN_PROTOCOL_VERSION_WITH_INITIAL_QUERY_START_TIME 54449
 
@@ -73,3 +73,7 @@
 #define DBMS_MIN_PROTOCOL_VERSION_WITH_PASSWORD_COMPLEXITY_RULES 54461
 
 #define DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET_V2 54462
+
+#define DBMS_MIN_PROTOCOL_VERSION_WITH_TOTAL_BYTES_IN_PROGRESS 54463
+
+#define DBMS_MIN_PROTOCOL_VERSION_WITH_TIMEZONE_UPDATES 54464
diff --git a/src/Core/QualifiedTableName.h b/src/Core/QualifiedTableName.h
index 3310130629d..bf05bd59caf 100644
--- a/src/Core/QualifiedTableName.h
+++ b/src/Core/QualifiedTableName.h
@@ -127,7 +127,7 @@ namespace fmt
         template <typename FormatContext>
         auto format(const DB::QualifiedTableName & name, FormatContext & ctx)
         {
-            return format_to(ctx.out(), "{}.{}", DB::backQuoteIfNeed(name.database), DB::backQuoteIfNeed(name.table));
+            return fmt::format_to(ctx.out(), "{}.{}", DB::backQuoteIfNeed(name.database), DB::backQuoteIfNeed(name.table));
         }
     };
 }
diff --git a/src/Core/ServerSettings.h b/src/Core/ServerSettings.h
index cb43d62ecd1..1a9f226041b 100644
--- a/src/Core/ServerSettings.h
+++ b/src/Core/ServerSettings.h
@@ -21,7 +21,9 @@ namespace DB
     M(UInt64, max_io_thread_pool_size, 100, "The maximum number of threads that would be used for IO operations", 0) \
     M(UInt64, max_io_thread_pool_free_size, 0, "Max free size for IO thread pool.", 0) \
     M(UInt64, io_thread_pool_queue_size, 10000, "Queue size for IO thread pool.", 0) \
-    M(UInt64, max_outdated_parts_loading_thread_pool_size, 32, "The maximum number of threads that would be used for loading outdated data parts on startup", 0) \
+    M(UInt64, max_active_parts_loading_thread_pool_size, 64, "The number of threads to load active set of data parts (Active ones) at startup.", 0) \
+    M(UInt64, max_outdated_parts_loading_thread_pool_size, 32, "The number of threads to load inactive set of data parts (Outdated ones) at startup.", 0) \
+    M(UInt64, max_parts_cleaning_thread_pool_size, 128, "The number of threads for concurrent removal of inactive data parts.", 0) \
     M(UInt64, max_replicated_fetches_network_bandwidth_for_server, 0, "The maximum speed of data exchange over the network in bytes per second for replicated fetches. Zero means unlimited.", 0) \
     M(UInt64, max_replicated_sends_network_bandwidth_for_server, 0, "The maximum speed of data exchange over the network in bytes per second for replicated sends. Zero means unlimited.", 0) \
     M(UInt64, max_remote_read_network_bandwidth_for_server, 0, "The maximum speed of data exchange over the network in bytes per second for read. Zero means unlimited.", 0) \
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index f40dd01a51b..b7d12a518c8 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -81,7 +81,9 @@ class IColumn;
     M(UInt64, s3_upload_part_size_multiply_parts_count_threshold, 500, "Each time this number of parts was uploaded to S3 s3_min_upload_part_size multiplied by s3_upload_part_size_multiply_factor.", 0) \
     M(UInt64, s3_max_inflight_parts_for_one_file, 20, "The maximum number of a concurrent loaded parts in multipart upload request. 0 means unlimited. You ", 0) \
     M(UInt64, s3_max_single_part_upload_size, 32*1024*1024, "The maximum size of object to upload using singlepart upload to S3.", 0) \
+    M(UInt64, azure_max_single_part_upload_size, 100*1024*1024, "The maximum size of object to upload using singlepart upload to Azure blob storage.", 0) \
     M(UInt64, s3_max_single_read_retries, 4, "The maximum number of retries during single S3 read.", 0) \
+    M(UInt64, azure_max_single_read_retries, 4, "The maximum number of retries during single Azure blob storage read.", 0) \
     M(UInt64, s3_max_unexpected_write_error_retries, 4, "The maximum number of retries in case of unexpected errors during S3 write.", 0) \
     M(UInt64, s3_max_redirects, 10, "Max number of S3 redirects hops allowed.", 0) \
     M(UInt64, s3_max_connections, 1024, "The maximum number of connections per server.", 0) \
@@ -90,8 +92,12 @@ class IColumn;
     M(UInt64, s3_max_put_rps, 0, "Limit on S3 PUT request per second rate before throttling. Zero means unlimited.", 0) \
     M(UInt64, s3_max_put_burst, 0, "Max number of requests that can be issued simultaneously before hitting request per second limit. By default (0) equals to `s3_max_put_rps`", 0) \
     M(UInt64, s3_list_object_keys_size, 1000, "Maximum number of files that could be returned in batch by ListObject request", 0) \
+    M(UInt64, azure_list_object_keys_size, 1000, "Maximum number of files that could be returned in batch by ListObject request", 0) \
     M(Bool, s3_truncate_on_insert, false, "Enables or disables truncate before insert in s3 engine tables.", 0) \
+    M(Bool, azure_truncate_on_insert, false, "Enables or disables truncate before insert in azure engine tables.", 0) \
     M(Bool, s3_create_new_file_on_insert, false, "Enables or disables creating a new file on each insert in s3 engine tables", 0) \
+    M(Bool, s3_skip_empty_files, false, "Allow to skip empty files in s3 table engine", 0) \
+    M(Bool, azure_create_new_file_on_insert, false, "Enables or disables creating a new file on each insert in azure engine tables", 0) \
     M(Bool, s3_check_objects_after_upload, false, "Check each uploaded object to s3 with head request to be sure that upload was successful", 0) \
     M(Bool, s3_allow_parallel_part_upload, true, "Use multiple threads for s3 multipart upload. It may lead to slightly higher memory usage", 0) \
     M(Bool, s3_throw_on_zero_files_match, false, "Throw an error, when ListObjects request cannot match any files", 0) \
@@ -100,6 +106,7 @@ class IColumn;
     M(UInt64, hdfs_replication, 0, "The actual number of replications can be specified when the hdfs file is created.", 0) \
     M(Bool, hdfs_truncate_on_insert, false, "Enables or disables truncate before insert in s3 engine tables", 0) \
     M(Bool, hdfs_create_new_file_on_insert, false, "Enables or disables creating a new file on each insert in hdfs engine tables", 0) \
+    M(Bool, hdfs_skip_empty_files, false, "Allow to skip empty files in hdfs table engine", 0) \
     M(UInt64, hsts_max_age, 0, "Expired time for hsts. 0 means disable HSTS.", 0) \
     M(Bool, extremes, false, "Calculate minimums and maximums of the result columns. They can be output in JSON-formats.", IMPORTANT) \
     M(Bool, use_uncompressed_cache, false, "Whether to use the cache of uncompressed blocks.", 0) \
@@ -134,7 +141,7 @@ class IColumn;
     M(Bool, allow_suspicious_low_cardinality_types, false, "In CREATE TABLE statement allows specifying LowCardinality modifier for types of small fixed size (8 or less). Enabling this may increase merge times and memory consumption.", 0) \
     M(Bool, allow_suspicious_fixed_string_types, false, "In CREATE TABLE statement allows creating columns of type FixedString(n) with n > 256. FixedString with length >= 256 is suspicious and most likely indicates misusage", 0) \
     M(Bool, allow_suspicious_indices, false, "Reject primary/secondary indexes and sorting keys with identical expressions", 0) \
-    M(Bool, compile_expressions, true, "Compile some scalar functions and operators to native code.", 0) \
+    M(Bool, compile_expressions, false, "Compile some scalar functions and operators to native code.", 0) \
     M(UInt64, min_count_to_compile_expression, 3, "The number of identical expressions before they are JIT-compiled", 0) \
     M(Bool, compile_aggregate_expressions, true, "Compile aggregate functions to native code. This feature has a bug and should not be used.", 0) \
     M(UInt64, min_count_to_compile_aggregate_expression, 3, "The number of identical aggregate expressions before they are JIT-compiled", 0) \
@@ -147,6 +154,7 @@ class IColumn;
     M(Bool, enable_memory_bound_merging_of_aggregation_results, true, "Enable memory bound merging strategy for aggregation.", 0) \
     M(Bool, enable_positional_arguments, true, "Enable positional arguments in ORDER BY, GROUP BY and LIMIT BY", 0) \
     M(Bool, enable_extended_results_for_datetime_functions, false, "Enable date functions like toLastDayOfMonth return Date32 results (instead of Date results) for Date32/DateTime64 arguments.", 0) \
+    M(Bool, allow_nonconst_timezone_arguments, false, "Allow non-const timezone arguments in certain time-related functions like toTimeZone(), fromUnixTimestamp*(), snowflakeToDateTime*()", 0) \
     \
     M(Bool, group_by_use_nulls, false, "Treat columns mentioned in ROLLUP, CUBE or GROUPING SETS as Nullable", 0) \
     \
@@ -160,6 +168,7 @@ class IColumn;
     M(UInt64, allow_experimental_parallel_reading_from_replicas, 0, "Use all the replicas from a shard for SELECT query execution. Reading is parallelized and coordinated dynamically. 0 - disabled, 1 - enabled, silently disable them in case of failure, 2 - enabled, throw an exception in case of failure", 0) \
     M(Float, parallel_replicas_single_task_marks_count_multiplier, 2, "A multiplier which will be added during calculation for minimal number of marks to retrieve from coordinator. This will be applied only for remote replicas.", 0) \
     M(Bool, parallel_replicas_for_non_replicated_merge_tree, false, "If true, ClickHouse will use parallel replicas algorithm also for non-replicated MergeTree tables", 0) \
+    M(UInt64, parallel_replicas_min_number_of_granules_to_enable, 0, "If the number of marks to read is less than the value of this setting - parallel replicas will be disabled", 0) \
     \
     M(Bool, skip_unavailable_shards, false, "If true, ClickHouse silently skips unavailable shards and nodes unresolvable through DNS. Shard is marked as unavailable when none of the replicas can be reached.", 0) \
     \
@@ -190,6 +199,7 @@ class IColumn;
     M(Bool, allow_experimental_inverted_index, false, "If it is set to true, allow to use experimental inverted index.", 0) \
     \
     M(UInt64, mysql_max_rows_to_insert, 65536, "The maximum number of rows in MySQL batch insertion of the MySQL storage engine", 0) \
+    M(Bool, use_mysql_types_in_show_columns, false, "Use MySQL converted types when connected via MySQL compatibility for show columns query", 0) \
     \
     M(UInt64, optimize_min_equality_disjunction_chain_length, 3, "The minimum length of the expression `expr = x1 OR ... expr = xN` for optimization ", 0) \
     \
@@ -201,6 +211,8 @@ class IColumn;
     M(Bool, force_primary_key, false, "Throw an exception if there is primary key in a table, and it is not used.", 0) \
     M(Bool, use_skip_indexes, true, "Use data skipping indexes during query execution.", 0) \
     M(Bool, use_skip_indexes_if_final, false, "If query has FINAL, then skipping data based on indexes may produce incorrect result, hence disabled by default.", 0) \
+    M(String, ignore_data_skipping_indices, "", "Comma separated list of strings or literals with the name of the data skipping indices that should be excluded during query execution.", 0) \
+    \
     M(String, force_data_skipping_indices, "", "Comma separated list of strings or literals with the name of the data skipping indices that should be used during query execution, otherwise an exception will be thrown.", 0) \
     \
     M(Float, max_streams_to_max_threads_ratio, 1, "Allows you to use more sources than the number of threads - to more evenly distribute work across threads. It is assumed that this is a temporary solution, since it will be possible in the future to make the number of sources equal to the number of threads, but for each source to dynamically select available work for itself.", 0) \
@@ -303,8 +315,8 @@ class IColumn;
     M(Seconds, http_receive_timeout, DEFAULT_HTTP_READ_BUFFER_TIMEOUT, "HTTP receive timeout", 0) \
     M(UInt64, http_max_uri_size, 1048576, "Maximum URI length of HTTP request", 0) \
     M(UInt64, http_max_fields, 1000000, "Maximum number of fields in HTTP header", 0) \
-    M(UInt64, http_max_field_name_size, 1048576, "Maximum length of field name in HTTP header", 0) \
-    M(UInt64, http_max_field_value_size, 1048576, "Maximum length of field value in HTTP header", 0) \
+    M(UInt64, http_max_field_name_size, 128 * 1024, "Maximum length of field name in HTTP header", 0) \
+    M(UInt64, http_max_field_value_size, 128 * 1024, "Maximum length of field value in HTTP header", 0) \
     M(UInt64, http_max_chunk_size, 100_GiB, "Maximum value of a chunk size in HTTP chunked transfer encoding", 0) \
     M(Bool, http_skip_not_found_url_for_globs, true, "Skip url's for globs with HTTP_NOT_FOUND error", 0) \
     M(Bool, optimize_throw_if_noop, false, "If setting is enabled and OPTIMIZE query didn't actually assign a merge then an explanatory exception is thrown", 0) \
@@ -316,6 +328,7 @@ class IColumn;
     M(Bool, allow_distributed_ddl, true, "If it is set to true, then a user is allowed to executed distributed DDL queries.", 0) \
     M(Bool, allow_suspicious_codecs, false, "If it is set to true, allow to specify meaningless compression codecs.", 0) \
     M(Bool, allow_experimental_codecs, false, "If it is set to true, allow to specify experimental compression codecs (but we don't have those yet and this option does nothing).", 0) \
+    M(Bool, enable_deflate_qpl_codec, false, "Enable/disable the DEFLATE_QPL codec.", 0) \
     M(UInt64, query_profiler_real_time_period_ns, QUERY_PROFILER_DEFAULT_SAMPLE_RATE_NS, "Period for real clock timer of query profiler (in nanoseconds). Set 0 value to turn off the real clock query profiler. Recommended value is at least 10000000 (100 times a second) for single queries or 1000000000 (once a second) for cluster-wide profiling.", 0) \
     M(UInt64, query_profiler_cpu_time_period_ns, QUERY_PROFILER_DEFAULT_SAMPLE_RATE_NS, "Period for CPU clock timer of query profiler (in nanoseconds). Set 0 value to turn off the CPU clock query profiler. Recommended value is at least 10000000 (100 times a second) for single queries or 1000000000 (once a second) for cluster-wide profiling.", 0) \
     M(Bool, metrics_perf_events_enabled, false, "If enabled, some of the perf events will be measured throughout queries' execution.", 0) \
@@ -454,6 +467,7 @@ class IColumn;
     M(UInt64, max_fetch_partition_retries_count, 5, "Amount of retries while fetching partition from another host.", 0) \
     M(UInt64, http_max_multipart_form_data_size, 1024 * 1024 * 1024, "Limit on size of multipart/form-data content. This setting cannot be parsed from URL parameters and should be set in user profile. Note that content is parsed and external tables are created in memory before start of query execution. And this is the only limit that has effect on that stage (limits on max memory usage and max execution time have no effect while reading HTTP form data).", 0) \
     M(Bool, calculate_text_stack_trace, true, "Calculate text stack trace in case of exceptions during query execution. This is the default. It requires symbol lookups that may slow down fuzzing tests when huge amount of wrong queries are executed. In normal cases you should not disable this option.", 0) \
+    M(Bool, enable_job_stack_trace, false, "Output stack trace of a job creator when job results in exception", 0) \
     M(Bool, allow_ddl, true, "If it is set to true, then a user is allowed to executed DDL queries.", 0) \
     M(Bool, parallel_view_processing, false, "Enables pushing to attached views concurrently instead of sequentially.", 0) \
     M(Bool, enable_unaligned_array_join, false, "Allow ARRAY JOIN with multiple arrays that have different sizes. When this settings is enabled, arrays will be resized to the longest one.", 0) \
@@ -603,6 +617,8 @@ class IColumn;
     M(Bool, engine_file_empty_if_not_exists, false, "Allows to select data from a file engine table without file", 0) \
     M(Bool, engine_file_truncate_on_insert, false, "Enables or disables truncate before insert in file engine tables", 0) \
     M(Bool, engine_file_allow_create_multiple_files, false, "Enables or disables creating a new file on each insert in file engine tables if format has suffix.", 0) \
+    M(Bool, engine_file_skip_empty_files, false, "Allows to skip empty files in file table engine", 0) \
+    M(Bool, engine_url_skip_empty_files, false, "Allows to skip empty files in url table engine", 0) \
     M(Bool, allow_experimental_database_replicated, false, "Allow to create databases with Replicated engine", 0) \
     M(UInt64, database_replicated_initial_query_timeout_sec, 300, "How long initial DDL query should wait for Replicated database to precess previous DDL queue entries", 0) \
     M(Bool, database_replicated_enforce_synchronous_settings, false, "Enforces synchronous waiting for some queries (see also database_atomic_wait_for_drop_and_detach_synchronously, mutation_sync, alter_sync). Not recommended to enable these settings.", 0) \
@@ -705,6 +721,7 @@ class IColumn;
     \
     M(Bool, schema_inference_use_cache_for_file, true, "Use cache in schema inference while using file table function", 0) \
     M(Bool, schema_inference_use_cache_for_s3, true, "Use cache in schema inference while using s3 table function", 0) \
+    M(Bool, schema_inference_use_cache_for_azure, true, "Use cache in schema inference while using azure table function", 0) \
     M(Bool, schema_inference_use_cache_for_hdfs, true, "Use cache in schema inference while using hdfs table function", 0) \
     M(Bool, schema_inference_use_cache_for_url, true, "Use cache in schema inference while using url table function", 0) \
     M(Bool, schema_inference_cache_require_modification_time_for_url, true, "Use schema from cache for URL with last modification time validation (for urls with Last-Modified header)", 0) \
@@ -717,9 +734,10 @@ class IColumn;
     M(String, workload, "default", "Name of workload to be used to access resources", 0) \
     M(Milliseconds, storage_system_stack_trace_pipe_read_timeout_ms, 100, "Maximum time to read from a pipe for receiving information from the threads when querying the `system.stack_trace` table. This setting is used for testing purposes and not meant to be changed by users.", 0) \
     \
+    M(String, rename_files_after_processing, "", "Rename successfully processed files according to the specified pattern; Pattern can include the following placeholders: `%f` (original filename without extension), `%e` (file extension with dot), `%t` (current timestamp in µs), and `%%` (% sign)", 0) \
+    \
     M(Bool, parallelize_output_from_storages, true, "Parallelize output for reading step from storage. It allows parallelizing query processing right after reading from storage if possible", 0) \
     M(String, insert_deduplication_token, "", "If not empty, used for duplicate detection instead of data digest", 0) \
-    M(String, ann_index_select_query_params, "", "Parameters passed to ANN indexes in SELECT queries, the format is 'param1=x, param2=y, ...'", 0) \
     M(Bool, count_distinct_optimization, false, "Rewrite count distinct to subquery of group by", 0) \
     M(Bool, throw_if_no_data_to_insert, true, "Enables or disables empty INSERTs, enabled by default", 0) \
     M(Bool, compatibility_ignore_auto_increment_in_create_table, false, "Ignore AUTO_INCREMENT keyword in column declaration if true, otherwise return error. It simplifies migration from MySQL", 0) \
@@ -742,7 +760,8 @@ class IColumn;
     M(Bool, allow_experimental_hash_functions, false, "Enable experimental hash functions (hashid, etc)", 0) \
     M(Bool, allow_experimental_object_type, false, "Allow Object and JSON data types", 0) \
     M(Bool, allow_experimental_annoy_index, false, "Allows to use Annoy index. Disabled by default because this feature is experimental", 0) \
-    M(UInt64, max_limit_for_ann_queries, 1000000, "Maximum limit value for using ANN indexes is used to prevent memory overflow in search queries for indexes", 0) \
+    M(UInt64, max_limit_for_ann_queries, 1'000'000, "SELECT queries with LIMIT bigger than this setting cannot use ANN indexes. Helps to prevent memory overflows in ANN search indexes.", 0) \
+    M(Int64, annoy_index_search_k_nodes, -1, "SELECT queries search up to this many nodes in Annoy indexes.", 0) \
     M(Bool, throw_on_unsupported_query_inside_transaction, true, "Throw exception if unsupported query is used inside transaction", 0) \
     M(TransactionsWaitCSNMode, wait_changes_become_visible_after_commit_mode, TransactionsWaitCSNMode::WAIT_UNKNOWN, "Wait for committed changes to become actually visible in the latest snapshot", 0) \
     M(Bool, implicit_transaction, false, "If enabled and not already inside a transaction, wraps the query inside a full transaction (begin + commit or rollback)", 0) \
@@ -752,6 +771,7 @@ class IColumn;
     M(Bool, allow_experimental_undrop_table_query, false, "Allow to use undrop query to restore dropped table in a limited time", 0) \
     M(Bool, keeper_map_strict_mode, false, "Enforce additional checks during operations on KeeperMap. E.g. throw an exception on an insert for already existing key", 0) \
     M(UInt64, extract_kvp_max_pairs_per_row, 1000, "Max number pairs that can be produced by extractKeyValuePairs function. Used to safeguard against consuming too much memory.", 0) \
+    M(Timezone, session_timezone, "", "The default timezone for current session or query. The server default timezone if empty.", 0) \
     // End of COMMON_SETTINGS
     // Please add settings related to formats into the FORMAT_FACTORY_SETTINGS and move obsolete settings to OBSOLETE_SETTINGS.
 
@@ -844,9 +864,12 @@ class IColumn;
     M(UInt64, input_format_msgpack_number_of_columns, 0, "The number of columns in inserted MsgPack data. Used for automatic schema inference from data.", 0) \
     M(MsgPackUUIDRepresentation, output_format_msgpack_uuid_representation, FormatSettings::MsgPackUUIDRepresentation::EXT, "The way how to output UUID in MsgPack format.", 0) \
     M(UInt64, input_format_max_rows_to_read_for_schema_inference, 25000, "The maximum rows of data to read for automatic schema inference", 0) \
+    M(UInt64, input_format_max_bytes_to_read_for_schema_inference, 32 * 1024 * 1024, "The maximum bytes of data to read for automatic schema inference", 0) \
     M(Bool, input_format_csv_use_best_effort_in_schema_inference, true, "Use some tweaks and heuristics to infer schema in CSV format", 0) \
     M(Bool, input_format_tsv_use_best_effort_in_schema_inference, true, "Use some tweaks and heuristics to infer schema in TSV format", 0) \
     M(Bool, input_format_csv_detect_header, true, "Automatically detect header with names and types in CSV format", 0) \
+    M(Bool, input_format_csv_allow_whitespace_or_tab_as_delimiter, false, "Allow to use spaces and tabs(\\t) as field delimiter in the CSV strings", 0) \
+    M(Bool, input_format_csv_trim_whitespaces, true, "Trims spaces and tabs (\\t) characters at the beginning and end in CSV strings", 0) \
     M(Bool, input_format_tsv_detect_header, true, "Automatically detect header with names and types in TSV format", 0) \
     M(Bool, input_format_custom_detect_header, true, "Automatically detect header with names and types in CustomSeparated format", 0) \
     M(Bool, input_format_parquet_skip_columns_with_unsupported_types_in_schema_inference, false, "Skip columns with unsupported types while schema inference for format Parquet", 0) \
@@ -873,6 +896,9 @@ class IColumn;
     M(Bool, output_format_protobuf_nullables_with_google_wrappers, false, "When serializing Nullable columns with Google wrappers, serialize default values as empty wrappers. If turned off, default and null values are not serialized", 0) \
     M(UInt64, input_format_csv_skip_first_lines, 0, "Skip specified number of lines at the beginning of data in CSV format", 0) \
     M(UInt64, input_format_tsv_skip_first_lines, 0, "Skip specified number of lines at the beginning of data in TSV format", 0) \
+    M(Bool, input_format_csv_skip_trailing_empty_lines, false, "Skip trailing empty lines in CSV format", 0) \
+    M(Bool, input_format_tsv_skip_trailing_empty_lines, false, "Skip trailing empty lines in TSV format", 0) \
+    M(Bool, input_format_custom_skip_trailing_empty_lines, false, "Skip trailing empty lines in CustomSeparated format", 0) \
     \
     M(Bool, input_format_native_allow_types_conversion, true, "Allow data types conversion in Native input format", 0) \
     \
@@ -965,7 +991,7 @@ class IColumn;
     M(Bool, output_format_orc_string_as_string, false, "Use ORC String type instead of Binary for String columns", 0) \
     M(ORCCompression, output_format_orc_compression_method, "lz4", "Compression method for ORC output format. Supported codecs: lz4, snappy, zlib, zstd, none (uncompressed)", 0) \
     \
-    M(EnumComparingMode, format_capn_proto_enum_comparising_mode, FormatSettings::EnumComparingMode::BY_VALUES, "How to map ClickHouse Enum and CapnProto Enum", 0) \
+    M(CapnProtoEnumComparingMode, format_capn_proto_enum_comparising_mode, FormatSettings::CapnProtoEnumComparingMode::BY_VALUES, "How to map ClickHouse Enum and CapnProto Enum", 0) \
     \
     M(String, input_format_mysql_dump_table_name, "", "Name of the table in MySQL dump from which to read data", 0) \
     M(Bool, input_format_mysql_dump_map_column_names, true, "Match columns from table in MySQL dump and columns from ClickHouse table by names", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index c0f10b13282..9fd45ac16d6 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -85,6 +85,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"use_with_fill_by_sorting_prefix", false, true, "Columns preceding WITH FILL columns in ORDER BY clause form sorting prefix. Rows with different values in sorting prefix are filled independently"},
               {"output_format_parquet_compliant_nested_types", false, true, "Change an internal field name in output Parquet file schema."}}},
     {"23.4", {{"allow_suspicious_indices", true, false, "If true, index can defined with identical expressions"},
+              {"allow_nonconst_timezone_arguments", true, false, "Allow non-const timezone arguments in certain time-related functions like toTimeZone(), fromUnixTimestamp*(), snowflakeToDateTime*()."},
               {"connect_timeout_with_failover_ms", 50, 1000, "Increase default connect timeout because of async connect"},
               {"connect_timeout_with_failover_secure_ms", 100, 1000, "Increase default secure connect timeout because of async connect"},
               {"hedged_connection_timeout_ms", 100, 50, "Start new connection in hedged requests after 50 ms instead of 100 to correspond with previous connect timeout"}}},
diff --git a/src/Core/SettingsEnums.cpp b/src/Core/SettingsEnums.cpp
index e0f16ea00db..612f8689480 100644
--- a/src/Core/SettingsEnums.cpp
+++ b/src/Core/SettingsEnums.cpp
@@ -1,8 +1,10 @@
 #include <Core/SettingsEnums.h>
+#include <magic_enum.hpp>
 
 
 namespace DB
 {
+
 namespace ErrorCodes
 {
     extern const int UNKNOWN_LOAD_BALANCING;
@@ -15,7 +17,6 @@ namespace ErrorCodes
     extern const int UNKNOWN_UNION;
 }
 
-
 IMPLEMENT_SETTING_ENUM(LoadBalancing, ErrorCodes::UNKNOWN_LOAD_BALANCING,
     {{"random",           LoadBalancing::RANDOM},
      {"nearest_hostname", LoadBalancing::NEAREST_HOSTNAME},
@@ -54,7 +55,7 @@ IMPLEMENT_SETTING_ENUM(OverflowMode, ErrorCodes::UNKNOWN_OVERFLOW_MODE,
      {"break", OverflowMode::BREAK}})
 
 
-IMPLEMENT_SETTING_ENUM_WITH_RENAME(OverflowModeGroupBy, ErrorCodes::UNKNOWN_OVERFLOW_MODE,
+IMPLEMENT_SETTING_ENUM(OverflowModeGroupBy, ErrorCodes::UNKNOWN_OVERFLOW_MODE,
     {{"throw", OverflowMode::THROW},
      {"break", OverflowMode::BREAK},
      {"any", OverflowMode::ANY}})
@@ -67,51 +68,26 @@ IMPLEMENT_SETTING_ENUM(DistributedProductMode, ErrorCodes::UNKNOWN_DISTRIBUTED_P
      {"allow",  DistributedProductMode::ALLOW}})
 
 
-IMPLEMENT_SETTING_ENUM_WITH_RENAME(DateTimeInputFormat, ErrorCodes::BAD_ARGUMENTS,
+IMPLEMENT_SETTING_ENUM(DateTimeInputFormat, ErrorCodes::BAD_ARGUMENTS,
     {{"basic",       FormatSettings::DateTimeInputFormat::Basic},
      {"best_effort", FormatSettings::DateTimeInputFormat::BestEffort},
      {"best_effort_us", FormatSettings::DateTimeInputFormat::BestEffortUS}})
 
 
-IMPLEMENT_SETTING_ENUM_WITH_RENAME(DateTimeOutputFormat, ErrorCodes::BAD_ARGUMENTS,
+IMPLEMENT_SETTING_ENUM(DateTimeOutputFormat, ErrorCodes::BAD_ARGUMENTS,
     {{"simple",         FormatSettings::DateTimeOutputFormat::Simple},
      {"iso",            FormatSettings::DateTimeOutputFormat::ISO},
      {"unix_timestamp", FormatSettings::DateTimeOutputFormat::UnixTimestamp}})
 
-IMPLEMENT_SETTING_ENUM(LogsLevel, ErrorCodes::BAD_ARGUMENTS,
-    {{"none",        LogsLevel::none},
-     {"fatal",       LogsLevel::fatal},
-     {"error",       LogsLevel::error},
-     {"warning",     LogsLevel::warning},
-     {"information", LogsLevel::information},
-     {"debug",       LogsLevel::debug},
-     {"trace",       LogsLevel::trace},
-     {"test",        LogsLevel::test}})
+IMPLEMENT_SETTING_AUTO_ENUM(LogsLevel, ErrorCodes::BAD_ARGUMENTS)
 
-IMPLEMENT_SETTING_ENUM_WITH_RENAME(LogQueriesType, ErrorCodes::BAD_ARGUMENTS,
-    {{"QUERY_START",                QUERY_START},
-     {"QUERY_FINISH",               QUERY_FINISH},
-     {"EXCEPTION_BEFORE_START",     EXCEPTION_BEFORE_START},
-     {"EXCEPTION_WHILE_PROCESSING", EXCEPTION_WHILE_PROCESSING}})
+IMPLEMENT_SETTING_AUTO_ENUM(LogQueriesType, ErrorCodes::BAD_ARGUMENTS)
 
+IMPLEMENT_SETTING_AUTO_ENUM(DefaultDatabaseEngine, ErrorCodes::BAD_ARGUMENTS)
 
-IMPLEMENT_SETTING_ENUM_WITH_RENAME(DefaultDatabaseEngine, ErrorCodes::BAD_ARGUMENTS,
-    {{"Ordinary", DefaultDatabaseEngine::Ordinary},
-     {"Atomic",   DefaultDatabaseEngine::Atomic}})
+IMPLEMENT_SETTING_AUTO_ENUM(DefaultTableEngine, ErrorCodes::BAD_ARGUMENTS)
 
-IMPLEMENT_SETTING_ENUM_WITH_RENAME(DefaultTableEngine, ErrorCodes::BAD_ARGUMENTS,
-    {{"None", DefaultTableEngine::None},
-     {"Log", DefaultTableEngine::Log},
-     {"StripeLog", DefaultTableEngine::StripeLog},
-     {"MergeTree", DefaultTableEngine::MergeTree},
-     {"ReplacingMergeTree", DefaultTableEngine::ReplacingMergeTree},
-     {"ReplicatedMergeTree", DefaultTableEngine::ReplicatedMergeTree},
-     {"ReplicatedReplacingMergeTree", DefaultTableEngine::ReplicatedReplacingMergeTree},
-     {"Memory", DefaultTableEngine::Memory}})
-
-IMPLEMENT_SETTING_ENUM(CleanDeletedRows, ErrorCodes::BAD_ARGUMENTS,
-    {{"Never", CleanDeletedRows::Never},
-     {"Always", CleanDeletedRows::Always}})
+IMPLEMENT_SETTING_AUTO_ENUM(CleanDeletedRows, ErrorCodes::BAD_ARGUMENTS)
 
 IMPLEMENT_SETTING_MULTI_ENUM(MySQLDataTypesSupport, ErrorCodes::UNKNOWN_MYSQL_DATATYPES_SUPPORT_LEVEL,
     {{"decimal",    MySQLDataTypesSupport::DECIMAL},
@@ -144,19 +120,12 @@ IMPLEMENT_SETTING_ENUM(TransactionsWaitCSNMode, ErrorCodes::BAD_ARGUMENTS,
      {"wait",           TransactionsWaitCSNMode::WAIT},
      {"wait_unknown",   TransactionsWaitCSNMode::WAIT_UNKNOWN}})
 
-IMPLEMENT_SETTING_ENUM(EnumComparingMode, ErrorCodes::BAD_ARGUMENTS,
-    {{"by_names",   FormatSettings::EnumComparingMode::BY_NAMES},
-     {"by_values",  FormatSettings::EnumComparingMode::BY_VALUES},
-     {"by_names_case_insensitive", FormatSettings::EnumComparingMode::BY_NAMES_CASE_INSENSITIVE}})
+IMPLEMENT_SETTING_ENUM(CapnProtoEnumComparingMode, ErrorCodes::BAD_ARGUMENTS,
+    {{"by_names",   FormatSettings::CapnProtoEnumComparingMode::BY_NAMES},
+     {"by_values",  FormatSettings::CapnProtoEnumComparingMode::BY_VALUES},
+     {"by_names_case_insensitive", FormatSettings::CapnProtoEnumComparingMode::BY_NAMES_CASE_INSENSITIVE}})
 
-IMPLEMENT_SETTING_ENUM(EscapingRule, ErrorCodes::BAD_ARGUMENTS,
-    {{"None", FormatSettings::EscapingRule::None},
-     {"Escaped", FormatSettings::EscapingRule::Escaped},
-     {"Quoted", FormatSettings::EscapingRule::Quoted},
-     {"CSV", FormatSettings::EscapingRule::CSV},
-     {"JSON", FormatSettings::EscapingRule::JSON},
-     {"XML", FormatSettings::EscapingRule::XML},
-     {"Raw", FormatSettings::EscapingRule::Raw}})
+IMPLEMENT_SETTING_AUTO_ENUM(EscapingRule, ErrorCodes::BAD_ARGUMENTS)
 
 IMPLEMENT_SETTING_ENUM(MsgPackUUIDRepresentation, ErrorCodes::BAD_ARGUMENTS,
                        {{"bin", FormatSettings::MsgPackUUIDRepresentation::BIN},
@@ -166,17 +135,15 @@ IMPLEMENT_SETTING_ENUM(MsgPackUUIDRepresentation, ErrorCodes::BAD_ARGUMENTS,
 IMPLEMENT_SETTING_ENUM(Dialect, ErrorCodes::BAD_ARGUMENTS,
     {{"clickhouse", Dialect::clickhouse},
      {"kusto", Dialect::kusto}})
+    // FIXME: do not add 'kusto_auto' to the list. Maybe remove it from code completely?
 
 IMPLEMENT_SETTING_ENUM(ParallelReplicasCustomKeyFilterType, ErrorCodes::BAD_ARGUMENTS,
     {{"default", ParallelReplicasCustomKeyFilterType::DEFAULT},
      {"range", ParallelReplicasCustomKeyFilterType::RANGE}})
 
-IMPLEMENT_SETTING_ENUM(LocalFSReadMethod, ErrorCodes::BAD_ARGUMENTS,
-    {{"mmap", LocalFSReadMethod::mmap},
-     {"pread", LocalFSReadMethod::pread},
-     {"read", LocalFSReadMethod::read}})
+IMPLEMENT_SETTING_AUTO_ENUM(LocalFSReadMethod, ErrorCodes::BAD_ARGUMENTS)
 
-IMPLEMENT_SETTING_ENUM_WITH_RENAME(ParquetVersion, ErrorCodes::BAD_ARGUMENTS,
+IMPLEMENT_SETTING_ENUM(ParquetVersion, ErrorCodes::BAD_ARGUMENTS,
     {{"1.0",       FormatSettings::ParquetVersion::V1_0},
      {"2.4", FormatSettings::ParquetVersion::V2_4},
      {"2.6", FormatSettings::ParquetVersion::V2_6},
diff --git a/src/Core/SettingsEnums.h b/src/Core/SettingsEnums.h
index 3ae7bfaa673..1c5be910ef7 100644
--- a/src/Core/SettingsEnums.h
+++ b/src/Core/SettingsEnums.h
@@ -188,7 +188,7 @@ enum class TransactionsWaitCSNMode
 
 DECLARE_SETTING_ENUM(TransactionsWaitCSNMode)
 
-DECLARE_SETTING_ENUM_WITH_RENAME(EnumComparingMode, FormatSettings::EnumComparingMode)
+DECLARE_SETTING_ENUM_WITH_RENAME(CapnProtoEnumComparingMode, FormatSettings::CapnProtoEnumComparingMode)
 
 DECLARE_SETTING_ENUM_WITH_RENAME(EscapingRule, FormatSettings::EscapingRule)
 
diff --git a/src/Core/SettingsFields.cpp b/src/Core/SettingsFields.cpp
index 8cd4efb68c6..9b8677a9888 100644
--- a/src/Core/SettingsFields.cpp
+++ b/src/Core/SettingsFields.cpp
@@ -13,7 +13,6 @@
 
 #include <cmath>
 
-
 namespace DB
 {
 namespace ErrorCodes
@@ -379,6 +378,40 @@ void SettingFieldMap::readBinary(ReadBuffer & in)
     *this = map;
 }
 
+#else
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
+SettingFieldMap::SettingFieldMap(const Field &) : value(Map()) {}
+String SettingFieldMap::toString() const
+{
+    throw DB::Exception(DB::ErrorCodes::LOGICAL_ERROR, "Setting of type Map not supported");
+}
+
+
+SettingFieldMap & SettingFieldMap::operator =(const Field &)
+{
+    throw DB::Exception(DB::ErrorCodes::LOGICAL_ERROR, "Setting of type Map not supported");
+}
+
+void SettingFieldMap::parseFromString(const String &)
+{
+    throw DB::Exception(DB::ErrorCodes::LOGICAL_ERROR, "Setting of type Map not supported");
+}
+
+void SettingFieldMap::writeBinary(WriteBuffer &) const
+{
+    throw DB::Exception(DB::ErrorCodes::LOGICAL_ERROR, "Setting of type Map not supported");
+}
+
+void SettingFieldMap::readBinary(ReadBuffer &)
+{
+    throw DB::Exception(DB::ErrorCodes::LOGICAL_ERROR, "Setting of type Map not supported");
+}
+
 #endif
 
 namespace
@@ -451,6 +484,17 @@ String SettingFieldEnumHelpers::readBinary(ReadBuffer & in)
     return str;
 }
 
+void SettingFieldTimezone::writeBinary(WriteBuffer & out) const
+{
+    writeStringBinary(value, out);
+}
+
+void SettingFieldTimezone::readBinary(ReadBuffer & in)
+{
+    String str;
+    readStringBinary(str, in);
+    *this = std::move(str);
+}
 
 String SettingFieldCustom::toString() const
 {
diff --git a/src/Core/SettingsFields.h b/src/Core/SettingsFields.h
index 2cd55e6b4c5..32fffd3af06 100644
--- a/src/Core/SettingsFields.h
+++ b/src/Core/SettingsFields.h
@@ -6,11 +6,11 @@
 #include <Core/Field.h>
 #include <Core/MultiEnum.h>
 #include <boost/range/adaptor/map.hpp>
+#include <cctz/time_zone.h>
 #include <chrono>
 #include <unordered_map>
 #include <string_view>
 
-
 namespace DB
 {
 namespace ErrorCodes
@@ -245,6 +245,12 @@ struct SettingFieldString
     void readBinary(ReadBuffer & in);
 };
 
+#ifdef CLICKHOUSE_PROGRAM_STANDALONE_BUILD
+#define NORETURN [[noreturn]]
+#else
+#define NORETURN
+#endif
+
 struct SettingFieldMap
 {
 public:
@@ -261,13 +267,15 @@ public:
     operator const Map &() const { return value; } /// NOLINT
     explicit operator Field() const { return value; }
 
-    String toString() const;
-    void parseFromString(const String & str);
+    NORETURN String toString() const;
+    NORETURN void parseFromString(const String & str);
 
-    void writeBinary(WriteBuffer & out) const;
-    void readBinary(ReadBuffer & in);
+    NORETURN void writeBinary(WriteBuffer & out) const;
+    NORETURN void readBinary(ReadBuffer & in);
 };
 
+#undef NORETURN
+
 struct SettingFieldChar
 {
 public:
@@ -371,19 +379,26 @@ void SettingFieldEnum<EnumT, Traits>::readBinary(ReadBuffer & in)
     *this = Traits::fromString(SettingFieldEnumHelpers::readBinary(in));
 }
 
+template <typename Type>
+constexpr auto getEnumValues()
+{
+    std::array<std::pair<std::string_view, Type>, magic_enum::enum_count<Type>()> enum_values{};
+    size_t index = 0;
+    for (auto value : magic_enum::enum_values<Type>())
+        enum_values[index++] = std::pair{magic_enum::enum_name(value), value};
+    return enum_values;
+}
+
 /// NOLINTNEXTLINE
 #define DECLARE_SETTING_ENUM(ENUM_TYPE) \
     DECLARE_SETTING_ENUM_WITH_RENAME(ENUM_TYPE, ENUM_TYPE)
 
-/// NOLINTNEXTLINE
-#define IMPLEMENT_SETTING_ENUM(ENUM_TYPE, ERROR_CODE_FOR_UNEXPECTED_NAME, ...) \
-    IMPLEMENT_SETTING_ENUM_WITH_RENAME(ENUM_TYPE, ERROR_CODE_FOR_UNEXPECTED_NAME, __VA_ARGS__)
-
 /// NOLINTNEXTLINE
 #define DECLARE_SETTING_ENUM_WITH_RENAME(NEW_NAME, ENUM_TYPE) \
     struct SettingField##NEW_NAME##Traits \
     { \
         using EnumType = ENUM_TYPE; \
+        using EnumValuePairs = std::pair<const char *, EnumType>[]; \
         static const String & toString(EnumType value); \
         static EnumType fromString(std::string_view str); \
     }; \
@@ -391,13 +406,20 @@ void SettingFieldEnum<EnumT, Traits>::readBinary(ReadBuffer & in)
     using SettingField##NEW_NAME = SettingFieldEnum<ENUM_TYPE, SettingField##NEW_NAME##Traits>;
 
 /// NOLINTNEXTLINE
-#define IMPLEMENT_SETTING_ENUM_WITH_RENAME(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, ...) \
+#define IMPLEMENT_SETTING_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, ...) \
+    IMPLEMENT_SETTING_ENUM_IMPL(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, EnumValuePairs, __VA_ARGS__)
+
+/// NOLINTNEXTLINE
+#define IMPLEMENT_SETTING_AUTO_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME) \
+    IMPLEMENT_SETTING_ENUM_IMPL(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, , getEnumValues<EnumType>())
+
+/// NOLINTNEXTLINE
+#define IMPLEMENT_SETTING_ENUM_IMPL(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, PAIRS_TYPE, ...) \
     const String & SettingField##NEW_NAME##Traits::toString(typename SettingField##NEW_NAME::EnumType value) \
     { \
         static const std::unordered_map<EnumType, String> map = [] { \
             std::unordered_map<EnumType, String> res; \
-            constexpr std::pair<const char *, EnumType> pairs[] = __VA_ARGS__; \
-            for (const auto & [name, val] : pairs) \
+            for (const auto & [name, val] : PAIRS_TYPE __VA_ARGS__) \
                 res.emplace(val, name); \
             return res; \
         }(); \
@@ -413,8 +435,7 @@ void SettingFieldEnum<EnumT, Traits>::readBinary(ReadBuffer & in)
     { \
         static const std::unordered_map<std::string_view, EnumType> map = [] { \
             std::unordered_map<std::string_view, EnumType> res; \
-            constexpr std::pair<const char *, EnumType> pairs[] = __VA_ARGS__; \
-            for (const auto & [name, val] : pairs) \
+            for (const auto & [name, val] : PAIRS_TYPE __VA_ARGS__) \
                 res.emplace(name, val); \
             return res; \
         }(); \
@@ -527,6 +548,7 @@ void SettingFieldMultiEnum<EnumT, Traits>::readBinary(ReadBuffer & in)
     struct SettingField##NEW_NAME##Traits \
     { \
         using EnumType = ENUM_TYPE; \
+        using EnumValuePairs = std::pair<const char *, EnumType>[]; \
         static size_t getEnumSize(); \
         static const String & toString(EnumType value); \
         static EnumType fromString(std::string_view str); \
@@ -540,11 +562,54 @@ void SettingFieldMultiEnum<EnumT, Traits>::readBinary(ReadBuffer & in)
 
 /// NOLINTNEXTLINE
 #define IMPLEMENT_SETTING_MULTI_ENUM_WITH_RENAME(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, ...) \
-    IMPLEMENT_SETTING_ENUM_WITH_RENAME(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, __VA_ARGS__)\
+    IMPLEMENT_SETTING_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, __VA_ARGS__)\
     size_t SettingField##NEW_NAME##Traits::getEnumSize() {\
         return std::initializer_list<std::pair<const char*, NEW_NAME>> __VA_ARGS__ .size();\
     }
 
+/// NOLINTNEXTLINE
+#define IMPLEMENT_SETTING_MULTI_AUTO_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME) \
+    IMPLEMENT_SETTING_AUTO_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME)\
+    size_t SettingField##NEW_NAME##Traits::getEnumSize() {\
+        return getEnumValues<EnumType>().size();\
+    }
+
+/// Setting field for specifying user-defined timezone. It is basically a string, but it needs validation.
+struct SettingFieldTimezone
+{
+    String value;
+    bool changed = false;
+
+    explicit SettingFieldTimezone(std::string_view str = {}) { validateTimezone(std::string(str)); value = str; }
+    explicit SettingFieldTimezone(const String & str) { validateTimezone(str); value = str; }
+    explicit SettingFieldTimezone(String && str) { validateTimezone(str); value = std::move(str); }
+    explicit SettingFieldTimezone(const char * str) { validateTimezone(str); value = str; }
+    explicit SettingFieldTimezone(const Field & f) { const String & str = f.safeGet<const String &>(); validateTimezone(str); value = str; }
+
+    SettingFieldTimezone & operator =(std::string_view str) { validateTimezone(std::string(str)); value = str; changed = true; return *this; }
+    SettingFieldTimezone & operator =(const String & str) { *this = std::string_view{str}; return *this; }
+    SettingFieldTimezone & operator =(String && str) { validateTimezone(str); value = std::move(str); changed = true; return *this; }
+    SettingFieldTimezone & operator =(const char * str) { *this = std::string_view{str}; return *this; }
+    SettingFieldTimezone & operator =(const Field & f) { *this = f.safeGet<const String &>(); return *this; }
+
+    operator const String &() const { return value; } /// NOLINT
+    explicit operator Field() const { return value; }
+
+    const String & toString() const { return value; }
+    void parseFromString(const String & str) { *this = str; }
+
+    void writeBinary(WriteBuffer & out) const;
+    void readBinary(ReadBuffer & in);
+
+private:
+    void validateTimezone(const std::string & tz_str)
+    {
+        cctz::time_zone validated_tz;
+        if (!tz_str.empty() && !cctz::load_time_zone(tz_str, &validated_tz))
+            throw DB::Exception(DB::ErrorCodes::BAD_ARGUMENTS, "Invalid time zone: {}", tz_str);
+    }
+};
+
 /// Can keep a value of any type. Used for user-defined settings.
 struct SettingFieldCustom
 {
diff --git a/src/Core/SettingsQuirks.cpp b/src/Core/SettingsQuirks.cpp
index 3326f42adf5..37a0f2db3e2 100644
--- a/src/Core/SettingsQuirks.cpp
+++ b/src/Core/SettingsQuirks.cpp
@@ -1,10 +1,11 @@
+#include <base/defines.h>
 #include <Core/SettingsQuirks.h>
 #include <Core/Settings.h>
 #include <Poco/Environment.h>
 #include <Poco/Platform.h>
 #include <Common/VersionNumber.h>
 #include <Common/logger_useful.h>
-#include <cstdlib>
+
 
 namespace
 {
@@ -71,6 +72,12 @@ void applySettingsQuirks(Settings & settings, Poco::Logger * log)
         }
     }
 
+#if defined(THREAD_SANITIZER)
+    settings.use_hedged_requests.value = false;
+    if (log)
+        LOG_WARNING(log, "use_hedged_requests has been disabled for the build with Thread Sanitizer, because they are using fibers, leading to a failed assertion inside TSan");
+#endif
+
     if (!queryProfilerWorks())
     {
         if (settings.query_profiler_real_time_period_ns)
diff --git a/src/Core/Types_fwd.h b/src/Core/Types_fwd.h
index 3db1127fe5a..a59e4b6eab8 100644
--- a/src/Core/Types_fwd.h
+++ b/src/Core/Types_fwd.h
@@ -27,7 +27,7 @@ namespace DB
 
 using UUID = StrongTypedef<UInt128, struct UUIDTag>;
 
-using IPv4 = StrongTypedef<UInt32, struct IPv4Tag>;
+struct IPv4;
 
 struct IPv6;
 
diff --git a/src/Core/ValueWithType.h b/src/Core/ValueWithType.h
new file mode 100644
index 00000000000..b5f61a1c5f7
--- /dev/null
+++ b/src/Core/ValueWithType.h
@@ -0,0 +1,26 @@
+#pragma once
+
+#include <DataTypes/IDataType.h>
+
+namespace llvm
+{
+    class Value;
+}
+
+namespace DB
+{
+
+/// LLVM value with its data type
+struct ValueWithType
+{
+    llvm::Value * value = nullptr;
+    DataTypePtr type;
+
+    ValueWithType() = default;
+    ValueWithType(llvm::Value * value_, DataTypePtr type_)
+        : value(value_)
+        , type(std::move(type_))
+    {}
+};
+
+}
diff --git a/src/Core/ValuesWithType.h b/src/Core/ValuesWithType.h
new file mode 100644
index 00000000000..92060419197
--- /dev/null
+++ b/src/Core/ValuesWithType.h
@@ -0,0 +1,13 @@
+#pragma once
+
+#include <vector>
+
+#include <Core/ValueWithType.h>
+
+
+namespace DB
+{
+
+using ValuesWithType = std::vector<ValueWithType>;
+
+}
diff --git a/src/Daemon/BaseDaemon.cpp b/src/Daemon/BaseDaemon.cpp
index 4780dfed4b2..6d29523a354 100644
--- a/src/Daemon/BaseDaemon.cpp
+++ b/src/Daemon/BaseDaemon.cpp
@@ -19,6 +19,7 @@
 #include <csignal>
 #include <unistd.h>
 
+#include <algorithm>
 #include <typeinfo>
 #include <iostream>
 #include <fstream>
@@ -54,6 +55,7 @@
 #include <Common/Elf.h>
 #include <Common/setThreadName.h>
 #include <Common/logger_useful.h>
+#include <Interpreters/Context.h>
 #include <filesystem>
 
 #include <Loggers/OwnFormattingChannel.h>
@@ -80,7 +82,9 @@ namespace DB
     }
 }
 
-DB::PipeFDs signal_pipe;
+using namespace DB;
+
+PipeFDs signal_pipe;
 
 
 /** Reset signal handler to the default and send signal to itself.
@@ -89,10 +93,10 @@ DB::PipeFDs signal_pipe;
 static void call_default_signal_handler(int sig)
 {
     if (SIG_ERR == signal(sig, SIG_DFL))
-        DB::throwFromErrno("Cannot set signal handler.", DB::ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+        throwFromErrno("Cannot set signal handler.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
 
     if (0 != raise(sig))
-        DB::throwFromErrno("Cannot send signal.", DB::ErrorCodes::CANNOT_SEND_SIGNAL);
+        throwFromErrno("Cannot send signal.", ErrorCodes::CANNOT_SEND_SIGNAL);
 }
 
 static const size_t signal_pipe_buf_size =
@@ -110,8 +114,8 @@ static void writeSignalIDtoSignalPipe(int sig)
     auto saved_errno = errno;   /// We must restore previous value of errno in signal handler.
 
     char buf[signal_pipe_buf_size];
-    DB::WriteBufferFromFileDescriptor out(signal_pipe.fds_rw[1], signal_pipe_buf_size, buf);
-    DB::writeBinary(sig, out);
+    WriteBufferFromFileDescriptor out(signal_pipe.fds_rw[1], signal_pipe_buf_size, buf);
+    writeBinary(sig, out);
     out.next();
 
     errno = saved_errno;
@@ -141,17 +145,18 @@ static void signalHandler(int sig, siginfo_t * info, void * context)
     auto saved_errno = errno;   /// We must restore previous value of errno in signal handler.
 
     char buf[signal_pipe_buf_size];
-    DB::WriteBufferFromFileDescriptorDiscardOnFailure out(signal_pipe.fds_rw[1], signal_pipe_buf_size, buf);
+    WriteBufferFromFileDescriptorDiscardOnFailure out(signal_pipe.fds_rw[1], signal_pipe_buf_size, buf);
 
     const ucontext_t * signal_context = reinterpret_cast<ucontext_t *>(context);
     const StackTrace stack_trace(*signal_context);
 
-    DB::writeBinary(sig, out);
-    DB::writePODBinary(*info, out);
-    DB::writePODBinary(signal_context, out);
-    DB::writePODBinary(stack_trace, out);
-    DB::writeBinary(static_cast<UInt32>(getThreadId()), out);
-    DB::writePODBinary(DB::current_thread, out);
+    writeBinary(sig, out);
+    writePODBinary(*info, out);
+    writePODBinary(signal_context, out);
+    writePODBinary(stack_trace, out);
+    writeVectorBinary(Exception::thread_frame_pointers, out);
+    writeBinary(static_cast<UInt32>(getThreadId()), out);
+    writePODBinary(current_thread, out);
 
     out.next();
 
@@ -203,12 +208,12 @@ public:
         static_assert(PIPE_BUF >= 512);
         static_assert(signal_pipe_buf_size <= PIPE_BUF, "Only write of PIPE_BUF to pipe is atomic and the minimal known PIPE_BUF across supported platforms is 512");
         char buf[signal_pipe_buf_size];
-        DB::ReadBufferFromFileDescriptor in(signal_pipe.fds_rw[0], signal_pipe_buf_size, buf);
+        ReadBufferFromFileDescriptor in(signal_pipe.fds_rw[0], signal_pipe_buf_size, buf);
 
         while (!in.eof())
         {
             int sig = 0;
-            DB::readBinary(sig, in);
+            readBinary(sig, in);
             // We may log some specific signals afterwards, with different log
             // levels and more info, but for completeness we log all signals
             // here at trace level.
@@ -231,8 +236,8 @@ public:
                 UInt32 thread_num;
                 std::string message;
 
-                DB::readBinary(thread_num, in);
-                DB::readBinary(message, in);
+                readBinary(thread_num, in);
+                readBinary(message, in);
 
                 onTerminate(message, thread_num);
             }
@@ -247,22 +252,24 @@ public:
                 siginfo_t info{};
                 ucontext_t * context{};
                 StackTrace stack_trace(NoCapture{});
+                std::vector<StackTrace::FramePointers> thread_frame_pointers;
                 UInt32 thread_num{};
-                DB::ThreadStatus * thread_ptr{};
+                ThreadStatus * thread_ptr{};
 
                 if (sig != SanitizerTrap)
                 {
-                    DB::readPODBinary(info, in);
-                    DB::readPODBinary(context, in);
+                    readPODBinary(info, in);
+                    readPODBinary(context, in);
                 }
 
-                DB::readPODBinary(stack_trace, in);
-                DB::readBinary(thread_num, in);
-                DB::readPODBinary(thread_ptr, in);
+                readPODBinary(stack_trace, in);
+                readVectorBinary(thread_frame_pointers, in);
+                readBinary(thread_num, in);
+                readPODBinary(thread_ptr, in);
 
                 /// This allows to receive more signals if failure happens inside onFault function.
                 /// Example: segfault while symbolizing stack trace.
-                std::thread([=, this] { onFault(sig, info, context, stack_trace, thread_num, thread_ptr); }).detach();
+                std::thread([=, this] { onFault(sig, info, context, stack_trace, thread_frame_pointers, thread_num, thread_ptr); }).detach();
             }
         }
     }
@@ -275,8 +282,8 @@ private:
     {
         size_t pos = message.find('\n');
 
-        LOG_FATAL(log, "(version {}{}, build id: {}) (from thread {}) {}",
-            VERSION_STRING, VERSION_OFFICIAL, daemon.build_id, thread_num, message.substr(0, pos));
+        LOG_FATAL(log, "(version {}{}, build id: {}, git hash: {}) (from thread {}) {}",
+            VERSION_STRING, VERSION_OFFICIAL, daemon.build_id, daemon.git_hash, thread_num, message.substr(0, pos));
 
         /// Print trace from std::terminate exception line-by-line to make it easy for grep.
         while (pos != std::string_view::npos)
@@ -297,10 +304,11 @@ private:
         const siginfo_t & info,
         ucontext_t * context,
         const StackTrace & stack_trace,
+        const std::vector<StackTrace::FramePointers> & thread_frame_pointers,
         UInt32 thread_num,
-        DB::ThreadStatus * thread_ptr) const
+        ThreadStatus * thread_ptr) const
     {
-        DB::ThreadStatus thread_status;
+        ThreadStatus thread_status;
 
         String query_id;
         String query;
@@ -314,7 +322,7 @@ private:
 
             if (auto logs_queue = thread_ptr->getInternalTextLogsQueue())
             {
-                DB::CurrentThread::attachInternalTextLogsQueue(logs_queue, DB::LogsLevel::trace);
+                CurrentThread::attachInternalTextLogsQueue(logs_queue, LogsLevel::trace);
             }
         }
 
@@ -332,14 +340,14 @@ private:
 
         if (query_id.empty())
         {
-            LOG_FATAL(log, "(version {}{}, build id: {}) (from thread {}) (no query) Received signal {} ({})",
-                VERSION_STRING, VERSION_OFFICIAL, daemon.build_id,
+            LOG_FATAL(log, "(version {}{}, build id: {}, git hash: {}) (from thread {}) (no query) Received signal {} ({})",
+                VERSION_STRING, VERSION_OFFICIAL, daemon.build_id, daemon.git_hash,
                 thread_num, signal_description, sig);
         }
         else
         {
-            LOG_FATAL(log, "(version {}{}, build id: {}) (from thread {}) (query_id: {}) (query: {}) Received signal {} ({})",
-                VERSION_STRING, VERSION_OFFICIAL, daemon.build_id,
+            LOG_FATAL(log, "(version {}{}, build id: {}, git hash: {}) (from thread {}) (query_id: {}) (query: {}) Received signal {} ({})",
+                VERSION_STRING, VERSION_OFFICIAL, daemon.build_id, daemon.git_hash,
                 thread_num, query_id, query, signal_description, sig);
         }
 
@@ -358,12 +366,12 @@ private:
             /// NOTE: This still require memory allocations and mutex lock inside logger.
             ///       BTW we can also print it to stderr using write syscalls.
 
-            DB::WriteBufferFromOwnString bare_stacktrace;
-            DB::writeString("Stack trace:", bare_stacktrace);
+            WriteBufferFromOwnString bare_stacktrace;
+            writeString("Stack trace:", bare_stacktrace);
             for (size_t i = stack_trace.getOffset(); i < stack_trace.getSize(); ++i)
             {
-                DB::writeChar(' ', bare_stacktrace);
-                DB::writePointerHex(stack_trace.getFramePointers()[i], bare_stacktrace);
+                writeChar(' ', bare_stacktrace);
+                writePointerHex(stack_trace.getFramePointers()[i], bare_stacktrace);
             }
 
             LOG_FATAL(log, fmt::runtime(bare_stacktrace.str()));
@@ -372,6 +380,31 @@ private:
         /// Write symbolized stack trace line by line for better grep-ability.
         stack_trace.toStringEveryLine([&](std::string_view s) { LOG_FATAL(log, fmt::runtime(s)); });
 
+        /// In case it's a scheduled job write all previous jobs origins call stacks
+        std::for_each(thread_frame_pointers.rbegin(), thread_frame_pointers.rend(),
+            [this](const StackTrace::FramePointers & frame_pointers)
+            {
+                if (size_t size = std::ranges::find(frame_pointers, nullptr) - frame_pointers.begin())
+                {
+                    LOG_FATAL(log, "========================================");
+                    WriteBufferFromOwnString bare_stacktrace;
+                    writeString("Job's origin stack trace:", bare_stacktrace);
+                    std::for_each_n(frame_pointers.begin(), size,
+                        [&bare_stacktrace](const void * ptr)
+                        {
+                            writeChar(' ', bare_stacktrace);
+                            writePointerHex(ptr, bare_stacktrace);
+                        }
+                    );
+
+                    LOG_FATAL(log, fmt::runtime(bare_stacktrace.str()));
+
+                    StackTrace::toStringEveryLine(const_cast<void **>(frame_pointers.data()), 0, size, [this](std::string_view s) { LOG_FATAL(log, fmt::runtime(s)); });
+                }
+            }
+        );
+
+
 #if defined(OS_LINUX)
         /// Write information about binary checksum. It can be difficult to calculate, so do it only after printing stack trace.
         /// Please keep the below log messages in-sync with the ones in programs/server/Server.cpp
@@ -411,8 +444,52 @@ private:
 
         /// Send crash report to developers (if configured)
         if (sig != SanitizerTrap)
+        {
             SentryWriter::onFault(sig, error_message, stack_trace);
 
+#pragma clang diagnostic push
+#pragma clang diagnostic ignored "-Wunreachable-code"
+            /// Advice the user to send it manually.
+            if constexpr (std::string_view(VERSION_OFFICIAL).contains("official build"))
+            {
+                const auto & date_lut = DateLUT::instance();
+
+                /// Approximate support period, upper bound.
+                if (time(nullptr) - date_lut.makeDate(2000 + VERSION_MAJOR, VERSION_MINOR, 1) < (365 + 30) * 86400)
+                {
+                    LOG_FATAL(log, "Report this error to https://github.com/ClickHouse/ClickHouse/issues");
+                }
+                else
+                {
+                    LOG_FATAL(log, "ClickHouse version {} is old and should be upgraded to the latest version.", VERSION_STRING);
+                }
+            }
+            else
+            {
+                LOG_FATAL(log, "This ClickHouse version is not official and should be upgraded to the official build.");
+            }
+#pragma clang diagnostic pop
+
+        }
+
+        /// ClickHouse Keeper does not link to some part of Settings.
+#ifndef CLICKHOUSE_PROGRAM_STANDALONE_BUILD
+        /// List changed settings.
+        if (!query_id.empty())
+        {
+            ContextPtr query_context = thread_ptr->getQueryContext();
+            if (query_context)
+            {
+                String changed_settings = query_context->getSettingsRef().toString();
+
+                if (changed_settings.empty())
+                    LOG_FATAL(log, "No settings were changed");
+                else
+                    LOG_FATAL(log, "Changed settings: {}", changed_settings);
+            }
+        }
+#endif
+
         /// When everything is done, we will try to send these error messages to client.
         if (thread_ptr)
             thread_ptr->onFatalError();
@@ -436,15 +513,15 @@ static DISABLE_SANITIZER_INSTRUMENTATION void sanitizerDeathCallback()
     /// Also need to send data via pipe. Otherwise it may lead to deadlocks or failures in printing diagnostic info.
 
     char buf[signal_pipe_buf_size];
-    DB::WriteBufferFromFileDescriptorDiscardOnFailure out(signal_pipe.fds_rw[1], signal_pipe_buf_size, buf);
+    WriteBufferFromFileDescriptorDiscardOnFailure out(signal_pipe.fds_rw[1], signal_pipe_buf_size, buf);
 
     const StackTrace stack_trace;
 
     int sig = SignalListener::SanitizerTrap;
-    DB::writeBinary(sig, out);
-    DB::writePODBinary(stack_trace, out);
-    DB::writeBinary(UInt32(getThreadId()), out);
-    DB::writePODBinary(DB::current_thread, out);
+    writeBinary(sig, out);
+    writePODBinary(stack_trace, out);
+    writeBinary(UInt32(getThreadId()), out);
+    writePODBinary(current_thread, out);
 
     out.next();
 
@@ -470,7 +547,7 @@ static DISABLE_SANITIZER_INSTRUMENTATION void sanitizerDeathCallback()
     std::string log_message;
 
     if (std::current_exception())
-        log_message = "Terminate called for uncaught exception:\n" + DB::getCurrentExceptionMessage(true);
+        log_message = "Terminate called for uncaught exception:\n" + getCurrentExceptionMessage(true);
     else
         log_message = "Terminate called without an active exception";
 
@@ -482,11 +559,11 @@ static DISABLE_SANITIZER_INSTRUMENTATION void sanitizerDeathCallback()
         log_message.resize(buf_size - 16);
 
     char buf[buf_size];
-    DB::WriteBufferFromFileDescriptor out(signal_pipe.fds_rw[1], buf_size, buf);
+    WriteBufferFromFileDescriptor out(signal_pipe.fds_rw[1], buf_size, buf);
 
-    DB::writeBinary(static_cast<int>(SignalListener::StdTerminate), out);
-    DB::writeBinary(static_cast<UInt32>(getThreadId()), out);
-    DB::writeBinary(log_message, out);
+    writeBinary(static_cast<int>(SignalListener::StdTerminate), out);
+    writeBinary(static_cast<UInt32>(getThreadId()), out);
+    writeBinary(log_message, out);
     out.next();
 
     abort();
@@ -512,7 +589,7 @@ static bool tryCreateDirectories(Poco::Logger * logger, const std::string & path
     }
     catch (...)
     {
-        LOG_WARNING(logger, "{}: when creating {}, {}", __PRETTY_FUNCTION__, path, DB::getCurrentExceptionMessage(true));
+        LOG_WARNING(logger, "{}: when creating {}, {}", __PRETTY_FUNCTION__, path, getCurrentExceptionMessage(true));
     }
     return false;
 }
@@ -527,7 +604,7 @@ void BaseDaemon::reloadConfiguration()
       * (It's convenient to log in console when you start server without any command line parameters.)
       */
     config_path = config().getString("config-file", getDefaultConfigFileName());
-    DB::ConfigProcessor config_processor(config_path, false, true);
+    ConfigProcessor config_processor(config_path, false, true);
     config_processor.setConfigPath(fs::path(config_path).parent_path());
     loaded_config = config_processor.loadConfig(/* allow_zk_includes = */ true);
 
@@ -548,7 +625,7 @@ BaseDaemon::~BaseDaemon()
     /// Reset signals to SIG_DFL to avoid trying to write to the signal_pipe that will be closed after.
     for (int sig : handled_signals)
         if (SIG_ERR == signal(sig, SIG_DFL))
-            DB::throwFromErrno("Cannot set signal handler.", DB::ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+            throwFromErrno("Cannot set signal handler.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
     signal_pipe.close();
 }
 
@@ -592,7 +669,7 @@ void BaseDaemon::closeFDs()
         /// Iterate directory separately from closing fds to avoid closing iterated directory fd.
         std::vector<int> fds;
         for (const auto & path : fs::directory_iterator(proc_path))
-            fds.push_back(DB::parse<int>(path.path().filename()));
+            fds.push_back(parse<int>(path.path().filename()));
 
         for (const auto & fd : fds)
         {
@@ -662,7 +739,7 @@ void BaseDaemon::initialize(Application & self)
     }
     umask(umask_num);
 
-    DB::ConfigProcessor(config_path).savePreprocessedConfig(loaded_config, "");
+    ConfigProcessor(config_path).savePreprocessedConfig(loaded_config, "");
 
     /// Write core dump on crash.
     {
@@ -713,12 +790,12 @@ void BaseDaemon::initialize(Application & self)
         ///     {
         ///         try
         ///         {
-        ///             DB::SomeApp app;
+        ///             SomeApp app;
         ///             return app.run(argc, argv);
         ///         }
         ///         catch (...)
         ///         {
-        ///             std::cerr << DB::getCurrentExceptionMessage(true) << "\n";
+        ///             std::cerr << getCurrentExceptionMessage(true) << "\n";
         ///             return 1;
         ///         }
         ///     }
@@ -772,7 +849,7 @@ void BaseDaemon::initialize(Application & self)
 
     /// Create pid file.
     if (config().has("pid"))
-        pid_file.emplace(config().getString("pid"), DB::StatusFile::write_pid);
+        pid_file.emplace(config().getString("pid"), StatusFile::write_pid);
 
     if (is_daemon)
     {
@@ -799,7 +876,7 @@ void BaseDaemon::initialize(Application & self)
     initializeTerminationAndSignalProcessing();
     logRevision();
 
-    for (const auto & key : DB::getMultipleKeysFromConfig(config(), "", "graphite"))
+    for (const auto & key : getMultipleKeysFromConfig(config(), "", "graphite"))
     {
         graphite_writers.emplace(key, std::make_unique<GraphiteWriter>(key));
     }
@@ -887,7 +964,7 @@ void BaseDaemon::initializeTerminationAndSignalProcessing()
     signal_listener_thread.start(*signal_listener);
 
 #if defined(__ELF__) && !defined(OS_FREEBSD)
-    String build_id_hex = DB::SymbolIndex::instance()->getBuildIDHex();
+    String build_id_hex = SymbolIndex::instance()->getBuildIDHex();
     if (build_id_hex.empty())
         build_id = "";
     else
@@ -902,7 +979,7 @@ void BaseDaemon::initializeTerminationAndSignalProcessing()
     std::string executable_path = getExecutablePath();
 
     if (!executable_path.empty())
-        stored_binary_hash = DB::Elf(executable_path).getStoredBinaryHash();
+        stored_binary_hash = Elf(executable_path).getStoredBinaryHash();
 #endif
 }
 
@@ -963,7 +1040,7 @@ void BaseDaemon::handleSignal(int signal_id)
         onInterruptSignals(signal_id);
     }
     else
-        throw DB::Exception::createDeprecated(std::string("Unsupported signal: ") + strsignal(signal_id), 0); // NOLINT(concurrency-mt-unsafe) // it is not thread-safe but ok in this context
+        throw Exception::createDeprecated(std::string("Unsupported signal: ") + strsignal(signal_id), 0); // NOLINT(concurrency-mt-unsafe) // it is not thread-safe but ok in this context
 }
 
 void BaseDaemon::onInterruptSignals(int signal_id)
@@ -999,7 +1076,7 @@ void BaseDaemon::shouldSetupWatchdog(char * argv0_)
 void BaseDaemon::setupWatchdog()
 {
     /// Initialize in advance to avoid double initialization in forked processes.
-    DateLUT::instance();
+    DateLUT::serverTimezoneInstance();
 
     std::string original_process_name;
     if (argv0)
@@ -1020,7 +1097,7 @@ void BaseDaemon::setupWatchdog()
         pid = fork();
 
         if (-1 == pid)
-            DB::throwFromErrno("Cannot fork", DB::ErrorCodes::SYSTEM_ERROR);
+            throwFromErrno("Cannot fork", ErrorCodes::SYSTEM_ERROR);
 
         if (0 == pid)
         {
@@ -1073,13 +1150,13 @@ void BaseDaemon::setupWatchdog()
                 pf = new OwnJSONPatternFormatter(config());
             else
                 pf = new OwnPatternFormatter;
-            Poco::AutoPtr<DB::OwnFormattingChannel> log = new DB::OwnFormattingChannel(pf, new Poco::ConsoleChannel(std::cerr));
+            Poco::AutoPtr<OwnFormattingChannel> log = new OwnFormattingChannel(pf, new Poco::ConsoleChannel(std::cerr));
             logger().setChannel(log);
         }
 
         /// Cuncurrent writing logs to the same file from two threads is questionable on its own,
         ///  but rotating them from two threads is disastrous.
-        if (auto * channel = dynamic_cast<DB::OwnSplitChannel *>(logger().getChannel()))
+        if (auto * channel = dynamic_cast<OwnSplitChannel *>(logger().getChannel()))
         {
             channel->setChannelProperty("log", Poco::FileChannel::PROP_ROTATION, "never");
             channel->setChannelProperty("log", Poco::FileChannel::PROP_ROTATEONOPEN, "false");
@@ -1191,7 +1268,7 @@ void systemdNotify(const std::string_view & command)
     int s = socket(AF_UNIX, SOCK_DGRAM | SOCK_CLOEXEC, 0);
 
     if (s == -1)
-        DB::throwFromErrno("Can't create UNIX socket for systemd notify.", DB::ErrorCodes::SYSTEM_ERROR);
+        throwFromErrno("Can't create UNIX socket for systemd notify.", ErrorCodes::SYSTEM_ERROR);
 
     SCOPE_EXIT({ close(s); });
 
@@ -1202,7 +1279,7 @@ void systemdNotify(const std::string_view & command)
     addr.sun_family = AF_UNIX;
 
     if (len < 2 || len > sizeof(addr.sun_path) - 1)
-        throw DB::Exception(DB::ErrorCodes::SYSTEM_ERROR, "NOTIFY_SOCKET env var value \"{}\" is wrong.", path);
+        throw Exception(ErrorCodes::SYSTEM_ERROR, "NOTIFY_SOCKET env var value \"{}\" is wrong.", path);
 
     memcpy(addr.sun_path, path, len + 1); /// write last zero as well.
 
@@ -1214,7 +1291,7 @@ void systemdNotify(const std::string_view & command)
     else if (path[0] == '/')
         addrlen += 1; /// non-abstract-addresses should be zero terminated.
     else
-        throw DB::Exception(DB::ErrorCodes::SYSTEM_ERROR, "Wrong UNIX path \"{}\" in NOTIFY_SOCKET env var", path);
+        throw Exception(ErrorCodes::SYSTEM_ERROR, "Wrong UNIX path \"{}\" in NOTIFY_SOCKET env var", path);
 
     const struct sockaddr *sock_addr = reinterpret_cast <const struct sockaddr *>(&addr);
 
@@ -1227,7 +1304,7 @@ void systemdNotify(const std::string_view & command)
             if (errno == EINTR)
                 continue;
             else
-                DB::throwFromErrno("Failed to notify systemd, sendto returned error.", DB::ErrorCodes::SYSTEM_ERROR);
+                throwFromErrno("Failed to notify systemd, sendto returned error.", ErrorCodes::SYSTEM_ERROR);
         }
         else
             sent_bytes_total += sent_bytes;
diff --git a/src/DataTypes/DataTypeAggregateFunction.h b/src/DataTypes/DataTypeAggregateFunction.h
index 2d712d9c686..83c9f10f407 100644
--- a/src/DataTypes/DataTypeAggregateFunction.h
+++ b/src/DataTypes/DataTypeAggregateFunction.h
@@ -45,6 +45,7 @@ public:
     String doGetName() const override;
     String getNameWithoutVersion() const;
     const char * getFamilyName() const override { return "AggregateFunction"; }
+    String getSQLCompatibleName() const override { return "TEXT"; }
     TypeIndex getTypeId() const override { return TypeIndex::AggregateFunction; }
 
     Array getParameters() const { return parameters; }
diff --git a/src/DataTypes/DataTypeArray.h b/src/DataTypes/DataTypeArray.h
index 033a657c845..2714ca1d023 100644
--- a/src/DataTypes/DataTypeArray.h
+++ b/src/DataTypes/DataTypeArray.h
@@ -30,6 +30,10 @@ public:
     {
         return "Array";
     }
+    String getSQLCompatibleName() const override
+    {
+        return "TEXT";
+    }
 
     bool canBeInsideNullable() const override
     {
diff --git a/src/DataTypes/DataTypeDate.h b/src/DataTypes/DataTypeDate.h
index 2f17207cc07..0d557cad5f0 100644
--- a/src/DataTypes/DataTypeDate.h
+++ b/src/DataTypes/DataTypeDate.h
@@ -13,6 +13,7 @@ public:
 
     TypeIndex getTypeId() const override { return TypeIndex::Date; }
     const char * getFamilyName() const override { return family_name; }
+    String getSQLCompatibleName() const override { return "DATE"; }
 
     bool canBeUsedAsVersion() const override { return true; }
     bool canBeInsideNullable() const override { return true; }
diff --git a/src/DataTypes/DataTypeDate32.h b/src/DataTypes/DataTypeDate32.h
index 9160b62dc15..0879a404179 100644
--- a/src/DataTypes/DataTypeDate32.h
+++ b/src/DataTypes/DataTypeDate32.h
@@ -13,6 +13,7 @@ public:
 
     TypeIndex getTypeId() const override { return TypeIndex::Date32; }
     const char * getFamilyName() const override { return family_name; }
+    String getSQLCompatibleName() const override { return "DATE"; }
 
     Field getDefault() const override
     {
diff --git a/src/DataTypes/DataTypeDateTime.h b/src/DataTypes/DataTypeDateTime.h
index 91a09ff7cb9..a473aae1faf 100644
--- a/src/DataTypes/DataTypeDateTime.h
+++ b/src/DataTypes/DataTypeDateTime.h
@@ -21,7 +21,9 @@ namespace DB
   *  all types with different time zones are equivalent and may be used interchangingly.
   * Time zone only affects parsing and displaying in text formats.
   *
-  * If time zone is not specified (example: DateTime without parameter), then default time zone is used.
+  * If time zone is not specified (example: DateTime without parameter),
+  * then `session_timezone` setting value is used.
+  * If `session_timezone` is not set (or empty string), server default time zone is used.
   * Default time zone is server time zone, if server is doing transformations
   *  and if client is doing transformations, unless 'use_client_time_zone' setting is passed to client;
   * Server time zone is the time zone specified in 'timezone' parameter in configuration file,
@@ -36,6 +38,7 @@ public:
     static constexpr auto family_name = "DateTime";
 
     const char * getFamilyName() const override { return family_name; }
+    String getSQLCompatibleName() const override { return "DATETIME"; }
     String doGetName() const override;
     TypeIndex getTypeId() const override { return TypeIndex::DateTime; }
 
diff --git a/src/DataTypes/DataTypeDateTime64.h b/src/DataTypes/DataTypeDateTime64.h
index aaa99485040..7663518807f 100644
--- a/src/DataTypes/DataTypeDateTime64.h
+++ b/src/DataTypes/DataTypeDateTime64.h
@@ -28,6 +28,7 @@ public:
     DataTypeDateTime64(UInt32 scale_, const TimezoneMixin & time_zone_info);
 
     const char * getFamilyName() const override { return family_name; }
+    String getSQLCompatibleName() const override { return "DATETIME"; }
     std::string doGetName() const override;
     TypeIndex getTypeId() const override { return type_id; }
 
@@ -37,6 +38,8 @@ public:
 
     bool canBeUsedAsVersion() const override { return true; }
 
+    bool isSummable() const override { return false; }
+
 protected:
     SerializationPtr doGetDefaultSerialization() const override;
 };
diff --git a/src/DataTypes/DataTypeEnum.cpp b/src/DataTypes/DataTypeEnum.cpp
index 3c3ac2ae4e2..1750ae785bf 100644
--- a/src/DataTypes/DataTypeEnum.cpp
+++ b/src/DataTypes/DataTypeEnum.cpp
@@ -36,6 +36,29 @@ const char * DataTypeEnum<Type>::getFamilyName() const
     return EnumName<FieldType>::value;
 }
 
+template <typename Type>
+std::string DataTypeEnum<Type>::generateMySQLName(const Values & values)
+{
+    WriteBufferFromOwnString out;
+
+    writeString("ENUM", out);
+    writeChar('(', out);
+
+    auto first = true;
+    for (const auto & name_and_value : values)
+    {
+        if (!first)
+            writeString(", ", out);
+
+        first = false;
+
+        writeQuotedString(name_and_value.first, out);
+    }
+
+    writeChar(')', out);
+
+    return out.str();
+}
 
 template <typename Type>
 std::string DataTypeEnum<Type>::generateName(const Values & values)
diff --git a/src/DataTypes/DataTypeEnum.h b/src/DataTypes/DataTypeEnum.h
index 2f607fc2aa6..d148f753c82 100644
--- a/src/DataTypes/DataTypeEnum.h
+++ b/src/DataTypes/DataTypeEnum.h
@@ -46,12 +46,14 @@ public:
 private:
     std::string type_name;
     static std::string generateName(const Values & values);
+    static std::string generateMySQLName(const Values & values);
 
 public:
     explicit DataTypeEnum(const Values & values_);
 
     std::string doGetName() const override { return type_name; }
     const char * getFamilyName() const override;
+    String getSQLCompatibleName() const override { return generateMySQLName(this->getValues()); }
 
     TypeIndex getTypeId() const override { return type_id; }
 
diff --git a/src/DataTypes/DataTypeFixedString.h b/src/DataTypes/DataTypeFixedString.h
index 8d114121c1a..22ec793208d 100644
--- a/src/DataTypes/DataTypeFixedString.h
+++ b/src/DataTypes/DataTypeFixedString.h
@@ -42,6 +42,8 @@ public:
     TypeIndex getTypeId() const override { return type_id; }
 
     const char * getFamilyName() const override { return "FixedString"; }
+    /// Use TEXT for compatibility with MySQL to allow arbitrary bytes.
+    String getSQLCompatibleName() const override { return "TEXT"; }
 
     size_t getN() const
     {
diff --git a/src/DataTypes/DataTypeFunction.h b/src/DataTypes/DataTypeFunction.h
index 888bcb6a775..b57c0587dde 100644
--- a/src/DataTypes/DataTypeFunction.h
+++ b/src/DataTypes/DataTypeFunction.h
@@ -24,6 +24,7 @@ public:
 
     std::string doGetName() const override;
     const char * getFamilyName() const override { return "Function"; }
+    String getSQLCompatibleName() const override { return "TEXT"; }
     TypeIndex getTypeId() const override { return TypeIndex::Function; }
 
     const DataTypes & getArgumentTypes() const
diff --git a/src/DataTypes/DataTypeIPv4andIPv6.h b/src/DataTypes/DataTypeIPv4andIPv6.h
index ad70bdae933..487ce04f67c 100644
--- a/src/DataTypes/DataTypeIPv4andIPv6.h
+++ b/src/DataTypes/DataTypeIPv4andIPv6.h
@@ -19,6 +19,8 @@ public:
     static constexpr auto type_id = TypeToTypeIndex<IPv4>;
 
     const char * getFamilyName() const override { return TypeName<IPv4>.data(); }
+    String getSQLCompatibleName() const override { return "TEXT"; }
+
     TypeIndex getTypeId() const override { return type_id; }
 
     Field getDefault() const override { return IPv4{}; }
@@ -59,6 +61,8 @@ public:
     static constexpr auto type_id = TypeToTypeIndex<IPv6>;
 
     const char * getFamilyName() const override { return TypeName<IPv6>.data(); }
+    String getSQLCompatibleName() const override { return "TEXT"; }
+
     TypeIndex getTypeId() const override { return type_id; }
 
     Field getDefault() const override { return IPv6{}; }
diff --git a/src/DataTypes/DataTypeInterval.h b/src/DataTypes/DataTypeInterval.h
index 05abe1d9b24..7de56c13b56 100644
--- a/src/DataTypes/DataTypeInterval.h
+++ b/src/DataTypes/DataTypeInterval.h
@@ -26,6 +26,7 @@ public:
 
     std::string doGetName() const override { return fmt::format("Interval{}", kind.toString()); }
     const char * getFamilyName() const override { return "Interval"; }
+    String getSQLCompatibleName() const override { return "TEXT"; }
     TypeIndex getTypeId() const override { return TypeIndex::Interval; }
 
     bool equals(const IDataType & rhs) const override;
diff --git a/src/DataTypes/DataTypeLowCardinality.h b/src/DataTypes/DataTypeLowCardinality.h
index d301a0f5443..f6d8d07a312 100644
--- a/src/DataTypes/DataTypeLowCardinality.h
+++ b/src/DataTypes/DataTypeLowCardinality.h
@@ -12,6 +12,7 @@ class DataTypeLowCardinality : public IDataType
 private:
     DataTypePtr dictionary_type;
 
+
 public:
     explicit DataTypeLowCardinality(DataTypePtr dictionary_type_);
 
@@ -22,6 +23,8 @@ public:
         return "LowCardinality(" + dictionary_type->getName() + ")";
     }
     const char * getFamilyName() const override { return "LowCardinality"; }
+    String getSQLCompatibleName() const override { return dictionary_type->getSQLCompatibleName(); }
+
     TypeIndex getTypeId() const override { return TypeIndex::LowCardinality; }
 
     MutableColumnPtr createColumn() const override;
diff --git a/src/DataTypes/DataTypeMap.cpp b/src/DataTypes/DataTypeMap.cpp
index 0f5d97e6761..90561857fad 100644
--- a/src/DataTypes/DataTypeMap.cpp
+++ b/src/DataTypes/DataTypeMap.cpp
@@ -69,7 +69,7 @@ void DataTypeMap::assertKeyType() const
     if (!checkKeyType(key_type))
         throw Exception(ErrorCodes::BAD_ARGUMENTS,
                         "Type of Map key must be a type, that can be represented by integer "
-                        "or String or FixedString (possibly LowCardinality) or UUID,"
+                        "or String or FixedString (possibly LowCardinality) or UUID or IPv6,"
                         " but {} given", key_type->getName());
 }
 
@@ -120,6 +120,7 @@ bool DataTypeMap::checkKeyType(DataTypePtr key_type)
     else if (!key_type->isValueRepresentedByInteger()
              && !isStringOrFixedString(*key_type)
              && !WhichDataType(key_type).isNothing()
+             && !WhichDataType(key_type).isIPv6()
              && !WhichDataType(key_type).isUUID())
     {
         return false;
diff --git a/src/DataTypes/DataTypeMap.h b/src/DataTypes/DataTypeMap.h
index 4712f6bbdef..294c5d7ac77 100644
--- a/src/DataTypes/DataTypeMap.h
+++ b/src/DataTypes/DataTypeMap.h
@@ -30,6 +30,7 @@ public:
     TypeIndex getTypeId() const override { return TypeIndex::Map; }
     std::string doGetName() const override;
     const char * getFamilyName() const override { return "Map"; }
+    String getSQLCompatibleName() const override { return "JSON"; }
 
     bool canBeInsideNullable() const override { return false; }
 
diff --git a/src/DataTypes/DataTypeNothing.h b/src/DataTypes/DataTypeNothing.h
index c7d12388de9..c3a7e2d09f0 100644
--- a/src/DataTypes/DataTypeNothing.h
+++ b/src/DataTypes/DataTypeNothing.h
@@ -16,6 +16,8 @@ public:
     static constexpr bool is_parametric = false;
 
     const char * getFamilyName() const override { return "Nothing"; }
+    String getSQLCompatibleName() const override { return "TEXT"; }
+
     TypeIndex getTypeId() const override { return TypeIndex::Nothing; }
 
     MutableColumnPtr createColumn() const override;
diff --git a/src/DataTypes/DataTypeNullable.h b/src/DataTypes/DataTypeNullable.h
index 06d46fb15ed..e3165414c07 100644
--- a/src/DataTypes/DataTypeNullable.h
+++ b/src/DataTypes/DataTypeNullable.h
@@ -16,6 +16,7 @@ public:
     explicit DataTypeNullable(const DataTypePtr & nested_data_type_);
     std::string doGetName() const override { return "Nullable(" + nested_data_type->getName() + ")"; }
     const char * getFamilyName() const override { return "Nullable"; }
+    String getSQLCompatibleName() const override { return nested_data_type->getSQLCompatibleName(); }
     TypeIndex getTypeId() const override { return TypeIndex::Nullable; }
 
     MutableColumnPtr createColumn() const override;
diff --git a/src/DataTypes/DataTypeNumberBase.cpp b/src/DataTypes/DataTypeNumberBase.cpp
index f668a4c522e..4cefc4945c6 100644
--- a/src/DataTypes/DataTypeNumberBase.cpp
+++ b/src/DataTypes/DataTypeNumberBase.cpp
@@ -11,6 +11,33 @@ Field DataTypeNumberBase<T>::getDefault() const
 {
     return NearestFieldType<FieldType>();
 }
+template <typename T>
+String DataTypeNumberBase<T>::getSQLCompatibleName() const
+{
+    if constexpr (std::is_same_v<T, Int8>)
+        return "TINYINT";
+    else if constexpr (std::is_same_v<T, Int16>)
+        return "SMALLINT";
+    else if constexpr (std::is_same_v<T, Int32>)
+        return "INTEGER";
+    else if constexpr (std::is_same_v<T, Int64>)
+        return "BIGINT";
+    else if constexpr (std::is_same_v<T, UInt8>)
+        return "TINYINT UNSIGNED";
+    else if constexpr (std::is_same_v<T, UInt16>)
+        return "SMALLINT UNSIGNED";
+    else if constexpr (std::is_same_v<T, UInt32>)
+        return "INTEGER UNSIGNED";
+    else if constexpr (std::is_same_v<T, UInt64>)
+        return "BIGINT UNSIGNED";
+    else if constexpr (std::is_same_v<T, Float32>)
+        return "FLOAT";
+    else if constexpr (std::is_same_v<T, Float64>)
+        return "DOUBLE";
+    /// Unsupported types are converted to TEXT
+    else
+        return "TEXT";
+}
 
 template <typename T>
 MutableColumnPtr DataTypeNumberBase<T>::createColumn() const
@@ -30,7 +57,6 @@ bool DataTypeNumberBase<T>::isValueRepresentedByUnsignedInteger() const
     return is_integer<T> && is_unsigned_v<T>;
 }
 
-
 /// Explicit template instantiations - to avoid code bloat in headers.
 template class DataTypeNumberBase<UInt8>;
 template class DataTypeNumberBase<UInt16>;
diff --git a/src/DataTypes/DataTypeNumberBase.h b/src/DataTypes/DataTypeNumberBase.h
index 3a5b11c5124..d902c62505e 100644
--- a/src/DataTypes/DataTypeNumberBase.h
+++ b/src/DataTypes/DataTypeNumberBase.h
@@ -25,6 +25,7 @@ public:
     using ColumnType = ColumnVector<T>;
 
     const char * getFamilyName() const override { return TypeName<T>.data(); }
+    String getSQLCompatibleName() const override;
     TypeIndex getTypeId() const override { return TypeToTypeIndex<T>; }
 
     Field getDefault() const override;
diff --git a/src/DataTypes/DataTypeObject.h b/src/DataTypes/DataTypeObject.h
index 937a9091371..2e1e5398f7e 100644
--- a/src/DataTypes/DataTypeObject.h
+++ b/src/DataTypes/DataTypeObject.h
@@ -23,6 +23,7 @@ public:
     DataTypeObject(const String & schema_format_, bool is_nullable_);
 
     const char * getFamilyName() const override { return "Object"; }
+    String getSQLCompatibleName() const override { return "JSON"; }
     String doGetName() const override;
     TypeIndex getTypeId() const override { return TypeIndex::Object; }
 
diff --git a/src/DataTypes/DataTypeSet.h b/src/DataTypes/DataTypeSet.h
index 7ddfeb9fe30..e71a345a195 100644
--- a/src/DataTypes/DataTypeSet.h
+++ b/src/DataTypes/DataTypeSet.h
@@ -15,12 +15,14 @@ class DataTypeSet final : public IDataTypeDummy
 public:
     static constexpr bool is_parametric = true;
     const char * getFamilyName() const override { return "Set"; }
+    String getSQLCompatibleName() const override { return "TEXT"; }
+
     TypeIndex getTypeId() const override { return TypeIndex::Set; }
     bool equals(const IDataType & rhs) const override { return typeid(rhs) == typeid(*this); }
     bool isParametric() const override { return true; }
 
     // Used for expressions analysis.
-    MutableColumnPtr createColumn() const override { return ColumnSet::create(0, FutureSet{}); }
+    MutableColumnPtr createColumn() const override { return ColumnSet::create(0, nullptr); }
 
     // Used only for debugging, making it DUMPABLE
     Field getDefault() const override { return Tuple(); }
diff --git a/src/DataTypes/DataTypeString.h b/src/DataTypes/DataTypeString.h
index 5f3bde43a13..c39fa90f6e7 100644
--- a/src/DataTypes/DataTypeString.h
+++ b/src/DataTypes/DataTypeString.h
@@ -21,6 +21,8 @@ public:
         return "String";
     }
 
+    String getSQLCompatibleName() const override { return "BLOB"; }
+
     TypeIndex getTypeId() const override { return type_id; }
 
     MutableColumnPtr createColumn() const override;
diff --git a/src/DataTypes/DataTypeTuple.h b/src/DataTypes/DataTypeTuple.h
index 152f21015f5..ea05e6ae59b 100644
--- a/src/DataTypes/DataTypeTuple.h
+++ b/src/DataTypes/DataTypeTuple.h
@@ -33,6 +33,7 @@ public:
     TypeIndex getTypeId() const override { return TypeIndex::Tuple; }
     std::string doGetName() const override;
     const char * getFamilyName() const override { return "Tuple"; }
+    String getSQLCompatibleName() const override { return "JSON"; }
 
     bool canBeInsideNullable() const override { return false; }
     bool supportsSparseSerialization() const override { return true; }
diff --git a/src/DataTypes/DataTypeUUID.h b/src/DataTypes/DataTypeUUID.h
index af9f1f35ca5..8664c3bcfd1 100644
--- a/src/DataTypes/DataTypeUUID.h
+++ b/src/DataTypes/DataTypeUUID.h
@@ -18,6 +18,8 @@ public:
     static constexpr auto type_id = TypeIndex::UUID;
 
     const char * getFamilyName() const override { return "UUID"; }
+    String getSQLCompatibleName() const override { return "CHAR"; }
+
     TypeIndex getTypeId() const override { return type_id; }
 
     Field getDefault() const override;
diff --git a/src/DataTypes/DataTypesDecimal.cpp b/src/DataTypes/DataTypesDecimal.cpp
index 1c2a63371ee..fa044d4ac9c 100644
--- a/src/DataTypes/DataTypesDecimal.cpp
+++ b/src/DataTypes/DataTypesDecimal.cpp
@@ -28,6 +28,11 @@ std::string DataTypeDecimal<T>::doGetName() const
     return fmt::format("Decimal({}, {})", this->precision, this->scale);
 }
 
+template <is_decimal T>
+std::string DataTypeDecimal<T>::getSQLCompatibleName() const
+{
+    return fmt::format("DECIMAL({}, {})", this->precision, this->scale);
+}
 
 template <is_decimal T>
 bool DataTypeDecimal<T>::equals(const IDataType & rhs) const
diff --git a/src/DataTypes/DataTypesDecimal.h b/src/DataTypes/DataTypesDecimal.h
index 583f7ea804a..5e4cfab7928 100644
--- a/src/DataTypes/DataTypesDecimal.h
+++ b/src/DataTypes/DataTypesDecimal.h
@@ -39,6 +39,8 @@ public:
     static constexpr auto family_name = "Decimal";
 
     const char * getFamilyName() const override { return family_name; }
+    String getSQLCompatibleName() const override;
+
     std::string doGetName() const override;
     TypeIndex getTypeId() const override { return TypeToTypeIndex<T>; }
     bool canBePromoted() const override { return true; }
diff --git a/src/DataTypes/IDataType.h b/src/DataTypes/IDataType.h
index 7cc18fea00c..bfc4a71083d 100644
--- a/src/DataTypes/IDataType.h
+++ b/src/DataTypes/IDataType.h
@@ -75,6 +75,8 @@ public:
 
     /// Name of data type family (example: FixedString, Array).
     virtual const char * getFamilyName() const = 0;
+    /// Name of corresponding data type in MySQL (exampe: Bigint, Blob, etc)
+    virtual String getSQLCompatibleName() const = 0;
 
     /// Data type id. It's used for runtime type checks.
     virtual TypeIndex getTypeId() const = 0;
@@ -532,11 +534,6 @@ inline bool isNotDecimalButComparableToDecimal(const DataTypePtr & data_type)
     return which.isInt() || which.isUInt() || which.isFloat();
 }
 
-inline bool isCompilableType(const DataTypePtr & data_type)
-{
-    return data_type->isValueRepresentedByNumber() && !isDecimal(data_type);
-}
-
 inline bool isBool(const DataTypePtr & data_type)
 {
     return data_type->getName() == "Bool";
diff --git a/src/DataTypes/Native.cpp b/src/DataTypes/Native.cpp
new file mode 100644
index 00000000000..fd3716c2291
--- /dev/null
+++ b/src/DataTypes/Native.cpp
@@ -0,0 +1,200 @@
+#include <DataTypes/Native.h>
+
+#if USE_EMBEDDED_COMPILER
+#    include <DataTypes/DataTypeNullable.h>
+#    include <Columns/ColumnConst.h>
+#    include <Columns/ColumnNullable.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int NOT_IMPLEMENTED;
+    extern const int LOGICAL_ERROR;
+}
+
+bool typeIsSigned(const IDataType & type)
+{
+    WhichDataType data_type(type);
+    return data_type.isNativeInt() || data_type.isFloat() || data_type.isEnum() || data_type.isDate32();
+}
+
+llvm::Type * toNullableType(llvm::IRBuilderBase & builder, llvm::Type * type)
+{
+    auto * is_null_type = builder.getInt1Ty();
+    return llvm::StructType::get(type, is_null_type);
+}
+
+bool canBeNativeType(const IDataType & type)
+{
+    WhichDataType data_type(type);
+
+    if (data_type.isNullable())
+    {
+        const auto & data_type_nullable = static_cast<const DataTypeNullable&>(type);
+        return canBeNativeType(*data_type_nullable.getNestedType());
+    }
+
+    return data_type.isNativeInt() || data_type.isNativeUInt() || data_type.isFloat() || data_type.isDate()
+        || data_type.isDate32() || data_type.isDateTime() || data_type.isEnum();
+}
+
+bool canBeNativeType(const DataTypePtr & type)
+{
+    return canBeNativeType(*type);
+}
+
+llvm::Type * toNativeType(llvm::IRBuilderBase & builder, const IDataType & type)
+{
+    WhichDataType data_type(type);
+
+    if (data_type.isNullable())
+    {
+        const auto & data_type_nullable = static_cast<const DataTypeNullable&>(type);
+        auto * nested_type = toNativeType(builder, *data_type_nullable.getNestedType());
+        return toNullableType(builder, nested_type);
+    }
+
+    /// LLVM doesn't have unsigned types, it has unsigned instructions.
+    if (data_type.isInt8() || data_type.isUInt8())
+        return builder.getInt8Ty();
+    else if (data_type.isInt16() || data_type.isUInt16() || data_type.isDate())
+        return builder.getInt16Ty();
+    else if (data_type.isInt32() || data_type.isUInt32() || data_type.isDate32() || data_type.isDateTime())
+        return builder.getInt32Ty();
+    else if (data_type.isInt64() || data_type.isUInt64())
+        return builder.getInt64Ty();
+    else if (data_type.isFloat32())
+        return builder.getFloatTy();
+    else if (data_type.isFloat64())
+        return builder.getDoubleTy();
+    else if (data_type.isEnum8())
+        return builder.getInt8Ty();
+    else if (data_type.isEnum16())
+        return builder.getInt16Ty();
+
+    throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid cast to native type");
+}
+
+llvm::Type * toNativeType(llvm::IRBuilderBase & builder, const DataTypePtr & type)
+{
+    return toNativeType(builder, *type);
+}
+
+llvm::Value * nativeBoolCast(llvm::IRBuilderBase & b, const DataTypePtr & from_type, llvm::Value * value)
+{
+    if (from_type->isNullable())
+    {
+        auto * inner = nativeBoolCast(b, removeNullable(from_type), b.CreateExtractValue(value, {0}));
+        return b.CreateAnd(b.CreateNot(b.CreateExtractValue(value, {1})), inner);
+    }
+
+    auto * zero = llvm::Constant::getNullValue(value->getType());
+
+    if (value->getType()->isIntegerTy())
+        return b.CreateICmpNE(value, zero);
+    else if (value->getType()->isFloatingPointTy())
+        return b.CreateFCmpUNE(value, zero);
+
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Cannot cast non-number {} to bool", from_type->getName());
+}
+
+llvm::Value * nativeBoolCast(llvm::IRBuilderBase & b, const ValueWithType & value_with_type)
+{
+    return nativeBoolCast(b, value_with_type.type, value_with_type.value);
+}
+
+llvm::Value * nativeCast(llvm::IRBuilderBase & b, const DataTypePtr & from_type, llvm::Value * value, const DataTypePtr & to_type)
+{
+    if (from_type->equals(*to_type))
+    {
+        return value;
+    }
+    else if (from_type->isNullable() && to_type->isNullable())
+    {
+        auto * inner = nativeCast(b, removeNullable(from_type), b.CreateExtractValue(value, {0}), to_type);
+        return b.CreateInsertValue(inner, b.CreateExtractValue(value, {1}), {1});
+    }
+    else if (from_type->isNullable())
+    {
+        return nativeCast(b, removeNullable(from_type), b.CreateExtractValue(value, {0}), to_type);
+    }
+    else if (to_type->isNullable())
+    {
+        auto * to_native_type = toNativeType(b, to_type);
+        auto * inner = nativeCast(b, from_type, value, removeNullable(to_type));
+        return b.CreateInsertValue(llvm::Constant::getNullValue(to_native_type), inner, {0});
+    }
+    else
+    {
+        auto * from_native_type = toNativeType(b, from_type);
+        auto * to_native_type = toNativeType(b, to_type);
+
+        if (from_native_type == to_native_type)
+            return value;
+        else if (from_native_type->isIntegerTy() && to_native_type->isFloatingPointTy())
+            return typeIsSigned(*from_type) ? b.CreateSIToFP(value, to_native_type) : b.CreateUIToFP(value, to_native_type);
+        else if (from_native_type->isFloatingPointTy() && to_native_type->isIntegerTy())
+            return typeIsSigned(*to_type) ? b.CreateFPToSI(value, to_native_type) : b.CreateFPToUI(value, to_native_type);
+        else if (from_native_type->isIntegerTy() && from_native_type->isIntegerTy())
+            return b.CreateIntCast(value, to_native_type, typeIsSigned(*from_type));
+        else if (to_native_type->isFloatingPointTy() && to_native_type->isFloatingPointTy())
+            return b.CreateFPCast(value, to_native_type);
+    }
+
+    throw Exception(ErrorCodes::LOGICAL_ERROR,
+        "Invalid cast to native value from type {} to type {}",
+        from_type->getName(),
+        to_type->getName());
+}
+
+llvm::Value * nativeCast(llvm::IRBuilderBase & b, const ValueWithType & value, const DataTypePtr & to_type)
+{
+    return nativeCast(b, value.type, value.value, to_type);
+}
+
+llvm::Constant * getColumnNativeValue(llvm::IRBuilderBase & builder, const DataTypePtr & column_type, const IColumn & column, size_t index)
+{
+    if (const auto * constant = typeid_cast<const ColumnConst *>(&column))
+        return getColumnNativeValue(builder, column_type, constant->getDataColumn(), 0);
+
+    auto * type = toNativeType(builder, column_type);
+
+    WhichDataType column_data_type(column_type);
+    if (column_data_type.isNullable())
+    {
+        const auto & nullable_data_type = assert_cast<const DataTypeNullable &>(*column_type);
+        const auto & nullable_column = assert_cast<const ColumnNullable &>(column);
+
+        auto * value = getColumnNativeValue(builder, nullable_data_type.getNestedType(), nullable_column.getNestedColumn(), index);
+        auto * is_null = llvm::ConstantInt::get(type->getContainedType(1), nullable_column.isNullAt(index));
+
+        return llvm::ConstantStruct::get(static_cast<llvm::StructType *>(type), value, is_null);
+    }
+    else if (column_data_type.isFloat32())
+    {
+        return llvm::ConstantFP::get(type, assert_cast<const ColumnVector<Float32> &>(column).getElement(index));
+    }
+    else if (column_data_type.isFloat64())
+    {
+        return llvm::ConstantFP::get(type, assert_cast<const ColumnVector<Float64> &>(column).getElement(index));
+    }
+    else if (column_data_type.isNativeUInt() || column_data_type.isDate() || column_data_type.isDateTime())
+    {
+        return llvm::ConstantInt::get(type, column.getUInt(index));
+    }
+    else if (column_data_type.isNativeInt() || column_data_type.isEnum() || column_data_type.isDate32())
+    {
+        return llvm::ConstantInt::get(type, column.getInt(index));
+    }
+
+    throw Exception(ErrorCodes::LOGICAL_ERROR,
+        "Cannot get native value for column with type {}",
+        column_type->getName());
+}
+
+}
+
+#endif
diff --git a/src/DataTypes/Native.h b/src/DataTypes/Native.h
index a3c8486fa60..7fee452b1f0 100644
--- a/src/DataTypes/Native.h
+++ b/src/DataTypes/Native.h
@@ -4,65 +4,53 @@
 
 #if USE_EMBEDDED_COMPILER
 #    include <Common/Exception.h>
-
+#    include <Core/ValueWithType.h>
 #    include <DataTypes/IDataType.h>
-#    include <DataTypes/DataTypeNullable.h>
-#    include <Columns/ColumnConst.h>
-#    include <Columns/ColumnNullable.h>
 #    include <llvm/IR/IRBuilder.h>
 
 
 namespace DB
 {
+
 namespace ErrorCodes
 {
-    extern const int NOT_IMPLEMENTED;
+    extern const int LOGICAL_ERROR;
 }
 
-static inline bool typeIsSigned(const IDataType & type)
+/// Returns true if type is signed, false otherwise
+bool typeIsSigned(const IDataType & type);
+
+/// Cast LLVM type to nullable LLVM type
+llvm::Type * toNullableType(llvm::IRBuilderBase & builder, llvm::Type * type);
+
+/// Returns true if type can be native LLVM type, false otherwise
+bool canBeNativeType(const IDataType & type);
+
+/// Returns true if type can be native LLVM type, false otherwise
+bool canBeNativeType(const DataTypePtr & type);
+
+template <typename Type>
+static inline bool canBeNativeType()
 {
-    WhichDataType data_type(type);
-    return data_type.isNativeInt() || data_type.isFloat() || data_type.isEnum();
+    if constexpr (std::is_same_v<Type, Int8> || std::is_same_v<Type, UInt8>)
+        return true;
+    else if constexpr (std::is_same_v<Type, Int16> || std::is_same_v<Type, UInt16>)
+        return true;
+    else if constexpr (std::is_same_v<Type, Int32> || std::is_same_v<Type, UInt32>)
+        return true;
+    else if constexpr (std::is_same_v<Type, Int64> || std::is_same_v<Type, UInt64>)
+        return true;
+    else if constexpr (std::is_same_v<Type, Float32> || std::is_same_v<Type, Float64>)
+        return true;
+
+    return false;
 }
 
-static inline llvm::Type * toNullableType(llvm::IRBuilderBase & builder, llvm::Type * type)
-{
-    auto * is_null_type = builder.getInt1Ty();
-    return llvm::StructType::get(type, is_null_type);
-}
+/// Cast type to native LLVM type
+llvm::Type * toNativeType(llvm::IRBuilderBase & builder, const IDataType & type);
 
-static inline llvm::Type * toNativeType(llvm::IRBuilderBase & builder, const IDataType & type)
-{
-    WhichDataType data_type(type);
-
-    if (data_type.isNullable())
-    {
-        const auto & data_type_nullable = static_cast<const DataTypeNullable&>(type);
-        auto * wrapped = toNativeType(builder, *data_type_nullable.getNestedType());
-        auto * is_null_type = builder.getInt1Ty();
-        return wrapped ? llvm::StructType::get(wrapped, is_null_type) : nullptr;
-    }
-
-    /// LLVM doesn't have unsigned types, it has unsigned instructions.
-    if (data_type.isInt8() || data_type.isUInt8())
-        return builder.getInt8Ty();
-    else if (data_type.isInt16() || data_type.isUInt16() || data_type.isDate())
-        return builder.getInt16Ty();
-    else if (data_type.isInt32() || data_type.isUInt32() || data_type.isDate32() || data_type.isDateTime())
-        return builder.getInt32Ty();
-    else if (data_type.isInt64() || data_type.isUInt64())
-        return builder.getInt64Ty();
-    else if (data_type.isFloat32())
-        return builder.getFloatTy();
-    else if (data_type.isFloat64())
-        return builder.getDoubleTy();
-    else if (data_type.isEnum8())
-        return builder.getInt8Ty();
-    else if (data_type.isEnum16())
-        return builder.getInt16Ty();
-
-    return nullptr;
-}
+/// Cast type to native LLVM type
+llvm::Type * toNativeType(llvm::IRBuilderBase & builder, const DataTypePtr & type);
 
 template <typename ToType>
 static inline llvm::Type * toNativeType(llvm::IRBuilderBase & builder)
@@ -80,203 +68,43 @@ static inline llvm::Type * toNativeType(llvm::IRBuilderBase & builder)
     else if constexpr (std::is_same_v<ToType, Float64>)
         return builder.getDoubleTy();
 
-    return nullptr;
+    throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid cast to native type");
 }
 
-template <typename Type>
-static inline bool canBeNativeType()
+template <typename ToType>
+static inline DataTypePtr toNativeDataType()
 {
-    if constexpr (std::is_same_v<Type, Int8> || std::is_same_v<Type, UInt8>)
-        return true;
-    else if constexpr (std::is_same_v<Type, Int16> || std::is_same_v<Type, UInt16>)
-        return true;
-    else if constexpr (std::is_same_v<Type, Int32> || std::is_same_v<Type, UInt32>)
-        return true;
-    else if constexpr (std::is_same_v<Type, Int64> || std::is_same_v<Type, UInt64>)
-        return true;
-    else if constexpr (std::is_same_v<Type, Float32>)
-        return true;
-    else if constexpr (std::is_same_v<Type, Float64>)
-        return true;
+    if constexpr (std::is_same_v<ToType, Int8> || std::is_same_v<ToType, UInt8> ||
+        std::is_same_v<ToType, Int16> || std::is_same_v<ToType, UInt16> ||
+        std::is_same_v<ToType, Int32> || std::is_same_v<ToType, UInt32> ||
+        std::is_same_v<ToType, Int64> || std::is_same_v<ToType, UInt64> ||
+        std::is_same_v<ToType, Float32> || std::is_same_v<ToType, Float64>)
+        return std::make_shared<DataTypeNumber<ToType>>();
 
-    return false;
+    throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid cast to native data type");
 }
 
-static inline bool canBeNativeType(const IDataType & type)
-{
-    WhichDataType data_type(type);
+/// Cast LLVM value with type to bool
+llvm::Value * nativeBoolCast(llvm::IRBuilderBase & b, const DataTypePtr & from_type, llvm::Value * value);
 
-    if (data_type.isNullable())
-    {
-        const auto & data_type_nullable = static_cast<const DataTypeNullable&>(type);
-        return canBeNativeType(*data_type_nullable.getNestedType());
-    }
+/// Cast LLVM value with type to bool
+llvm::Value * nativeBoolCast(llvm::IRBuilderBase & b, const ValueWithType & value_with_type);
 
-    return data_type.isNativeInt() || data_type.isNativeUInt() || data_type.isFloat() || data_type.isDate()
-        || data_type.isDate32() || data_type.isDateTime() || data_type.isEnum();
-}
+/// Cast LLVM value with type to specified type
+llvm::Value * nativeCast(llvm::IRBuilderBase & b, const DataTypePtr & from_type, llvm::Value * value, const DataTypePtr & to_type);
 
-static inline llvm::Type * toNativeType(llvm::IRBuilderBase & builder, const DataTypePtr & type)
-{
-    return toNativeType(builder, *type);
-}
-
-static inline llvm::Value * nativeBoolCast(llvm::IRBuilder<> & b, const DataTypePtr & from_type, llvm::Value * value)
-{
-    if (from_type->isNullable())
-    {
-        auto * inner = nativeBoolCast(b, removeNullable(from_type), b.CreateExtractValue(value, {0}));
-        return b.CreateAnd(b.CreateNot(b.CreateExtractValue(value, {1})), inner);
-    }
-    auto * zero = llvm::Constant::getNullValue(value->getType());
-
-    if (value->getType()->isIntegerTy())
-        return b.CreateICmpNE(value, zero);
-    if (value->getType()->isFloatingPointTy())
-        return b.CreateFCmpUNE(value, zero);
-
-    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Cannot cast non-number {} to bool", from_type->getName());
-}
-
-static inline llvm::Value * nativeCast(llvm::IRBuilder<> & b, const DataTypePtr & from, llvm::Value * value, llvm::Type * to_type)
-{
-    auto * from_type = value->getType();
-
-    if (from_type == to_type)
-        return value;
-    else if (from_type->isIntegerTy() && to_type->isFloatingPointTy())
-        return typeIsSigned(*from) ? b.CreateSIToFP(value, to_type) : b.CreateUIToFP(value, to_type);
-    else if (from_type->isFloatingPointTy() && to_type->isIntegerTy())
-        return typeIsSigned(*from) ? b.CreateFPToSI(value, to_type) : b.CreateFPToUI(value, to_type);
-    else if (from_type->isIntegerTy() && to_type->isIntegerTy())
-        return b.CreateIntCast(value, to_type, typeIsSigned(*from));
-    else if (from_type->isFloatingPointTy() && to_type->isFloatingPointTy())
-        return b.CreateFPCast(value, to_type);
-
-    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Cannot cast {} to requested type", from->getName());
-}
+/// Cast LLVM value with type to specified type
+llvm::Value * nativeCast(llvm::IRBuilderBase & b, const ValueWithType & value, const DataTypePtr & to_type);
 
 template <typename FromType>
-static inline llvm::Value * nativeCast(llvm::IRBuilder<> & b, llvm::Value * value, llvm::Type * to_type)
+static inline llvm::Value * nativeCast(llvm::IRBuilderBase & b, llvm::Value * value, const DataTypePtr & to)
 {
-    auto * from_type = value->getType();
-
-    static constexpr bool from_type_is_signed = std::numeric_limits<FromType>::is_signed;
-
-    if (from_type == to_type)
-        return value;
-    else if (from_type->isIntegerTy() && to_type->isFloatingPointTy())
-        return from_type_is_signed ? b.CreateSIToFP(value, to_type) : b.CreateUIToFP(value, to_type);
-    else if (from_type->isFloatingPointTy() && to_type->isIntegerTy())
-        return from_type_is_signed ? b.CreateFPToSI(value, to_type) : b.CreateFPToUI(value, to_type);
-    else if (from_type->isIntegerTy() && to_type->isIntegerTy())
-        return b.CreateIntCast(value, to_type, from_type_is_signed);
-    else if (from_type->isFloatingPointTy() && to_type->isFloatingPointTy())
-        return b.CreateFPCast(value, to_type);
-
-    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Cannot cast {} to requested type", TypeName<FromType>);
+    auto native_data_type = toNativeDataType<FromType>();
+    return nativeCast(b, native_data_type, value, to);
 }
 
-static inline llvm::Value * nativeCast(llvm::IRBuilder<> & b, const DataTypePtr & from, llvm::Value * value, const DataTypePtr & to)
-{
-    auto * n_to = toNativeType(b, to);
-
-    if (value->getType() == n_to)
-    {
-        return value;
-    }
-    else if (from->isNullable() && to->isNullable())
-    {
-        auto * inner = nativeCast(b, removeNullable(from), b.CreateExtractValue(value, {0}), to);
-        return b.CreateInsertValue(inner, b.CreateExtractValue(value, {1}), {1});
-    }
-    else if (from->isNullable())
-    {
-        return nativeCast(b, removeNullable(from), b.CreateExtractValue(value, {0}), to);
-    }
-    else if (to->isNullable())
-    {
-        auto * inner = nativeCast(b, from, value, removeNullable(to));
-        return b.CreateInsertValue(llvm::Constant::getNullValue(n_to), inner, {0});
-    }
-
-    return nativeCast(b, from, value, n_to);
-}
-
-static inline std::pair<llvm::Value *, llvm::Value *> nativeCastToCommon(llvm::IRBuilder<> & b, const DataTypePtr & lhs_type, llvm::Value * lhs, const DataTypePtr & rhs_type, llvm::Value * rhs) /// NOLINT
-{
-    llvm::Type * common;
-
-    bool lhs_is_signed = typeIsSigned(*lhs_type);
-    bool rhs_is_signed = typeIsSigned(*rhs_type);
-
-    if (lhs->getType()->isIntegerTy() && rhs->getType()->isIntegerTy())
-    {
-        /// if one integer has a sign bit, make sure the other does as well. llvm generates optimal code
-        /// (e.g. uses overflow flag on x86) for (word size + 1)-bit integer operations.
-
-        size_t lhs_bit_width = lhs->getType()->getIntegerBitWidth() + (!lhs_is_signed && rhs_is_signed);
-        size_t rhs_bit_width = rhs->getType()->getIntegerBitWidth() + (!rhs_is_signed && lhs_is_signed);
-
-        size_t max_bit_width = std::max(lhs_bit_width, rhs_bit_width);
-        common = b.getIntNTy(static_cast<unsigned>(max_bit_width));
-    }
-    else
-    {
-        /// TODO: Check
-        /// (double, float) or (double, int_N where N <= double's mantissa width) -> double
-        common = b.getDoubleTy();
-    }
-
-    auto * cast_lhs_to_common = nativeCast(b, lhs_type, lhs, common);
-    auto * cast_rhs_to_common = nativeCast(b, rhs_type, rhs, common);
-
-    return std::make_pair(cast_lhs_to_common, cast_rhs_to_common);
-}
-
-static inline llvm::Constant * getColumnNativeValue(llvm::IRBuilderBase & builder, const DataTypePtr & column_type, const IColumn & column, size_t index)
-{
-    if (const auto * constant = typeid_cast<const ColumnConst *>(&column))
-    {
-        return getColumnNativeValue(builder, column_type, constant->getDataColumn(), 0);
-    }
-
-    WhichDataType column_data_type(column_type);
-
-    auto * type = toNativeType(builder, column_type);
-
-    if (!type || column.size() <= index)
-        return nullptr;
-
-    if (column_data_type.isNullable())
-    {
-        const auto & nullable_data_type = assert_cast<const DataTypeNullable &>(*column_type);
-        const auto & nullable_column = assert_cast<const ColumnNullable &>(column);
-
-        auto * value = getColumnNativeValue(builder, nullable_data_type.getNestedType(), nullable_column.getNestedColumn(), index);
-        auto * is_null = llvm::ConstantInt::get(type->getContainedType(1), nullable_column.isNullAt(index));
-
-        return value ? llvm::ConstantStruct::get(static_cast<llvm::StructType *>(type), value, is_null) : nullptr;
-    }
-    else if (column_data_type.isFloat32())
-    {
-        return llvm::ConstantFP::get(type, assert_cast<const ColumnVector<Float32> &>(column).getElement(index));
-    }
-    else if (column_data_type.isFloat64())
-    {
-        return llvm::ConstantFP::get(type, assert_cast<const ColumnVector<Float64> &>(column).getElement(index));
-    }
-    else if (column_data_type.isNativeUInt() || column_data_type.isDate() || column_data_type.isDateTime())
-    {
-        return llvm::ConstantInt::get(type, column.getUInt(index));
-    }
-    else if (column_data_type.isNativeInt() || column_data_type.isEnum() || column_data_type.isDate32())
-    {
-        return llvm::ConstantInt::get(type, column.getInt(index));
-    }
-
-    return nullptr;
-}
+/// Get column value for specified index as LLVM constant
+llvm::Constant * getColumnNativeValue(llvm::IRBuilderBase & builder, const DataTypePtr & column_type, const IColumn & column, size_t index);
 
 }
 
diff --git a/src/DataTypes/Serializations/SerializationDate.cpp b/src/DataTypes/Serializations/SerializationDate.cpp
index 678817017e0..1ed48fdd31d 100644
--- a/src/DataTypes/Serializations/SerializationDate.cpp
+++ b/src/DataTypes/Serializations/SerializationDate.cpp
@@ -13,7 +13,7 @@ namespace DB
 
 void SerializationDate::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
-    writeDateText(DayNum(assert_cast<const ColumnUInt16 &>(column).getData()[row_num]), ostr);
+    writeDateText(DayNum(assert_cast<const ColumnUInt16 &>(column).getData()[row_num]), ostr, time_zone);
 }
 
 void SerializationDate::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
@@ -26,7 +26,7 @@ void SerializationDate::deserializeWholeText(IColumn & column, ReadBuffer & istr
 void SerializationDate::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     DayNum x;
-    readDateText(x, istr);
+    readDateText(x, istr, time_zone);
     assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
 }
 
@@ -46,7 +46,7 @@ void SerializationDate::deserializeTextQuoted(IColumn & column, ReadBuffer & ist
 {
     DayNum x;
     assertChar('\'', istr);
-    readDateText(x, istr);
+    readDateText(x, istr, time_zone);
     assertChar('\'', istr);
     assert_cast<ColumnUInt16 &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
 }
@@ -62,7 +62,7 @@ void SerializationDate::deserializeTextJSON(IColumn & column, ReadBuffer & istr,
 {
     DayNum x;
     assertChar('"', istr);
-    readDateText(x, istr);
+    readDateText(x, istr, time_zone);
     assertChar('"', istr);
     assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
 }
@@ -77,8 +77,12 @@ void SerializationDate::serializeTextCSV(const IColumn & column, size_t row_num,
 void SerializationDate::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     DayNum value;
-    readCSV(value, istr);
+    readCSV(value, istr, time_zone);
     assert_cast<ColumnUInt16 &>(column).getData().push_back(value);
 }
 
+SerializationDate::SerializationDate(const DateLUTImpl & time_zone_) : time_zone(time_zone_)
+{
+}
+
 }
diff --git a/src/DataTypes/Serializations/SerializationDate.h b/src/DataTypes/Serializations/SerializationDate.h
index 099d7444c3d..f751b06fba6 100644
--- a/src/DataTypes/Serializations/SerializationDate.h
+++ b/src/DataTypes/Serializations/SerializationDate.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <DataTypes/Serializations/SerializationNumber.h>
+#include <Common/DateLUT.h>
 
 namespace DB
 {
@@ -8,6 +9,8 @@ namespace DB
 class SerializationDate final : public SerializationNumber<UInt16>
 {
 public:
+    explicit SerializationDate(const DateLUTImpl & time_zone_ = DateLUT::instance());
+
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
@@ -18,6 +21,9 @@ public:
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+protected:
+    const DateLUTImpl & time_zone;
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationDate32.cpp b/src/DataTypes/Serializations/SerializationDate32.cpp
index ef92202f89d..851710de839 100644
--- a/src/DataTypes/Serializations/SerializationDate32.cpp
+++ b/src/DataTypes/Serializations/SerializationDate32.cpp
@@ -11,7 +11,7 @@ namespace DB
 
 void SerializationDate32::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
-    writeDateText(ExtendedDayNum(assert_cast<const ColumnInt32 &>(column).getData()[row_num]), ostr);
+    writeDateText(ExtendedDayNum(assert_cast<const ColumnInt32 &>(column).getData()[row_num]), ostr, time_zone);
 }
 
 void SerializationDate32::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
@@ -24,7 +24,7 @@ void SerializationDate32::deserializeWholeText(IColumn & column, ReadBuffer & is
 void SerializationDate32::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     ExtendedDayNum x;
-    readDateText(x, istr);
+    readDateText(x, istr, time_zone);
     assert_cast<ColumnInt32 &>(column).getData().push_back(x);
 }
 
@@ -44,7 +44,7 @@ void SerializationDate32::deserializeTextQuoted(IColumn & column, ReadBuffer & i
 {
     ExtendedDayNum x;
     assertChar('\'', istr);
-    readDateText(x, istr);
+    readDateText(x, istr, time_zone);
     assertChar('\'', istr);
     assert_cast<ColumnInt32 &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
 }
@@ -60,7 +60,7 @@ void SerializationDate32::deserializeTextJSON(IColumn & column, ReadBuffer & ist
 {
     ExtendedDayNum x;
     assertChar('"', istr);
-    readDateText(x, istr);
+    readDateText(x, istr, time_zone);
     assertChar('"', istr);
     assert_cast<ColumnInt32 &>(column).getData().push_back(x);
 }
@@ -78,4 +78,8 @@ void SerializationDate32::deserializeTextCSV(IColumn & column, ReadBuffer & istr
     readCSV(value, istr);
     assert_cast<ColumnInt32 &>(column).getData().push_back(value.getExtenedDayNum());
 }
+
+SerializationDate32::SerializationDate32(const DateLUTImpl & time_zone_) : time_zone(time_zone_)
+{
+}
 }
diff --git a/src/DataTypes/Serializations/SerializationDate32.h b/src/DataTypes/Serializations/SerializationDate32.h
index 484b4f4a958..49560fb6c7d 100644
--- a/src/DataTypes/Serializations/SerializationDate32.h
+++ b/src/DataTypes/Serializations/SerializationDate32.h
@@ -1,12 +1,15 @@
 #pragma once
 
 #include <DataTypes/Serializations/SerializationNumber.h>
+#include <Common/DateLUT.h>
 
 namespace DB
 {
 class SerializationDate32 final : public SerializationNumber<Int32>
 {
 public:
+    explicit SerializationDate32(const DateLUTImpl & time_zone_ = DateLUT::instance());
+
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
@@ -17,5 +20,8 @@ public:
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+protected:
+    const DateLUTImpl & time_zone;
 };
 }
diff --git a/src/DataTypes/Serializations/SerializationLowCardinality.cpp b/src/DataTypes/Serializations/SerializationLowCardinality.cpp
index 90b51c1a6f2..aba77c8d431 100644
--- a/src/DataTypes/Serializations/SerializationLowCardinality.cpp
+++ b/src/DataTypes/Serializations/SerializationLowCardinality.cpp
@@ -300,49 +300,6 @@ namespace
         MutableColumnPtr additional_keys_map;
     };
 
-    template <typename T>
-    IndexMapsWithAdditionalKeys mapIndexWithAdditionalKeysRef(PaddedPODArray<T> & index, size_t dict_size)
-    {
-        PaddedPODArray<T> copy(index.cbegin(), index.cend());
-
-        HashMap<T, T> dict_map;
-        HashMap<T, T> add_keys_map;
-
-        for (auto val : index)
-        {
-            if (val < dict_size)
-                dict_map.insert({val, dict_map.size()});
-            else
-                add_keys_map.insert({val, add_keys_map.size()});
-        }
-
-        auto dictionary_map = ColumnVector<T>::create(dict_map.size());
-        auto additional_keys_map = ColumnVector<T>::create(add_keys_map.size());
-        auto & dict_data = dictionary_map->getData();
-        auto & add_keys_data = additional_keys_map->getData();
-
-        for (auto val : dict_map)
-            dict_data[val.second] = val.first;
-
-        for (auto val : add_keys_map)
-            add_keys_data[val.second] = val.first - dict_size;
-
-        for (auto & val : index)
-            val = val < dict_size ? dict_map[val]
-                                  : add_keys_map[val] + dict_map.size();
-
-        for (size_t i = 0; i < index.size(); ++i)
-        {
-            T expected = index[i] < dict_data.size() ? dict_data[index[i]]
-                                                     : add_keys_data[index[i] - dict_data.size()] + dict_size;
-            if (expected != copy[i])
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected {}, but got {}", toString(expected), toString(copy[i]));
-
-        }
-
-        return {std::move(dictionary_map), std::move(additional_keys_map)};
-    }
-
     template <typename T>
     IndexMapsWithAdditionalKeys mapIndexWithAdditionalKeys(PaddedPODArray<T> & index, size_t dict_size)
     {
diff --git a/src/DataTypes/Serializations/SerializationUUID.cpp b/src/DataTypes/Serializations/SerializationUUID.cpp
index ee1327ef094..76be273d7dc 100644
--- a/src/DataTypes/Serializations/SerializationUUID.cpp
+++ b/src/DataTypes/Serializations/SerializationUUID.cpp
@@ -51,19 +51,11 @@ void SerializationUUID::deserializeTextQuoted(IColumn & column, ReadBuffer & ist
     {
         assertChar('\'', istr);
         char * next_pos = find_first_symbols<'\\', '\''>(istr.position(), istr.buffer().end());
-        size_t len = next_pos - istr.position();
-        if ((len == 32) && (istr.position()[32] == '\''))
+        const size_t len = next_pos - istr.position();
+        if ((len == 32 || len == 36) && istr.position()[len] == '\'')
         {
-            parseUUIDWithoutSeparator(
-                reinterpret_cast<const UInt8 *>(istr.position()), std::reverse_iterator<UInt8 *>(reinterpret_cast<UInt8 *>(&uuid) + 16));
-            istr.ignore(33);
-            fast = true;
-        }
-        else if ((len == 36) && (istr.position()[36] == '\''))
-        {
-            parseUUID(
-                reinterpret_cast<const UInt8 *>(istr.position()), std::reverse_iterator<UInt8 *>(reinterpret_cast<UInt8 *>(&uuid) + 16));
-            istr.ignore(37);
+            uuid = parseUUID(std::span(reinterpret_cast<const UInt8 *>(istr.position()), len));
+            istr.ignore(len + 1);
             fast = true;
         }
         else
diff --git a/src/Databases/DatabaseReplicated.cpp b/src/Databases/DatabaseReplicated.cpp
index 9bbf5b9565d..661afc6bf1f 100644
--- a/src/Databases/DatabaseReplicated.cpp
+++ b/src/Databases/DatabaseReplicated.cpp
@@ -36,6 +36,7 @@
 #include <Parsers/ParserCreateQuery.h>
 #include <Parsers/queryToString.h>
 #include <Storages/StorageKeeperMap.h>
+#include <Storages/AlterCommands.h>
 
 namespace DB
 {
@@ -252,7 +253,7 @@ ClusterPtr DatabaseReplicated::getClusterImpl() const
         treat_local_as_remote,
         treat_local_port_as_remote,
         cluster_auth_info.cluster_secure_connection,
-        /*priority=*/ 1,
+        Priority{1},
         TSA_SUPPRESS_WARNING_FOR_READ(database_name),     /// FIXME
         cluster_auth_info.cluster_secret};
 
@@ -709,8 +710,9 @@ BlockIO DatabaseReplicated::tryEnqueueReplicatedDDL(const ASTPtr & query, Contex
 
 static UUID getTableUUIDIfReplicated(const String & metadata, ContextPtr context)
 {
-    bool looks_like_replicated = metadata.find("ReplicatedMergeTree") != std::string::npos;
-    if (!looks_like_replicated)
+    bool looks_like_replicated = metadata.find("Replicated") != std::string::npos;
+    bool looks_like_merge_tree = metadata.find("MergeTree") != std::string::npos;
+    if (!looks_like_replicated || !looks_like_merge_tree)
         return UUIDHelpers::Nil;
 
     ParserCreateQuery parser;
@@ -983,7 +985,7 @@ void DatabaseReplicated::recoverLostReplica(const ZooKeeperPtr & current_zookeep
         const auto & create_query_string = metadata_it->second;
         if (isTableExist(table_name, getContext()))
         {
-            assert(create_query_string == readMetadataFile(table_name));
+            assert(create_query_string == readMetadataFile(table_name) || getTableUUIDIfReplicated(create_query_string, getContext()) != UUIDHelpers::Nil);
             continue;
         }
 
@@ -1179,7 +1181,7 @@ void DatabaseReplicated::dropTable(ContextPtr local_context, const String & tabl
     std::lock_guard lock{metadata_mutex};
     UInt64 new_digest = tables_metadata_digest;
     new_digest -= getMetadataHash(table_name);
-    if (txn && !txn->isCreateOrReplaceQuery())
+    if (txn && !txn->isCreateOrReplaceQuery() && !is_recovering)
         txn->addOp(zkutil::makeSetRequest(replica_path + "/digest", toString(new_digest), -1));
 
     DatabaseAtomic::dropTableImpl(local_context, table_name, sync);
@@ -1233,7 +1235,7 @@ void DatabaseReplicated::renameTable(ContextPtr local_context, const String & ta
         new_digest -= DB::getMetadataHash(to_table_name, statement_to);
         new_digest += DB::getMetadataHash(table_name, statement_to);
     }
-    if (txn)
+    if (txn && !is_recovering)
         txn->addOp(zkutil::makeSetRequest(replica_path + "/digest", toString(new_digest), -1));
 
     DatabaseAtomic::renameTable(local_context, table_name, to_database, to_table_name, exchange, dictionary);
@@ -1259,7 +1261,7 @@ void DatabaseReplicated::commitCreateTable(const ASTCreateQuery & query, const S
     std::lock_guard lock{metadata_mutex};
     UInt64 new_digest = tables_metadata_digest;
     new_digest += DB::getMetadataHash(query.getTable(), statement);
-    if (txn && !txn->isCreateOrReplaceQuery())
+    if (txn && !txn->isCreateOrReplaceQuery() && !is_recovering)
         txn->addOp(zkutil::makeSetRequest(replica_path + "/digest", toString(new_digest), -1));
 
     DatabaseAtomic::commitCreateTable(query, table, table_metadata_tmp_path, table_metadata_path, query_context);
@@ -1272,7 +1274,7 @@ void DatabaseReplicated::commitAlterTable(const StorageID & table_id,
                                           const String & statement, ContextPtr query_context)
 {
     auto txn = query_context->getZooKeeperMetadataTransaction();
-    assert(!ddl_worker->isCurrentlyActive() || txn);
+    assert(!ddl_worker || !ddl_worker->isCurrentlyActive() || txn);
     if (txn && txn->isInitialQuery())
     {
         String metadata_zk_path = zookeeper_path + "/metadata/" + escapeForFileName(table_id.table_name);
@@ -1283,7 +1285,7 @@ void DatabaseReplicated::commitAlterTable(const StorageID & table_id,
     UInt64 new_digest = tables_metadata_digest;
     new_digest -= getMetadataHash(table_id.table_name);
     new_digest += DB::getMetadataHash(table_id.table_name, statement);
-    if (txn)
+    if (txn && !is_recovering)
         txn->addOp(zkutil::makeSetRequest(replica_path + "/digest", toString(new_digest), -1));
 
     DatabaseAtomic::commitAlterTable(table_id, table_metadata_tmp_path, table_metadata_path, statement, query_context);
@@ -1291,6 +1293,16 @@ void DatabaseReplicated::commitAlterTable(const StorageID & table_id,
     assert(checkDigestValid(query_context));
 }
 
+
+bool DatabaseReplicated::canExecuteReplicatedMetadataAlter() const
+{
+    /// ReplicatedMergeTree may call commitAlterTable from its background threads when executing ALTER_METADATA entries.
+    /// It may update the metadata digest (both locally and in ZooKeeper)
+    /// before DatabaseReplicatedDDLWorker::initializeReplication() has finished.
+    /// We should not update metadata until the database is initialized.
+    return ddl_worker && ddl_worker->isCurrentlyActive();
+}
+
 void DatabaseReplicated::detachTablePermanently(ContextPtr local_context, const String & table_name)
 {
     auto txn = local_context->getZooKeeperMetadataTransaction();
@@ -1306,7 +1318,7 @@ void DatabaseReplicated::detachTablePermanently(ContextPtr local_context, const
     std::lock_guard lock{metadata_mutex};
     UInt64 new_digest = tables_metadata_digest;
     new_digest -= getMetadataHash(table_name);
-    if (txn)
+    if (txn && !is_recovering)
         txn->addOp(zkutil::makeSetRequest(replica_path + "/digest", toString(new_digest), -1));
 
     DatabaseAtomic::detachTablePermanently(local_context, table_name);
@@ -1330,7 +1342,7 @@ void DatabaseReplicated::removeDetachedPermanentlyFlag(ContextPtr local_context,
     if (attach)
     {
         new_digest += getMetadataHash(table_name);
-        if (txn)
+        if (txn && !is_recovering)
             txn->addOp(zkutil::makeSetRequest(replica_path + "/digest", toString(new_digest), -1));
     }
 
@@ -1441,9 +1453,49 @@ bool DatabaseReplicated::shouldReplicateQuery(const ContextPtr & query_context,
         return table->as<StorageKeeperMap>() != nullptr;
     };
 
+    const auto is_replicated_table = [&](const ASTPtr & ast)
+    {
+        auto table_id = query_context->resolveStorageID(ast, Context::ResolveOrdinary);
+        StoragePtr table = DatabaseCatalog::instance().getTable(table_id, query_context);
+
+        return table->supportsReplication();
+    };
+
+    const auto has_many_shards = [&]()
+    {
+        /// If there is only 1 shard then there is no need to replicate some queries.
+        auto current_cluster = tryGetCluster();
+        return
+            !current_cluster || /// Couldn't get the cluster, so we don't know how many shards there are.
+            current_cluster->getShardsInfo().size() > 1;
+    };
+
     /// Some ALTERs are not replicated on database level
     if (const auto * alter = query_ptr->as<const ASTAlterQuery>())
-        return !alter->isAttachAlter() && !alter->isFetchAlter() && !alter->isDropPartitionAlter() && !is_keeper_map_table(query_ptr);
+    {
+        if (alter->isAttachAlter() || alter->isFetchAlter() || alter->isDropPartitionAlter() || is_keeper_map_table(query_ptr))
+            return false;
+
+        if (has_many_shards() || !is_replicated_table(query_ptr))
+            return true;
+
+        try
+        {
+            /// Metadata alter should go through database
+            for (const auto & child : alter->command_list->children)
+                if (AlterCommand::parse(child->as<ASTAlterCommand>()))
+                    return true;
+
+            /// It's ALTER PARTITION or mutation, doesn't involve database
+            return false;
+        }
+        catch (...)
+        {
+            tryLogCurrentException(log);
+        }
+
+        return true;
+    }
 
     /// DROP DATABASE is not replicated
     if (const auto * drop = query_ptr->as<const ASTDropQuery>())
@@ -1459,11 +1511,7 @@ bool DatabaseReplicated::shouldReplicateQuery(const ContextPtr & query_context,
         if (is_keeper_map_table(query_ptr))
             return false;
 
-        /// If there is only 1 shard then there is no need to replicate DELETE query.
-        auto current_cluster = tryGetCluster();
-        return
-            !current_cluster || /// Couldn't get the cluster, so we don't know how many shards there are.
-            current_cluster->getShardsInfo().size() > 1;
+        return has_many_shards() || !is_replicated_table(query_ptr);
     }
 
     return true;
diff --git a/src/Databases/DatabaseReplicated.h b/src/Databases/DatabaseReplicated.h
index 1da181de030..ff1a4aba41c 100644
--- a/src/Databases/DatabaseReplicated.h
+++ b/src/Databases/DatabaseReplicated.h
@@ -48,6 +48,8 @@ public:
     /// then it will be executed on all replicas.
     BlockIO tryEnqueueReplicatedDDL(const ASTPtr & query, ContextPtr query_context, bool internal) override;
 
+    bool canExecuteReplicatedMetadataAlter() const override;
+
     bool hasReplicationThread() const override { return true; }
 
     void stopReplication() override;
diff --git a/src/Databases/DatabaseReplicatedWorker.cpp b/src/Databases/DatabaseReplicatedWorker.cpp
index 66ae5cd250c..4976f54e417 100644
--- a/src/Databases/DatabaseReplicatedWorker.cpp
+++ b/src/Databases/DatabaseReplicatedWorker.cpp
@@ -96,6 +96,7 @@ void DatabaseReplicatedDDLWorker::initializeReplication()
     }
     else
     {
+        LOG_WARNING(log, "Did not find digest in ZooKeeper, creating it");
         /// Database was created by old ClickHouse versions, let's create the node
         std::lock_guard lock{database->metadata_mutex};
         digest = local_digest = database->tables_metadata_digest;
@@ -103,6 +104,9 @@ void DatabaseReplicatedDDLWorker::initializeReplication()
         zookeeper->create(database->replica_path + "/digest", digest_str, zkutil::CreateMode::Persistent);
     }
 
+    LOG_TRACE(log, "Trying to initialize replication: our_log_ptr={}, max_log_ptr={}, local_digest={}, zk_digest={}",
+              our_log_ptr, max_log_ptr, local_digest, digest);
+
     bool is_new_replica = our_log_ptr == 0;
     bool lost_according_to_log_ptr = our_log_ptr + logs_to_keep < max_log_ptr;
     bool lost_according_to_digest = database->db_settings.check_consistency && local_digest != digest;
@@ -157,7 +161,7 @@ bool DatabaseReplicatedDDLWorker::waitForReplicaToProcessAllEntries(UInt64 timeo
         LOG_TRACE(log, "Waiting for worker thread to process all entries before {}, current task is {}", max_log, current_task);
         bool processed = wait_current_task_change.wait_for(lock, std::chrono::milliseconds(timeout_ms), [&]()
         {
-            return zookeeper->expired() || current_task == max_log || stop_flag;
+            return zookeeper->expired() || current_task >= max_log || stop_flag;
         });
 
         if (!processed)
diff --git a/src/Databases/IDatabase.h b/src/Databases/IDatabase.h
index 53a2f372814..aadae3e2491 100644
--- a/src/Databases/IDatabase.h
+++ b/src/Databases/IDatabase.h
@@ -254,6 +254,9 @@ public:
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "{}: alterTable() is not supported", getEngineName());
     }
 
+    /// Special method for ReplicatedMergeTree and DatabaseReplicated
+    virtual bool canExecuteReplicatedMetadataAlter() const { return true; }
+
     /// Returns time of table's metadata change, 0 if there is no corresponding metadata file.
     virtual time_t getObjectMetadataModificationTime(const String & /*name*/) const
     {
diff --git a/src/Dictionaries/ExecutableDictionarySource.cpp b/src/Dictionaries/ExecutableDictionarySource.cpp
index 91f914fb7ad..e40ef07de9e 100644
--- a/src/Dictionaries/ExecutableDictionarySource.cpp
+++ b/src/Dictionaries/ExecutableDictionarySource.cpp
@@ -114,7 +114,10 @@ QueryPipeline ExecutableDictionarySource::loadAll()
     auto command = configuration.command;
     updateCommandIfNeeded(command, coordinator_configuration.execute_direct, context);
 
-    return QueryPipeline(coordinator->createPipe(command, configuration.command_arguments, sample_block, context));
+    ShellCommandSourceConfiguration command_configuration {
+        .check_exit_code = true,
+    };
+    return QueryPipeline(coordinator->createPipe(command, configuration.command_arguments, {}, sample_block, context, command_configuration));
 }
 
 QueryPipeline ExecutableDictionarySource::loadUpdatedAll()
@@ -148,7 +151,11 @@ QueryPipeline ExecutableDictionarySource::loadUpdatedAll()
     update_time = new_update_time;
 
     LOG_TRACE(log, "loadUpdatedAll {}", command);
-    return QueryPipeline(coordinator->createPipe(command, command_arguments, sample_block, context));
+
+    ShellCommandSourceConfiguration command_configuration {
+        .check_exit_code = true,
+    };
+    return QueryPipeline(coordinator->createPipe(command, command_arguments, {}, sample_block, context, command_configuration));
 }
 
 QueryPipeline ExecutableDictionarySource::loadIds(const std::vector<UInt64> & ids)
@@ -179,7 +186,11 @@ QueryPipeline ExecutableDictionarySource::getStreamForBlock(const Block & block)
     Pipes shell_input_pipes;
     shell_input_pipes.emplace_back(std::move(shell_input_pipe));
 
-    auto pipe = coordinator->createPipe(command, configuration.command_arguments, std::move(shell_input_pipes), sample_block, context);
+    ShellCommandSourceConfiguration command_configuration {
+        .check_exit_code = true,
+    };
+
+    auto pipe = coordinator->createPipe(command, configuration.command_arguments, std::move(shell_input_pipes), sample_block, context, command_configuration);
 
     if (configuration.implicit_key)
         pipe.addTransform(std::make_shared<TransformWithAdditionalColumns>(block, pipe.getHeader()));
diff --git a/src/Dictionaries/ExecutablePoolDictionarySource.cpp b/src/Dictionaries/ExecutablePoolDictionarySource.cpp
index 0cc7696585f..94685060a46 100644
--- a/src/Dictionaries/ExecutablePoolDictionarySource.cpp
+++ b/src/Dictionaries/ExecutablePoolDictionarySource.cpp
@@ -132,6 +132,7 @@ QueryPipeline ExecutablePoolDictionarySource::getStreamForBlock(const Block & bl
     ShellCommandSourceConfiguration command_configuration;
     command_configuration.read_fixed_number_of_rows = true;
     command_configuration.number_of_rows_to_read = block.rows();
+    command_configuration.check_exit_code = true;
 
     Pipes shell_input_pipes;
     shell_input_pipes.emplace_back(std::move(shell_input_pipe));
diff --git a/src/Dictionaries/HTTPDictionarySource.cpp b/src/Dictionaries/HTTPDictionarySource.cpp
index 757a3b1819b..55bff868dee 100644
--- a/src/Dictionaries/HTTPDictionarySource.cpp
+++ b/src/Dictionaries/HTTPDictionarySource.cpp
@@ -135,6 +135,7 @@ QueryPipeline HTTPDictionarySource::loadIds(const std::vector<UInt64> & ids)
         WriteBufferFromOStream out_buffer(ostr);
         auto output_format = context->getOutputFormatParallelIfPossible(configuration.format, out_buffer, block.cloneEmpty());
         formatBlock(output_format, block);
+        out_buffer.finalize();
     };
 
     Poco::URI uri(configuration.url);
@@ -164,6 +165,7 @@ QueryPipeline HTTPDictionarySource::loadKeys(const Columns & key_columns, const
         WriteBufferFromOStream out_buffer(ostr);
         auto output_format = context->getOutputFormatParallelIfPossible(configuration.format, out_buffer, block.cloneEmpty());
         formatBlock(output_format, block);
+        out_buffer.finalize();
     };
 
     Poco::URI uri(configuration.url);
diff --git a/src/Dictionaries/HashedDictionary.cpp b/src/Dictionaries/HashedDictionary.cpp
index eb1d98a8f39..5f25600db8f 100644
--- a/src/Dictionaries/HashedDictionary.cpp
+++ b/src/Dictionaries/HashedDictionary.cpp
@@ -10,6 +10,7 @@
 #include <Common/ConcurrentBoundedQueue.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/MemoryTrackerBlockerInThread.h>
+#include <Common/scope_guard_safe.h>
 
 #include <Core/Defines.h>
 
@@ -69,6 +70,11 @@ public:
             shards_queues[shard].emplace(backlog);
             pool.scheduleOrThrowOnError([this, shard, thread_group = CurrentThread::getGroup()]
             {
+                SCOPE_EXIT_SAFE(
+                    if (thread_group)
+                        CurrentThread::detachFromGroupIfNotDetached();
+                );
+
                 /// Do not account memory that was occupied by the dictionaries for the query/user context.
                 MemoryTrackerBlockerInThread memory_blocker;
 
@@ -230,6 +236,11 @@ HashedDictionary<dictionary_key_type, sparse, sharded>::~HashedDictionary()
 
         pool.trySchedule([&container, thread_group = CurrentThread::getGroup()]
         {
+            SCOPE_EXIT_SAFE(
+                if (thread_group)
+                    CurrentThread::detachFromGroupIfNotDetached();
+            );
+
             /// Do not account memory that was occupied by the dictionaries for the query/user context.
             MemoryTrackerBlockerInThread memory_blocker;
 
diff --git a/src/Dictionaries/IDictionary.h b/src/Dictionaries/IDictionary.h
index ee18e8b9a7e..f1834b4b129 100644
--- a/src/Dictionaries/IDictionary.h
+++ b/src/Dictionaries/IDictionary.h
@@ -207,6 +207,51 @@ public:
         return result;
     }
 
+    /**
+     * Analogous to getColumn, but for dictGetAll
+     */
+    virtual ColumnPtr getColumnAllValues(
+        const std::string & attribute_name [[maybe_unused]],
+        const DataTypePtr & result_type [[maybe_unused]],
+        const Columns & key_columns [[maybe_unused]],
+        const DataTypes & key_types [[maybe_unused]],
+        const ColumnPtr & default_values_column [[maybe_unused]],
+        size_t limit [[maybe_unused]]) const
+    {
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED,
+                        "Method getColumnAllValues is not supported for {} dictionary.",
+                        getDictionaryID().getNameForLogs());
+    }
+
+    /**
+     * Analogous to getColumns, but for dictGetAll
+     */
+    virtual Columns getColumnsAllValues(
+        const Strings & attribute_names,
+        const DataTypes & result_types,
+        const Columns & key_columns,
+        const DataTypes & key_types,
+        const Columns & default_values_columns,
+        size_t limit) const
+    {
+        size_t attribute_names_size = attribute_names.size();
+
+        Columns result;
+        result.reserve(attribute_names_size);
+
+        for (size_t i = 0; i < attribute_names_size; ++i)
+        {
+            const auto & attribute_name = attribute_names[i];
+            const auto & result_type = result_types[i];
+            const auto & default_values_column = default_values_columns[i];
+
+            result.emplace_back(getColumnAllValues(
+                attribute_name, result_type, key_columns, key_types, default_values_column, limit));
+        }
+
+        return result;
+    }
+
     /** Subclass must validate key columns and key types and return ColumnUInt8 that
       * is bitmask representation of is key in dictionary or not.
       * If key is in dictionary then value of associated row will be 1, otherwise 0.
diff --git a/src/Dictionaries/MongoDBDictionarySource.cpp b/src/Dictionaries/MongoDBDictionarySource.cpp
index b7e342f3c80..46910fa9f6a 100644
--- a/src/Dictionaries/MongoDBDictionarySource.cpp
+++ b/src/Dictionaries/MongoDBDictionarySource.cpp
@@ -170,7 +170,7 @@ MongoDBDictionarySource::~MongoDBDictionarySource() = default;
 
 QueryPipeline MongoDBDictionarySource::loadAll()
 {
-    return QueryPipeline(std::make_shared<MongoDBSource>(connection, createCursor(db, collection, sample_block), sample_block, max_block_size));
+    return QueryPipeline(std::make_shared<MongoDBSource>(connection, db, collection, Poco::MongoDB::Document{}, sample_block, max_block_size));
 }
 
 QueryPipeline MongoDBDictionarySource::loadIds(const std::vector<UInt64> & ids)
@@ -178,7 +178,7 @@ QueryPipeline MongoDBDictionarySource::loadIds(const std::vector<UInt64> & ids)
     if (!dict_struct.id)
         throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "'id' is required for selective loading");
 
-    auto cursor = createCursor(db, collection, sample_block);
+    Poco::MongoDB::Document query;
 
     /** NOTE: While building array, Poco::MongoDB requires passing of different unused element names, along with values.
       * In general, Poco::MongoDB is quite inefficient and bulky.
@@ -188,9 +188,9 @@ QueryPipeline MongoDBDictionarySource::loadIds(const std::vector<UInt64> & ids)
     for (const UInt64 id : ids)
         ids_array->add(DB::toString(id), static_cast<Int32>(id));
 
-    cursor->query().selector().addNewDocument(dict_struct.id->name).add("$in", ids_array);
+    query.addNewDocument(dict_struct.id->name).add("$in", ids_array);
 
-    return QueryPipeline(std::make_shared<MongoDBSource>(connection, std::move(cursor), sample_block, max_block_size));
+    return QueryPipeline(std::make_shared<MongoDBSource>(connection, db, collection, query, sample_block, max_block_size));
 }
 
 
@@ -199,8 +199,7 @@ QueryPipeline MongoDBDictionarySource::loadKeys(const Columns & key_columns, con
     if (!dict_struct.key)
         throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "'key' is required for selective loading");
 
-    auto cursor = createCursor(db, collection, sample_block);
-
+    Poco::MongoDB::Document query;
     Poco::MongoDB::Array::Ptr keys_array(new Poco::MongoDB::Array);
 
     for (const auto row_idx : requested_rows)
@@ -254,9 +253,9 @@ QueryPipeline MongoDBDictionarySource::loadKeys(const Columns & key_columns, con
     }
 
     /// If more than one key we should use $or
-    cursor->query().selector().add("$or", keys_array);
+    query.add("$or", keys_array);
 
-    return QueryPipeline(std::make_shared<MongoDBSource>(connection, std::move(cursor), sample_block, max_block_size));
+    return QueryPipeline(std::make_shared<MongoDBSource>(connection, db, collection, query, sample_block, max_block_size));
 }
 
 std::string MongoDBDictionarySource::toString() const
diff --git a/src/Dictionaries/MongoDBDictionarySource.h b/src/Dictionaries/MongoDBDictionarySource.h
index fefcb1bff9f..6d93bc6c090 100644
--- a/src/Dictionaries/MongoDBDictionarySource.h
+++ b/src/Dictionaries/MongoDBDictionarySource.h
@@ -16,7 +16,6 @@ namespace Util
 namespace MongoDB
 {
     class Connection;
-    class Cursor;
 }
 }
 
diff --git a/src/Dictionaries/RedisDictionarySource.cpp b/src/Dictionaries/RedisDictionarySource.cpp
index 6e4c5d1d5d9..1736cdff306 100644
--- a/src/Dictionaries/RedisDictionarySource.cpp
+++ b/src/Dictionaries/RedisDictionarySource.cpp
@@ -3,10 +3,6 @@
 #include "DictionaryStructure.h"
 #include "registerDictionaries.h"
 
-#include <Poco/Redis/Array.h>
-#include <Poco/Redis/Client.h>
-#include <Poco/Redis/Command.h>
-#include <Poco/Redis/Type.h>
 #include <Poco/Util/AbstractConfiguration.h>
 #include <Interpreters/Context.h>
 #include <QueryPipeline/QueryPipeline.h>
@@ -21,19 +17,7 @@ namespace DB
     {
         extern const int UNSUPPORTED_METHOD;
         extern const int INVALID_CONFIG_PARAMETER;
-        extern const int INTERNAL_REDIS_ERROR;
         extern const int LOGICAL_ERROR;
-        extern const int TIMEOUT_EXCEEDED;
-    }
-
-    static RedisStorageType parseStorageType(const String & storage_type_str)
-    {
-        if (storage_type_str == "hash_map")
-            return RedisStorageType::HASH_MAP;
-        else if (!storage_type_str.empty() && storage_type_str != "simple")
-            throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "Unknown storage type {} for Redis dictionary", storage_type_str);
-
-        return RedisStorageType::SIMPLE;
     }
 
     void registerDictionarySourceRedis(DictionarySourceFactory & factory)
@@ -52,14 +36,14 @@ namespace DB
             auto port = config.getUInt(redis_config_prefix + ".port");
             global_context->getRemoteHostFilter().checkHostAndPort(host, toString(port));
 
-            RedisDictionarySource::Configuration configuration =
+            RedisConfiguration configuration =
             {
                 .host = host,
                 .port = static_cast<UInt16>(port),
-                .db_index = config.getUInt(redis_config_prefix + ".db_index", 0),
-                .password = config.getString(redis_config_prefix + ".password", ""),
+                .db_index = config.getUInt(redis_config_prefix + ".db_index", DEFAULT_REDIS_DB_INDEX),
+                .password = config.getString(redis_config_prefix + ".password", DEFAULT_REDIS_PASSWORD),
                 .storage_type = parseStorageType(config.getString(redis_config_prefix + ".storage_type", "")),
-                .pool_size = config.getUInt(redis_config_prefix + ".pool_size", 16),
+                .pool_size = config.getUInt(redis_config_prefix + ".pool_size", DEFAULT_REDIS_POOL_SIZE),
             };
 
             return std::make_unique<RedisDictionarySource>(dict_struct, configuration, sample_block);
@@ -68,26 +52,13 @@ namespace DB
         factory.registerSource("redis", create_table_source);
     }
 
-    RedisDictionarySource::Connection::Connection(PoolPtr pool_, ClientPtr client_)
-        : pool(std::move(pool_)), client(std::move(client_))
-    {
-    }
-
-    RedisDictionarySource::Connection::~Connection()
-    {
-        pool->returnObject(std::move(client));
-    }
-
-    static constexpr size_t REDIS_MAX_BLOCK_SIZE = DEFAULT_BLOCK_SIZE;
-    static constexpr size_t REDIS_LOCK_ACQUIRE_TIMEOUT_MS = 5000;
-
     RedisDictionarySource::RedisDictionarySource(
         const DictionaryStructure & dict_struct_,
-        const Configuration & configuration_,
+        const RedisConfiguration & configuration_,
         const Block & sample_block_)
         : dict_struct{dict_struct_}
         , configuration(configuration_)
-        , pool(std::make_shared<Pool>(configuration.pool_size))
+        , pool(std::make_shared<RedisPool>(configuration.pool_size))
         , sample_block{sample_block_}
     {
         if (dict_struct.attributes.size() != 1)
@@ -122,24 +93,9 @@ namespace DB
 
     RedisDictionarySource::~RedisDictionarySource() = default;
 
-    static String storageTypeToKeyType(RedisStorageType type)
-    {
-        switch (type)
-        {
-            case RedisStorageType::SIMPLE:
-                return "string";
-            case RedisStorageType::HASH_MAP:
-                return "hash";
-            default:
-                return "none";
-        }
-
-        UNREACHABLE();
-    }
-
     QueryPipeline RedisDictionarySource::loadAll()
     {
-        auto connection = getConnection();
+        auto connection = getRedisConnection(pool, configuration);
 
         RedisCommand command_for_keys("KEYS");
         command_for_keys << "*";
@@ -159,33 +115,7 @@ namespace DB
 
         if (configuration.storage_type == RedisStorageType::HASH_MAP)
         {
-            RedisArray hkeys;
-            for (const auto & key : keys)
-            {
-                RedisCommand command_for_secondary_keys("HKEYS");
-                command_for_secondary_keys.addRedisType(key);
-
-                auto secondary_keys = connection->client->execute<RedisArray>(command_for_secondary_keys);
-
-                RedisArray primary_with_secondary;
-                primary_with_secondary.addRedisType(key);
-                for (const auto & secondary_key : secondary_keys)
-                {
-                    primary_with_secondary.addRedisType(secondary_key);
-                    /// Do not store more than max_block_size values for one request.
-                    if (primary_with_secondary.size() == REDIS_MAX_BLOCK_SIZE + 1)
-                    {
-                        hkeys.add(primary_with_secondary);
-                        primary_with_secondary.clear();
-                        primary_with_secondary.addRedisType(key);
-                    }
-                }
-
-                if (primary_with_secondary.size() > 1)
-                    hkeys.add(primary_with_secondary);
-            }
-
-            keys = hkeys;
+            keys = *getRedisHashMapKeys(connection, keys);
         }
 
         return QueryPipeline(std::make_shared<RedisSource>(
@@ -195,7 +125,7 @@ namespace DB
 
     QueryPipeline RedisDictionarySource::loadIds(const std::vector<UInt64> & ids)
     {
-        auto connection = getConnection();
+        auto connection = getRedisConnection(pool, configuration);
 
         if (configuration.storage_type == RedisStorageType::HASH_MAP)
             throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "Cannot use loadIds with 'hash_map' storage type");
@@ -215,7 +145,7 @@ namespace DB
 
     QueryPipeline RedisDictionarySource::loadKeys(const Columns & key_columns, const std::vector<size_t> & requested_rows)
     {
-        auto connection = getConnection();
+        auto connection = getRedisConnection(pool, configuration);
 
         if (key_columns.size() != dict_struct.key->size())
             throw Exception(ErrorCodes::LOGICAL_ERROR, "The size of key_columns does not equal to the size of dictionary key");
@@ -248,55 +178,4 @@ namespace DB
         return "Redis: " + configuration.host + ':' + DB::toString(configuration.port);
     }
 
-    RedisDictionarySource::ConnectionPtr RedisDictionarySource::getConnection() const
-    {
-        ClientPtr client;
-        bool ok = pool->tryBorrowObject(client,
-            [] { return std::make_unique<Poco::Redis::Client>(); },
-            REDIS_LOCK_ACQUIRE_TIMEOUT_MS);
-
-        if (!ok)
-            throw Exception(ErrorCodes::TIMEOUT_EXCEEDED,
-                "Could not get connection from pool, timeout exceeded {} seconds",
-                REDIS_LOCK_ACQUIRE_TIMEOUT_MS);
-
-        if (!client->isConnected())
-        {
-            try
-            {
-                client->connect(configuration.host, configuration.port);
-
-                if (!configuration.password.empty())
-                {
-                    RedisCommand command("AUTH");
-                    command << configuration.password;
-                    String reply = client->execute<String>(command);
-                    if (reply != "OK")
-                        throw Exception(ErrorCodes::INTERNAL_REDIS_ERROR,
-                            "Authentication failed with reason {}", reply);
-                }
-
-                if (configuration.db_index != 0)
-                {
-                    RedisCommand command("SELECT");
-                    command << std::to_string(configuration.db_index);
-                    String reply = client->execute<String>(command);
-                    if (reply != "OK")
-                        throw Exception(ErrorCodes::INTERNAL_REDIS_ERROR,
-                            "Selecting database with index {} failed with reason {}",
-                            configuration.db_index, reply);
-                }
-            }
-            catch (...)
-            {
-                if (client->isConnected())
-                    client->disconnect();
-
-                pool->returnObject(std::move(client));
-                throw;
-            }
-        }
-
-        return std::make_unique<Connection>(pool, std::move(client));
-    }
 }
diff --git a/src/Dictionaries/RedisDictionarySource.h b/src/Dictionaries/RedisDictionarySource.h
index 8fb6f93193b..a55f220321d 100644
--- a/src/Dictionaries/RedisDictionarySource.h
+++ b/src/Dictionaries/RedisDictionarySource.h
@@ -5,16 +5,7 @@
 
 #include "DictionaryStructure.h"
 #include "IDictionarySource.h"
-
-namespace Poco
-{
-    namespace Redis
-    {
-        class Client;
-        class Array;
-        class Command;
-    }
-}
+#include <Storages/RedisCommon.h>
 
 namespace DB
 {
@@ -23,47 +14,12 @@ namespace DB
         extern const int NOT_IMPLEMENTED;
     }
 
-    enum class RedisStorageType
-    {
-            SIMPLE,
-            HASH_MAP,
-            UNKNOWN
-    };
-
     class RedisDictionarySource final : public IDictionarySource
     {
     public:
-        using RedisArray = Poco::Redis::Array;
-        using RedisCommand = Poco::Redis::Command;
-
-        using ClientPtr = std::unique_ptr<Poco::Redis::Client>;
-        using Pool = BorrowedObjectPool<ClientPtr>;
-        using PoolPtr = std::shared_ptr<Pool>;
-
-        struct Configuration
-        {
-            const std::string host;
-            const UInt16 port;
-            const UInt32 db_index;
-            const std::string password;
-            const RedisStorageType storage_type;
-            const size_t pool_size;
-        };
-
-        struct Connection
-        {
-            Connection(PoolPtr pool_, ClientPtr client_);
-            ~Connection();
-
-            PoolPtr pool;
-            ClientPtr client;
-        };
-
-        using ConnectionPtr = std::unique_ptr<Connection>;
-
         RedisDictionarySource(
             const DictionaryStructure & dict_struct_,
-            const Configuration & configuration_,
+            const RedisConfiguration & configuration_,
             const Block & sample_block_);
 
         RedisDictionarySource(const RedisDictionarySource & other);
@@ -92,12 +48,10 @@ namespace DB
         std::string toString() const override;
 
     private:
-        ConnectionPtr getConnection() const;
-
         const DictionaryStructure dict_struct;
-        const Configuration configuration;
+        const RedisConfiguration configuration;
 
-        PoolPtr pool;
+        RedisPoolPtr pool;
         Block sample_block;
     };
 }
diff --git a/src/Dictionaries/RedisSource.cpp b/src/Dictionaries/RedisSource.cpp
index 4622f65a1a9..719c0278707 100644
--- a/src/Dictionaries/RedisSource.cpp
+++ b/src/Dictionaries/RedisSource.cpp
@@ -1,20 +1,12 @@
 #include "RedisSource.h"
 
-#include <string>
 #include <vector>
-
-#include <Poco/Redis/Array.h>
-#include <Poco/Redis/Client.h>
-#include <Poco/Redis/Command.h>
-#include <Poco/Redis/Type.h>
-
 #include <Columns/ColumnNullable.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnsNumber.h>
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
-
-#include "DictionaryStructure.h"
+#include <IO/ReadBufferFromString.h>
 
 
 namespace DB
@@ -30,7 +22,7 @@ namespace DB
 
 
     RedisSource::RedisSource(
-        ConnectionPtr connection_,
+        RedisConnectionPtr connection_,
         const RedisArray & keys_,
         const RedisStorageType & storage_type_,
         const DB::Block & sample_block,
diff --git a/src/Dictionaries/RedisSource.h b/src/Dictionaries/RedisSource.h
index 0f8cc317003..9aa2b0ddba4 100644
--- a/src/Dictionaries/RedisSource.h
+++ b/src/Dictionaries/RedisSource.h
@@ -6,15 +6,7 @@
 #include <Processors/ISource.h>
 #include <Poco/Redis/Array.h>
 #include <Poco/Redis/Type.h>
-#include "RedisDictionarySource.h"
-
-namespace Poco
-{
-    namespace Redis
-    {
-        class Client;
-    }
-}
+#include <Storages/RedisCommon.h>
 
 
 namespace DB
@@ -22,15 +14,11 @@ namespace DB
     class RedisSource final : public ISource
     {
     public:
-        using RedisArray = Poco::Redis::Array;
-        using RedisBulkString = Poco::Redis::BulkString;
-        using ConnectionPtr = RedisDictionarySource::ConnectionPtr;
-
         RedisSource(
-            ConnectionPtr connection_,
-            const Poco::Redis::Array & keys_,
+            RedisConnectionPtr connection_,
+            const RedisArray & keys_,
             const RedisStorageType & storage_type_,
-            const Block & sample_block,
+            const DB::Block & sample_block,
             size_t max_block_size);
 
         ~RedisSource() override;
@@ -40,7 +28,7 @@ namespace DB
     private:
         Chunk generate() override;
 
-        ConnectionPtr connection;
+        RedisConnectionPtr connection;
         Poco::Redis::Array keys;
         RedisStorageType storage_type;
         const size_t max_block_size;
diff --git a/src/Dictionaries/RegExpTreeDictionary.cpp b/src/Dictionaries/RegExpTreeDictionary.cpp
index 9841cadcdca..074b179c48e 100644
--- a/src/Dictionaries/RegExpTreeDictionary.cpp
+++ b/src/Dictionaries/RegExpTreeDictionary.cpp
@@ -70,7 +70,7 @@ namespace
         explicit StringPiece(int ref_) : ref_num(ref_) {}
     };
 
-    Field parseStringToField(const String & raw, DataTypePtr data_type)
+    Field parseStringToField(const String & raw, const DataTypePtr data_type)
     try
     {
         ReadBufferFromString buffer(raw);
@@ -129,17 +129,6 @@ struct RegExpTreeDictionary::RegexTreeNode
         return searcher.Match(haystack, 0, size, re2_st::RE2::Anchor::UNANCHORED, nullptr, 0);
     }
 
-    /// check if this node can cover all the attributes from the query.
-    bool containsAll(const std::unordered_map<String, const DictionaryAttribute &> & matching_attributes) const
-    {
-        for (const auto & [key, value] : matching_attributes)
-        {
-            if (!attributes.contains(key))
-                return false;
-        }
-        return true;
-    }
-
     struct AttributeValue
     {
         Field field;
@@ -419,6 +408,65 @@ RegExpTreeDictionary::RegExpTreeDictionary(
     calculateBytesAllocated();
 }
 
+// Thin wrapper around unordered_map<String, Field> that manages the collection of attribute values subject to the
+// behavior specified by collect_values_limit
+class RegExpTreeDictionary::AttributeCollector : public std::unordered_map<String, Field>
+{
+private:
+    std::optional<size_t> collect_values_limit; // std::nullopt means single-value mode, i.e. don't collect
+    size_t n_full_attributes;
+
+public:
+    explicit AttributeCollector(std::optional<size_t> collect_values_limit_)
+        : collect_values_limit(collect_values_limit_), n_full_attributes(0)
+    {
+    }
+
+    constexpr bool collecting() const { return collect_values_limit != std::nullopt; }
+
+    // Add a name-value pair to the collection if there's space
+    void add(const String & attr_name, Field field)
+    {
+        if (collect_values_limit)
+        {
+            if (!this->contains(attr_name))
+                (*this)[attr_name] = Array();
+
+            Array & values = (*this)[attr_name].safeGet<Array &>();
+            if (values.size() < *collect_values_limit)
+            {
+                values.push_back(std::move(field));
+                if (values.size() == *collect_values_limit)
+                    n_full_attributes++;
+            }
+        }
+        else if (!this->contains(attr_name))
+        {
+            (*this)[attr_name] = std::move(field);
+            n_full_attributes++;
+        }
+    }
+
+    // Checks if no more values can be added for a given attribute
+    inline bool full(const String & attr_name) const
+    {
+        if (collect_values_limit)
+        {
+            auto it = this->find(attr_name);
+            if (it == this->end())
+                return false;
+            return it->second.safeGet<const Array &>().size() >= *collect_values_limit;
+        }
+        else
+        {
+            return this->contains(attr_name);
+        }
+    }
+
+    // Returns the number of full attributes
+    inline size_t attributesFull() const { return n_full_attributes; }
+};
+
 std::pair<String, bool> processBackRefs(const String & data, const re2_st::RE2 & searcher, const std::vector<StringPiece> & pieces)
 {
     re2_st::StringPiece haystack(data.data(), data.size());
@@ -431,7 +479,7 @@ std::pair<String, bool> processBackRefs(const String & data, const re2_st::RE2 &
     for (const auto & item : pieces)
     {
         if (item.ref_num >= 0 && item.ref_num < 10)
-            result += matches[item.ref_num].ToString();
+            result += String{matches[item.ref_num]};
         else
             result += item.literal;
     }
@@ -442,7 +490,7 @@ std::pair<String, bool> processBackRefs(const String & data, const re2_st::RE2 &
 // The return value means whether we finish collecting.
 bool RegExpTreeDictionary::setAttributes(
     UInt64 id,
-    std::unordered_map<String, Field> & attributes_to_set,
+    AttributeCollector & attributes_to_set,
     const String & data,
     std::unordered_set<UInt64> & visited_nodes,
     const std::unordered_map<String, const DictionaryAttribute &> & attributes,
@@ -451,34 +499,43 @@ bool RegExpTreeDictionary::setAttributes(
 {
 
     if (visited_nodes.contains(id))
-        return attributes_to_set.size() == attributes.size();
+        return attributes_to_set.attributesFull() == attributes.size();
     visited_nodes.emplace(id);
     const auto & node_attributes = regex_nodes.at(id)->attributes;
     for (const auto & [name_, value] : node_attributes)
     {
-        if (!attributes.contains(name_) || attributes_to_set.contains(name_))
+        if (!attributes.contains(name_) || attributes_to_set.full(name_))
             continue;
+
         if (value.containsBackRefs())
         {
             auto [updated_str, use_default] = processBackRefs(data, regex_nodes.at(id)->searcher, value.pieces);
             if (use_default)
             {
-                DefaultValueProvider default_value(attributes.at(name_).null_value, defaults.at(name_));
-                attributes_to_set[name_] = default_value.getDefaultValue(key_index);
+                // Back-ref processing failed.
+                // - If not collecting values, set the default value immediately while we're still on this node.
+                //   Otherwise, a value from a different node could take its place before we set it to the default value post-walk.
+                // - If collecting values, don't add anything. If we find no other matches for this attribute,
+                //   then we'll set its value to the default Array value later.
+                if (!attributes_to_set.collecting())
+                {
+                    DefaultValueProvider default_value(attributes.at(name_).null_value, defaults.at(name_));
+                    attributes_to_set.add(name_, default_value.getDefaultValue(key_index));
+                }
             }
             else
-                attributes_to_set[name_] = parseStringToField(updated_str, attributes.at(name_).type);
+                attributes_to_set.add(name_, parseStringToField(updated_str, attributes.at(name_).type));
         }
         else
-            attributes_to_set[name_] = value.field;
+            attributes_to_set.add(name_, value.field);
     }
 
     auto parent_id = regex_nodes.at(id)->parent_id;
     if (parent_id > 0)
         setAttributes(parent_id, attributes_to_set, data, visited_nodes, attributes, defaults, key_index);
 
-    /// if all the attributes have set, the walking through can be stopped.
-    return attributes_to_set.size() == attributes.size();
+    /// if all attributes are full, we can stop walking the tree
+    return attributes_to_set.attributesFull() == attributes.size();
 }
 
 /// a temp struct to store all the matched result.
@@ -550,7 +607,8 @@ std::unordered_map<String, ColumnPtr> RegExpTreeDictionary::match(
     const ColumnString::Chars & keys_data,
     const ColumnString::Offsets & keys_offsets,
     const std::unordered_map<String, const DictionaryAttribute &> & attributes,
-    const std::unordered_map<String, ColumnPtr> & defaults) const
+    const std::unordered_map<String, ColumnPtr> & defaults,
+    std::optional<size_t> collect_values_limit) const
 {
 
 #if USE_VECTORSCAN
@@ -573,7 +631,7 @@ std::unordered_map<String, ColumnPtr> RegExpTreeDictionary::match(
     /// initialize columns
     for (const auto & [name_, attr] : attributes)
     {
-        auto col_ptr = attr.type->createColumn();
+        auto col_ptr = (collect_values_limit ? std::make_shared<DataTypeArray>(attr.type) : attr.type)->createColumn();
         col_ptr->reserve(keys_offsets.size());
         columns[name_] = std::move(col_ptr);
     }
@@ -622,19 +680,16 @@ std::unordered_map<String, ColumnPtr> RegExpTreeDictionary::match(
             if (node_ptr->match(reinterpret_cast<const char *>(keys_data.data()) + offset, length))
             {
                 match_result.insertNodeID(node_ptr->id);
-                /// When this node is leaf and contains all the required attributes, it means a match.
-                if (node_ptr->containsAll(attributes) && node_ptr->children.empty())
-                    break;
             }
         }
 
         match_result.sort();
         /// Walk through the regex tree util all attributes are set;
-        std::unordered_map<String, Field> attributes_to_set;
+        AttributeCollector attributes_to_set{collect_values_limit};
         std::unordered_set<UInt64> visited_nodes;
 
         /// Some node matches but its parents cannot match. In this case we must regard this node unmatched.
-        auto is_invalid = [&](UInt64 id)
+        auto is_valid = [&](UInt64 id)
         {
             while (id)
             {
@@ -650,7 +705,7 @@ std::unordered_map<String, ColumnPtr> RegExpTreeDictionary::match(
         for (auto item : match_result.matched_idx_sorted_list)
         {
             UInt64 id = item.second;
-            if (!is_invalid(id))
+            if (!is_valid(id))
                 continue;
             if (visited_nodes.contains(id))
                 continue;
@@ -663,7 +718,8 @@ std::unordered_map<String, ColumnPtr> RegExpTreeDictionary::match(
             if (attributes_to_set.contains(name_))
                 continue;
 
-            DefaultValueProvider default_value(attr.null_value, defaults.at(name_));
+            DefaultValueProvider default_value(
+                collect_values_limit ? DataTypeArray(attr.type).getDefault() : attr.null_value, defaults.at(name_));
             columns[name_]->insert(default_value.getDefaultValue(key_idx));
         }
 
@@ -727,12 +783,13 @@ Pipe RegExpTreeDictionary::read(const Names & , size_t max_block_size, size_t) c
     return Pipe(std::make_shared<BlocksListSource>(std::move(result)));
 }
 
-Columns RegExpTreeDictionary::getColumns(
+Columns RegExpTreeDictionary::getColumnsImpl(
     const Strings & attribute_names,
     const DataTypes & result_types,
     const Columns & key_columns,
     const DataTypes & key_types,
-    const Columns & default_values_columns) const
+    const Columns & default_values_columns,
+    std::optional<size_t> collect_values_limit) const
 {
     /// valid check
     if (key_columns.size() != 1)
@@ -746,7 +803,17 @@ Columns RegExpTreeDictionary::getColumns(
 
     for (size_t i = 0; i < attribute_names.size(); i++)
     {
-        const auto & attribute = structure.getAttribute(attribute_names[i], result_types[i]);
+        DataTypePtr attribute_type = result_types[i];
+        if (collect_values_limit)
+        {
+            if (!WhichDataType(attribute_type).isArray())
+                throw Exception(
+                    ErrorCodes::LOGICAL_ERROR, "Expected Array result type for attribute `{}`, got `{}`",
+                    attribute_names[i],
+                    attribute_type->getName());
+            attribute_type = assert_cast<const DataTypeArray &>(*attribute_type).getNestedType();
+        }
+        const auto & attribute = structure.getAttribute(attribute_names[i], attribute_type);
         attributes.emplace(attribute.name, attribute);
         defaults[attribute.name] = default_values_columns[i];
     }
@@ -757,7 +824,8 @@ Columns RegExpTreeDictionary::getColumns(
         key_column->getChars(),
         key_column->getOffsets(),
         attributes,
-        defaults);
+        defaults,
+        collect_values_limit);
 
     Columns result;
     for (const String & name_ : attribute_names)
diff --git a/src/Dictionaries/RegExpTreeDictionary.h b/src/Dictionaries/RegExpTreeDictionary.h
index 683588e688f..30966184eb6 100644
--- a/src/Dictionaries/RegExpTreeDictionary.h
+++ b/src/Dictionaries/RegExpTreeDictionary.h
@@ -101,16 +101,50 @@ public:
         const Columns & key_columns,
         const DataTypes & key_types,
         const ColumnPtr & default_values_column) const override
-        {
-            return getColumns(Strings({attribute_name}), DataTypes({result_type}), key_columns, key_types, Columns({default_values_column}))[0];
-        }
+    {
+        return getColumns(Strings({attribute_name}), DataTypes({result_type}), key_columns, key_types, Columns({default_values_column}))[0];
+    }
 
     Columns getColumns(
         const Strings & attribute_names,
         const DataTypes & result_types,
         const Columns & key_columns,
         const DataTypes & key_types,
-        const Columns & default_values_columns) const override;
+        const Columns & default_values_columns) const override
+    {
+        return getColumnsImpl(attribute_names, result_types, key_columns, key_types, default_values_columns, std::nullopt);
+    }
+
+    ColumnPtr getColumnAllValues(
+        const std::string & attribute_name,
+        const DataTypePtr & result_type,
+        const Columns & key_columns,
+        const DataTypes & key_types,
+        const ColumnPtr & default_values_column,
+        size_t limit) const override
+    {
+        return getColumnsAllValues(
+            Strings({attribute_name}), DataTypes({result_type}), key_columns, key_types, Columns({default_values_column}), limit)[0];
+    }
+
+    Columns getColumnsAllValues(
+        const Strings & attribute_names,
+        const DataTypes & result_types,
+        const Columns & key_columns,
+        const DataTypes & key_types,
+        const Columns & default_values_columns,
+        size_t limit) const override
+    {
+        return getColumnsImpl(attribute_names, result_types, key_columns, key_types, default_values_columns, limit);
+    }
+
+    Columns getColumnsImpl(
+        const Strings & attribute_names,
+        const DataTypes & result_types,
+        const Columns & key_columns,
+        const DataTypes & key_types,
+        const Columns & default_values_columns,
+        std::optional<size_t> collect_values_limit) const;
 
 private:
     const DictionaryStructure structure;
@@ -137,11 +171,14 @@ private:
         const ColumnString::Chars & keys_data,
         const ColumnString::Offsets & keys_offsets,
         const std::unordered_map<String, const DictionaryAttribute &> & attributes,
-        const std::unordered_map<String, ColumnPtr> & defaults) const;
+        const std::unordered_map<String, ColumnPtr> & defaults,
+        std::optional<size_t> collect_values_limit) const;
+
+    class AttributeCollector;
 
     bool setAttributes(
         UInt64 id,
-        std::unordered_map<String, Field> & attributes_to_set,
+        AttributeCollector & attributes_to_set,
         const String & data,
         std::unordered_set<UInt64> & visited_nodes,
         const std::unordered_map<String, const DictionaryAttribute &> & attributes,
diff --git a/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp b/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
index d75ec9f09e0..f9bd68222ae 100644
--- a/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
+++ b/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
@@ -301,9 +301,8 @@ off_t AsynchronousBoundedReadBuffer::seek(off_t offset, int whence)
     * Lazy ignore. Save number of bytes to ignore and ignore it either for prefetch buffer or current buffer.
     * Note: we read in range [file_offset_of_buffer_end, read_until_position).
     */
-    if (file_offset_of_buffer_end && read_until_position && new_pos < *read_until_position
-        && new_pos > file_offset_of_buffer_end
-        && new_pos < file_offset_of_buffer_end + read_settings.remote_read_min_bytes_for_seek)
+    if (!impl->seekIsCheap() && file_offset_of_buffer_end && read_until_position && new_pos < *read_until_position
+        && new_pos > file_offset_of_buffer_end && new_pos < file_offset_of_buffer_end + read_settings.remote_read_min_bytes_for_seek)
     {
         ProfileEvents::increment(ProfileEvents::RemoteFSLazySeeks);
         bytes_to_ignore = new_pos - file_offset_of_buffer_end;
diff --git a/src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp b/src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp
index 7c497baa450..81aa29639ac 100644
--- a/src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp
+++ b/src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp
@@ -8,6 +8,7 @@
 #include <IO/BoundedReadBuffer.h>
 #include <Common/getRandomASCIIString.h>
 #include <Common/logger_useful.h>
+#include <Common/ElapsedTimeProfileEventIncrement.h>
 #include <base/hex.h>
 #include <Interpreters/Context.h>
 
@@ -26,6 +27,7 @@ extern const Event CachedReadBufferCacheWriteMicroseconds;
 extern const Event CachedReadBufferReadFromSourceBytes;
 extern const Event CachedReadBufferReadFromCacheBytes;
 extern const Event CachedReadBufferCacheWriteBytes;
+extern const Event CachedReadBufferCreateBufferMicroseconds;
 }
 
 namespace DB
@@ -67,7 +69,6 @@ CachedOnDiskReadBufferFromFile::CachedOnDiskReadBufferFromFile(
     , allow_seeks_after_first_read(allow_seeks_after_first_read_)
     , use_external_buffer(use_external_buffer_)
     , query_context_holder(cache_->getQueryContextHolder(query_id, settings_))
-    , is_persistent(settings_.is_file_cache_persistent)
     , cache_log(cache_log_)
 {
 }
@@ -123,7 +124,7 @@ void CachedOnDiskReadBufferFromFile::initialize(size_t offset, size_t size)
     }
     else
     {
-        CreateFileSegmentSettings create_settings(is_persistent ? FileSegmentKind::Persistent : FileSegmentKind::Regular);
+        CreateFileSegmentSettings create_settings(FileSegmentKind::Regular);
         file_segments = cache->getOrSet(cache_key, offset, size, file_size.value(), create_settings);
     }
 
@@ -145,8 +146,8 @@ void CachedOnDiskReadBufferFromFile::initialize(size_t offset, size_t size)
 CachedOnDiskReadBufferFromFile::ImplementationBufferPtr
 CachedOnDiskReadBufferFromFile::getCacheReadBuffer(const FileSegment & file_segment) const
 {
-    /// Use is_persistent flag from in-memory state of the filesegment,
-    /// because it is consistent with what is written on disk.
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::CachedReadBufferCreateBufferMicroseconds);
+
     auto path = file_segment.getPathInLocalCache();
 
     ReadSettings local_read_settings{settings};
@@ -156,7 +157,7 @@ CachedOnDiskReadBufferFromFile::getCacheReadBuffer(const FileSegment & file_segm
     if (use_external_buffer)
         local_read_settings.local_fs_buffer_size = 0;
 
-    auto buf = createReadBufferFromFileBase(path, local_read_settings);
+    auto buf = createReadBufferFromFileBase(path, local_read_settings, std::nullopt, std::nullopt, file_segment.getFlagsForLocalRead());
 
     if (getFileSizeFromReadBuffer(*buf) == 0)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to read from an empty cache file: {}", path);
@@ -167,6 +168,8 @@ CachedOnDiskReadBufferFromFile::getCacheReadBuffer(const FileSegment & file_segm
 CachedOnDiskReadBufferFromFile::ImplementationBufferPtr
 CachedOnDiskReadBufferFromFile::getRemoteReadBuffer(FileSegment & file_segment, ReadType read_type_)
 {
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::CachedReadBufferCreateBufferMicroseconds);
+
     switch (read_type_)
     {
         case ReadType::REMOTE_FS_READ_AND_PUT_IN_CACHE:
@@ -401,6 +404,8 @@ CachedOnDiskReadBufferFromFile::getImplementationBuffer(FileSegment & file_segme
     current_file_segment_counters.increment(
         ProfileEvents::FileSegmentWaitReadBufferMicroseconds, watch.elapsedMicroseconds());
 
+    ProfileEvents::increment(ProfileEvents::FileSegmentWaitReadBufferMicroseconds, watch.elapsedMicroseconds());
+
     [[maybe_unused]] auto download_current_segment = read_type == ReadType::REMOTE_FS_READ_AND_PUT_IN_CACHE;
     chassert(download_current_segment == file_segment.isDownloader());
 
@@ -502,9 +507,6 @@ bool CachedOnDiskReadBufferFromFile::completeFileSegmentAndGetNext()
     current_file_segment->use();
     implementation_buffer = getImplementationBuffer(*current_file_segment);
 
-    if (read_type == ReadType::CACHED)
-        current_file_segment->incrementHitsCount();
-
     LOG_TEST(
         log, "New segment range: {}, old range: {}",
         current_file_segment->range().toString(), completed_range.toString());
@@ -847,9 +849,7 @@ bool CachedOnDiskReadBufferFromFile::nextImplStep()
     else
     {
         implementation_buffer = getImplementationBuffer(file_segments->front());
-
-        if (read_type == ReadType::CACHED)
-            file_segments->front().incrementHitsCount();
+        file_segments->front().use();
     }
 
     chassert(!internal_buffer.empty());
@@ -870,10 +870,11 @@ bool CachedOnDiskReadBufferFromFile::nextImplStep()
 
     LOG_TEST(
         log,
-        "Current read type: {}, read offset: {}, impl offset: {}, file segment: {}",
+        "Current read type: {}, read offset: {}, impl offset: {}, impl position: {}, file segment: {}",
         toString(read_type),
         file_offset_of_buffer_end,
         implementation_buffer->getFileOffsetOfBufferEnd(),
+        implementation_buffer->getPosition(),
         file_segment.getInfoForLog());
 
     chassert(current_read_range.left <= file_offset_of_buffer_end);
@@ -932,31 +933,37 @@ bool CachedOnDiskReadBufferFromFile::nextImplStep()
         // We don't support implementation_buffer implementations that use nextimpl_working_buffer_offset.
         chassert(implementation_buffer->position() == implementation_buffer->buffer().begin());
 
-        size = implementation_buffer->buffer().size();
+        if (result)
+            size = implementation_buffer->buffer().size();
 
         LOG_TEST(
             log,
-            "Read {} bytes, read type {}, file offset: {}, impl offset: {}/{}, segment: {}",
+            "Read {} bytes, read type {}, file offset: {}, impl offset: {}/{}, impl position: {}, segment: {}",
             size, toString(read_type), file_offset_of_buffer_end,
-            implementation_buffer->getFileOffsetOfBufferEnd(), read_until_position, file_segment.range().toString());
+            implementation_buffer->getFileOffsetOfBufferEnd(), read_until_position,
+            implementation_buffer->getPosition(), file_segment.range().toString());
 
         if (read_type == ReadType::CACHED)
         {
             ProfileEvents::increment(ProfileEvents::CachedReadBufferReadFromCacheBytes, size);
             ProfileEvents::increment(ProfileEvents::CachedReadBufferReadFromCacheMicroseconds, elapsed);
 
-#ifdef ABORT_ON_LOGICAL_ERROR
-            const size_t new_file_offset = file_offset_of_buffer_end + size;
-            chassert(new_file_offset - 1 <= file_segment.range().right);
-            const size_t file_segment_write_offset = file_segment.getCurrentWriteOffset(true);
-            if (new_file_offset > file_segment_write_offset)
+            if (result)
             {
-                LOG_TRACE(
-                    log, "Read {} bytes, file offset: {}, segment: {}, segment write offset: {}",
-                    size, file_offset_of_buffer_end, file_segment.range().toString(), file_segment_write_offset);
-                chassert(false);
+                const size_t new_file_offset = file_offset_of_buffer_end + size;
+                const size_t file_segment_write_offset = file_segment.getCurrentWriteOffset(true);
+                if (new_file_offset > file_segment.range().right + 1 || new_file_offset > file_segment_write_offset)
+                {
+                    auto file_segment_path = file_segment.getPathInLocalCache();
+                    throw Exception(
+                        ErrorCodes::LOGICAL_ERROR, "Read unexpected size. "
+                        "File size: {}, file segment path: {}, impl size: {}, impl path: {}"
+                        "file segment info: {}",
+                        fs::file_size(file_segment_path), file_segment_path,
+                        implementation_buffer->getFileSize(), implementation_buffer->getFileName(),
+                        file_segment.getInfoForLog());
+                }
             }
-#endif
         }
         else
         {
@@ -1033,34 +1040,6 @@ bool CachedOnDiskReadBufferFromFile::nextImplStep()
 
     current_file_segment_counters.increment(ProfileEvents::FileSegmentUsedBytes, available());
 
-    // No necessary because of the SCOPE_EXIT above, but useful for logging below.
-    if (download_current_segment)
-        file_segment.completePartAndResetDownloader();
-
-    chassert(!file_segment.isDownloader());
-
-    LOG_TEST(
-        log,
-        "Key: {}. Returning with {} bytes, buffer position: {} (offset: {}, predownloaded: {}), "
-        "buffer available: {}, current range: {}, file offset of buffer end: {}, impl offset: {}, file segment state: {}, "
-        "current write offset: {}, read_type: {}, reading until position: {}, started with offset: {}, "
-        "remaining ranges: {}",
-        cache_key.toString(),
-        working_buffer.size(),
-        getPosition(),
-        offset(),
-        needed_to_predownload,
-        available(),
-        current_read_range.toString(),
-        file_offset_of_buffer_end,
-        implementation_buffer->getFileOffsetOfBufferEnd(),
-        FileSegment::stateToString(file_segment.state()),
-        file_segment.getCurrentWriteOffset(false),
-        toString(read_type),
-        read_until_position,
-        first_offset,
-        file_segments->toString());
-
     if (size == 0 && file_offset_of_buffer_end < read_until_position)
     {
         size_t cache_file_size = getFileSizeFromReadBuffer(*implementation_buffer);
@@ -1081,6 +1060,33 @@ bool CachedOnDiskReadBufferFromFile::nextImplStep()
             file_segment.getInfoForLog());
     }
 
+    // No necessary because of the SCOPE_EXIT above, but useful for logging below.
+    if (download_current_segment)
+        file_segment.completePartAndResetDownloader();
+
+    chassert(!file_segment.isDownloader());
+
+    LOG_TEST(
+        log,
+        "Key: {}. Returning with {} bytes, buffer position: {} (offset: {}, predownloaded: {}), "
+        "buffer available: {}, current range: {}, file offset of buffer end: {}, file segment state: {}, "
+        "current write offset: {}, read_type: {}, reading until position: {}, started with offset: {}, "
+        "remaining ranges: {}",
+        cache_key.toString(),
+        working_buffer.size(),
+        getPosition(),
+        offset(),
+        needed_to_predownload,
+        available(),
+        current_read_range.toString(),
+        file_offset_of_buffer_end,
+        FileSegment::stateToString(file_segment.state()),
+        file_segment.getCurrentWriteOffset(false),
+        toString(read_type),
+        read_until_position,
+        first_offset,
+        file_segments->toString());
+
     return result;
 }
 
@@ -1219,7 +1225,7 @@ off_t CachedOnDiskReadBufferFromFile::getPosition()
 
 void CachedOnDiskReadBufferFromFile::assertCorrectness() const
 {
-    if (!CachedObjectStorage::canUseReadThroughCache()
+    if (!CachedObjectStorage::canUseReadThroughCache(settings)
         && !settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cache usage is not allowed (query_id: {})", query_id);
 }
diff --git a/src/Disks/IO/CachedOnDiskReadBufferFromFile.h b/src/Disks/IO/CachedOnDiskReadBufferFromFile.h
index 8faf23ad343..b4e7701de75 100644
--- a/src/Disks/IO/CachedOnDiskReadBufferFromFile.h
+++ b/src/Disks/IO/CachedOnDiskReadBufferFromFile.h
@@ -147,8 +147,6 @@ private:
 
     FileCache::QueryContextHolderPtr query_context_holder;
 
-    bool is_persistent;
-
     std::shared_ptr<FilesystemCacheLog> cache_log;
 };
 
diff --git a/src/Disks/IO/CachedOnDiskWriteBufferFromFile.cpp b/src/Disks/IO/CachedOnDiskWriteBufferFromFile.cpp
index 9153af90312..33d4ed7b3d7 100644
--- a/src/Disks/IO/CachedOnDiskWriteBufferFromFile.cpp
+++ b/src/Disks/IO/CachedOnDiskWriteBufferFromFile.cpp
@@ -52,18 +52,20 @@ bool FileSegmentRangeWriter::write(const char * data, size_t size, size_t offset
 
     FileSegment * file_segment;
 
-    if (file_segments.empty() || file_segments.back().isDownloaded())
+    if (!file_segments || file_segments->empty() || file_segments->front().isDownloaded())
     {
         file_segment = &allocateFileSegment(expected_write_offset, segment_kind);
     }
     else
     {
-        file_segment = &file_segments.back();
+        file_segment = &file_segments->front();
     }
 
     SCOPE_EXIT({
-        if (file_segments.back().isDownloader())
-            file_segments.back().completePartAndResetDownloader();
+        if (!file_segments || file_segments->empty())
+            return;
+        if (file_segments->front().isDownloader())
+            file_segments->front().completePartAndResetDownloader();
     });
 
     while (size > 0)
@@ -71,7 +73,7 @@ bool FileSegmentRangeWriter::write(const char * data, size_t size, size_t offset
         size_t available_size = file_segment->range().size() - file_segment->getDownloadedSize(false);
         if (available_size == 0)
         {
-            completeFileSegment(*file_segment);
+            completeFileSegment();
             file_segment = &allocateFileSegment(expected_write_offset, segment_kind);
             continue;
         }
@@ -114,10 +116,7 @@ void FileSegmentRangeWriter::finalize()
     if (finalized)
         return;
 
-    if (file_segments.empty())
-        return;
-
-    completeFileSegment(file_segments.back());
+    completeFileSegment();
     finalized = true;
 }
 
@@ -145,10 +144,9 @@ FileSegment & FileSegmentRangeWriter::allocateFileSegment(size_t offset, FileSeg
 
     /// We set max_file_segment_size to be downloaded,
     /// if we have less size to write, file segment will be resized in complete() method.
-    auto holder = cache->set(key, offset, cache->getMaxFileSegmentSize(), create_settings);
-    chassert(holder->size() == 1);
-    holder->moveTo(file_segments);
-    return file_segments.back();
+    file_segments = cache->set(key, offset, cache->getMaxFileSegmentSize(), create_settings);
+    chassert(file_segments->size() == 1);
+    return file_segments->front();
 }
 
 void FileSegmentRangeWriter::appendFilesystemCacheLog(const FileSegment & file_segment)
@@ -176,8 +174,12 @@ void FileSegmentRangeWriter::appendFilesystemCacheLog(const FileSegment & file_s
     cache_log->add(elem);
 }
 
-void FileSegmentRangeWriter::completeFileSegment(FileSegment & file_segment)
+void FileSegmentRangeWriter::completeFileSegment()
 {
+    if (!file_segments || file_segments->empty())
+        return;
+
+    auto & file_segment = file_segments->front();
     /// File segment can be detached if space reservation failed.
     if (file_segment.isDetached() || file_segment.isCompleted())
         return;
@@ -192,7 +194,6 @@ CachedOnDiskWriteBufferFromFile::CachedOnDiskWriteBufferFromFile(
     FileCachePtr cache_,
     const String & source_path_,
     const FileCache::Key & key_,
-    bool is_persistent_cache_file_,
     const String & query_id_,
     const WriteSettings & settings_)
     : WriteBufferFromFileDecorator(std::move(impl_))
@@ -200,7 +201,6 @@ CachedOnDiskWriteBufferFromFile::CachedOnDiskWriteBufferFromFile(
     , cache(cache_)
     , source_path(source_path_)
     , key(key_)
-    , is_persistent_cache_file(is_persistent_cache_file_)
     , query_id(query_id_)
     , enable_cache_log(!query_id_.empty() && settings_.enable_filesystem_cache_log)
     , throw_on_error_from_cache(settings_.throw_on_error_from_cache)
@@ -253,8 +253,7 @@ void CachedOnDiskWriteBufferFromFile::cacheData(char * data, size_t size, bool t
 
     try
     {
-        auto segment_kind = is_persistent_cache_file ? FileSegmentKind::Persistent : FileSegmentKind::Regular;
-        if (!cache_writer->write(data, size, current_download_offset, segment_kind))
+        if (!cache_writer->write(data, size, current_download_offset, FileSegmentKind::Regular))
         {
             LOG_INFO(log, "Write-through cache is stopped as cache limit is reached and nothing can be evicted");
             return;
diff --git a/src/Disks/IO/CachedOnDiskWriteBufferFromFile.h b/src/Disks/IO/CachedOnDiskWriteBufferFromFile.h
index 194afe88d88..8d39b6eed42 100644
--- a/src/Disks/IO/CachedOnDiskWriteBufferFromFile.h
+++ b/src/Disks/IO/CachedOnDiskWriteBufferFromFile.h
@@ -43,7 +43,7 @@ private:
 
     void appendFilesystemCacheLog(const FileSegment & file_segment);
 
-    void completeFileSegment(FileSegment & file_segment);
+    void completeFileSegment();
 
     FileCache * cache;
     FileSegment::Key key;
@@ -53,7 +53,7 @@ private:
     String query_id;
     String source_path;
 
-    FileSegmentsHolder file_segments{};
+    FileSegmentsHolderPtr file_segments;
 
     size_t expected_write_offset = 0;
 
@@ -72,7 +72,6 @@ public:
         FileCachePtr cache_,
         const String & source_path_,
         const FileCache::Key & key_,
-        bool is_persistent_cache_file_,
         const String & query_id_,
         const WriteSettings & settings_);
 
@@ -89,7 +88,6 @@ private:
     String source_path;
     FileCache::Key key;
 
-    bool is_persistent_cache_file;
     size_t current_download_offset = 0;
     const String query_id;
 
diff --git a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
index 0f197c2ff06..129bb97be09 100644
--- a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
@@ -35,6 +35,7 @@ ReadBufferFromAzureBlobStorage::ReadBufferFromAzureBlobStorage(
     size_t max_single_read_retries_,
     size_t max_single_download_retries_,
     bool use_external_buffer_,
+    bool restricted_seek_,
     size_t read_until_position_)
     : ReadBufferFromFileBase(use_external_buffer_ ? 0 : read_settings_.remote_fs_buffer_size, nullptr, 0)
     , blob_container_client(blob_container_client_)
@@ -44,6 +45,7 @@ ReadBufferFromAzureBlobStorage::ReadBufferFromAzureBlobStorage(
     , read_settings(read_settings_)
     , tmp_buffer_size(read_settings.remote_fs_buffer_size)
     , use_external_buffer(use_external_buffer_)
+    , restricted_seek(restricted_seek_)
     , read_until_position(read_until_position_)
 {
     if (!use_external_buffer)
@@ -54,6 +56,22 @@ ReadBufferFromAzureBlobStorage::ReadBufferFromAzureBlobStorage(
     }
 }
 
+
+void ReadBufferFromAzureBlobStorage::setReadUntilEnd()
+{
+    if (read_until_position)
+    {
+        read_until_position = 0;
+        if (initialized)
+        {
+            offset = getPosition();
+            resetWorkingBuffer();
+            initialized = false;
+        }
+    }
+
+}
+
 void ReadBufferFromAzureBlobStorage::setReadUntilPosition(size_t position)
 {
     read_until_position = position;
@@ -118,8 +136,17 @@ bool ReadBufferFromAzureBlobStorage::nextImpl()
 
 off_t ReadBufferFromAzureBlobStorage::seek(off_t offset_, int whence)
 {
-    if (initialized)
-        throw Exception(ErrorCodes::CANNOT_SEEK_THROUGH_FILE, "Seek is allowed only before first read attempt from the buffer.");
+    if (offset_ == getPosition() && whence == SEEK_SET)
+        return offset_;
+
+    if (initialized && restricted_seek)
+    {
+        throw Exception(
+            ErrorCodes::CANNOT_SEEK_THROUGH_FILE,
+            "Seek is allowed only before first read attempt from the buffer (current offset: "
+            "{}, new offset: {}, reading until position: {}, available: {})",
+            getPosition(), offset_, read_until_position, available());
+    }
 
     if (whence != SEEK_SET)
         throw Exception(ErrorCodes::CANNOT_SEEK_THROUGH_FILE, "Only SEEK_SET mode is allowed.");
@@ -127,8 +154,36 @@ off_t ReadBufferFromAzureBlobStorage::seek(off_t offset_, int whence)
     if (offset_ < 0)
         throw Exception(ErrorCodes::SEEK_POSITION_OUT_OF_BOUND, "Seek position is out of bounds. Offset: {}", offset_);
 
-    offset = offset_;
+    if (!restricted_seek)
+    {
+        if (!working_buffer.empty()
+            && static_cast<size_t>(offset_) >= offset - working_buffer.size()
+            && offset_ < offset)
+        {
+            pos = working_buffer.end() - (offset - offset_);
+            assert(pos >= working_buffer.begin());
+            assert(pos < working_buffer.end());
 
+            return getPosition();
+        }
+
+        off_t position = getPosition();
+        if (initialized && offset_ > position)
+        {
+            size_t diff = offset_ - position;
+            if (diff < read_settings.remote_read_min_bytes_for_seek)
+            {
+                ignore(diff);
+                return offset_;
+            }
+        }
+
+        resetWorkingBuffer();
+        if (initialized)
+            initialized = false;
+    }
+
+    offset = offset_;
     return offset;
 }
 
@@ -152,7 +207,8 @@ void ReadBufferFromAzureBlobStorage::initialize()
 
     download_options.Range = {static_cast<int64_t>(offset), length};
 
-    blob_client = std::make_unique<Azure::Storage::Blobs::BlobClient>(blob_container_client->GetBlobClient(path));
+    if (!blob_client)
+        blob_client = std::make_unique<Azure::Storage::Blobs::BlobClient>(blob_container_client->GetBlobClient(path));
 
     size_t sleep_time_with_backoff_milliseconds = 100;
     for (size_t i = 0; i < max_single_download_retries; ++i)
@@ -182,6 +238,18 @@ void ReadBufferFromAzureBlobStorage::initialize()
     initialized = true;
 }
 
+size_t ReadBufferFromAzureBlobStorage::getFileSize()
+{
+    if (!blob_client)
+        blob_client = std::make_unique<Azure::Storage::Blobs::BlobClient>(blob_container_client->GetBlobClient(path));
+
+    if (file_size.has_value())
+        return *file_size;
+
+    file_size = blob_client->GetProperties().Value.BlobSize;
+    return *file_size;
+}
+
 }
 
 #endif
diff --git a/src/Disks/IO/ReadBufferFromAzureBlobStorage.h b/src/Disks/IO/ReadBufferFromAzureBlobStorage.h
index 6164a005773..4e21f543653 100644
--- a/src/Disks/IO/ReadBufferFromAzureBlobStorage.h
+++ b/src/Disks/IO/ReadBufferFromAzureBlobStorage.h
@@ -24,6 +24,7 @@ public:
         size_t max_single_read_retries_,
         size_t max_single_download_retries_,
         bool use_external_buffer_ = false,
+        bool restricted_seek_ = false,
         size_t read_until_position_ = 0);
 
     off_t seek(off_t off, int whence) override;
@@ -37,9 +38,12 @@ public:
     String getFileName() const override { return path; }
 
     void setReadUntilPosition(size_t position) override;
+    void setReadUntilEnd() override;
 
     bool supportsRightBoundedReads() const override { return true; }
 
+    size_t getFileSize() override;
+
 private:
 
     void initialize();
@@ -55,6 +59,12 @@ private:
     std::vector<char> tmp_buffer;
     size_t tmp_buffer_size;
     bool use_external_buffer;
+
+    /// There is different seek policy for disk seek and for non-disk seek
+    /// (non-disk seek is applied for seekable input formats: orc, arrow, parquet).
+    bool restricted_seek;
+
+
     off_t read_until_position = 0;
 
     off_t offset = 0;
diff --git a/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp b/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
index 12fbbbcf747..16c1def7b11 100644
--- a/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
+++ b/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
@@ -22,13 +22,15 @@ ReadBufferFromRemoteFSGather::ReadBufferFromRemoteFSGather(
     ReadBufferCreator && read_buffer_creator_,
     const StoredObjects & blobs_to_read_,
     const ReadSettings & settings_,
-    std::shared_ptr<FilesystemCacheLog> cache_log_)
-    : ReadBufferFromFileBase(0, nullptr, 0)
+    std::shared_ptr<FilesystemCacheLog> cache_log_,
+    bool use_external_buffer_)
+    : ReadBufferFromFileBase(use_external_buffer_ ? 0 : settings_.remote_fs_buffer_size, nullptr, 0)
     , settings(settings_)
     , blobs_to_read(blobs_to_read_)
     , read_buffer_creator(std::move(read_buffer_creator_))
     , cache_log(settings.enable_filesystem_cache_log ? cache_log_ : nullptr)
     , query_id(CurrentThread::isInitialized() && CurrentThread::get().getQueryContext() != nullptr ? CurrentThread::getQueryId() : "")
+    , use_external_buffer(use_external_buffer_)
     , log(&Poco::Logger::get("ReadBufferFromRemoteFSGather"))
 {
     if (!blobs_to_read.empty())
@@ -36,7 +38,9 @@ ReadBufferFromRemoteFSGather::ReadBufferFromRemoteFSGather(
 
     with_cache = settings.remote_fs_cache
         && settings.enable_filesystem_cache
-        && (!query_id.empty() || settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache);
+        && (!query_id.empty()
+            || settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache
+            || !settings.avoid_readthrough_cache_outside_query_context);
 }
 
 SeekableReadBufferPtr ReadBufferFromRemoteFSGather::createImplementationBuffer(const StoredObject & object)
@@ -52,6 +56,7 @@ SeekableReadBufferPtr ReadBufferFromRemoteFSGather::createImplementationBuffer(c
     size_t current_read_until_position = read_until_position ? read_until_position : object.bytes_size;
     auto current_read_buffer_creator = [=, this]() { return read_buffer_creator(object_path, current_read_until_position); };
 
+#ifndef CLICKHOUSE_PROGRAM_STANDALONE_BUILD
     if (with_cache)
     {
         auto cache_key = settings.remote_fs_cache->createKeyForPath(object_path);
@@ -68,6 +73,7 @@ SeekableReadBufferPtr ReadBufferFromRemoteFSGather::createImplementationBuffer(c
             read_until_position ? std::optional<size_t>(read_until_position) : std::nullopt,
             cache_log);
     }
+#endif
 
     return current_read_buffer_creator();
 }
@@ -235,22 +241,49 @@ void ReadBufferFromRemoteFSGather::reset()
 
 off_t ReadBufferFromRemoteFSGather::seek(off_t offset, int whence)
 {
-    if (whence != SEEK_SET)
-        throw Exception(ErrorCodes::CANNOT_SEEK_THROUGH_FILE, "Only seeking with SEEK_SET is allowed");
+    if (offset == getPosition() && whence == SEEK_SET)
+        return offset;
+
+    if (whence != SEEK_SET)
+        throw Exception(ErrorCodes::CANNOT_SEEK_THROUGH_FILE, "Only SEEK_SET mode is allowed.");
+
+    if (use_external_buffer)
+    {
+        /// In case use_external_buffer == true, the buffer manages seeks itself.
+        reset();
+    }
+    else
+    {
+        if (!working_buffer.empty()
+            && static_cast<size_t>(offset) >= file_offset_of_buffer_end - working_buffer.size()
+            && static_cast<size_t>(offset) < file_offset_of_buffer_end)
+        {
+            pos = working_buffer.end() - (file_offset_of_buffer_end - offset);
+            assert(pos >= working_buffer.begin());
+            assert(pos < working_buffer.end());
+
+            return getPosition();
+        }
+
+        off_t position = getPosition();
+        if (current_buf && offset > position)
+        {
+            size_t diff = offset - position;
+            if (diff < settings.remote_read_min_bytes_for_seek)
+            {
+                ignore(diff);
+                return offset;
+            }
+        }
+
+        resetWorkingBuffer();
+        reset();
+    }
 
-    reset();
     file_offset_of_buffer_end = offset;
     return file_offset_of_buffer_end;
 }
 
-size_t ReadBufferFromRemoteFSGather::getImplementationBufferOffset() const
-{
-    if (!current_buf)
-        return file_offset_of_buffer_end;
-
-    return current_buf->getFileOffsetOfBufferEnd();
-}
-
 ReadBufferFromRemoteFSGather::~ReadBufferFromRemoteFSGather()
 {
     if (!with_cache)
diff --git a/src/Disks/IO/ReadBufferFromRemoteFSGather.h b/src/Disks/IO/ReadBufferFromRemoteFSGather.h
index 39b81d6f9ac..272ed2b3ac1 100644
--- a/src/Disks/IO/ReadBufferFromRemoteFSGather.h
+++ b/src/Disks/IO/ReadBufferFromRemoteFSGather.h
@@ -27,7 +27,8 @@ public:
         ReadBufferCreator && read_buffer_creator_,
         const StoredObjects & blobs_to_read_,
         const ReadSettings & settings_,
-        std::shared_ptr<FilesystemCacheLog> cache_log_);
+        std::shared_ptr<FilesystemCacheLog> cache_log_,
+        bool use_external_buffer_);
 
     ~ReadBufferFromRemoteFSGather() override;
 
@@ -37,20 +38,20 @@ public:
 
     void setReadUntilPosition(size_t position) override;
 
+    void setReadUntilEnd() override { return setReadUntilPosition(getFileSize()); }
+
     IAsynchronousReader::Result readInto(char * data, size_t size, size_t offset, size_t ignore) override;
 
     size_t getFileSize() override { return getTotalSize(blobs_to_read); }
 
     size_t getFileOffsetOfBufferEnd() const override { return file_offset_of_buffer_end; }
 
-    bool initialized() const { return current_buf != nullptr; }
-
-    size_t getImplementationBufferOffset() const;
-
     off_t seek(off_t offset, int whence) override;
 
     off_t getPosition() override { return file_offset_of_buffer_end - available() + bytes_to_ignore; }
 
+    bool seekIsCheap() override { return !current_buf; }
+
 private:
     SeekableReadBufferPtr createImplementationBuffer(const StoredObject & object);
 
@@ -71,6 +72,7 @@ private:
     const ReadBufferCreator read_buffer_creator;
     const std::shared_ptr<FilesystemCacheLog> cache_log;
     const String query_id;
+    const bool use_external_buffer;
     bool with_cache;
 
     size_t read_until_position = 0;
diff --git a/src/Disks/IO/ReadBufferFromWebServer.h b/src/Disks/IO/ReadBufferFromWebServer.h
index dd9cf63224f..fa899cf2c5e 100644
--- a/src/Disks/IO/ReadBufferFromWebServer.h
+++ b/src/Disks/IO/ReadBufferFromWebServer.h
@@ -12,8 +12,6 @@ namespace DB
 
 /* Read buffer, which reads via http, but is used as ReadBufferFromFileBase.
  * Used to read files, hosted on a web server with static files.
- *
- * Usage: ReadIndirectBufferFromRemoteFS -> SeekAvoidingReadBuffer -> ReadBufferFromWebServer -> ReadWriteBufferFromHTTP.
  */
 class ReadBufferFromWebServer : public ReadBufferFromFileBase
 {
diff --git a/src/Disks/IO/ReadIndirectBufferFromRemoteFS.cpp b/src/Disks/IO/ReadIndirectBufferFromRemoteFS.cpp
deleted file mode 100644
index a559b47f2cc..00000000000
--- a/src/Disks/IO/ReadIndirectBufferFromRemoteFS.cpp
+++ /dev/null
@@ -1,118 +0,0 @@
-#include "ReadIndirectBufferFromRemoteFS.h"
-
-#include <Disks/IO/ReadBufferFromRemoteFSGather.h>
-
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int CANNOT_SEEK_THROUGH_FILE;
-}
-
-
-ReadIndirectBufferFromRemoteFS::ReadIndirectBufferFromRemoteFS(
-    std::shared_ptr<ReadBufferFromRemoteFSGather> impl_, const ReadSettings & settings)
-    : ReadBufferFromFileBase(settings.remote_fs_buffer_size, nullptr, 0)
-    , impl(impl_)
-    , read_settings(settings)
-{
-}
-
-size_t ReadIndirectBufferFromRemoteFS::getFileSize()
-{
-    return impl->getFileSize();
-}
-
-off_t ReadIndirectBufferFromRemoteFS::getPosition()
-{
-    return impl->file_offset_of_buffer_end - available();
-}
-
-
-String ReadIndirectBufferFromRemoteFS::getFileName() const
-{
-    return impl->getFileName();
-}
-
-
-void ReadIndirectBufferFromRemoteFS::setReadUntilPosition(size_t position)
-{
-    impl->setReadUntilPosition(position);
-}
-
-
-void ReadIndirectBufferFromRemoteFS::setReadUntilEnd()
-{
-    impl->setReadUntilPosition(impl->getFileSize());
-}
-
-
-off_t ReadIndirectBufferFromRemoteFS::seek(off_t offset_, int whence)
-{
-    if (whence == SEEK_CUR)
-    {
-        /// If position within current working buffer - shift pos.
-        if (!working_buffer.empty() && size_t(getPosition() + offset_) < impl->file_offset_of_buffer_end)
-        {
-            pos += offset_;
-            return getPosition();
-        }
-        else
-        {
-            impl->file_offset_of_buffer_end += offset_;
-        }
-    }
-    else if (whence == SEEK_SET)
-    {
-        /// If position within current working buffer - shift pos.
-        if (!working_buffer.empty()
-            && size_t(offset_) >= impl->file_offset_of_buffer_end - working_buffer.size()
-            && size_t(offset_) < impl->file_offset_of_buffer_end)
-        {
-            pos = working_buffer.end() - (impl->file_offset_of_buffer_end - offset_);
-            return getPosition();
-        }
-        else
-        {
-            impl->file_offset_of_buffer_end = offset_;
-        }
-    }
-    else
-        throw Exception(ErrorCodes::CANNOT_SEEK_THROUGH_FILE, "Only SEEK_SET or SEEK_CUR modes are allowed.");
-
-    impl->seek(impl->file_offset_of_buffer_end, SEEK_SET);
-    resetWorkingBuffer();
-
-    file_offset_of_buffer_end = impl->file_offset_of_buffer_end;
-    return impl->file_offset_of_buffer_end;
-}
-
-
-bool ReadIndirectBufferFromRemoteFS::nextImpl()
-{
-    chassert(internal_buffer.size() == read_settings.remote_fs_buffer_size);
-    chassert(file_offset_of_buffer_end <= impl->getFileSize());
-
-    auto [size, offset, _] = impl->readInto(internal_buffer.begin(), internal_buffer.size(), file_offset_of_buffer_end, /* ignore */0);
-
-    chassert(offset <= size);
-    chassert(size <= internal_buffer.size());
-
-    size_t bytes_read = size - offset;
-    if (bytes_read)
-        working_buffer = Buffer(internal_buffer.begin() + offset, internal_buffer.begin() + size);
-
-    file_offset_of_buffer_end = impl->getFileOffsetOfBufferEnd();
-
-    /// In case of multiple files for the same file in clickhouse (i.e. log family)
-    /// file_offset_of_buffer_end will not match getImplementationBufferOffset()
-    /// so we use [impl->getImplementationBufferOffset(), impl->getFileSize()]
-    chassert(file_offset_of_buffer_end >= impl->getImplementationBufferOffset());
-    chassert(file_offset_of_buffer_end <= impl->getFileSize());
-
-    return bytes_read;
-}
-
-}
diff --git a/src/Disks/IO/ReadIndirectBufferFromRemoteFS.h b/src/Disks/IO/ReadIndirectBufferFromRemoteFS.h
deleted file mode 100644
index 19647b1fa39..00000000000
--- a/src/Disks/IO/ReadIndirectBufferFromRemoteFS.h
+++ /dev/null
@@ -1,46 +0,0 @@
-#pragma once
-
-#include "config.h"
-#include <IO/ReadBufferFromFile.h>
-#include <IO/ReadSettings.h>
-#include <utility>
-
-
-namespace DB
-{
-
-class ReadBufferFromRemoteFSGather;
-
-/**
-* Reads data from S3/HDFS/Web using stored paths in metadata.
-* There is asynchronous version of this class -- AsynchronousReadIndirectBufferFromRemoteFS.
-*/
-class ReadIndirectBufferFromRemoteFS : public ReadBufferFromFileBase
-{
-
-public:
-    explicit ReadIndirectBufferFromRemoteFS(std::shared_ptr<ReadBufferFromRemoteFSGather> impl_, const ReadSettings & settings);
-
-    off_t seek(off_t offset_, int whence) override;
-
-    off_t getPosition() override;
-
-    String getFileName() const override;
-
-    void setReadUntilPosition(size_t position) override;
-
-    void setReadUntilEnd() override;
-
-    size_t getFileSize() override;
-
-private:
-    bool nextImpl() override;
-
-    std::shared_ptr<ReadBufferFromRemoteFSGather> impl;
-
-    ReadSettings read_settings;
-
-    size_t file_offset_of_buffer_end = 0;
-};
-
-}
diff --git a/src/Disks/IO/WriteBufferFromTemporaryFile.cpp b/src/Disks/IO/WriteBufferFromTemporaryFile.cpp
index 5818c405e93..5bfbb2fa440 100644
--- a/src/Disks/IO/WriteBufferFromTemporaryFile.cpp
+++ b/src/Disks/IO/WriteBufferFromTemporaryFile.cpp
@@ -46,7 +46,7 @@ public:
 ReadBufferPtr WriteBufferFromTemporaryFile::getReadBufferImpl()
 {
     /// ignore buffer, write all data to file and reread it
-    next();
+    finalize();
 
     auto res = ReadBufferFromTemporaryWriteBuffer::createFrom(this);
 
diff --git a/src/Disks/IO/getThreadPoolReader.cpp b/src/Disks/IO/getThreadPoolReader.cpp
index deb8f66106c..7dbff9ffe76 100644
--- a/src/Disks/IO/getThreadPoolReader.cpp
+++ b/src/Disks/IO/getThreadPoolReader.cpp
@@ -7,9 +7,7 @@
 #include <Disks/IO/ThreadPoolRemoteFSReader.h>
 #include <Disks/IO/ThreadPoolReader.h>
 
-#ifndef CLICKHOUSE_PROGRAM_STANDALONE_BUILD
 #include <Interpreters/Context.h>
-#endif
 
 namespace DB
 {
@@ -21,32 +19,10 @@ namespace ErrorCodes
 
 IAsynchronousReader & getThreadPoolReader(FilesystemReaderType type)
 {
-#ifdef CLICKHOUSE_PROGRAM_STANDALONE_BUILD
-    const auto & config = Poco::Util::Application::instance().config();
-    switch (type)
-    {
-        case FilesystemReaderType::ASYNCHRONOUS_REMOTE_FS_READER:
-        {
-            static auto asynchronous_remote_fs_reader = createThreadPoolReader(type, config);
-            return *asynchronous_remote_fs_reader;
-        }
-        case FilesystemReaderType::ASYNCHRONOUS_LOCAL_FS_READER:
-        {
-            static auto asynchronous_local_fs_reader = createThreadPoolReader(type, config);
-            return *asynchronous_local_fs_reader;
-        }
-        case FilesystemReaderType::SYNCHRONOUS_LOCAL_FS_READER:
-        {
-            static auto synchronous_local_fs_reader = createThreadPoolReader(type, config);
-            return *synchronous_local_fs_reader;
-        }
-    }
-#else
     auto context = Context::getGlobalContextInstance();
     if (!context)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Global context not initialized");
     return context->getThreadPoolReader(type);
-#endif
 }
 
 std::unique_ptr<IAsynchronousReader> createThreadPoolReader(
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
index 1e06490b5bc..1b62b5fdb05 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
@@ -57,14 +57,22 @@ void validateContainerName(const String & container_name)
 
 AzureBlobStorageEndpoint processAzureBlobStorageEndpoint(const Poco::Util::AbstractConfiguration & config, const String & config_prefix)
 {
-    String storage_account_url = config.getString(config_prefix + ".storage_account_url");
-    validateStorageAccountUrl(storage_account_url);
+    std::string storage_url;
+    if (config.has(config_prefix + ".storage_account_url"))
+    {
+        storage_url = config.getString(config_prefix + ".storage_account_url");
+        validateStorageAccountUrl(storage_url);
+    }
+    else
+    {
+        storage_url = config.getString(config_prefix + ".connection_string");
+    }
     String container_name = config.getString(config_prefix + ".container_name", "default-container");
     validateContainerName(container_name);
     std::optional<bool> container_already_exists {};
     if (config.has(config_prefix + ".container_already_exists"))
         container_already_exists = {config.getBool(config_prefix + ".container_already_exists")};
-    return {storage_account_url, container_name, container_already_exists};
+    return {storage_url, container_name, container_already_exists};
 }
 
 
@@ -136,10 +144,7 @@ std::unique_ptr<BlobContainerClient> getAzureBlobContainerClient(
         /// If container_already_exists is not set (in config), ignore already exists error.
         /// (Conflict - The specified container already exists)
         if (!endpoint.container_already_exists.has_value() && e.StatusCode == Azure::Core::Http::HttpStatusCode::Conflict)
-        {
-            tryLogCurrentException("Container already exists, returning the existing container");
             return getAzureBlobStorageClientWithAuth<BlobContainerClient>(final_url, container_name, config, config_prefix);
-        }
         throw;
     }
 }
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
index 0358b4e915a..dbb41851053 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
@@ -6,14 +6,20 @@
 #include <Common/getRandomASCIIString.h>
 #include <Disks/IO/ReadBufferFromAzureBlobStorage.h>
 #include <Disks/IO/WriteBufferFromAzureBlobStorage.h>
-#include <IO/SeekAvoidingReadBuffer.h>
 #include <Disks/IO/ReadBufferFromRemoteFSGather.h>
 #include <Disks/IO/AsynchronousBoundedReadBuffer.h>
 
 #include <Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.h>
+#include <Disks/ObjectStorages/ObjectStorageIteratorAsync.h>
 #include <Interpreters/Context.h>
 #include <Common/logger_useful.h>
 
+namespace CurrentMetrics
+{
+    extern const Metric ObjectStorageAzureThreads;
+    extern const Metric ObjectStorageAzureThreadsActive;
+
+}
 
 namespace DB
 {
@@ -26,6 +32,61 @@ namespace ErrorCodes
 }
 
 
+namespace
+{
+
+class AzureIteratorAsync final : public IObjectStorageIteratorAsync
+{
+public:
+    AzureIteratorAsync(
+        const std::string & path_prefix,
+        std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> client_,
+        size_t max_list_size)
+        : IObjectStorageIteratorAsync(
+            CurrentMetrics::ObjectStorageAzureThreads,
+            CurrentMetrics::ObjectStorageAzureThreadsActive,
+            "ListObjectAzure")
+        , client(client_)
+    {
+
+        options.Prefix = path_prefix;
+        options.PageSizeHint = static_cast<int>(max_list_size);
+    }
+
+private:
+    bool getBatchAndCheckNext(RelativePathsWithMetadata & batch) override
+    {
+        batch.clear();
+        auto outcome = client->ListBlobs(options);
+        auto blob_list_response = client->ListBlobs(options);
+        auto blobs_list = blob_list_response.Blobs;
+
+        for (const auto & blob : blobs_list)
+        {
+            batch.emplace_back(
+                blob.Name,
+                ObjectMetadata{
+                    static_cast<uint64_t>(blob.BlobSize),
+                    Poco::Timestamp::fromEpochTime(
+                        std::chrono::duration_cast<std::chrono::seconds>(
+                            blob.Details.LastModified.time_since_epoch()).count()),
+                    {}});
+        }
+
+        if (!blob_list_response.NextPageToken.HasValue() || blob_list_response.NextPageToken.Value().empty())
+            return false;
+
+        options.ContinuationToken = blob_list_response.NextPageToken;
+        return true;
+    }
+
+    std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> client;
+    Azure::Storage::Blobs::ListBlobsOptions options;
+};
+
+}
+
+
 AzureObjectStorage::AzureObjectStorage(
     const String & name_,
     AzureClientPtr && client_,
@@ -67,6 +128,14 @@ bool AzureObjectStorage::exists(const StoredObject & object) const
     return false;
 }
 
+ObjectStorageIteratorPtr AzureObjectStorage::iterate(const std::string & path_prefix) const
+{
+    auto settings_ptr = settings.get();
+    auto client_ptr = client.get();
+
+    return std::make_shared<AzureIteratorAsync>(path_prefix, client_ptr, settings_ptr->list_object_keys_size);
+}
+
 void AzureObjectStorage::listObjects(const std::string & path, RelativePathsWithMetadata & children, int max_keys) const
 {
     auto client_ptr = client.get();
@@ -146,27 +215,37 @@ std::unique_ptr<ReadBufferFromFileBase> AzureObjectStorage::readObjects( /// NOL
             settings_ptr->max_single_read_retries,
             settings_ptr->max_single_download_retries,
             /* use_external_buffer */true,
+            /* restricted_seek */true,
             read_until_position);
     };
 
-    auto reader_impl = std::make_unique<ReadBufferFromRemoteFSGather>(
-        std::move(read_buffer_creator),
-        objects,
-        disk_read_settings,
-        global_context->getFilesystemCacheLog());
+    switch (read_settings.remote_fs_method)
+    {
+        case RemoteFSReadMethod::read:
+        {
+            return std::make_unique<ReadBufferFromRemoteFSGather>(
+                std::move(read_buffer_creator),
+                objects,
+                disk_read_settings,
+                global_context->getFilesystemCacheLog(),
+                /* use_external_buffer */false);
 
-    if (disk_read_settings.remote_fs_method == RemoteFSReadMethod::threadpool)
-    {
-        auto & reader = global_context->getThreadPoolReader(FilesystemReaderType::ASYNCHRONOUS_REMOTE_FS_READER);
-        return std::make_unique<AsynchronousBoundedReadBuffer>(
-            std::move(reader_impl), reader, disk_read_settings,
-            global_context->getAsyncReadCounters(),
-            global_context->getFilesystemReadPrefetchesLog());
-    }
-    else
-    {
-        auto buf = std::make_unique<ReadIndirectBufferFromRemoteFS>(std::move(reader_impl), disk_read_settings);
-        return std::make_unique<SeekAvoidingReadBuffer>(std::move(buf), settings_ptr->min_bytes_for_seek);
+        }
+        case RemoteFSReadMethod::threadpool:
+        {
+            auto impl = std::make_unique<ReadBufferFromRemoteFSGather>(
+                std::move(read_buffer_creator),
+                objects,
+                disk_read_settings,
+                global_context->getFilesystemCacheLog(),
+                /* use_external_buffer */true);
+
+            auto & reader = global_context->getThreadPoolReader(FilesystemReaderType::ASYNCHRONOUS_REMOTE_FS_READER);
+            return std::make_unique<AsynchronousBoundedReadBuffer>(
+                std::move(impl), reader, disk_read_settings,
+                global_context->getAsyncReadCounters(),
+                global_context->getFilesystemReadPrefetchesLog());
+        }
     }
 }
 
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index a36a03bcda4..b5f81cef235 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -5,13 +5,9 @@
 
 #include <Disks/ObjectStorages/DiskObjectStorageCommon.h>
 #include <Disks/IO/ReadBufferFromRemoteFSGather.h>
-#include <Disks/IO/ReadIndirectBufferFromRemoteFS.h>
 #include <Disks/ObjectStorages/IObjectStorage.h>
 #include <Common/MultiVersion.h>
-
-#if USE_AZURE_BLOB_STORAGE
 #include <azure/storage/blobs.hpp>
-#endif
 
 namespace Poco
 {
@@ -37,11 +33,13 @@ struct AzureObjectStorageSettings
     {
     }
 
-    size_t max_single_part_upload_size; /// NOTE: on 32-bit machines it will be at most 4GB, but size_t is also used in BufferBase for offset
-    uint64_t min_bytes_for_seek;
-    size_t max_single_read_retries;
-    size_t max_single_download_retries;
-    int list_object_keys_size;
+    AzureObjectStorageSettings() = default;
+
+    size_t max_single_part_upload_size = 100 * 1024 * 1024; /// NOTE: on 32-bit machines it will be at most 4GB, but size_t is also used in BufferBase for offset
+    uint64_t min_bytes_for_seek = 1024 * 1024;
+    size_t max_single_read_retries = 3;
+    size_t max_single_download_retries = 3;
+    int list_object_keys_size = 1000;
 };
 
 using AzureClient = Azure::Storage::Blobs::BlobContainerClient;
@@ -60,6 +58,8 @@ public:
 
     void listObjects(const std::string & path, RelativePathsWithMetadata & children, int max_keys) const override;
 
+    ObjectStorageIteratorPtr iterate(const std::string & path_prefix) const override;
+
     DataSourceDescription getDataSourceDescription() const override { return data_source_description; }
 
     std::string getName() const override { return "AzureObjectStorage"; }
diff --git a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.cpp b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.cpp
index 1d24d9d5411..3e7c4d12c42 100644
--- a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.cpp
@@ -57,7 +57,7 @@ ReadSettings CachedObjectStorage::patchSettings(const ReadSettings & read_settin
     ReadSettings modified_settings{read_settings};
     modified_settings.remote_fs_cache = cache;
 
-    if (!canUseReadThroughCache())
+    if (!canUseReadThroughCache(read_settings))
         modified_settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache = true;
 
     return object_storage->patchSettings(modified_settings);
@@ -119,7 +119,6 @@ std::unique_ptr<WriteBufferFromFileBase> CachedObjectStorage::writeObject( /// N
             cache,
             implementation_buffer->getFileName(),
             key,
-            modified_write_settings.is_file_cache_persistent,
             CurrentThread::isInitialized() && CurrentThread::get().getQueryContext() ? std::string(CurrentThread::getQueryId()) : "",
             modified_write_settings);
     }
@@ -138,6 +137,7 @@ void CachedObjectStorage::removeCacheIfExists(const std::string & path_key_for_c
 
 void CachedObjectStorage::removeObject(const StoredObject & object)
 {
+    removeCacheIfExists(object.remote_path);
     object_storage->removeObject(object);
 }
 
@@ -163,20 +163,6 @@ void CachedObjectStorage::removeObjectsIfExist(const StoredObjects & objects)
     object_storage->removeObjectsIfExist(objects);
 }
 
-ReadSettings CachedObjectStorage::getAdjustedSettingsFromMetadataFile(const ReadSettings & settings, const std::string & path) const
-{
-    ReadSettings new_settings{settings};
-    new_settings.is_file_cache_persistent = isFileWithPersistentCache(path) && cache_settings.do_not_evict_index_and_mark_files;
-    return new_settings;
-}
-
-WriteSettings CachedObjectStorage::getAdjustedSettingsFromMetadataFile(const WriteSettings & settings, const std::string & path) const
-{
-    WriteSettings new_settings{settings};
-    new_settings.is_file_cache_persistent = isFileWithPersistentCache(path) && cache_settings.do_not_evict_index_and_mark_files;
-    return new_settings;
-}
-
 void CachedObjectStorage::copyObjectToAnotherObjectStorage( // NOLINT
     const StoredObject & object_from,
     const StoredObject & object_to,
@@ -227,8 +213,11 @@ String CachedObjectStorage::getObjectsNamespace() const
     return object_storage->getObjectsNamespace();
 }
 
-bool CachedObjectStorage::canUseReadThroughCache()
+bool CachedObjectStorage::canUseReadThroughCache(const ReadSettings & settings)
 {
+    if (!settings.avoid_readthrough_cache_outside_query_context)
+        return true;
+
     return CurrentThread::isInitialized()
         && CurrentThread::get().getQueryContext()
         && !CurrentThread::getQueryId().empty();
diff --git a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h
index b5186d39c32..76f16c9d930 100644
--- a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h
+++ b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h
@@ -108,11 +108,9 @@ public:
 
     bool supportParallelWrite() const override { return object_storage->supportParallelWrite(); }
 
-    ReadSettings getAdjustedSettingsFromMetadataFile(const ReadSettings & settings, const std::string & path) const override;
+    const FileCacheSettings & getCacheSettings() const { return cache_settings; }
 
-    WriteSettings getAdjustedSettingsFromMetadataFile(const WriteSettings & settings, const std::string & path) const override;
-
-    static bool canUseReadThroughCache();
+    static bool canUseReadThroughCache(const ReadSettings & settings);
 
 private:
     FileCache::Key getCacheKey(const std::string & path) const;
diff --git a/src/Disks/ObjectStorages/Cached/registerDiskCache.cpp b/src/Disks/ObjectStorages/Cached/registerDiskCache.cpp
index 779ec6120f8..2b40fa9c21b 100644
--- a/src/Disks/ObjectStorages/Cached/registerDiskCache.cpp
+++ b/src/Disks/ObjectStorages/Cached/registerDiskCache.cpp
@@ -48,7 +48,9 @@ void registerDiskCache(DiskFactory & factory, bool /* global_skip_access_check *
         auto cache = FileCacheFactory::instance().getOrCreate(name, file_cache_settings);
         auto disk = disk_it->second;
         if (!dynamic_cast<const DiskObjectStorage *>(disk.get()))
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cached disk is allowed only on top of object storage");
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                "Cannot wrap disk `{}` with cache layer `{}`: cached disk is allowed only on top of object storage",
+                disk_name, name);
 
         auto disk_object_storage = disk->createDiskObjectStorage();
 
diff --git a/src/Disks/ObjectStorages/DiskObjectStorage.cpp b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
index 129f1ab1ef7..e5bbd2ca0c6 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
@@ -11,7 +11,6 @@
 #include <Common/logger_useful.h>
 #include <Common/filesystemHelpers.h>
 #include <Common/CurrentMetrics.h>
-#include <Disks/ObjectStorages/Cached/CachedObjectStorage.h>
 #include <Disks/ObjectStorages/DiskObjectStorageRemoteMetadataRestoreHelper.h>
 #include <Disks/ObjectStorages/DiskObjectStorageTransaction.h>
 #include <Disks/FakeDiskTransaction.h>
@@ -530,24 +529,6 @@ DiskObjectStoragePtr DiskObjectStorage::createDiskObjectStorage()
         threadpool_size);
 }
 
-void DiskObjectStorage::wrapWithCache(FileCachePtr cache, const FileCacheSettings & cache_settings, const String & layer_name)
-{
-    object_storage = std::make_shared<CachedObjectStorage>(object_storage, cache, cache_settings, layer_name);
-}
-
-NameSet DiskObjectStorage::getCacheLayersNames() const
-{
-    NameSet cache_layers;
-    auto current_object_storage = object_storage;
-    while (current_object_storage->supportsCache())
-    {
-        auto * cached_object_storage = assert_cast<CachedObjectStorage *>(current_object_storage.get());
-        cache_layers.insert(cached_object_storage->getCacheConfigName());
-        current_object_storage = cached_object_storage->getWrappedObjectStorage();
-    }
-    return cache_layers;
-}
-
 std::unique_ptr<ReadBufferFromFileBase> DiskObjectStorage::readFile(
     const String & path,
     const ReadSettings & settings,
@@ -596,7 +577,8 @@ void DiskObjectStorage::writeFileUsingBlobWritingFunction(const String & path, W
 {
     LOG_TEST(log, "Write file: {}", path);
     auto transaction = createObjectStorageTransaction();
-    return transaction->writeFileUsingBlobWritingFunction(path, mode, std::move(write_blob_function));
+    transaction->writeFileUsingBlobWritingFunction(path, mode, std::move(write_blob_function));
+    transaction->commit();
 }
 
 void DiskObjectStorage::applyNewSettings(
diff --git a/src/Disks/ObjectStorages/DiskObjectStorage.h b/src/Disks/ObjectStorages/DiskObjectStorage.h
index b7dfaf67cf2..c9820956a4d 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorage.h
+++ b/src/Disks/ObjectStorages/DiskObjectStorage.h
@@ -181,20 +181,22 @@ public:
     /// MergeTree table on this disk.
     bool isWriteOnce() const override;
 
-    /// Add a cache layer.
-    /// Example: DiskObjectStorage(S3ObjectStorage) -> DiskObjectStorage(CachedObjectStorage(S3ObjectStorage))
-    /// There can be any number of cache layers:
-    /// DiskObjectStorage(CachedObjectStorage(...CacheObjectStorage(S3ObjectStorage)...))
-    void wrapWithCache(FileCachePtr cache, const FileCacheSettings & cache_settings, const String & layer_name);
-
     /// Get structure of object storage this disk works with. Examples:
     /// DiskObjectStorage(S3ObjectStorage)
     /// DiskObjectStorage(CachedObjectStorage(S3ObjectStorage))
     /// DiskObjectStorage(CachedObjectStorage(CachedObjectStorage(S3ObjectStorage)))
     String getStructure() const { return fmt::format("DiskObjectStorage-{}({})", getName(), object_storage->getName()); }
 
+#ifndef CLICKHOUSE_PROGRAM_STANDALONE_BUILD
+    /// Add a cache layer.
+    /// Example: DiskObjectStorage(S3ObjectStorage) -> DiskObjectStorage(CachedObjectStorage(S3ObjectStorage))
+    /// There can be any number of cache layers:
+    /// DiskObjectStorage(CachedObjectStorage(...CacheObjectStorage(S3ObjectStorage)...))
+    void wrapWithCache(FileCachePtr cache, const FileCacheSettings & cache_settings, const String & layer_name);
+
     /// Get names of all cache layers. Name is how cache is defined in configuration file.
     NameSet getCacheLayersNames() const override;
+#endif
 
     static std::shared_ptr<Executor> getAsyncExecutor(const std::string & log_name, size_t size);
 
diff --git a/src/Disks/ObjectStorages/DiskObjectStorageCache.cpp b/src/Disks/ObjectStorages/DiskObjectStorageCache.cpp
new file mode 100644
index 00000000000..9e5012dec54
--- /dev/null
+++ b/src/Disks/ObjectStorages/DiskObjectStorageCache.cpp
@@ -0,0 +1,28 @@
+#include <Disks/ObjectStorages/Cached/CachedObjectStorage.h>
+
+#include <Disks/ObjectStorages/DiskObjectStorage.h>
+
+#include <Common/assert_cast.h>
+
+namespace DB
+{
+
+void DiskObjectStorage::wrapWithCache(FileCachePtr cache, const FileCacheSettings & cache_settings, const String & layer_name)
+{
+    object_storage = std::make_shared<CachedObjectStorage>(object_storage, cache, cache_settings, layer_name);
+}
+
+NameSet DiskObjectStorage::getCacheLayersNames() const
+{
+    NameSet cache_layers;
+    auto current_object_storage = object_storage;
+    while (current_object_storage->supportsCache())
+    {
+        auto * cached_object_storage = assert_cast<CachedObjectStorage *>(current_object_storage.get());
+        cache_layers.insert(cached_object_storage->getCacheConfigName());
+        current_object_storage = cached_object_storage->getWrappedObjectStorage();
+    }
+    return cache_layers;
+}
+
+}
diff --git a/src/Disks/ObjectStorages/DiskObjectStorageTransaction.cpp b/src/Disks/ObjectStorages/DiskObjectStorageTransaction.cpp
index 257a6fdf2ea..bd66ada492f 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorageTransaction.cpp
+++ b/src/Disks/ObjectStorages/DiskObjectStorageTransaction.cpp
@@ -710,8 +710,6 @@ void DiskObjectStorageTransaction::writeFileUsingBlobWritingFunction(
         metadata_transaction->createMetadataFile(path, blob_name, object_size);
     else
         metadata_transaction->addBlobToMetadata(path, blob_name, object_size);
-
-    metadata_transaction->commit();
 }
 
 
diff --git a/src/Disks/ObjectStorages/HDFS/HDFSObjectStorage.cpp b/src/Disks/ObjectStorages/HDFS/HDFSObjectStorage.cpp
index a3092bc6f12..60230ce2fb0 100644
--- a/src/Disks/ObjectStorages/HDFS/HDFSObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/HDFS/HDFSObjectStorage.cpp
@@ -1,13 +1,10 @@
 #include <Disks/ObjectStorages/HDFS/HDFSObjectStorage.h>
 
-#include <IO/SeekAvoidingReadBuffer.h>
 #include <IO/copyData.h>
-
 #include <Storages/HDFS/WriteBufferFromHDFS.h>
 #include <Storages/HDFS/HDFSCommon.h>
 
 #include <Storages/HDFS/ReadBufferFromHDFS.h>
-#include <Disks/IO/ReadIndirectBufferFromRemoteFS.h>
 #include <Disks/IO/ReadBufferFromRemoteFSGather.h>
 #include <Common/getRandomASCIIString.h>
 
@@ -72,9 +69,8 @@ std::unique_ptr<ReadBufferFromFileBase> HDFSObjectStorage::readObjects( /// NOLI
             hdfs_uri, hdfs_path, config, disk_read_settings, /* read_until_position */0, /* use_external_buffer */true);
     };
 
-    auto hdfs_impl = std::make_unique<ReadBufferFromRemoteFSGather>(std::move(read_buffer_creator), objects, disk_read_settings, nullptr);
-    auto buf = std::make_unique<ReadIndirectBufferFromRemoteFS>(std::move(hdfs_impl), read_settings);
-    return std::make_unique<SeekAvoidingReadBuffer>(std::move(buf), settings->min_bytes_for_seek);
+    return std::make_unique<ReadBufferFromRemoteFSGather>(
+        std::move(read_buffer_creator), objects, disk_read_settings, nullptr, /* use_external_buffer */false);
 }
 
 std::unique_ptr<WriteBufferFromFileBase> HDFSObjectStorage::writeObject( /// NOLINT
diff --git a/src/Disks/ObjectStorages/IObjectStorage.cpp b/src/Disks/ObjectStorages/IObjectStorage.cpp
index a5903f9d429..ea22294224c 100644
--- a/src/Disks/ObjectStorages/IObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/IObjectStorage.cpp
@@ -5,6 +5,7 @@
 #include <IO/copyData.h>
 #include <IO/ReadBufferFromFileBase.h>
 #include <Interpreters/Context.h>
+#include <Disks/ObjectStorages/ObjectStorageIterator.h>
 
 
 namespace DB
@@ -29,6 +30,14 @@ void IObjectStorage::listObjects(const std::string &, RelativePathsWithMetadata
 }
 
 
+ObjectStorageIteratorPtr IObjectStorage::iterate(const std::string & path_prefix) const
+{
+    RelativePathsWithMetadata files;
+    listObjects(path_prefix, files, 0);
+
+    return std::make_shared<ObjectStorageIteratorFromList>(std::move(files));
+}
+
 std::optional<ObjectMetadata> IObjectStorage::tryGetObjectMetadata(const std::string & path) const
 {
     try
diff --git a/src/Disks/ObjectStorages/IObjectStorage.h b/src/Disks/ObjectStorages/IObjectStorage.h
index 28de80a88cd..32f9d1ba764 100644
--- a/src/Disks/ObjectStorages/IObjectStorage.h
+++ b/src/Disks/ObjectStorages/IObjectStorage.h
@@ -20,6 +20,9 @@
 #include <Disks/WriteMode.h>
 #include <Interpreters/Context_fwd.h>
 #include <Core/Types.h>
+#include <Disks/DirectoryIterator.h>
+#include <Common/ThreadPool.h>
+#include <Interpreters/threadPoolCallbackRunner.h>
 
 
 namespace DB
@@ -51,6 +54,8 @@ struct RelativePathWithMetadata
 
 using RelativePathsWithMetadata = std::vector<RelativePathWithMetadata>;
 
+class IObjectStorageIterator;
+using ObjectStorageIteratorPtr = std::shared_ptr<IObjectStorageIterator>;
 
 /// Base class for all object storages which implement some subset of ordinary filesystem operations.
 ///
@@ -75,6 +80,8 @@ public:
 
     virtual void listObjects(const std::string & path, RelativePathsWithMetadata & children, int max_keys) const;
 
+    virtual ObjectStorageIteratorPtr iterate(const std::string & path_prefix) const;
+
     /// Get object metadata if supported. It should be possible to receive
     /// at least size of object
     virtual std::optional<ObjectMetadata> tryGetObjectMetadata(const std::string & path) const;
diff --git a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
index 05c0c8f3961..69ccf309096 100644
--- a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
@@ -4,11 +4,9 @@
 #include <Interpreters/Context.h>
 #include <Common/filesystemHelpers.h>
 #include <Common/logger_useful.h>
-#include <Disks/IO/ReadIndirectBufferFromRemoteFS.h>
 #include <Disks/IO/ReadBufferFromRemoteFSGather.h>
 #include <Disks/IO/createReadBufferFromFileBase.h>
 #include <Disks/IO/AsynchronousBoundedReadBuffer.h>
-#include <IO/SeekAvoidingReadBuffer.h>
 #include <IO/WriteBufferFromFile.h>
 #include <IO/copyData.h>
 #include <Common/getRandomASCIIString.h>
@@ -59,25 +57,26 @@ std::unique_ptr<ReadBufferFromFileBase> LocalObjectStorage::readObjects( /// NOL
         return createReadBufferFromFileBase(file_path, modified_settings, read_hint, file_size);
     };
 
-    auto impl = std::make_unique<ReadBufferFromRemoteFSGather>(
-        std::move(read_buffer_creator), objects, modified_settings,
-        global_context->getFilesystemCacheLog());
+    switch (read_settings.remote_fs_method)
+    {
+        case RemoteFSReadMethod::read:
+        {
+            return std::make_unique<ReadBufferFromRemoteFSGather>(
+                std::move(read_buffer_creator), objects, modified_settings,
+                global_context->getFilesystemCacheLog(), /* use_external_buffer */false);
+        }
+        case RemoteFSReadMethod::threadpool:
+        {
+            auto impl = std::make_unique<ReadBufferFromRemoteFSGather>(
+                std::move(read_buffer_creator), objects, modified_settings,
+                global_context->getFilesystemCacheLog(), /* use_external_buffer */true);
 
-    /// We use `remove_fs_method` (not `local_fs_method`) because we are about to use
-    /// AsynchronousBoundedReadBuffer which works by the remote_fs_* settings.
-    if (modified_settings.remote_fs_method == RemoteFSReadMethod::threadpool)
-    {
-        auto & reader = global_context->getThreadPoolReader(FilesystemReaderType::ASYNCHRONOUS_REMOTE_FS_READER);
-        return std::make_unique<AsynchronousBoundedReadBuffer>(
-            std::move(impl), reader, modified_settings,
-            global_context->getAsyncReadCounters(),
-            global_context->getFilesystemReadPrefetchesLog());
-    }
-    else
-    {
-        auto buf = std::make_unique<ReadIndirectBufferFromRemoteFS>(std::move(impl), modified_settings);
-        return std::make_unique<SeekAvoidingReadBuffer>(
-            std::move(buf), modified_settings.remote_read_min_bytes_for_seek);
+            auto & reader = global_context->getThreadPoolReader(FilesystemReaderType::ASYNCHRONOUS_REMOTE_FS_READER);
+            return std::make_unique<AsynchronousBoundedReadBuffer>(
+                std::move(impl), reader, read_settings,
+                global_context->getAsyncReadCounters(),
+                global_context->getFilesystemReadPrefetchesLog());
+        }
     }
 }
 
diff --git a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
index 0beed65879b..fb5b6d0757c 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
+++ b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
@@ -63,7 +63,7 @@ public:
 
     uint32_t getHardlinkCount(const std::string & /* path */) const override
     {
-        return 1;
+        return 0;
     }
 
     bool supportsChmod() const override { return false; }
diff --git a/src/Disks/ObjectStorages/ObjectStorageIterator.cpp b/src/Disks/ObjectStorages/ObjectStorageIterator.cpp
new file mode 100644
index 00000000000..72ec6e0e500
--- /dev/null
+++ b/src/Disks/ObjectStorages/ObjectStorageIterator.cpp
@@ -0,0 +1,20 @@
+#include <Disks/ObjectStorages/ObjectStorageIterator.h>
+#include <Common/Exception.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
+RelativePathWithMetadata ObjectStorageIteratorFromList::current()
+{
+    if (!isValid())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to access invalid iterator");
+
+    return *batch_iterator;
+}
+
+}
diff --git a/src/Disks/ObjectStorages/ObjectStorageIterator.h b/src/Disks/ObjectStorages/ObjectStorageIterator.h
new file mode 100644
index 00000000000..841b0ea6664
--- /dev/null
+++ b/src/Disks/ObjectStorages/ObjectStorageIterator.h
@@ -0,0 +1,71 @@
+#pragma once
+
+#include <Disks/ObjectStorages/IObjectStorage.h>
+#include <memory>
+
+namespace DB
+{
+
+class IObjectStorageIterator
+{
+public:
+    virtual void next() = 0;
+    virtual void nextBatch() = 0;
+    virtual bool isValid() = 0;
+    virtual RelativePathWithMetadata current() = 0;
+    virtual RelativePathsWithMetadata currentBatch() = 0;
+    virtual std::optional<RelativePathsWithMetadata> getCurrrentBatchAndScheduleNext() = 0;
+    virtual size_t getAccumulatedSize() const = 0;
+
+    virtual ~IObjectStorageIterator() = default;
+};
+
+using ObjectStorageIteratorPtr = std::shared_ptr<IObjectStorageIterator>;
+
+class ObjectStorageIteratorFromList : public IObjectStorageIterator
+{
+public:
+    explicit ObjectStorageIteratorFromList(RelativePathsWithMetadata && batch_)
+        : batch(std::move(batch_))
+        , batch_iterator(batch.begin())
+    {
+    }
+
+    void next() override
+    {
+        if (isValid())
+            ++batch_iterator;
+    }
+
+    void nextBatch() override
+    {
+        batch_iterator = batch.end();
+    }
+
+    bool isValid() override
+    {
+        return batch_iterator != batch.end();
+    }
+
+    RelativePathWithMetadata current() override;
+
+    RelativePathsWithMetadata currentBatch() override
+    {
+        return batch;
+    }
+
+    virtual std::optional<RelativePathsWithMetadata> getCurrrentBatchAndScheduleNext() override
+    {
+        return std::nullopt;
+    }
+
+    size_t getAccumulatedSize() const override
+    {
+        return batch.size();
+    }
+private:
+    RelativePathsWithMetadata batch;
+    RelativePathsWithMetadata::iterator batch_iterator;
+};
+
+}
diff --git a/src/Disks/ObjectStorages/ObjectStorageIteratorAsync.cpp b/src/Disks/ObjectStorages/ObjectStorageIteratorAsync.cpp
new file mode 100644
index 00000000000..7425f629a5a
--- /dev/null
+++ b/src/Disks/ObjectStorages/ObjectStorageIteratorAsync.cpp
@@ -0,0 +1,124 @@
+#include <Disks/ObjectStorages/ObjectStorageIteratorAsync.h>
+
+#include <Common/logger_useful.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
+void IObjectStorageIteratorAsync::nextBatch()
+{
+    std::lock_guard lock(mutex);
+    if (!is_finished)
+    {
+        if (!is_initialized)
+        {
+            outcome_future = scheduleBatch();
+            is_initialized = true;
+        }
+
+         BatchAndHasNext next_batch = outcome_future.get();
+         current_batch = std::move(next_batch.batch);
+         accumulated_size.fetch_add(current_batch.size(), std::memory_order_relaxed);
+         current_batch_iterator = current_batch.begin();
+         if (next_batch.has_next)
+             outcome_future = scheduleBatch();
+         else
+             is_finished = true;
+    }
+    else
+    {
+        current_batch.clear();
+        current_batch_iterator = current_batch.begin();
+    }
+}
+
+void IObjectStorageIteratorAsync::next()
+{
+    std::lock_guard lock(mutex);
+
+    if (current_batch_iterator != current_batch.end())
+    {
+        ++current_batch_iterator;
+    }
+    else if (!is_finished)
+    {
+        if (outcome_future.valid())
+        {
+            BatchAndHasNext next_batch = outcome_future.get();
+            current_batch = std::move(next_batch.batch);
+            accumulated_size.fetch_add(current_batch.size(), std::memory_order_relaxed);
+            current_batch_iterator = current_batch.begin();
+            if (next_batch.has_next)
+                outcome_future = scheduleBatch();
+            else
+                is_finished = true;
+        }
+    }
+}
+
+std::future<IObjectStorageIteratorAsync::BatchAndHasNext> IObjectStorageIteratorAsync::scheduleBatch()
+{
+    return list_objects_scheduler([this]
+    {
+        BatchAndHasNext result;
+        result.has_next = getBatchAndCheckNext(result.batch);
+        return result;
+    }, Priority{});
+}
+
+
+bool IObjectStorageIteratorAsync::isValid()
+{
+    if (!is_initialized)
+        nextBatch();
+
+    std::lock_guard lock(mutex);
+    return current_batch_iterator != current_batch.end();
+}
+
+RelativePathWithMetadata IObjectStorageIteratorAsync::current()
+{
+    if (!isValid())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to access invalid iterator");
+
+    std::lock_guard lock(mutex);
+    return *current_batch_iterator;
+}
+
+
+RelativePathsWithMetadata IObjectStorageIteratorAsync::currentBatch()
+{
+    if (!isValid())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to access invalid iterator");
+
+    std::lock_guard lock(mutex);
+    return current_batch;
+}
+
+std::optional<RelativePathsWithMetadata> IObjectStorageIteratorAsync::getCurrrentBatchAndScheduleNext()
+{
+    std::lock_guard lock(mutex);
+    if (!is_initialized)
+        nextBatch();
+
+    if (current_batch_iterator != current_batch.end())
+    {
+        auto temp_current_batch = current_batch;
+        nextBatch();
+        return temp_current_batch;
+    }
+
+    return std::nullopt;
+}
+
+size_t IObjectStorageIteratorAsync::getAccumulatedSize() const
+{
+    return accumulated_size.load(std::memory_order_relaxed);
+}
+
+}
diff --git a/src/Disks/ObjectStorages/ObjectStorageIteratorAsync.h b/src/Disks/ObjectStorages/ObjectStorageIteratorAsync.h
new file mode 100644
index 00000000000..b0dd3cef39c
--- /dev/null
+++ b/src/Disks/ObjectStorages/ObjectStorageIteratorAsync.h
@@ -0,0 +1,62 @@
+#pragma once
+
+#include <Disks/ObjectStorages/ObjectStorageIterator.h>
+#include <Common/ThreadPool.h>
+#include <Interpreters/threadPoolCallbackRunner.h>
+#include <mutex>
+#include <Common/CurrentMetrics.h>
+
+namespace DB
+{
+
+class IObjectStorageIteratorAsync : public IObjectStorageIterator
+{
+public:
+    IObjectStorageIteratorAsync(
+        CurrentMetrics::Metric threads_metric,
+        CurrentMetrics::Metric threads_active_metric,
+        const std::string & thread_name)
+        : list_objects_pool(threads_metric, threads_active_metric, 1)
+        , list_objects_scheduler(threadPoolCallbackRunner<BatchAndHasNext>(list_objects_pool, thread_name))
+    {
+    }
+
+    void next() override;
+    void nextBatch() override;
+    bool isValid() override;
+    RelativePathWithMetadata current() override;
+    RelativePathsWithMetadata currentBatch() override;
+    size_t getAccumulatedSize() const override;
+    std::optional<RelativePathsWithMetadata> getCurrrentBatchAndScheduleNext() override;
+
+    ~IObjectStorageIteratorAsync() override
+    {
+        list_objects_pool.wait();
+    }
+
+protected:
+
+    virtual bool getBatchAndCheckNext(RelativePathsWithMetadata & batch) = 0;
+
+    struct BatchAndHasNext
+    {
+        RelativePathsWithMetadata batch;
+        bool has_next;
+    };
+
+    std::future<BatchAndHasNext> scheduleBatch();
+
+    bool is_initialized{false};
+    bool is_finished{false};
+
+    mutable std::recursive_mutex mutex;
+    ThreadPool list_objects_pool;
+    ThreadPoolCallbackRunner<BatchAndHasNext> list_objects_scheduler;
+    std::future<BatchAndHasNext> outcome_future;
+    RelativePathsWithMetadata current_batch;
+    RelativePathsWithMetadata::iterator current_batch_iterator;
+    std::atomic<size_t> accumulated_size = 0;
+};
+
+
+}
diff --git a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
index 6e63efcc1e3..e48924326e1 100644
--- a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
@@ -3,15 +3,14 @@
 #if USE_AWS_S3
 
 #include <IO/S3Common.h>
+#include <Disks/ObjectStorages/ObjectStorageIteratorAsync.h>
 
 #include <Disks/IO/ReadBufferFromRemoteFSGather.h>
 #include <Disks/ObjectStorages/DiskObjectStorageCommon.h>
 #include <Disks/IO/AsynchronousBoundedReadBuffer.h>
-#include <Disks/IO/ReadIndirectBufferFromRemoteFS.h>
 #include <Disks/IO/ThreadPoolRemoteFSReader.h>
 #include <IO/WriteBufferFromS3.h>
 #include <IO/ReadBufferFromS3.h>
-#include <IO/SeekAvoidingReadBuffer.h>
 #include <IO/S3/getObjectInfo.h>
 #include <IO/S3/copyS3File.h>
 #include <Interpreters/Context.h>
@@ -33,6 +32,13 @@ namespace ProfileEvents
     extern const Event DiskS3ListObjects;
 }
 
+namespace CurrentMetrics
+{
+    extern const Metric ObjectStorageS3Threads;
+    extern const Metric ObjectStorageS3ThreadsActive;
+}
+
+
 namespace DB
 {
 
@@ -84,6 +90,62 @@ void logIfError(const Aws::Utils::Outcome<Result, Error> & response, std::functi
 
 }
 
+namespace
+{
+
+class S3IteratorAsync final : public IObjectStorageIteratorAsync
+{
+public:
+    S3IteratorAsync(
+        const std::string & bucket,
+        const std::string & path_prefix,
+        std::shared_ptr<const S3::Client> client_,
+        size_t max_list_size)
+        : IObjectStorageIteratorAsync(
+            CurrentMetrics::ObjectStorageS3Threads,
+            CurrentMetrics::ObjectStorageS3ThreadsActive,
+            "ListObjectS3")
+        , client(client_)
+    {
+        request.SetBucket(bucket);
+        request.SetPrefix(path_prefix);
+        request.SetMaxKeys(static_cast<int>(max_list_size));
+    }
+
+private:
+    bool getBatchAndCheckNext(RelativePathsWithMetadata & batch) override
+    {
+        ProfileEvents::increment(ProfileEvents::S3ListObjects);
+
+        bool result = false;
+        auto outcome = client->ListObjectsV2(request);
+        /// Outcome failure will be handled on the caller side.
+        if (outcome.IsSuccess())
+        {
+            auto objects = outcome.GetResult().GetContents();
+
+            result = !objects.empty();
+
+            for (const auto & object : objects)
+                batch.emplace_back(object.GetKey(), ObjectMetadata{static_cast<uint64_t>(object.GetSize()), Poco::Timestamp::fromEpochTime(object.GetLastModified().Seconds()), {}});
+
+            if (result)
+                request.SetContinuationToken(outcome.GetResult().GetNextContinuationToken());
+
+            return result;
+        }
+
+        throw Exception(ErrorCodes::S3_ERROR, "Could not list objects in bucket {} with prefix {}, S3 exception: {}, message: {}",
+                quoteString(request.GetBucket()), quoteString(request.GetPrefix()),
+                backQuote(outcome.GetError().GetExceptionName()), quoteString(outcome.GetError().GetMessage()));
+    }
+
+    std::shared_ptr<const S3::Client> client;
+    S3::ListObjectsV2Request request;
+};
+
+}
+
 bool S3ObjectStorage::exists(const StoredObject & object) const
 {
     auto settings_ptr = s3_settings.get();
@@ -118,24 +180,33 @@ std::unique_ptr<ReadBufferFromFileBase> S3ObjectStorage::readObjects( /// NOLINT
             /* restricted_seek */true);
     };
 
-    auto s3_impl = std::make_unique<ReadBufferFromRemoteFSGather>(
-        std::move(read_buffer_creator),
-        objects,
-        disk_read_settings,
-        global_context->getFilesystemCacheLog());
+    switch (read_settings.remote_fs_method)
+    {
+        case RemoteFSReadMethod::read:
+        {
+            return std::make_unique<ReadBufferFromRemoteFSGather>(
+                std::move(read_buffer_creator),
+                objects,
+                disk_read_settings,
+                global_context->getFilesystemCacheLog(),
+                /* use_external_buffer */false);
 
-    if (read_settings.remote_fs_method == RemoteFSReadMethod::threadpool)
-    {
-        auto & reader = global_context->getThreadPoolReader(FilesystemReaderType::ASYNCHRONOUS_REMOTE_FS_READER);
-        return std::make_unique<AsynchronousBoundedReadBuffer>(
-            std::move(s3_impl), reader, disk_read_settings,
-            global_context->getAsyncReadCounters(),
-            global_context->getFilesystemReadPrefetchesLog());
-    }
-    else
-    {
-        auto buf = std::make_unique<ReadIndirectBufferFromRemoteFS>(std::move(s3_impl), disk_read_settings);
-        return std::make_unique<SeekAvoidingReadBuffer>(std::move(buf), settings_ptr->min_bytes_for_seek);
+        }
+        case RemoteFSReadMethod::threadpool:
+        {
+            auto impl = std::make_unique<ReadBufferFromRemoteFSGather>(
+                std::move(read_buffer_creator),
+                objects,
+                disk_read_settings,
+                global_context->getFilesystemCacheLog(),
+                /* use_external_buffer */true);
+
+            auto & reader = global_context->getThreadPoolReader(FilesystemReaderType::ASYNCHRONOUS_REMOTE_FS_READER);
+            return std::make_unique<AsynchronousBoundedReadBuffer>(
+                std::move(impl), reader, disk_read_settings,
+                global_context->getAsyncReadCounters(),
+                global_context->getFilesystemReadPrefetchesLog());
+        }
     }
 }
 
@@ -183,6 +254,15 @@ std::unique_ptr<WriteBufferFromFileBase> S3ObjectStorage::writeObject( /// NOLIN
         disk_write_settings);
 }
 
+
+ObjectStorageIteratorPtr S3ObjectStorage::iterate(const std::string & path_prefix) const
+{
+    auto settings_ptr = s3_settings.get();
+    auto client_ptr = client.get();
+
+    return std::make_shared<S3IteratorAsync>(bucket, path_prefix, client_ptr, settings_ptr->list_object_keys_size);
+}
+
 void S3ObjectStorage::listObjects(const std::string & path, RelativePathsWithMetadata & children, int max_keys) const
 {
     auto settings_ptr = s3_settings.get();
diff --git a/src/Disks/ObjectStorages/S3/S3ObjectStorage.h b/src/Disks/ObjectStorages/S3/S3ObjectStorage.h
index b0eb01aec0d..072e1354d38 100644
--- a/src/Disks/ObjectStorages/S3/S3ObjectStorage.h
+++ b/src/Disks/ObjectStorages/S3/S3ObjectStorage.h
@@ -102,6 +102,8 @@ public:
 
     void listObjects(const std::string & path, RelativePathsWithMetadata & children, int max_keys) const override;
 
+    ObjectStorageIteratorPtr iterate(const std::string & path_prefix) const override;
+
     /// Uses `DeleteObjectRequest`.
     void removeObject(const StoredObject & object) override;
 
diff --git a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
index 4f34f3eed9c..690a0d3372c 100644
--- a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
@@ -4,11 +4,9 @@
 #include <Common/escapeForFileName.h>
 
 #include <IO/ReadWriteBufferFromHTTP.h>
-#include <IO/SeekAvoidingReadBuffer.h>
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
 
-#include <Disks/IO/ReadIndirectBufferFromRemoteFS.h>
 #include <Disks/IO/AsynchronousBoundedReadBuffer.h>
 #include <Disks/IO/ReadBufferFromRemoteFSGather.h>
 #include <Disks/IO/ReadBufferFromWebServer.h>
@@ -181,24 +179,33 @@ std::unique_ptr<ReadBufferFromFileBase> WebObjectStorage::readObject( /// NOLINT
      };
 
     auto global_context = Context::getGlobalContextInstance();
-    auto web_impl = std::make_unique<ReadBufferFromRemoteFSGather>(
-        std::move(read_buffer_creator),
-        StoredObjects{object},
-        read_settings,
-        global_context->getFilesystemCacheLog());
 
-    if (read_settings.remote_fs_method == RemoteFSReadMethod::threadpool)
+    switch (read_settings.remote_fs_method)
     {
-        auto & reader = global_context->getThreadPoolReader(FilesystemReaderType::ASYNCHRONOUS_REMOTE_FS_READER);
-        return std::make_unique<AsynchronousBoundedReadBuffer>(
-            std::move(web_impl), reader, read_settings,
-            global_context->getAsyncReadCounters(),
-            global_context->getFilesystemReadPrefetchesLog());
-    }
-    else
-    {
-        auto buf = std::make_unique<ReadIndirectBufferFromRemoteFS>(std::move(web_impl), read_settings);
-        return std::make_unique<SeekAvoidingReadBuffer>(std::move(buf), min_bytes_for_seek);
+        case RemoteFSReadMethod::read:
+        {
+            return std::make_unique<ReadBufferFromRemoteFSGather>(
+                std::move(read_buffer_creator),
+                StoredObjects{object},
+                read_settings,
+                global_context->getFilesystemCacheLog(),
+                /* use_external_buffer */false);
+        }
+        case RemoteFSReadMethod::threadpool:
+        {
+            auto impl = std::make_unique<ReadBufferFromRemoteFSGather>(
+                std::move(read_buffer_creator),
+                StoredObjects{object},
+                read_settings,
+                global_context->getFilesystemCacheLog(),
+                /* use_external_buffer */true);
+
+            auto & reader = global_context->getThreadPoolReader(FilesystemReaderType::ASYNCHRONOUS_REMOTE_FS_READER);
+            return std::make_unique<AsynchronousBoundedReadBuffer>(
+                std::move(impl), reader, read_settings,
+                global_context->getAsyncReadCounters(),
+                global_context->getFilesystemReadPrefetchesLog());
+        }
     }
 }
 
diff --git a/src/Disks/getOrCreateDiskFromAST.cpp b/src/Disks/getOrCreateDiskFromAST.cpp
index 637acff7b95..81d5b7372f3 100644
--- a/src/Disks/getOrCreateDiskFromAST.cpp
+++ b/src/Disks/getOrCreateDiskFromAST.cpp
@@ -26,12 +26,25 @@ namespace
 {
     std::string getOrCreateDiskFromDiskAST(const ASTFunction & function, ContextPtr context)
     {
-        /// We need a unique name for a created custom disk, but it needs to be the same
-        /// after table is reattached or server is restarted, so take a hash of the disk
-        /// configuration serialized ast as a disk name suffix.
-        auto disk_setting_string = serializeAST(function, true);
-        auto disk_name = DiskSelector::TMP_INTERNAL_DISK_PREFIX
-            + toString(sipHash128(disk_setting_string.data(), disk_setting_string.size()));
+        std::string disk_name;
+        if (function.name == "disk")
+        {
+            /// We need a unique name for a created custom disk, but it needs to be the same
+            /// after table is reattached or server is restarted, so take a hash of the disk
+            /// configuration serialized ast as a disk name suffix.
+            auto disk_setting_string = serializeAST(function, true);
+            disk_name = DiskSelector::TMP_INTERNAL_DISK_PREFIX
+                + toString(sipHash128(disk_setting_string.data(), disk_setting_string.size()));
+        }
+        else
+        {
+            static constexpr std::string_view custom_disk_prefix = "disk_";
+
+            if (function.name.size() <= custom_disk_prefix.size() || !function.name.starts_with(custom_disk_prefix))
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid disk name: {}", function.name);
+
+            disk_name = function.name.substr(custom_disk_prefix.size());
+        }
 
         auto result_disk = context->getOrCreateDisk(disk_name, [&](const DisksMap & disks_map) -> DiskPtr {
             const auto * function_args_expr = assert_cast<const ASTExpressionList *>(function.arguments.get());
@@ -43,6 +56,9 @@ namespace
             return disk;
         });
 
+        if (!result_disk->isCustomDisk())
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Disk with name `{}` already exist", disk_name);
+
         if (!result_disk->isRemote())
         {
             static constexpr auto custom_disks_base_dir_in_config = "custom_local_disks_base_directory";
diff --git a/src/Disks/registerDisks.cpp b/src/Disks/registerDisks.cpp
index 48d5a19fb61..676744a8e79 100644
--- a/src/Disks/registerDisks.cpp
+++ b/src/Disks/registerDisks.cpp
@@ -32,6 +32,8 @@ void registerDiskCache(DiskFactory & factory, bool global_skip_access_check);
 void registerDiskLocalObjectStorage(DiskFactory & factory, bool global_skip_access_check);
 
 
+#ifndef CLICKHOUSE_PROGRAM_STANDALONE_BUILD
+
 void registerDisks(bool global_skip_access_check)
 {
     auto & factory = DiskFactory::instance();
@@ -61,4 +63,19 @@ void registerDisks(bool global_skip_access_check)
     registerDiskLocalObjectStorage(factory, global_skip_access_check);
 }
 
+#else
+
+void registerDisks(bool global_skip_access_check)
+{
+    auto & factory = DiskFactory::instance();
+
+    registerDiskLocal(factory, global_skip_access_check);
+
+#if USE_AWS_S3
+    registerDiskS3(factory, global_skip_access_check);
+#endif
+}
+
+#endif
+
 }
diff --git a/src/Disks/tests/gtest_cascade_and_memory_write_buffer.cpp b/src/Disks/tests/gtest_cascade_and_memory_write_buffer.cpp
index a24056a141f..16acd109c27 100644
--- a/src/Disks/tests/gtest_cascade_and_memory_write_buffer.cpp
+++ b/src/Disks/tests/gtest_cascade_and_memory_write_buffer.cpp
@@ -166,6 +166,7 @@ static void checkHTTPHandlerCase(size_t input_size, size_t memory_buffer_size)
             });
 
         cascade.write(src.data(), src.size());
+        cascade.finalize();
         EXPECT_EQ(cascade.count(), src.size());
     }
 
@@ -222,6 +223,7 @@ TEST(MemoryWriteBuffer, WriteAndReread)
         {
             MemoryWriteBuffer buf(s - 1);
             EXPECT_THROW(buf.write(data.data(), data.size()), MemoryWriteBuffer::CurrentBufferExhausted);
+            buf.finalize();
         }
     }
 
diff --git a/src/Formats/CapnProtoSchema.cpp b/src/Formats/CapnProtoSchema.cpp
new file mode 100644
index 00000000000..559047a6f8d
--- /dev/null
+++ b/src/Formats/CapnProtoSchema.cpp
@@ -0,0 +1,298 @@
+#include <Formats/CapnProtoSchema.h>
+
+#if USE_CAPNP
+
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeEnum.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeTuple.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/IDataType.h>
+#include <Common/StringUtils/StringUtils.h>
+#include <boost/algorithm/string/join.hpp>
+#include <capnp/schema.h>
+#include <capnp/schema-parser.h>
+#include <fcntl.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int CANNOT_PARSE_CAPN_PROTO_SCHEMA;
+    extern const int BAD_TYPE_OF_FIELD;
+    extern const int FILE_DOESNT_EXIST;
+    extern const int UNKNOWN_EXCEPTION;
+    extern const int CAPN_PROTO_BAD_TYPE;
+    extern const int BAD_ARGUMENTS;
+}
+
+capnp::StructSchema CapnProtoSchemaParser::getMessageSchema(const FormatSchemaInfo & schema_info)
+{
+    capnp::ParsedSchema schema;
+    try
+    {
+        int fd;
+        KJ_SYSCALL(fd = open(schema_info.schemaDirectory().data(), O_RDONLY)); // NOLINT(bugprone-suspicious-semicolon)
+        auto schema_dir = kj::newDiskDirectory(kj::OsFileHandle(fd));
+        schema = impl.parseFromDirectory(*schema_dir, kj::Path::parse(schema_info.schemaPath()), {});
+    }
+    catch (const kj::Exception & e)
+    {
+        /// That's not good to determine the type of error by its description, but
+        /// this is the only way to do it here, because kj doesn't specify the type of error.
+        auto description = std::string_view(e.getDescription().cStr());
+        if (description.find("No such file or directory") != String::npos || description.find("no such directory") != String::npos || description.find("no such file") != String::npos)
+            throw Exception(ErrorCodes::FILE_DOESNT_EXIST, "Cannot open CapnProto schema, file {} doesn't exists", schema_info.absoluteSchemaPath());
+
+        if (description.find("Parse error") != String::npos)
+            throw Exception(ErrorCodes::CANNOT_PARSE_CAPN_PROTO_SCHEMA, "Cannot parse CapnProto schema {}:{}", schema_info.schemaPath(), e.getLine());
+
+        throw Exception(ErrorCodes::UNKNOWN_EXCEPTION,
+                        "Unknown exception while parsing CapnProto schema: {}, schema dir and file: {}, {}",
+                        description, schema_info.schemaDirectory(), schema_info.schemaPath());
+    }
+
+    auto message_maybe = schema.findNested(schema_info.messageName());
+    auto * message_schema = kj::_::readMaybe(message_maybe);
+    if (!message_schema)
+        throw Exception(ErrorCodes::CANNOT_PARSE_CAPN_PROTO_SCHEMA,
+                        "CapnProto schema doesn't contain message with name {}", schema_info.messageName());
+    return message_schema->asStruct();
+}
+
+bool checkIfStructContainsUnnamedUnion(const capnp::StructSchema & struct_schema)
+{
+    return struct_schema.getFields().size() != struct_schema.getNonUnionFields().size();
+}
+
+bool checkIfStructIsNamedUnion(const capnp::StructSchema & struct_schema)
+{
+    return struct_schema.getFields().size() == struct_schema.getUnionFields().size();
+}
+
+/// Get full name of type for better exception messages.
+String getCapnProtoFullTypeName(const capnp::Type & type)
+{
+    static const std::map<capnp::schema::Type::Which, String> capnp_simple_type_names =
+    {
+        {capnp::schema::Type::Which::BOOL, "Bool"},
+        {capnp::schema::Type::Which::VOID, "Void"},
+        {capnp::schema::Type::Which::INT8, "Int8"},
+        {capnp::schema::Type::Which::INT16, "Int16"},
+        {capnp::schema::Type::Which::INT32, "Int32"},
+        {capnp::schema::Type::Which::INT64, "Int64"},
+        {capnp::schema::Type::Which::UINT8, "UInt8"},
+        {capnp::schema::Type::Which::UINT16, "UInt16"},
+        {capnp::schema::Type::Which::UINT32, "UInt32"},
+        {capnp::schema::Type::Which::UINT64, "UInt64"},
+        {capnp::schema::Type::Which::FLOAT32, "Float32"},
+        {capnp::schema::Type::Which::FLOAT64, "Float64"},
+        {capnp::schema::Type::Which::TEXT, "Text"},
+        {capnp::schema::Type::Which::DATA, "Data"},
+        {capnp::schema::Type::Which::INTERFACE, "Interface"},
+        {capnp::schema::Type::Which::ANY_POINTER, "AnyPointer"},
+    };
+
+    switch (type.which())
+    {
+        case capnp::schema::Type::Which::STRUCT:
+        {
+            auto struct_schema = type.asStruct();
+
+            auto non_union_fields = struct_schema.getNonUnionFields();
+            std::vector<String> non_union_field_names;
+            for (auto nested_field : non_union_fields)
+                non_union_field_names.push_back(String(nested_field.getProto().getName()) + " " + getCapnProtoFullTypeName(nested_field.getType()));
+
+            auto union_fields = struct_schema.getUnionFields();
+            std::vector<String> union_field_names;
+            for (auto nested_field : union_fields)
+                union_field_names.push_back(String(nested_field.getProto().getName()) + " " + getCapnProtoFullTypeName(nested_field.getType()));
+
+            String union_name = "Union(" + boost::algorithm::join(union_field_names, ", ") + ")";
+            /// Check if the struct is a named union.
+            if (non_union_field_names.empty())
+                return union_name;
+
+            String type_name = "Struct(" + boost::algorithm::join(non_union_field_names, ", ");
+            /// Check if the struct contains unnamed union.
+            if (!union_field_names.empty())
+                type_name += ", " + union_name;
+            type_name += ")";
+            return type_name;
+        }
+        case capnp::schema::Type::Which::LIST:
+            return "List(" + getCapnProtoFullTypeName(type.asList().getElementType()) + ")";
+        case capnp::schema::Type::Which::ENUM:
+        {
+            auto enum_schema = type.asEnum();
+            String enum_name = "Enum(";
+            auto enumerants = enum_schema.getEnumerants();
+            for (unsigned i = 0; i != enumerants.size(); ++i)
+            {
+                enum_name += String(enumerants[i].getProto().getName()) + " = " + std::to_string(enumerants[i].getOrdinal());
+                if (i + 1 != enumerants.size())
+                    enum_name += ", ";
+            }
+            enum_name += ")";
+            return enum_name;
+        }
+        default:
+            auto it = capnp_simple_type_names.find(type.which());
+            if (it == capnp_simple_type_names.end())
+                throw Exception(ErrorCodes::BAD_TYPE_OF_FIELD, "Unknown CapnProto type");
+            return it->second;
+    }
+}
+
+namespace
+{
+
+    template <typename ValueType>
+    DataTypePtr getEnumDataTypeFromEnumerants(const capnp::EnumSchema::EnumerantList & enumerants)
+    {
+        std::vector<std::pair<String, ValueType>> values;
+        for (auto enumerant : enumerants)
+            values.emplace_back(enumerant.getProto().getName(), ValueType(enumerant.getOrdinal()));
+        return std::make_shared<DataTypeEnum<ValueType>>(std::move(values));
+    }
+
+    DataTypePtr getEnumDataTypeFromEnumSchema(const capnp::EnumSchema & enum_schema)
+    {
+        auto enumerants = enum_schema.getEnumerants();
+        if (enumerants.size() < 128)
+            return getEnumDataTypeFromEnumerants<Int8>(enumerants);
+        if (enumerants.size() < 32768)
+            return getEnumDataTypeFromEnumerants<Int16>(enumerants);
+
+        throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "ClickHouse supports only 8 and 16-bit Enums");
+    }
+
+    DataTypePtr getDataTypeFromCapnProtoType(const capnp::Type & capnp_type, bool skip_unsupported_fields)
+    {
+        switch (capnp_type.which())
+        {
+            case capnp::schema::Type::INT8:
+                return std::make_shared<DataTypeInt8>();
+            case capnp::schema::Type::INT16:
+                return std::make_shared<DataTypeInt16>();
+            case capnp::schema::Type::INT32:
+                return std::make_shared<DataTypeInt32>();
+            case capnp::schema::Type::INT64:
+                return std::make_shared<DataTypeInt64>();
+            case capnp::schema::Type::BOOL: [[fallthrough]];
+            case capnp::schema::Type::UINT8:
+                return std::make_shared<DataTypeUInt8>();
+            case capnp::schema::Type::UINT16:
+                return std::make_shared<DataTypeUInt16>();
+            case capnp::schema::Type::UINT32:
+                return std::make_shared<DataTypeUInt32>();
+            case capnp::schema::Type::UINT64:
+                return std::make_shared<DataTypeUInt64>();
+            case capnp::schema::Type::FLOAT32:
+                return std::make_shared<DataTypeFloat32>();
+            case capnp::schema::Type::FLOAT64:
+                return std::make_shared<DataTypeFloat64>();
+            case capnp::schema::Type::DATA: [[fallthrough]];
+            case capnp::schema::Type::TEXT:
+                return std::make_shared<DataTypeString>();
+            case capnp::schema::Type::ENUM:
+                return getEnumDataTypeFromEnumSchema(capnp_type.asEnum());
+            case capnp::schema::Type::LIST:
+            {
+                auto list_schema = capnp_type.asList();
+                auto nested_type = getDataTypeFromCapnProtoType(list_schema.getElementType(), skip_unsupported_fields);
+                if (!nested_type)
+                    return nullptr;
+                return std::make_shared<DataTypeArray>(nested_type);
+            }
+            case capnp::schema::Type::STRUCT:
+            {
+                auto struct_schema = capnp_type.asStruct();
+
+
+                if (struct_schema.getFields().size() == 0)
+                {
+                    if (skip_unsupported_fields)
+                        return nullptr;
+                    throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "Empty messages are not supported");
+                }
+
+                /// Check if it can be Nullable.
+                if (checkIfStructIsNamedUnion(struct_schema))
+                {
+                    auto fields = struct_schema.getUnionFields();
+                    if (fields.size() != 2 || (!fields[0].getType().isVoid() && !fields[1].getType().isVoid()))
+                    {
+                        if (skip_unsupported_fields)
+                            return nullptr;
+                        throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "Unions are not supported");
+                    }
+                    auto value_type = fields[0].getType().isVoid() ? fields[1].getType() : fields[0].getType();
+                    if (value_type.isStruct() || value_type.isList())
+                    {
+                        if (skip_unsupported_fields)
+                            return nullptr;
+                        throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "Tuples and Lists cannot be inside Nullable");
+                    }
+
+                    auto nested_type = getDataTypeFromCapnProtoType(value_type, skip_unsupported_fields);
+                    if (!nested_type)
+                        return nullptr;
+                    return std::make_shared<DataTypeNullable>(nested_type);
+                }
+
+                if (checkIfStructContainsUnnamedUnion(struct_schema))
+                    throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "Unnamed union is not supported");
+
+                /// Treat Struct as Tuple.
+                DataTypes nested_types;
+                Names nested_names;
+                for (auto field : struct_schema.getNonUnionFields())
+                {
+                    auto nested_type = getDataTypeFromCapnProtoType(field.getType(), skip_unsupported_fields);
+                    if (!nested_type)
+                        continue;
+                    nested_names.push_back(field.getProto().getName());
+                    nested_types.push_back(nested_type);
+                }
+                if (nested_types.empty())
+                    return nullptr;
+                return std::make_shared<DataTypeTuple>(std::move(nested_types), std::move(nested_names));
+            }
+            default:
+            {
+                if (skip_unsupported_fields)
+                    return nullptr;
+                throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "Unsupported CapnProtoType: {}", getCapnProtoFullTypeName(capnp_type));
+            }
+        }
+}
+
+}
+
+NamesAndTypesList capnProtoSchemaToCHSchema(const capnp::StructSchema & schema, bool skip_unsupported_fields)
+{
+    if (checkIfStructContainsUnnamedUnion(schema))
+        throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "Unnamed union is not supported");
+
+    NamesAndTypesList names_and_types;
+    for (auto field : schema.getNonUnionFields())
+    {
+        auto name = field.getProto().getName();
+        auto type = getDataTypeFromCapnProtoType(field.getType(), skip_unsupported_fields);
+        if (type)
+            names_and_types.emplace_back(name, type);
+    }
+    if (names_and_types.empty())
+        throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                        "Cannot convert CapnProto schema to ClickHouse table schema, all fields have unsupported types");
+
+    return names_and_types;
+}
+
+}
+
+#endif
diff --git a/src/Formats/CapnProtoUtils.h b/src/Formats/CapnProtoSchema.h
similarity index 59%
rename from src/Formats/CapnProtoUtils.h
rename to src/Formats/CapnProtoSchema.h
index 2d8cdb418d7..225f6f56207 100644
--- a/src/Formats/CapnProtoUtils.h
+++ b/src/Formats/CapnProtoSchema.h
@@ -30,17 +30,14 @@ public:
     capnp::StructSchema getMessageSchema(const FormatSchemaInfo & schema_info);
 };
 
-std::pair<String, String> splitCapnProtoFieldName(const String & name);
+bool checkIfStructContainsUnnamedUnion(const capnp::StructSchema & struct_schema);
+bool checkIfStructIsNamedUnion(const capnp::StructSchema & struct_schema);
 
-bool compareEnumNames(const String & first, const String & second, FormatSettings::EnumComparingMode mode);
-
-std::pair<capnp::DynamicStruct::Builder, capnp::StructSchema::Field> getStructBuilderAndFieldByColumnName(capnp::DynamicStruct::Builder struct_builder, const String & name);
-
-capnp::DynamicValue::Reader getReaderByColumnName(const capnp::DynamicStruct::Reader & struct_reader, const String & name);
-
-void checkCapnProtoSchemaStructure(const capnp::StructSchema & schema, const Block & header, FormatSettings::EnumComparingMode mode);
+/// Get full name of type for better exception messages.
+String getCapnProtoFullTypeName(const capnp::Type & type);
 
 NamesAndTypesList capnProtoSchemaToCHSchema(const capnp::StructSchema & schema, bool skip_unsupported_fields);
+
 }
 
 #endif
diff --git a/src/Formats/CapnProtoSerializer.cpp b/src/Formats/CapnProtoSerializer.cpp
new file mode 100644
index 00000000000..6f7254ab2aa
--- /dev/null
+++ b/src/Formats/CapnProtoSerializer.cpp
@@ -0,0 +1,1538 @@
+#include "config.h"
+
+#if USE_CAPNP
+
+#include <Formats/CapnProtoSerializer.h>
+#include <Formats/FormatSettings.h>
+#include <Formats/CapnProtoSchema.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeEnum.h>
+#include <DataTypes/DataTypeLowCardinality.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeTuple.h>
+#include <DataTypes/DataTypeMap.h>
+#include <DataTypes/IDataType.h>
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnNullable.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnFixedString.h>
+#include <Columns/ColumnTuple.h>
+#include <Columns/ColumnLowCardinality.h>
+#include <Columns/ColumnsDateTime.h>
+#include <Columns/ColumnMap.h>
+
+#include <boost/algorithm/string.hpp>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int THERE_IS_NO_COLUMN;
+    extern const int CAPN_PROTO_BAD_CAST;
+    extern const int INCORRECT_DATA;
+    extern const int ILLEGAL_COLUMN;
+}
+
+namespace
+{
+    std::pair<String, String> splitFieldName(const String & name)
+    {
+        const auto * begin = name.data();
+        const auto * end = name.data() + name.size();
+        const auto * it = find_first_symbols<'_', '.'>(begin, end);
+        String first = String(begin, it);
+        String second = it == end ? "" : String(it + 1, end);
+        return {first, second};
+    }
+
+    std::optional<capnp::StructSchema::Field> findFieldByName(const capnp::StructSchema & struct_schema, const String & name)
+    {
+        const auto & fields = struct_schema.getFields();
+        for (auto field : fields)
+        {
+            auto field_name = String(field.getProto().getName());
+            if (boost::to_lower_copy(name) == boost::to_lower_copy(field_name))
+                return field;
+        }
+        return std::nullopt;
+    }
+
+    [[noreturn]] void throwCannotConvert(const DataTypePtr & type, const String & name, const capnp::Type & capnp_type)
+    {
+        throw Exception(
+            ErrorCodes::CAPN_PROTO_BAD_CAST,
+            "Cannot convert ClickHouse column \"{}\" with type {} to CapnProto type {}",
+            name,
+            type->getName(),
+            getCapnProtoFullTypeName(capnp_type));
+    }
+
+    struct FieldBuilder
+    {
+        virtual ~FieldBuilder() = default;
+    };
+
+    struct ListBuilder : public FieldBuilder
+    {
+        explicit ListBuilder(capnp::DynamicValue::Builder builder, UInt32 elements_size) : impl(builder.as<capnp::DynamicList>()), nested_builders(elements_size)
+        {
+        }
+
+        capnp::DynamicList::Builder impl;
+        std::vector<std::unique_ptr<FieldBuilder>> nested_builders;
+    };
+
+    struct StructBuilder : public FieldBuilder
+    {
+        explicit StructBuilder(capnp::DynamicStruct::Builder struct_builder, size_t fields_size) : impl(std::move(struct_builder)), field_builders(fields_size)
+        {
+        }
+
+        capnp::DynamicStruct::Builder impl;
+        std::vector<std::unique_ptr<FieldBuilder>> field_builders;
+    };
+
+    template <typename ParentBuilder>
+    std::unique_ptr<StructBuilder> initStructBuilder(ParentBuilder & parent_builder, UInt32 offset_or_index, const capnp::_::StructSize & struct_size, size_t elements, const capnp::StructSchema & schema)
+    {
+        capnp::DynamicStruct::Builder builder_impl;
+        if constexpr (std::is_same_v<ParentBuilder, capnp::DynamicStruct::Builder>)
+            builder_impl = capnp::DynamicStruct::Builder(schema, parent_builder.getBuilderImpl().getPointerField(offset_or_index).initStruct(struct_size));
+        else
+            builder_impl = capnp::DynamicStruct::Builder(schema, parent_builder.getBuilderImpl().getStructElement(offset_or_index));
+        return std::make_unique<StructBuilder>(std::move(builder_impl), elements);
+    }
+
+    class ICapnProtoSerializer
+    {
+    public:
+        /// Write row as struct field.
+        virtual void writeRow(
+            const ColumnPtr & column,
+            std::unique_ptr<FieldBuilder> & builder, /// Maybe unused for simple types, needed to initialize structs and lists.
+            capnp::DynamicStruct::Builder & parent_struct_builder,
+            UInt32 slot_offset,
+            size_t row_num) = 0;
+
+        /// Write row as list element.
+        virtual void writeRow(
+            const ColumnPtr & column,
+            std::unique_ptr<FieldBuilder> & builder, /// Maybe unused for simple types, needed to initialize structs and lists.
+            capnp::DynamicList::Builder & parent_list_builder,
+            UInt32 array_index,
+            size_t row_num) = 0;
+
+        /// Read row from struct field at slot_offset.
+        virtual void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) = 0;
+
+        /// Read row from list element at array_index.
+        virtual void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) = 0;
+
+        virtual ~ICapnProtoSerializer() = default;
+    };
+
+    template <typename CHNumericType, typename CapnProtoNumericType, bool convert_to_bool_on_read>
+    class CapnProtoIntegerSerializer : public ICapnProtoSerializer
+    {
+    public:
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().setDataField<CapnProtoNumericType>(slot_offset, getValue(column, row_num));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            parent_list_builder.getBuilderImpl().setDataElement<CapnProtoNumericType>(array_index, getValue(column, row_num));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            insertValue(column, parent_struct_reader.getReaderImpl().getDataField<CapnProtoNumericType>(slot_offset));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            insertValue(column, parent_list_reader.getReaderImpl().getDataElement<CapnProtoNumericType>(array_index));
+        }
+
+    private:
+        CapnProtoNumericType getValue(const ColumnPtr & column, size_t row_num)
+        {
+            return static_cast<CapnProtoNumericType>(assert_cast<const ColumnVector<CHNumericType> &>(*column).getElement(row_num));
+        }
+
+        void insertValue(IColumn & column, CapnProtoNumericType value)
+        {
+            if constexpr (convert_to_bool_on_read)
+                assert_cast<ColumnUInt8 &>(column).insertValue(static_cast<bool>(value));
+            else
+                assert_cast<ColumnVector<CHNumericType> &>(column).insertValue(static_cast<CHNumericType>(value));
+        }
+    };
+
+    template <typename NumericType, bool convert_to_bool_on_read = false>
+    std::unique_ptr<ICapnProtoSerializer> createIntegerSerializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type)
+    {
+        switch (capnp_type.which())
+        {
+            case capnp::schema::Type::INT8:
+                return std::make_unique<CapnProtoIntegerSerializer<NumericType, Int8, convert_to_bool_on_read>>();
+            case capnp::schema::Type::INT16:
+                return std::make_unique<CapnProtoIntegerSerializer<NumericType, Int16, convert_to_bool_on_read>>();
+            case capnp::schema::Type::INT32:
+                return std::make_unique<CapnProtoIntegerSerializer<NumericType, Int32, convert_to_bool_on_read>>();
+            case capnp::schema::Type::INT64:
+                return std::make_unique<CapnProtoIntegerSerializer<NumericType, Int64, convert_to_bool_on_read>>();
+            case capnp::schema::Type::UINT8:
+                return std::make_unique<CapnProtoIntegerSerializer<NumericType, UInt8, convert_to_bool_on_read>>();
+            case capnp::schema::Type::UINT16:
+                return std::make_unique<CapnProtoIntegerSerializer<NumericType, UInt16, convert_to_bool_on_read>>();
+            case capnp::schema::Type::UINT32:
+                return std::make_unique<CapnProtoIntegerSerializer<NumericType, UInt32, convert_to_bool_on_read>>();
+            case capnp::schema::Type::UINT64:
+                return std::make_unique<CapnProtoIntegerSerializer<NumericType, UInt64, convert_to_bool_on_read>>();
+            case capnp::schema::Type::BOOL:
+                return std::make_unique<CapnProtoIntegerSerializer<NumericType, bool, convert_to_bool_on_read>>();
+            default:
+                throwCannotConvert(data_type, column_name, capnp_type);
+        }
+    }
+
+    template <typename CHFloatType, typename CapnProtoFloatType>
+    class CapnProtoFloatSerializer : public ICapnProtoSerializer
+    {
+    public:
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().setDataField<CapnProtoFloatType>(slot_offset, getValue(column, row_num));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            parent_list_builder.getBuilderImpl().setDataElement<CapnProtoFloatType>(array_index, getValue(column, row_num));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            insertValue(column, parent_struct_reader.getReaderImpl().getDataField<CapnProtoFloatType>(slot_offset));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            insertValue(column, parent_list_reader.getReaderImpl().getDataElement<CapnProtoFloatType>(array_index));
+        }
+
+    private:
+        CapnProtoFloatType getValue(const ColumnPtr & column, size_t row_num)
+        {
+            return static_cast<CapnProtoFloatType>(assert_cast<const ColumnVector<CHFloatType> &>(*column).getElement(row_num));
+        }
+
+        void insertValue(IColumn & column, CapnProtoFloatType value)
+        {
+            assert_cast<ColumnVector<CHFloatType> &>(column).insertValue(static_cast<CHFloatType>(value));
+        }
+    };
+
+    template <typename FloatType>
+    std::unique_ptr<ICapnProtoSerializer> createFloatSerializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type)
+    {
+        switch (capnp_type.which())
+        {
+            case capnp::schema::Type::FLOAT32:
+                return std::make_unique<CapnProtoFloatSerializer<FloatType, Float32>>();
+            case capnp::schema::Type::FLOAT64:
+                return std::make_unique<CapnProtoFloatSerializer<FloatType, Float64>>();
+            default:
+                throwCannotConvert(data_type, column_name, capnp_type);
+        }
+    }
+
+    template <typename EnumType>
+    class CapnProtoEnumSerializer : public ICapnProtoSerializer
+    {
+    public:
+        CapnProtoEnumSerializer(
+            const DataTypePtr & data_type_,
+            const String & column_name,
+            const capnp::Type & capnp_type,
+            const FormatSettings::CapnProtoEnumComparingMode enum_comparing_mode_) : data_type(data_type_), enum_comparing_mode(enum_comparing_mode_)
+        {
+            if (!capnp_type.isEnum())
+                throwCannotConvert(data_type, column_name, capnp_type);
+
+            const auto * enum_type = assert_cast<const DataTypeEnum<EnumType> *>(data_type.get());
+            const auto & enum_values = dynamic_cast<const EnumValues<EnumType> &>(*enum_type);
+
+            enum_schema = capnp_type.asEnum();
+            auto enumerants = enum_schema.getEnumerants();
+            if (enum_comparing_mode == FormatSettings::CapnProtoEnumComparingMode::BY_VALUES)
+            {
+                auto ch_enum_values = enum_values.getSetOfAllValues();
+                std::unordered_set<UInt16> capn_enum_values;
+                for (auto enumerant : enumerants)
+                    capn_enum_values.insert(enumerant.getOrdinal());
+
+                /// Check if ClickHouse values is a superset of CapnProto values.
+                ch_enum_is_superset = true;
+                /// In CapnProto Enum fields are numbered sequentially starting from zero.
+                /// Check if max CapnProto value exceeds max ClickHouse value.
+                constexpr auto max_value = std::is_same_v<EnumType, Int8> ? INT8_MAX : INT16_MAX;
+                if (enumerants.size() > max_value)
+                {
+                    ch_enum_is_superset = false;
+                }
+                else
+                {
+                    for (auto capnp_value : capn_enum_values)
+                    {
+                        if (!ch_enum_values.contains(static_cast<EnumType>(capnp_value)))
+                        {
+                            ch_enum_is_superset = false;
+                            break;
+                        }
+                    }
+                }
+
+                /// Check if CapnProto values is a superset of ClickHouse values.
+                capnp_enum_is_superset = true;
+                for (auto ch_value : ch_enum_values)
+                {
+                    /// Capnp doesn't support negative enum values.
+                    if (ch_value < 0 || !capn_enum_values.contains(static_cast<UInt16>(ch_value)))
+                    {
+                        capnp_enum_is_superset = false;
+                        break;
+                    }
+                }
+            }
+            else
+            {
+                bool to_lower = enum_comparing_mode == FormatSettings::CapnProtoEnumComparingMode::BY_NAMES_CASE_INSENSITIVE;
+
+                auto all_values = enum_values.getValues();
+                std::unordered_map<String, EnumType> ch_name_to_value;
+                for (auto & [name, value] : all_values)
+                    ch_name_to_value[to_lower ? boost::algorithm::to_lower_copy(name) : name] = value;
+
+                std::unordered_map<String, UInt16> capnp_name_to_value;
+                for (auto enumerant : enumerants)
+                {
+                    String capnp_name = enumerant.getProto().getName();
+                    capnp_name_to_value[to_lower ? boost::algorithm::to_lower_copy(capnp_name) : capnp_name] = enumerant.getOrdinal();
+                }
+
+                /// Check if ClickHouse names is a superset of CapnProto names.
+                ch_enum_is_superset = true;
+                for (auto & [capnp_name, capnp_value] : capnp_name_to_value)
+                {
+                    auto it = ch_name_to_value.find(capnp_name);
+                    if (it == ch_name_to_value.end())
+                    {
+                        ch_enum_is_superset = false;
+                        break;
+                    }
+                    capnp_to_ch_values[capnp_value] = it->second;
+                }
+
+                /// Check if CapnProto names is a superset of ClickHouse names.
+                capnp_enum_is_superset = true;
+
+                for (auto & [ch_name, ch_value] : ch_name_to_value)
+                {
+                    auto it = capnp_name_to_value.find(ch_name);
+                    if (it == capnp_name_to_value.end())
+                    {
+                        capnp_enum_is_superset = false;
+                        break;
+                    }
+                    ch_to_capnp_values[ch_value] = it->second;
+                }
+            }
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().setDataField<UInt16>(slot_offset, getValue(column, row_num));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            parent_list_builder.getBuilderImpl().setDataElement<UInt16>(array_index, getValue(column, row_num));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            insertValue(column, parent_struct_reader.getReaderImpl().getDataField<UInt16>(slot_offset));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            insertValue(column, parent_list_reader.getReaderImpl().getDataElement<UInt16>(array_index));
+        }
+
+    private:
+        UInt16 getValue(const ColumnPtr & column, size_t row_num)
+        {
+            if (!capnp_enum_is_superset)
+                throw Exception(ErrorCodes::CAPN_PROTO_BAD_CAST, "Cannot convert ClickHouse enum to CapnProto enum: CapnProto enum values/names is not a superset of ClickHouse enum values/names");
+
+            EnumType enum_value = assert_cast<const ColumnVector<EnumType> &>(*column).getElement(row_num);
+            if (enum_comparing_mode == FormatSettings::CapnProtoEnumComparingMode::BY_VALUES)
+                return static_cast<UInt16>(enum_value);
+            auto it = ch_to_capnp_values.find(enum_value);
+            if (it == ch_to_capnp_values.end())
+                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected value {} in ClickHouse enum", enum_value);
+
+            return it->second;
+        }
+
+        void insertValue(IColumn & column, UInt16 capnp_enum_value)
+        {
+            if (!ch_enum_is_superset)
+                throw Exception(ErrorCodes::CAPN_PROTO_BAD_CAST, "Cannot convert CapnProto enum to ClickHouse enum: ClickHouse enum values/names is not a superset of CapnProto enum values/names");
+
+            if (enum_comparing_mode == FormatSettings::CapnProtoEnumComparingMode::BY_VALUES)
+            {
+                assert_cast<ColumnVector<EnumType> &>(column).insertValue(static_cast<EnumType>(capnp_enum_value));
+            }
+            else
+            {
+                auto it = capnp_to_ch_values.find(capnp_enum_value);
+                if (it == capnp_to_ch_values.end())
+                    throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected value {} in CapnProto enum", capnp_enum_value);
+
+                assert_cast<ColumnVector<EnumType> &>(column).insertValue(it->second);
+            }
+        }
+
+        DataTypePtr data_type;
+        capnp::EnumSchema enum_schema;
+        const FormatSettings::CapnProtoEnumComparingMode enum_comparing_mode;
+        bool ch_enum_is_superset;
+        bool capnp_enum_is_superset;
+        std::unordered_map<EnumType, UInt16> ch_to_capnp_values;
+        std::unordered_map<UInt16, EnumType> capnp_to_ch_values;
+    };
+
+    class CapnProtoDateSerializer : public ICapnProtoSerializer
+    {
+    public:
+        CapnProtoDateSerializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type)
+        {
+            if (!capnp_type.isUInt16())
+                throwCannotConvert(data_type, column_name, capnp_type);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().setDataField<UInt16>(slot_offset, getValue(column, row_num));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            parent_list_builder.getBuilderImpl().setDataElement<UInt16>(array_index, getValue(column, row_num));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            insertValue(column, parent_struct_reader.getReaderImpl().getDataField<UInt16>(slot_offset));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            insertValue(column, parent_list_reader.getReaderImpl().getDataElement<UInt16>(array_index));
+        }
+
+    private:
+        UInt16 getValue(const ColumnPtr & column, size_t row_num)
+        {
+            return assert_cast<const ColumnDate &>(*column).getElement(row_num);
+        }
+
+        void insertValue(IColumn & column, UInt16 value)
+        {
+            assert_cast<ColumnDate &>(column).insertValue(value);
+        }
+    };
+
+    class CapnProtoDate32Serializer : public ICapnProtoSerializer
+    {
+    public:
+        CapnProtoDate32Serializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type)
+        {
+            if (!capnp_type.isInt32())
+                throwCannotConvert(data_type, column_name, capnp_type);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().setDataField<Int32>(slot_offset, getValue(column, row_num));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            parent_list_builder.getBuilderImpl().setDataElement<Int32>(array_index, getValue(column, row_num));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            insertValue(column, parent_struct_reader.getReaderImpl().getDataField<Int32>(slot_offset));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            insertValue(column, parent_list_reader.getReaderImpl().getDataElement<Int32>(array_index));
+        }
+
+    private:
+        Int32 getValue(const ColumnPtr & column, size_t row_num)
+        {
+            return assert_cast<const ColumnDate32 &>(*column).getElement(row_num);
+        }
+
+        void insertValue(IColumn & column, Int32 value)
+        {
+            assert_cast<ColumnDate32 &>(column).insertValue(value);
+        }
+    };
+
+    class CapnProtoDateTimeSerializer : public ICapnProtoSerializer
+    {
+    public:
+        CapnProtoDateTimeSerializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type)
+        {
+            if (!capnp_type.isUInt32())
+                throwCannotConvert(data_type, column_name, capnp_type);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().setDataField<UInt32>(slot_offset, getValue(column, row_num));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            parent_list_builder.getBuilderImpl().setDataElement<UInt32>(array_index, getValue(column, row_num));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            insertValue(column, parent_struct_reader.getReaderImpl().getDataField<UInt32>(slot_offset));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            insertValue(column, parent_list_reader.getReaderImpl().getDataElement<UInt32>(array_index));
+        }
+
+    private:
+        UInt32 getValue(const ColumnPtr & column, size_t row_num)
+        {
+            return assert_cast<const ColumnDateTime &>(*column).getElement(row_num);
+        }
+
+        void insertValue(IColumn & column, UInt32 value)
+        {
+            assert_cast<ColumnDateTime &>(column).insertValue(value);
+        }
+    };
+
+    class CapnProtoDateTime64Serializer : public ICapnProtoSerializer
+    {
+    public:
+        CapnProtoDateTime64Serializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type)
+        {
+            if (!capnp_type.isInt64())
+                throwCannotConvert(data_type, column_name, capnp_type);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().setDataField<Int64>(slot_offset, getValue(column, row_num));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            parent_list_builder.getBuilderImpl().setDataElement<Int64>(array_index, getValue(column, row_num));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            insertValue(column, parent_struct_reader.getReaderImpl().getDataField<Int64>(slot_offset));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            insertValue(column, parent_list_reader.getReaderImpl().getDataElement<Int64>(array_index));
+        }
+
+    private:
+        Int64 getValue(const ColumnPtr & column, size_t row_num)
+        {
+            return assert_cast<const ColumnDateTime64 &>(*column).getElement(row_num);
+        }
+
+        void insertValue(IColumn & column, Int64 value)
+        {
+            assert_cast<ColumnDateTime64 &>(column).insertValue(value);
+        }
+    };
+
+    template <typename DecimalType>
+    class CapnProtoDecimalSerializer : public ICapnProtoSerializer
+    {
+    public:
+        using NativeType = typename DecimalType::NativeType;
+
+        CapnProtoDecimalSerializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type)
+        {
+            auto which = WhichDataType(data_type);
+            if ((!capnp_type.isInt32() && which.isDecimal32()) || (!capnp_type.isInt64() && which.isDecimal64()))
+                throwCannotConvert(data_type, column_name, capnp_type);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().setDataField<NativeType>(slot_offset, getValue(column, row_num));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            parent_list_builder.getBuilderImpl().setDataElement<NativeType>(array_index, getValue(column, row_num));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            insertValue(column, parent_struct_reader.getReaderImpl().getDataField<NativeType>(slot_offset));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            insertValue(column, parent_list_reader.getReaderImpl().getDataElement<NativeType>(array_index));
+        }
+
+    private:
+        NativeType getValue(const ColumnPtr & column, size_t row_num)
+        {
+            return assert_cast<const ColumnDecimal<DecimalType> &>(*column).getElement(row_num);
+        }
+
+        void insertValue(IColumn & column, NativeType value)
+        {
+            assert_cast<ColumnDecimal<DecimalType> &>(column).insertValue(value);
+        }
+    };
+
+
+    class CapnProtoIPv4Serializer : public ICapnProtoSerializer
+    {
+    public:
+        CapnProtoIPv4Serializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type)
+        {
+            if (!capnp_type.isUInt32())
+                throwCannotConvert(data_type, column_name, capnp_type);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().setDataField<UInt32>(slot_offset, getValue(column, row_num));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            parent_list_builder.getBuilderImpl().setDataElement<UInt32>(array_index, getValue(column, row_num));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            insertValue(column, parent_struct_reader.getReaderImpl().getDataField<UInt32>(slot_offset));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            insertValue(column, parent_list_reader.getReaderImpl().getDataElement<UInt32>(array_index));
+        }
+
+    private:
+        UInt32 getValue(const ColumnPtr & column, size_t row_num)
+        {
+            return assert_cast<const ColumnIPv4 &>(*column).getElement(row_num);
+        }
+
+        void insertValue(IColumn & column, UInt32 value)
+        {
+            assert_cast<ColumnIPv4 &>(column).insertValue(IPv4(value));
+        }
+    };
+
+    template <typename T>
+    class CapnProtoFixedSizeRawDataSerializer : public ICapnProtoSerializer
+    {
+    private:
+        static constexpr size_t expected_value_size = sizeof(T);
+
+    public:
+        CapnProtoFixedSizeRawDataSerializer(const DataTypePtr & data_type_, const String & column_name, const capnp::Type & capnp_type) : data_type(data_type_)
+        {
+            if (!capnp_type.isData())
+                throwCannotConvert(data_type, column_name, capnp_type);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().getPointerField(slot_offset).setBlob<capnp::Data>(getData(column, row_num));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicList::Builder & parent_struct_builder, UInt32 array_index, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().getPointerElement(array_index).setBlob<capnp::Data>(getData(column, row_num));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            insertData(column, parent_struct_reader.getReaderImpl().getPointerField(slot_offset).getBlob<capnp::Data>(nullptr, 0));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            insertData(column, parent_list_reader.getReaderImpl().getPointerElement(array_index).getBlob<capnp::Data>(nullptr, 0));
+        }
+
+    private:
+        capnp::Data::Reader getData(const ColumnPtr & column, size_t row_num)
+        {
+            auto data = column->getDataAt(row_num);
+            return capnp::Data::Reader(reinterpret_cast<const kj::byte *>(data.data), data.size);
+        }
+
+        void insertData(IColumn & column, capnp::Data::Reader data)
+        {
+            if (data.size() != expected_value_size)
+                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected size of {} value: {}", data_type->getName(), data.size());
+
+            column.insertData(reinterpret_cast<const char *>(data.begin()), data.size());
+        }
+
+        DataTypePtr data_type;
+    };
+
+    template <typename CapnpType>
+    class CapnProtoStringSerializer : public ICapnProtoSerializer
+    {
+    public:
+        CapnProtoStringSerializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type)
+        {
+            if (!capnp_type.isData() && !capnp_type.isText())
+                throwCannotConvert(data_type, column_name, capnp_type);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().getPointerField(slot_offset).setBlob<CapnpType>(getData(column, row_num));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicList::Builder & parent_struct_builder, UInt32 array_index, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().getPointerElement(array_index).setBlob<CapnpType>(getData(column, row_num));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            insertData(column, parent_struct_reader.getReaderImpl().getPointerField(slot_offset).getBlob<CapnpType>(nullptr, 0));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            insertData(column, parent_list_reader.getReaderImpl().getPointerElement(array_index).getBlob<CapnpType>(nullptr, 0));
+        }
+
+    private:
+        using Reader = typename CapnpType::Reader;
+
+        Reader getData(const ColumnPtr & column, size_t row_num)
+        {
+            auto data = column->getDataAt(row_num);
+            if constexpr (std::is_same_v<CapnpType, capnp::Data>)
+                return Reader(reinterpret_cast<const kj::byte *>(data.data), data.size);
+            else
+                return Reader(data.data, data.size);
+        }
+
+        void insertData(IColumn & column, Reader data)
+        {
+            column.insertData(reinterpret_cast<const char *>(data.begin()), data.size());
+        }
+    };
+
+    template <typename CapnpType>
+    class CapnProtoFixedStringSerializer : public ICapnProtoSerializer
+    {
+    private:
+
+    public:
+        CapnProtoFixedStringSerializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type_) : capnp_type(capnp_type_)
+        {
+            if (!capnp_type.isData() && !capnp_type.isText())
+                throwCannotConvert(data_type, column_name, capnp_type);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().getPointerField(slot_offset).setBlob<CapnpType>(getData(column, row_num));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> &, capnp::DynamicList::Builder & parent_struct_builder, UInt32 array_index, size_t row_num) override
+        {
+            parent_struct_builder.getBuilderImpl().getPointerElement(array_index).setBlob<CapnpType>(getData(column, row_num));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            insertData(column, parent_struct_reader.getReaderImpl().getPointerField(slot_offset).getBlob<CapnpType>(nullptr, 0));
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            insertData(column, parent_list_reader.getReaderImpl().getPointerElement(array_index).getBlob<CapnpType>(nullptr, 0));
+        }
+
+    private:
+        using Reader = typename CapnpType::Reader;
+
+        Reader getData(const ColumnPtr & column, size_t row_num)
+        {
+            auto data = column->getDataAt(row_num);
+            if constexpr (std::is_same_v<CapnpType, capnp::Data>)
+            {
+                return Reader(reinterpret_cast<const kj::byte *>(data.data), data.size);
+            }
+            else
+            {
+                if (data.data[data.size - 1] == 0)
+                    return Reader(data.data, data.size);
+
+                /// In TEXT type data should be null-terminated, but ClickHouse FixedString data could not be.
+                /// To make data null-terminated we should copy it to temporary String object and use it in capnp::Text::Reader.
+                /// Note that capnp::Text::Reader works only with pointer to the data and it's size, so we should
+                /// guarantee that new String object life time is longer than capnp::Text::Reader life time.
+                tmp_string = data.toString();
+                return Reader(tmp_string.data(), tmp_string.size());
+            }
+        }
+
+        void insertData(IColumn & column, Reader data)
+        {
+            auto & fixed_string_column = assert_cast<ColumnFixedString &>(column);
+            if (data.size() > fixed_string_column.getN())
+                throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot read data with size {} to FixedString with size {}", data.size(), fixed_string_column.getN());
+
+            fixed_string_column.insertData(reinterpret_cast<const char *>(data.begin()), data.size());
+        }
+
+        String tmp_string;
+        capnp::Type capnp_type;
+    };
+
+    std::unique_ptr<ICapnProtoSerializer> createSerializer(const DataTypePtr & type, const String & name, const capnp::Type & capnp_type, const FormatSettings::CapnProto & settings);
+
+    class CapnProtoLowCardinalitySerializer : public ICapnProtoSerializer
+    {
+    public:
+        CapnProtoLowCardinalitySerializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type, const FormatSettings::CapnProto & settings)
+        {
+            nested_serializer = createSerializer(assert_cast<const DataTypeLowCardinality &>(*data_type).getDictionaryType(), column_name, capnp_type, settings);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            writeRowImpl(column, field_builder, parent_struct_builder, slot_offset, row_num);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            writeRowImpl(column, field_builder, parent_list_builder, array_index, row_num);
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            readRowImpl(column, parent_struct_reader, slot_offset);
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            readRowImpl(column, parent_list_reader, array_index);
+        }
+
+    private:
+        template <typename ParentBuilder>
+        void writeRowImpl(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, ParentBuilder & parent_builder, UInt32 offset_or_index, size_t row_num)
+        {
+            const auto & low_cardinality_column = assert_cast<const ColumnLowCardinality &>(*column);
+            size_t index = low_cardinality_column.getIndexAt(row_num);
+            const auto & dict_column = low_cardinality_column.getDictionary().getNestedColumn();
+            nested_serializer->writeRow(dict_column, field_builder, parent_builder, offset_or_index, index);
+        }
+
+        template <typename ParentReader>
+        void readRowImpl(IColumn & column, const ParentReader & parent_reader, UInt32 offset_or_index)
+        {
+            auto & low_cardinality_column = assert_cast<ColumnLowCardinality &>(column);
+            auto tmp_column = low_cardinality_column.getDictionary().getNestedColumn()->cloneEmpty();
+            nested_serializer->readRow(*tmp_column, parent_reader, offset_or_index);
+            low_cardinality_column.insertFromFullColumn(*tmp_column, 0);
+        }
+
+        std::unique_ptr<ICapnProtoSerializer> nested_serializer;
+    };
+
+    class CapnProtoNullableSerializer : public ICapnProtoSerializer
+    {
+    public:
+        CapnProtoNullableSerializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type, const FormatSettings::CapnProto & settings)
+        {
+            if (!capnp_type.isStruct())
+                throw Exception(
+                    ErrorCodes::CAPN_PROTO_BAD_CAST,
+                    "Cannot convert column \"{}\": Nullable can be represented only as a named union of type Void and nested type, got CapnProto type {}",
+                    column_name,
+                    getCapnProtoFullTypeName(capnp_type));
+
+            /// Check that struct is a named union of type VOID and one arbitrary type.
+            struct_schema = capnp_type.asStruct();
+            auto node = struct_schema.getProto().getStruct();
+            struct_size = capnp::_::StructSize(node.getDataWordCount(), node.getPointerCount());
+            discriminant_offset = node.getDiscriminantOffset();
+            if (!checkIfStructIsNamedUnion(struct_schema))
+                throw Exception(
+                    ErrorCodes::CAPN_PROTO_BAD_CAST,
+                    "Cannot convert column \"{}\": Nullable can be represented only as a named union of type Void and nested type."
+                    "Given CapnProto struct is not a named union: {}",
+                    column_name,
+                    getCapnProtoFullTypeName(capnp_type));
+
+            auto union_fields = struct_schema.getUnionFields();
+            if (union_fields.size() != 2)
+                throw Exception(
+                    ErrorCodes::CAPN_PROTO_BAD_CAST,
+                    "Cannot convert column \"{}\": Nullable can be represented only as a named union of type Void and nested type."
+                    "Given CapnProto union have more than 2 fields: {}",
+                    column_name,
+                    getCapnProtoFullTypeName(capnp_type));
+
+            auto first = union_fields[0];
+            auto second = union_fields[1];
+            auto nested_type = assert_cast<const DataTypeNullable *>(data_type.get())->getNestedType();
+            nested_slot_offset = first.getProto().getSlot().getOffset(); /// Both fields have the same offset.
+            if (first.getType().isVoid())
+            {
+                nested_serializer = createSerializer(nested_type, column_name, second.getType(), settings);
+                null_discriminant = 0;
+                nested_discriminant = 1;
+            }
+            else if (second.getType().isVoid())
+            {
+                nested_serializer = createSerializer(nested_type, column_name, first.getType(), settings);
+                null_discriminant = 1;
+                nested_discriminant = 0;
+            }
+            else
+                throw Exception(
+                    ErrorCodes::CAPN_PROTO_BAD_CAST,
+                    "Cannot convert column \"{}\": Nullable can be represented only as a named union of type Void and nested type."
+                    "Given CapnProto union doesn't have field with type Void: {}",
+                    column_name,
+                    getCapnProtoFullTypeName(capnp_type));
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            writeRowImpl(column, field_builder, parent_struct_builder, slot_offset, row_num);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            writeRowImpl(column, field_builder, parent_list_builder, array_index, row_num);
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            auto struct_reader = capnp::DynamicStruct::Reader(struct_schema, parent_struct_reader.getReaderImpl().getPointerField(slot_offset).getStruct(nullptr));
+            readRowImpl(column, struct_reader);
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            auto struct_reader = capnp::DynamicStruct::Reader(struct_schema, parent_list_reader.getReaderImpl().getStructElement(array_index));
+            readRowImpl(column, struct_reader);
+        }
+
+    private:
+        template <typename ParentBuilder>
+        void writeRowImpl(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, ParentBuilder & parent_builder, UInt32 offset_or_index, size_t row_num)
+        {
+            if (!field_builder)
+                field_builder = initStructBuilder(parent_builder, offset_or_index, struct_size, 1, struct_schema);
+
+            auto & struct_builder = assert_cast<StructBuilder &>(*field_builder);
+
+            const auto & nullable_column = assert_cast<const ColumnNullable &>(*column);
+            if (nullable_column.isNullAt(row_num))
+            {
+                auto struct_builder_impl = struct_builder.impl.getBuilderImpl();
+                struct_builder_impl.setDataField<uint16_t>(discriminant_offset, null_discriminant);
+                struct_builder_impl.setDataField<capnp::Void>(nested_slot_offset, capnp::Void());
+            }
+            else
+            {
+                const auto & nested_column = nullable_column.getNestedColumnPtr();
+                struct_builder.impl.getBuilderImpl().setDataField<uint16_t>(discriminant_offset, nested_discriminant);
+                nested_serializer->writeRow(nested_column, struct_builder.field_builders[0], struct_builder.impl, nested_slot_offset, row_num);
+            }
+        }
+
+        void readRowImpl(IColumn & column, capnp::DynamicStruct::Reader & struct_reader)
+        {
+            auto & nullable_column = assert_cast<ColumnNullable &>(column);
+            auto discriminant = struct_reader.getReaderImpl().getDataField<uint16_t>(discriminant_offset);
+
+            if (discriminant == null_discriminant)
+                nullable_column.insertDefault();
+            else
+            {
+                auto & nested_column = nullable_column.getNestedColumn();
+                nested_serializer->readRow(nested_column, struct_reader, nested_slot_offset);
+                nullable_column.getNullMapData().push_back(0);
+            }
+        }
+
+
+        std::unique_ptr<ICapnProtoSerializer> nested_serializer;
+        capnp::StructSchema struct_schema;
+        capnp::_::StructSize struct_size;
+        UInt32 discriminant_offset;
+        UInt16 null_discriminant;
+        UInt16 nested_discriminant;
+        UInt32 nested_slot_offset;
+    };
+
+    class CapnProtoArraySerializer : public ICapnProtoSerializer
+    {
+    public:
+        CapnProtoArraySerializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type, const FormatSettings::CapnProto & settings)
+        {
+            if (!capnp_type.isList())
+                throwCannotConvert(data_type, column_name, capnp_type);
+
+            auto nested_type = assert_cast<const DataTypeArray *>(data_type.get())->getNestedType();
+            list_schema = capnp_type.asList();
+            auto element_type = list_schema.getElementType();
+            element_size = capnp::elementSizeFor(element_type.which());
+            if (element_type.isStruct())
+            {
+                element_is_struct = true;
+                auto node = element_type.asStruct().getProto().getStruct();
+                element_struct_size = capnp::_::StructSize(node.getDataWordCount(), node.getPointerCount());
+            }
+
+            nested_serializer = createSerializer(nested_type, column_name, capnp_type.asList().getElementType(), settings);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            writeRowImpl(column, field_builder, parent_struct_builder, slot_offset, row_num);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            writeRowImpl(column, field_builder, parent_list_builder, array_index, row_num);
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            auto list_reader = capnp::DynamicList::Reader(list_schema, parent_struct_reader.getReaderImpl().getPointerField(slot_offset).getList(element_size, nullptr));
+            readRowImpl(column, list_reader);
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            auto list_reader = capnp::DynamicList::Reader(list_schema, parent_list_reader.getReaderImpl().getPointerElement(array_index).getList(element_size, nullptr));
+            readRowImpl(column, list_reader);
+        }
+
+    private:
+        template <typename ParentBuilder>
+        void writeRowImpl(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, ParentBuilder & parent_builder, UInt32 offset_or_index, size_t row_num)
+        {
+            const auto * array_column = assert_cast<const ColumnArray *>(column.get());
+            const auto & nested_column = array_column->getDataPtr();
+            const auto & offsets = array_column->getOffsets();
+            auto offset = offsets[row_num - 1];
+            UInt32 size = static_cast<UInt32>(offsets[row_num] - offset);
+
+            if (!field_builder)
+                field_builder = std::make_unique<ListBuilder>(capnp::DynamicList::Builder(list_schema, initListBuilder(parent_builder, offset_or_index, size)), size);
+
+            auto & list_builder = assert_cast<ListBuilder &>(*field_builder);
+            for (UInt32 i = 0; i != size; ++i)
+                nested_serializer->writeRow(nested_column, list_builder.nested_builders[i], list_builder.impl, i, offset + i);
+        }
+
+        template <typename ParentBuilder>
+        capnp::_::ListBuilder initListBuilder(ParentBuilder & parent_builder, UInt32 offset_or_index, UInt32 size)
+        {
+            if (element_is_struct)
+            {
+                if constexpr (std::is_same_v<ParentBuilder, capnp::DynamicStruct::Builder>)
+                    return parent_builder.getBuilderImpl().getPointerField(offset_or_index).initStructList(size, element_struct_size);
+                else
+                    return parent_builder.getBuilderImpl().getPointerElement(offset_or_index).initStructList(size, element_struct_size);
+            }
+
+            if constexpr (std::is_same_v<ParentBuilder, capnp::DynamicStruct::Builder>)
+                return parent_builder.getBuilderImpl().getPointerField(offset_or_index).initList(element_size, size);
+            else
+                return parent_builder.getBuilderImpl().getPointerElement(offset_or_index).initList(element_size, size);
+        }
+
+        void readRowImpl(IColumn & column, const capnp::DynamicList::Reader & list_reader)
+        {
+            UInt32 size = list_reader.size();
+            auto & column_array = assert_cast<ColumnArray &>(column);
+            auto & offsets = column_array.getOffsets();
+            offsets.push_back(offsets.back() + list_reader.size());
+
+            auto & nested_column = column_array.getData();
+            for (UInt32 i = 0; i != size; ++i)
+                nested_serializer->readRow(nested_column, list_reader, i);
+        }
+
+        capnp::ListSchema list_schema;
+        std::unique_ptr<ICapnProtoSerializer> nested_serializer;
+        capnp::ElementSize element_size;
+        capnp::_::StructSize element_struct_size;
+        bool element_is_struct = false;
+
+    };
+
+    class CapnProtoMapSerializer : public ICapnProtoSerializer
+    {
+    public:
+        CapnProtoMapSerializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type, const FormatSettings::CapnProto & settings)
+        {
+            /// We output/input Map type as follow CapnProto schema
+            ///
+            /// struct Map {
+            ///     struct Entry {
+            ///         key @0: Key;
+            ///         value @1: Value;
+            ///     }
+            ///     entries @0 :List(Entry);
+            /// }
+
+            if (!capnp_type.isStruct())
+                throwCannotConvert(data_type, column_name, capnp_type);
+
+            struct_schema = capnp_type.asStruct();
+            auto node = struct_schema.getProto().getStruct();
+            struct_size = capnp::_::StructSize(node.getDataWordCount(), node.getPointerCount());
+
+            if (checkIfStructContainsUnnamedUnion(struct_schema))
+                throw Exception(
+                    ErrorCodes::CAPN_PROTO_BAD_CAST,
+                    "Cannot convert ClickHouse column \"{}\" with type {} to CapnProto Struct with unnamed union {}",
+                    column_name,
+                    data_type->getName(),
+                    getCapnProtoFullTypeName(capnp_type));
+
+            if (struct_schema.getFields().size() != 1)
+                throw Exception(
+                    ErrorCodes::CAPN_PROTO_BAD_CAST,
+                    "Cannot convert ClickHouse column \"{}\": Map type can be represented as a Struct with one list field, got struct: {}",
+                    column_name,
+                    getCapnProtoFullTypeName(capnp_type));
+
+            const auto & field_type = struct_schema.getFields()[0].getType();
+            if (!field_type.isList())
+                throw Exception(
+                    ErrorCodes::CAPN_PROTO_BAD_CAST,
+                    "Cannot convert ClickHouse column \"{}\": Map type can be represented as a Struct with one list field, got field: {}",
+                    column_name,
+                    getCapnProtoFullTypeName(field_type));
+
+            auto list_element_type = field_type.asList().getElementType();
+            if (!list_element_type.isStruct())
+                throw Exception(
+                    ErrorCodes::CAPN_PROTO_BAD_CAST,
+                    "Cannot convert ClickHouse column \"{}\": Field of struct that represents Map should be a list of structs, got list of {}",
+                    column_name,
+                    getCapnProtoFullTypeName(list_element_type));
+
+            auto key_value_struct = list_element_type.asStruct();
+            if (checkIfStructContainsUnnamedUnion(key_value_struct))
+                throw Exception(
+                    ErrorCodes::CAPN_PROTO_BAD_CAST,
+                    "Cannot convert ClickHouse column \"{}\": struct that represents Map entries is unnamed union: {}",
+                    column_name,
+                    getCapnProtoFullTypeName(list_element_type));
+
+            if (key_value_struct.getFields().size() != 2)
+                throw Exception(
+                    ErrorCodes::CAPN_PROTO_BAD_CAST,
+                    "Cannot convert ClickHouse column \"{}\": struct that represents Map entries should contain only 2 fields, got struct {}",
+                    column_name,
+                    getCapnProtoFullTypeName(list_element_type));
+
+            const auto & map_type = assert_cast<const DataTypeMap &>(*data_type);
+            DataTypes types = {map_type.getKeyType(), map_type.getValueType()};
+            Names names = {"key", "value"};
+            auto entries_type = std::make_shared<DataTypeArray>(std::make_shared<DataTypeTuple>(types, names));
+            nested_serializer = createSerializer(entries_type, column_name, field_type, settings);
+            entries_slot_offset = struct_schema.getFields()[0].getProto().getSlot().getOffset();
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            writeRowImpl(column, field_builder, parent_struct_builder, slot_offset, row_num);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            writeRowImpl(column, field_builder, parent_list_builder, array_index, row_num);
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            auto struct_reader = capnp::DynamicStruct::Reader(struct_schema, parent_struct_reader.getReaderImpl().getPointerField(slot_offset).getStruct(nullptr));
+            readRowImpl(column, struct_reader);
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            auto struct_reader = capnp::DynamicStruct::Reader(struct_schema, parent_list_reader.getReaderImpl().getStructElement(array_index));
+            readRowImpl(column, struct_reader);
+        }
+
+    private:
+        template <typename ParentBuilder>
+        void writeRowImpl(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, ParentBuilder & parent_builder, UInt32 offset_or_index, size_t row_num)
+        {
+            if (!field_builder)
+                field_builder = initStructBuilder(parent_builder, offset_or_index, struct_size, 1, struct_schema);
+
+            auto & struct_builder = assert_cast<StructBuilder &>(*field_builder);
+            const auto & entries_column = assert_cast<const ColumnMap *>(column.get())->getNestedColumnPtr();
+            nested_serializer->writeRow(entries_column, struct_builder.field_builders[0], struct_builder.impl, entries_slot_offset, row_num);
+        }
+
+        void readRowImpl(IColumn & column, const capnp::DynamicStruct::Reader & struct_reader)
+        {
+            auto & entries_column = assert_cast<ColumnMap &>(column).getNestedColumn();
+            nested_serializer->readRow(entries_column, struct_reader, entries_slot_offset);
+        }
+
+        std::unique_ptr<ICapnProtoSerializer> nested_serializer;
+        capnp::StructSchema struct_schema;
+        capnp::_::StructSize struct_size;
+        UInt32 entries_slot_offset;
+    };
+
+    class CapnProtoStructureSerializer : public ICapnProtoSerializer
+    {
+    public:
+        CapnProtoStructureSerializer(const DataTypes & data_types, const Names & names, const capnp::StructSchema & schema, const FormatSettings::CapnProto & settings) : struct_schema(schema)
+        {
+            if (checkIfStructIsNamedUnion(schema) || checkIfStructContainsUnnamedUnion(schema))
+                throw Exception(ErrorCodes::CAPN_PROTO_BAD_CAST, "Root CapnProto Struct cannot be named union/struct with unnamed union");
+
+            initialize(data_types, names, settings);
+        }
+
+        CapnProtoStructureSerializer(const DataTypePtr & data_type, const String & column_name, const capnp::Type & capnp_type, const FormatSettings::CapnProto & settings)
+        {
+            if (!capnp_type.isStruct())
+                throwCannotConvert(data_type, column_name, capnp_type);
+
+            struct_schema = capnp_type.asStruct();
+
+            if (checkIfStructIsNamedUnion(struct_schema) || checkIfStructContainsUnnamedUnion(struct_schema))
+                throw Exception(
+                    ErrorCodes::CAPN_PROTO_BAD_CAST,
+                    "Cannot convert ClickHouse column \"{}\" with type {} to CapnProto named union/struct with unnamed union {}",
+                    column_name,
+                    data_type->getName(),
+                    getCapnProtoFullTypeName(capnp_type));
+
+            const auto * tuple_data_type = assert_cast<const DataTypeTuple *>(data_type.get());
+            auto nested_types = tuple_data_type->getElements();
+            Names nested_names;
+            bool have_explicit_names = tuple_data_type->haveExplicitNames();
+            auto structure_fields = struct_schema.getFields();
+            if (!have_explicit_names)
+            {
+                if (nested_types.size() != structure_fields.size())
+                    throw Exception(
+                        ErrorCodes::CAPN_PROTO_BAD_CAST,
+                        "Cannot convert ClickHouse column \"{}\" with type {} to CapnProto type {}: Tuple and Struct have different sizes {} != {}",
+                        column_name,
+                        data_type->getName(),
+                        getCapnProtoFullTypeName(capnp_type),
+                        nested_types.size(),
+                        structure_fields.size());
+                nested_names.reserve(structure_fields.size());
+                for (auto field : structure_fields)
+                    nested_names.push_back(field.getProto().getName());
+            }
+            else
+            {
+                nested_names = tuple_data_type->getElementNames();
+            }
+
+            try
+            {
+                initialize(nested_types, nested_names, settings);
+            }
+            catch (Exception & e)
+            {
+                e.addMessage("(while converting column {})", column_name);
+                throw std::move(e);
+            }
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, capnp::DynamicStruct::Builder & parent_struct_builder, UInt32 slot_offset, size_t row_num) override
+        {
+            writeRowImpl(column, field_builder, parent_struct_builder, slot_offset, row_num);
+        }
+
+        void writeRow(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, capnp::DynamicList::Builder & parent_list_builder, UInt32 array_index, size_t row_num) override
+        {
+            writeRowImpl(column, field_builder, parent_list_builder, array_index, row_num);
+        }
+
+        /// Method for writing root struct.
+        void writeRow(const Columns & columns, StructBuilder & struct_builder, size_t row_num)
+        {
+            for (size_t i = 0; i != columns.size(); ++i)
+                fields_serializers[i]->writeRow(columns[i], struct_builder.field_builders[fields_indexes[i]], struct_builder.impl, fields_offsets[i], row_num);
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicStruct::Reader & parent_struct_reader, UInt32 slot_offset) override
+        {
+            auto struct_reader = capnp::DynamicStruct::Reader(struct_schema, parent_struct_reader.getReaderImpl().getPointerField(slot_offset).getStruct(nullptr));
+            readRowImpl(column, struct_reader);
+        }
+
+        void readRow(IColumn & column, const capnp::DynamicList::Reader & parent_list_reader, UInt32 array_index) override
+        {
+            auto struct_reader = capnp::DynamicStruct::Reader(struct_schema, parent_list_reader.getReaderImpl().getStructElement(array_index));
+            readRowImpl(column, struct_reader);
+        }
+
+        /// Method for reading from root struct.
+        void readRow(MutableColumns & columns, const capnp::DynamicStruct::Reader & reader)
+        {
+            for (size_t i = 0; i != columns.size(); ++i)
+                fields_serializers[i]->readRow(*columns[i], reader, fields_offsets[i]);
+        }
+
+    private:
+        void initialize(const DataTypes & data_types, const Names & names, const FormatSettings::CapnProto & settings)
+        {
+            auto node = struct_schema.getProto().getStruct();
+            struct_size = capnp::_::StructSize(node.getDataWordCount(), node.getPointerCount());
+            fields_count = struct_schema.getFields().size();
+            fields_serializers.reserve(data_types.size());
+            fields_offsets.reserve(data_types.size());
+            fields_indexes.reserve(data_types.size());
+            for (size_t i = 0; i != data_types.size(); ++i)
+            {
+                auto [field_name, _] = splitFieldName(names[i]);
+                auto field = findFieldByName(struct_schema, field_name);
+                if (!field)
+                    throw Exception(ErrorCodes::THERE_IS_NO_COLUMN, "Capnproto schema doesn't contain field with name {}", field_name);
+
+                auto capnp_type = field->getType();
+                fields_serializers.push_back(createSerializer(data_types[i], names[i], capnp_type, settings));
+                fields_offsets.push_back(field->getProto().getSlot().getOffset());
+                fields_indexes.push_back(field->getIndex());
+            }
+        }
+
+        template <typename ParentBuilder>
+        void writeRowImpl(const ColumnPtr & column, std::unique_ptr<FieldBuilder> & field_builder, ParentBuilder & parent_builder, UInt32 offset_or_index, size_t row_num)
+        {
+            if (!field_builder)
+                field_builder = initStructBuilder(parent_builder, offset_or_index, struct_size, fields_count, struct_schema);
+
+            auto & struct_builder = assert_cast<StructBuilder &>(*field_builder);
+            if (const auto * tuple_column = typeid_cast<const ColumnTuple *>(column.get()))
+            {
+                const auto & columns = tuple_column->getColumns();
+                for (size_t i = 0; i != columns.size(); ++i)
+                    fields_serializers[i]->writeRow(columns[i], struct_builder.field_builders[fields_indexes[i]], struct_builder.impl, fields_offsets[i], row_num);
+            }
+            else
+            {
+                fields_serializers[0]->writeRow(column, struct_builder.field_builders[fields_indexes[0]], struct_builder.impl, fields_offsets[0], row_num);
+            }
+        }
+
+        void readRowImpl(IColumn & column, const capnp::DynamicStruct::Reader & struct_reader)
+        {
+            if (auto * tuple_column = typeid_cast<ColumnTuple *>(&column))
+            {
+                for (size_t i = 0; i != tuple_column->tupleSize(); ++i)
+                    fields_serializers[i]->readRow(tuple_column->getColumn(i), struct_reader, fields_offsets[i]);
+            }
+            else
+                fields_serializers[0]->readRow(column, struct_reader, fields_offsets[0]);
+        }
+
+        capnp::StructSchema struct_schema;
+        capnp::_::StructSize struct_size;
+        size_t fields_count;
+        std::vector<std::unique_ptr<ICapnProtoSerializer>> fields_serializers;
+        std::vector<UInt32> fields_offsets;
+        std::vector<size_t> fields_indexes;
+
+    };
+
+    std::unique_ptr<ICapnProtoSerializer> createSerializer(const DataTypePtr & type, const String & name, const capnp::Type & capnp_type, const FormatSettings::CapnProto & settings)
+    {
+        auto [field_name, nested_name] = splitFieldName(name);
+        if (!nested_name.empty() && !capnp_type.isList())
+        {
+            if (!capnp_type.isStruct())
+                throw Exception(ErrorCodes::CAPN_PROTO_BAD_CAST, "Field {} is not a struct", field_name);
+
+            return std::make_unique<CapnProtoStructureSerializer>(DataTypes{type}, Names{nested_name}, capnp_type.asStruct(), settings);
+        }
+
+        switch (type->getTypeId())
+        {
+            case TypeIndex::Int8:
+                return createIntegerSerializer<Int8>(type, name, capnp_type);
+            case TypeIndex::UInt8:
+                if (isBool(type))
+                    return createIntegerSerializer<UInt8, true>(type, name, capnp_type);
+                return createIntegerSerializer<UInt8>(type, name, capnp_type);
+            case TypeIndex::Int16:
+                return createIntegerSerializer<Int16>(type, name, capnp_type);
+            case TypeIndex::UInt16:
+                return createIntegerSerializer<UInt16>(type, name, capnp_type);
+            case TypeIndex::Int32:
+                return createIntegerSerializer<Int32>(type, name, capnp_type);
+            case TypeIndex::UInt32:
+                return createIntegerSerializer<UInt32>(type, name, capnp_type);
+            case TypeIndex::Int64:
+                return createIntegerSerializer<Int64>(type, name, capnp_type);
+            case TypeIndex::UInt64:
+                return createIntegerSerializer<UInt64>(type, name, capnp_type);
+            case TypeIndex::Int128:
+                return std::make_unique<CapnProtoFixedSizeRawDataSerializer<Int128>>(type, name, capnp_type);
+            case TypeIndex::UInt128:
+                return std::make_unique<CapnProtoFixedSizeRawDataSerializer<UInt128>>(type, name, capnp_type);
+            case TypeIndex::Int256:
+                return std::make_unique<CapnProtoFixedSizeRawDataSerializer<Int256>>(type, name, capnp_type);
+            case TypeIndex::UInt256:
+                return std::make_unique<CapnProtoFixedSizeRawDataSerializer<UInt256>>(type, name, capnp_type);
+            case TypeIndex::Float32:
+                return createFloatSerializer<Float32>(type, name, capnp_type);
+            case TypeIndex::Float64:
+                return createFloatSerializer<Float64>(type, name, capnp_type);
+            case TypeIndex::Date:
+                return std::make_unique<CapnProtoDateSerializer>(type, name, capnp_type);
+            case TypeIndex::Date32:
+                return std::make_unique<CapnProtoDate32Serializer>(type, name, capnp_type);
+            case TypeIndex::DateTime:
+                return std::make_unique<CapnProtoDateTimeSerializer>(type, name, capnp_type);
+            case TypeIndex::DateTime64:
+                return std::make_unique<CapnProtoDateTime64Serializer>(type, name, capnp_type);
+            case TypeIndex::Decimal32:
+                return std::make_unique<CapnProtoDecimalSerializer<Decimal32>>(type, name, capnp_type);
+            case TypeIndex::Decimal64:
+                return std::make_unique<CapnProtoDecimalSerializer<Decimal64>>(type, name, capnp_type);
+            case TypeIndex::Decimal128:
+                return std::make_unique<CapnProtoFixedSizeRawDataSerializer<Decimal128>>(type, name, capnp_type);
+            case TypeIndex::Decimal256:
+                return std::make_unique<CapnProtoFixedSizeRawDataSerializer<Decimal256>>(type, name, capnp_type);
+            case TypeIndex::IPv4:
+                return std::make_unique<CapnProtoIPv4Serializer>(type, name, capnp_type);
+            case TypeIndex::IPv6:
+                return std::make_unique<CapnProtoFixedSizeRawDataSerializer<IPv6>>(type, name, capnp_type);
+            case TypeIndex::UUID:
+                return std::make_unique<CapnProtoFixedSizeRawDataSerializer<UUID>>(type, name, capnp_type);
+            case TypeIndex::Enum8:
+                return std::make_unique<CapnProtoEnumSerializer<Int8>>(type, name, capnp_type, settings.enum_comparing_mode);
+            case TypeIndex::Enum16:
+                return std::make_unique<CapnProtoEnumSerializer<Int16>>(type, name, capnp_type, settings.enum_comparing_mode);
+            case TypeIndex::String:
+                if (capnp_type.isData())
+                    return std::make_unique<CapnProtoStringSerializer<capnp::Data>>(type, name, capnp_type);
+                return std::make_unique<CapnProtoStringSerializer<capnp::Text>>(type, name, capnp_type);
+            case TypeIndex::FixedString:
+                if (capnp_type.isData())
+                    return std::make_unique<CapnProtoFixedStringSerializer<capnp::Data>>(type, name, capnp_type);
+                return std::make_unique<CapnProtoFixedStringSerializer<capnp::Text>>(type, name, capnp_type);
+            case TypeIndex::LowCardinality:
+                return std::make_unique<CapnProtoLowCardinalitySerializer>(type, name, capnp_type, settings);
+            case TypeIndex::Nullable:
+                return std::make_unique<CapnProtoNullableSerializer>(type, name, capnp_type, settings);
+            case TypeIndex::Array:
+                return std::make_unique<CapnProtoArraySerializer>(type, name, capnp_type, settings);
+            case TypeIndex::Map:
+                return std::make_unique<CapnProtoMapSerializer>(type, name, capnp_type, settings);
+            case TypeIndex::Tuple:
+                return std::make_unique<CapnProtoStructureSerializer>(type, name, capnp_type, settings);
+            default:
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Type {} is not supported in CapnProto format", type->getName());
+        }
+    }
+}
+
+class CapnProtoSerializer::Impl
+{
+public:
+    Impl(const DataTypes & data_types, const Names & names, const capnp::StructSchema & schema, const FormatSettings::CapnProto & settings)
+        : struct_serializer(std::make_unique<CapnProtoStructureSerializer>(data_types, names, schema, settings))
+        , fields_size(schema.getFields().size())
+    {
+    }
+
+    void writeRow(const Columns & columns, capnp::DynamicStruct::Builder builder, size_t row_num)
+    {
+        StructBuilder struct_builder(std::move(builder), fields_size);
+        struct_serializer->writeRow(columns, struct_builder, row_num);
+    }
+
+    void readRow(MutableColumns & columns, capnp::DynamicStruct::Reader & reader)
+    {
+        struct_serializer->readRow(columns, reader);
+    }
+
+private:
+    std::unique_ptr<CapnProtoStructureSerializer> struct_serializer;
+    size_t fields_size;
+};
+
+CapnProtoSerializer::CapnProtoSerializer(const DataTypes & data_types, const Names & names, const capnp::StructSchema & schema, const FormatSettings::CapnProto & settings)
+    : serializer_impl(std::make_unique<Impl>(data_types, names, schema, settings))
+{
+}
+
+void CapnProtoSerializer::writeRow(const Columns & columns, capnp::DynamicStruct::Builder builder, size_t row_num)
+{
+    serializer_impl->writeRow(columns, std::move(builder), row_num);
+}
+
+void CapnProtoSerializer::readRow(MutableColumns & columns, capnp::DynamicStruct::Reader & reader)
+{
+    serializer_impl->readRow(columns, reader);
+}
+
+CapnProtoSerializer::~CapnProtoSerializer() = default;
+
+}
+
+#endif
diff --git a/src/Formats/CapnProtoSerializer.h b/src/Formats/CapnProtoSerializer.h
new file mode 100644
index 00000000000..5bdd1a0e554
--- /dev/null
+++ b/src/Formats/CapnProtoSerializer.h
@@ -0,0 +1,30 @@
+#pragma once
+
+#if USE_CAPNP
+
+#include <Core/Block.h>
+#include <capnp/dynamic.h>
+#include <Formats/FormatSettings.h>
+
+namespace DB
+{
+
+class CapnProtoSerializer
+{
+public:
+    CapnProtoSerializer(const DataTypes & data_types, const Names & names, const capnp::StructSchema & schema, const FormatSettings::CapnProto & settings);
+
+    void writeRow(const Columns & columns, capnp::DynamicStruct::Builder builder, size_t row_num);
+
+    void readRow(MutableColumns & columns, capnp::DynamicStruct::Reader & reader);
+
+    ~CapnProtoSerializer();
+
+private:
+    class Impl;
+    std::unique_ptr<Impl> serializer_impl;
+};
+
+}
+
+#endif
diff --git a/src/Formats/CapnProtoUtils.cpp b/src/Formats/CapnProtoUtils.cpp
deleted file mode 100644
index d6c032408bb..00000000000
--- a/src/Formats/CapnProtoUtils.cpp
+++ /dev/null
@@ -1,734 +0,0 @@
-#include <Formats/CapnProtoUtils.h>
-
-#if USE_CAPNP
-
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeEnum.h>
-#include <DataTypes/DataTypeLowCardinality.h>
-#include <DataTypes/DataTypeNullable.h>
-#include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypesNumber.h>
-#include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypeMap.h>
-#include <DataTypes/IDataType.h>
-#include <boost/algorithm/string.hpp>
-#include <boost/algorithm/string/join.hpp>
-#include <capnp/schema.h>
-#include <capnp/schema-parser.h>
-#include <fcntl.h>
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int CANNOT_PARSE_CAPN_PROTO_SCHEMA;
-    extern const int THERE_IS_NO_COLUMN;
-    extern const int BAD_TYPE_OF_FIELD;
-    extern const int CAPN_PROTO_BAD_CAST;
-    extern const int FILE_DOESNT_EXIST;
-    extern const int UNKNOWN_EXCEPTION;
-    extern const int INCORRECT_DATA;
-    extern const int CAPN_PROTO_BAD_TYPE;
-    extern const int BAD_ARGUMENTS;
-}
-
-std::pair<String, String> splitCapnProtoFieldName(const String & name)
-{
-    const auto * begin = name.data();
-    const auto * end = name.data() + name.size();
-    const auto * it = find_first_symbols<'_', '.'>(begin, end);
-    String first = String(begin, it);
-    String second = it == end ? "" : String(it + 1, end);
-    return {first, second};
-}
-
-capnp::StructSchema CapnProtoSchemaParser::getMessageSchema(const FormatSchemaInfo & schema_info)
-{
-    capnp::ParsedSchema schema;
-    try
-    {
-        int fd;
-        KJ_SYSCALL(fd = open(schema_info.schemaDirectory().data(), O_RDONLY)); // NOLINT(bugprone-suspicious-semicolon)
-        auto schema_dir = kj::newDiskDirectory(kj::OsFileHandle(fd));
-        schema = impl.parseFromDirectory(*schema_dir, kj::Path::parse(schema_info.schemaPath()), {});
-    }
-    catch (const kj::Exception & e)
-    {
-        /// That's not good to determine the type of error by its description, but
-        /// this is the only way to do it here, because kj doesn't specify the type of error.
-        auto description = std::string_view(e.getDescription().cStr());
-        if (description.find("No such file or directory") != String::npos || description.find("no such directory") != String::npos)
-            throw Exception(ErrorCodes::FILE_DOESNT_EXIST, "Cannot open CapnProto schema, file {} doesn't exists", schema_info.absoluteSchemaPath());
-
-        if (description.find("Parse error") != String::npos)
-            throw Exception(ErrorCodes::CANNOT_PARSE_CAPN_PROTO_SCHEMA, "Cannot parse CapnProto schema {}:{}", schema_info.schemaPath(), e.getLine());
-
-        throw Exception(ErrorCodes::UNKNOWN_EXCEPTION,
-                        "Unknown exception while parsing CapnProto schema: {}, schema dir and file: {}, {}",
-                        description, schema_info.schemaDirectory(), schema_info.schemaPath());
-    }
-
-    auto message_maybe = schema.findNested(schema_info.messageName());
-    auto * message_schema = kj::_::readMaybe(message_maybe);
-    if (!message_schema)
-        throw Exception(ErrorCodes::CANNOT_PARSE_CAPN_PROTO_SCHEMA,
-                        "CapnProto schema doesn't contain message with name {}", schema_info.messageName());
-    return message_schema->asStruct();
-}
-
-bool compareEnumNames(const String & first, const String & second, FormatSettings::EnumComparingMode mode)
-{
-    if (mode == FormatSettings::EnumComparingMode::BY_NAMES_CASE_INSENSITIVE)
-        return boost::algorithm::to_lower_copy(first) == boost::algorithm::to_lower_copy(second);
-    return first == second;
-}
-
-static const std::map<capnp::schema::Type::Which, String> capnp_simple_type_names =
-{
-        {capnp::schema::Type::Which::BOOL, "Bool"},
-        {capnp::schema::Type::Which::VOID, "Void"},
-        {capnp::schema::Type::Which::INT8, "Int8"},
-        {capnp::schema::Type::Which::INT16, "Int16"},
-        {capnp::schema::Type::Which::INT32, "Int32"},
-        {capnp::schema::Type::Which::INT64, "Int64"},
-        {capnp::schema::Type::Which::UINT8, "UInt8"},
-        {capnp::schema::Type::Which::UINT16, "UInt16"},
-        {capnp::schema::Type::Which::UINT32, "UInt32"},
-        {capnp::schema::Type::Which::UINT64, "UInt64"},
-        {capnp::schema::Type::Which::FLOAT32, "Float32"},
-        {capnp::schema::Type::Which::FLOAT64, "Float64"},
-        {capnp::schema::Type::Which::TEXT, "Text"},
-        {capnp::schema::Type::Which::DATA, "Data"},
-        {capnp::schema::Type::Which::INTERFACE, "Interface"},
-        {capnp::schema::Type::Which::ANY_POINTER, "AnyPointer"},
-};
-
-static bool checkIfStructContainsUnnamedUnion(const capnp::StructSchema & struct_schema)
-{
-    return struct_schema.getFields().size() != struct_schema.getNonUnionFields().size();
-}
-
-static bool checkIfStructIsNamedUnion(const capnp::StructSchema & struct_schema)
-{
-    return struct_schema.getFields().size() == struct_schema.getUnionFields().size();
-}
-
-/// Get full name of type for better exception messages.
-static String getCapnProtoFullTypeName(const capnp::Type & type)
-{
-    switch (type.which())
-    {
-        case capnp::schema::Type::Which::STRUCT:
-        {
-            auto struct_schema = type.asStruct();
-
-            auto non_union_fields = struct_schema.getNonUnionFields();
-            std::vector<String> non_union_field_names;
-            for (auto nested_field : non_union_fields)
-                non_union_field_names.push_back(String(nested_field.getProto().getName()) + " " + getCapnProtoFullTypeName(nested_field.getType()));
-
-            auto union_fields = struct_schema.getUnionFields();
-            std::vector<String> union_field_names;
-            for (auto nested_field : union_fields)
-                union_field_names.push_back(String(nested_field.getProto().getName()) + " " + getCapnProtoFullTypeName(nested_field.getType()));
-
-            String union_name = "Union(" + boost::algorithm::join(union_field_names, ", ") + ")";
-            /// Check if the struct is a named union.
-            if (non_union_field_names.empty())
-                return union_name;
-
-            String type_name = "Struct(" + boost::algorithm::join(non_union_field_names, ", ");
-            /// Check if the struct contains unnamed union.
-            if (!union_field_names.empty())
-                type_name += ", " + union_name;
-            type_name += ")";
-            return type_name;
-        }
-        case capnp::schema::Type::Which::LIST:
-            return "List(" + getCapnProtoFullTypeName(type.asList().getElementType()) + ")";
-        case capnp::schema::Type::Which::ENUM:
-        {
-            auto enum_schema = type.asEnum();
-            String enum_name = "Enum(";
-            auto enumerants = enum_schema.getEnumerants();
-            for (unsigned i = 0; i != enumerants.size(); ++i)
-            {
-                enum_name += String(enumerants[i].getProto().getName()) + " = " + std::to_string(enumerants[i].getOrdinal());
-                if (i + 1 != enumerants.size())
-                    enum_name += ", ";
-            }
-            enum_name += ")";
-            return enum_name;
-        }
-        default:
-            auto it = capnp_simple_type_names.find(type.which());
-            if (it == capnp_simple_type_names.end())
-                throw Exception(ErrorCodes::BAD_TYPE_OF_FIELD, "Unknown CapnProto type");
-            return it->second;
-    }
-}
-
-template <typename Type>
-static bool checkEnums(const capnp::Type & capnp_type, const DataTypePtr column_type, FormatSettings::EnumComparingMode mode, UInt64 max_value, String & error_message)
-{
-    if (!capnp_type.isEnum())
-        return false;
-
-    auto enum_schema = capnp_type.asEnum();
-    bool to_lower = mode == FormatSettings::EnumComparingMode::BY_NAMES_CASE_INSENSITIVE;
-    const auto * enum_type = assert_cast<const DataTypeEnum<Type> *>(column_type.get());
-    const auto & enum_values = dynamic_cast<const EnumValues<Type> &>(*enum_type);
-
-    auto enumerants = enum_schema.getEnumerants();
-    if (mode == FormatSettings::EnumComparingMode::BY_VALUES)
-    {
-        /// In CapnProto Enum fields are numbered sequentially starting from zero.
-        if (enumerants.size() > max_value)
-        {
-            error_message += "Enum from CapnProto schema contains values that is out of range for Clickhouse Enum";
-            return false;
-        }
-
-        auto values = enum_values.getSetOfAllValues();
-        std::unordered_set<Type> capn_enum_values;
-        for (auto enumerant : enumerants)
-            capn_enum_values.insert(Type(enumerant.getOrdinal()));
-        auto result = values == capn_enum_values;
-        if (!result)
-            error_message += "The set of values in Enum from CapnProto schema is different from the set of values in ClickHouse Enum";
-        return result;
-    }
-
-    auto names = enum_values.getSetOfAllNames(to_lower);
-    std::unordered_set<String> capn_enum_names;
-
-    for (auto enumerant : enumerants)
-    {
-        String name = enumerant.getProto().getName();
-        capn_enum_names.insert(to_lower ? boost::algorithm::to_lower_copy(name) : name);
-    }
-
-    auto result = names == capn_enum_names;
-    if (!result)
-        error_message += "The set of names in Enum from CapnProto schema is different from the set of names in ClickHouse Enum";
-    return result;
-}
-
-static bool checkCapnProtoType(const capnp::Type & capnp_type, const DataTypePtr & data_type, FormatSettings::EnumComparingMode mode, String & error_message, const String & column_name);
-
-static bool checkNullableType(const capnp::Type & capnp_type, const DataTypePtr & data_type, FormatSettings::EnumComparingMode mode, String & error_message, const String & column_name)
-{
-    if (!capnp_type.isStruct())
-        return false;
-
-    /// Check that struct is a named union of type VOID and one arbitrary type.
-    auto struct_schema = capnp_type.asStruct();
-    if (!checkIfStructIsNamedUnion(struct_schema))
-        return false;
-
-    auto union_fields = struct_schema.getUnionFields();
-    if (union_fields.size() != 2)
-        return false;
-
-    auto first = union_fields[0];
-    auto second = union_fields[1];
-
-    auto nested_type = assert_cast<const DataTypeNullable *>(data_type.get())->getNestedType();
-    if (first.getType().isVoid())
-        return checkCapnProtoType(second.getType(), nested_type, mode, error_message, column_name);
-    if (second.getType().isVoid())
-        return checkCapnProtoType(first.getType(), nested_type, mode, error_message, column_name);
-    return false;
-}
-
-static bool checkTupleType(const capnp::Type & capnp_type, const DataTypePtr & data_type, FormatSettings::EnumComparingMode mode, String & error_message)
-{
-    if (!capnp_type.isStruct())
-        return false;
-    auto struct_schema = capnp_type.asStruct();
-
-    if (checkIfStructIsNamedUnion(struct_schema))
-        return false;
-
-    if (checkIfStructContainsUnnamedUnion(struct_schema))
-    {
-        error_message += "CapnProto struct contains unnamed union";
-        return false;
-    }
-
-    const auto * tuple_data_type = assert_cast<const DataTypeTuple *>(data_type.get());
-    auto nested_types = tuple_data_type->getElements();
-    if (nested_types.size() != struct_schema.getFields().size())
-    {
-        error_message += "Tuple and Struct types have different sizes";
-        return false;
-    }
-
-    bool have_explicit_names = tuple_data_type->haveExplicitNames();
-    const auto & nested_names = tuple_data_type->getElementNames();
-    for (uint32_t i = 0; i != nested_names.size(); ++i)
-    {
-        if (have_explicit_names)
-        {
-            KJ_IF_MAYBE (field, struct_schema.findFieldByName(nested_names[i]))
-            {
-                if (!checkCapnProtoType(field->getType(), nested_types[tuple_data_type->getPositionByName(nested_names[i])], mode, error_message, nested_names[i]))
-                    return false;
-            }
-            else
-            {
-                error_message += "CapnProto struct doesn't contain a field with name " + nested_names[i];
-                return false;
-            }
-        }
-        else if (!checkCapnProtoType(struct_schema.getFields()[i].getType(), nested_types[tuple_data_type->getPositionByName(nested_names[i])], mode, error_message, nested_names[i]))
-            return false;
-    }
-
-    return true;
-}
-
-static bool checkArrayType(const capnp::Type & capnp_type, const DataTypePtr & data_type, FormatSettings::EnumComparingMode mode, String & error_message, const String & column_name)
-{
-    if (!capnp_type.isList())
-        return false;
-    auto list_schema = capnp_type.asList();
-    auto nested_type = assert_cast<const DataTypeArray *>(data_type.get())->getNestedType();
-
-    auto [field_name, nested_name] = splitCapnProtoFieldName(column_name);
-    if (!nested_name.empty() && list_schema.getElementType().isStruct())
-    {
-        auto struct_schema = list_schema.getElementType().asStruct();
-        KJ_IF_MAYBE(field, struct_schema.findFieldByName(nested_name))
-            return checkCapnProtoType(field->getType(), nested_type, mode, error_message, nested_name);
-
-        error_message += "Element type of List {} doesn't contain field with name " + nested_name;
-        return false;
-    }
-
-    return checkCapnProtoType(list_schema.getElementType(), nested_type, mode, error_message, column_name);
-}
-
-static bool checkMapType(const capnp::Type & capnp_type, const DataTypePtr & data_type, FormatSettings::EnumComparingMode mode, String & error_message)
-{
-    /// We output/input Map type as follow CapnProto schema
-    ///
-    /// struct Map {
-    ///     struct Entry {
-    ///         key @0: Key;
-    ///         value @1: Value;
-    ///     }
-    ///     entries @0 :List(Entry);
-    /// }
-
-    if (!capnp_type.isStruct())
-        return false;
-    auto struct_schema = capnp_type.asStruct();
-
-    if (checkIfStructContainsUnnamedUnion(struct_schema))
-    {
-        error_message += "CapnProto struct contains unnamed union";
-        return false;
-    }
-
-    if (struct_schema.getFields().size() != 1)
-    {
-        error_message += "CapnProto struct that represents Map type can contain only one field";
-        return false;
-    }
-
-    const auto & field_type = struct_schema.getFields()[0].getType();
-    if (!field_type.isList())
-    {
-        error_message += "Field of CapnProto struct that represents Map is not a list";
-        return false;
-    }
-
-    auto list_element_type = field_type.asList().getElementType();
-    if (!list_element_type.isStruct())
-    {
-        error_message += "Field of CapnProto struct that represents Map is not a list of structs";
-        return false;
-    }
-
-    auto key_value_struct = list_element_type.asStruct();
-    if (checkIfStructContainsUnnamedUnion(key_value_struct))
-    {
-        error_message += "CapnProto struct contains unnamed union";
-        return false;
-    }
-
-    if (key_value_struct.getFields().size() != 2)
-    {
-        error_message += "Key-value structure for Map struct should have exactly 2 fields";
-        return false;
-    }
-
-    const auto & map_type = assert_cast<const DataTypeMap &>(*data_type);
-    DataTypes types = {map_type.getKeyType(), map_type.getValueType()};
-    Names names = {"key", "value"};
-
-    for (size_t i = 0; i != types.size(); ++i)
-    {
-        KJ_IF_MAYBE(field, key_value_struct.findFieldByName(names[i]))
-        {
-            if (!checkCapnProtoType(field->getType(), types[i], mode, error_message, names[i]))
-                return false;
-        }
-        else
-        {
-            error_message += R"(Key-value structure for Map struct should have exactly 2 fields with names "key" and "value")";
-            return false;
-        }
-    }
-
-    return true;
-}
-
-static bool isCapnInteger(const capnp::Type & capnp_type)
-{
-    return capnp_type.isInt8() || capnp_type.isUInt8() || capnp_type.isInt16() || capnp_type.isUInt16() || capnp_type.isInt32()
-        || capnp_type.isUInt32() || capnp_type.isInt64() || capnp_type.isUInt64();
-}
-
-static bool checkCapnProtoType(const capnp::Type & capnp_type, const DataTypePtr & data_type, FormatSettings::EnumComparingMode mode, String & error_message, const String & column_name)
-{
-    switch (data_type->getTypeId())
-    {
-        case TypeIndex::UInt8:
-            return capnp_type.isBool() || isCapnInteger(capnp_type);
-        case TypeIndex::Int8: [[fallthrough]];
-        case TypeIndex::Int16: [[fallthrough]];
-        case TypeIndex::UInt16: [[fallthrough]];
-        case TypeIndex::Int32: [[fallthrough]];
-        case TypeIndex::UInt32: [[fallthrough]];
-        case TypeIndex::Int64: [[fallthrough]];
-        case TypeIndex::UInt64:
-            /// Allow integer conversions durin input/output.
-            return isCapnInteger(capnp_type);
-        case TypeIndex::Date:
-            return capnp_type.isUInt16();
-        case TypeIndex::DateTime: [[fallthrough]];
-        case TypeIndex::IPv4:
-            return capnp_type.isUInt32();
-        case TypeIndex::Date32: [[fallthrough]];
-        case TypeIndex::Decimal32:
-            return capnp_type.isInt32() || capnp_type.isUInt32();
-        case TypeIndex::DateTime64: [[fallthrough]];
-        case TypeIndex::Decimal64:
-            return capnp_type.isInt64() || capnp_type.isUInt64();
-        case TypeIndex::Float32:[[fallthrough]];
-        case TypeIndex::Float64:
-            /// Allow converting between Float32 and isFloat64
-            return capnp_type.isFloat32() || capnp_type.isFloat64();
-        case TypeIndex::Enum8:
-            return checkEnums<Int8>(capnp_type, data_type, mode, INT8_MAX, error_message);
-        case TypeIndex::Enum16:
-            return checkEnums<Int16>(capnp_type, data_type, mode, INT16_MAX, error_message);
-        case TypeIndex::Int128: [[fallthrough]];
-        case TypeIndex::UInt128: [[fallthrough]];
-        case TypeIndex::Int256: [[fallthrough]];
-        case TypeIndex::UInt256: [[fallthrough]];
-        case TypeIndex::Decimal128: [[fallthrough]];
-        case TypeIndex::Decimal256:
-            return capnp_type.isData();
-        case TypeIndex::Tuple:
-            return checkTupleType(capnp_type, data_type, mode, error_message);
-        case TypeIndex::Nullable:
-        {
-            auto result = checkNullableType(capnp_type, data_type, mode, error_message, column_name);
-            if (!result)
-                error_message += "Nullable can be represented only as a named union of type Void and nested type";
-            return result;
-        }
-        case TypeIndex::Array:
-            return checkArrayType(capnp_type, data_type, mode, error_message, column_name);
-        case TypeIndex::LowCardinality:
-            return checkCapnProtoType(capnp_type, assert_cast<const DataTypeLowCardinality *>(data_type.get())->getDictionaryType(), mode, error_message, column_name);
-        case TypeIndex::FixedString: [[fallthrough]];
-        case TypeIndex::IPv6: [[fallthrough]];
-        case TypeIndex::String:
-            return capnp_type.isText() || capnp_type.isData();
-        case TypeIndex::Map:
-            return checkMapType(capnp_type, data_type, mode, error_message);
-        default:
-            return false;
-    }
-}
-
-capnp::DynamicValue::Reader getReaderByColumnName(const capnp::DynamicStruct::Reader & struct_reader, const String & name)
-{
-    auto [field_name, nested_name] = splitCapnProtoFieldName(name);
-    KJ_IF_MAYBE(field, struct_reader.getSchema().findFieldByName(field_name))
-    {
-        capnp::DynamicValue::Reader field_reader;
-        try
-        {
-            field_reader = struct_reader.get(*field);
-        }
-        catch (const kj::Exception & e)
-        {
-            throw Exception(ErrorCodes::INCORRECT_DATA,
-                            "Cannot extract field value from struct by provided schema, error: "
-                            "{} Perhaps the data was generated by another schema", String(e.getDescription().cStr()));
-        }
-
-        if (nested_name.empty())
-            return field_reader;
-
-        /// Support reading Nested as List of Structs.
-        if (field_reader.getType() == capnp::DynamicValue::LIST)
-        {
-            auto list_schema = field->getType().asList();
-            if (!list_schema.getElementType().isStruct())
-                throw Exception(ErrorCodes::CAPN_PROTO_BAD_CAST, "Element type of List {} is not a struct", field_name);
-
-            auto struct_schema = list_schema.getElementType().asStruct();
-            KJ_IF_MAYBE(nested_field, struct_schema.findFieldByName(nested_name))
-                return field_reader;
-
-            throw Exception(ErrorCodes::THERE_IS_NO_COLUMN, "Element type of List {} doesn't contain field with name \"{}\"", field_name, nested_name);
-        }
-
-        if (field_reader.getType() != capnp::DynamicValue::STRUCT)
-            throw Exception(ErrorCodes::CAPN_PROTO_BAD_CAST, "Field {} is not a struct", field_name);
-
-        return getReaderByColumnName(field_reader.as<capnp::DynamicStruct>(), nested_name);
-    }
-
-    throw Exception(ErrorCodes::THERE_IS_NO_COLUMN, "Capnproto struct doesn't contain field with name {}", field_name);
-}
-
-std::pair<capnp::DynamicStruct::Builder, capnp::StructSchema::Field> getStructBuilderAndFieldByColumnName(capnp::DynamicStruct::Builder struct_builder, const String & name)
-{
-    auto [field_name, nested_name] = splitCapnProtoFieldName(name);
-    KJ_IF_MAYBE(field, struct_builder.getSchema().findFieldByName(field_name))
-    {
-        if (nested_name.empty())
-            return {struct_builder, *field};
-
-        auto field_builder = struct_builder.get(*field);
-
-        /// Support reading Nested as List of Structs.
-        if (field_builder.getType() == capnp::DynamicValue::LIST)
-        {
-            auto list_schema = field->getType().asList();
-            if (!list_schema.getElementType().isStruct())
-                throw Exception(ErrorCodes::CAPN_PROTO_BAD_CAST, "Element type of List {} is not a struct", field_name);
-
-            auto struct_schema = list_schema.getElementType().asStruct();
-            KJ_IF_MAYBE(nested_field, struct_schema.findFieldByName(nested_name))
-                return {struct_builder, *field};
-
-            throw Exception(ErrorCodes::THERE_IS_NO_COLUMN, "Element type of List {} doesn't contain field with name \"{}\"", field_name, nested_name);
-        }
-
-        if (field_builder.getType() != capnp::DynamicValue::STRUCT)
-            throw Exception(ErrorCodes::CAPN_PROTO_BAD_CAST, "Field {} is not a struct", field_name);
-
-        return getStructBuilderAndFieldByColumnName(field_builder.as<capnp::DynamicStruct>(), nested_name);
-    }
-
-    throw Exception(ErrorCodes::THERE_IS_NO_COLUMN, "Capnproto struct doesn't contain field with name {}", field_name);
-}
-
-static std::pair<capnp::StructSchema::Field, String> getFieldByName(const capnp::StructSchema & schema, const String & name)
-{
-    auto [field_name, nested_name] = splitCapnProtoFieldName(name);
-    KJ_IF_MAYBE(field, schema.findFieldByName(field_name))
-    {
-        if (nested_name.empty())
-            return {*field, name};
-
-        /// Support reading Nested as List of Structs.
-        if (field->getType().isList())
-        {
-            auto list_schema = field->getType().asList();
-            if (!list_schema.getElementType().isStruct())
-                throw Exception(ErrorCodes::CAPN_PROTO_BAD_CAST, "Element type of List {} is not a struct", field_name);
-
-            auto struct_schema = list_schema.getElementType().asStruct();
-            KJ_IF_MAYBE(nested_field, struct_schema.findFieldByName(nested_name))
-                return {*field, name};
-
-            throw Exception(ErrorCodes::THERE_IS_NO_COLUMN, "Element type of List {} doesn't contain field with name \"{}\"", field_name, nested_name);
-        }
-
-        if (!field->getType().isStruct())
-            throw Exception(ErrorCodes::CAPN_PROTO_BAD_CAST, "Field {} is not a struct", field_name);
-
-        return getFieldByName(field->getType().asStruct(), nested_name);
-    }
-
-    throw Exception(ErrorCodes::THERE_IS_NO_COLUMN, "Capnproto schema doesn't contain field with name {}", field_name);
-}
-
-void checkCapnProtoSchemaStructure(const capnp::StructSchema & schema, const Block & header, FormatSettings::EnumComparingMode mode)
-{
-    /// Firstly check that struct doesn't contain unnamed union, because we don't support it.
-    if (checkIfStructContainsUnnamedUnion(schema))
-        throw Exception(ErrorCodes::CAPN_PROTO_BAD_CAST, "Schema contains unnamed union that is not supported");
-    auto names_and_types = header.getNamesAndTypesList();
-    String additional_error_message;
-    for (auto & [name, type] : names_and_types)
-    {
-        auto [field, field_name] = getFieldByName(schema, name);
-        if (!checkCapnProtoType(field.getType(), type, mode, additional_error_message, field_name))
-        {
-            auto e = Exception(
-                ErrorCodes::CAPN_PROTO_BAD_CAST,
-                "Cannot convert ClickHouse type {} to CapnProto type {}",
-                type->getName(),
-                getCapnProtoFullTypeName(field.getType()));
-            if (!additional_error_message.empty())
-                e.addMessage(additional_error_message);
-            throw std::move(e);
-        }
-    }
-}
-
-template <typename ValueType>
-static DataTypePtr getEnumDataTypeFromEnumerants(const capnp::EnumSchema::EnumerantList & enumerants)
-{
-    std::vector<std::pair<String, ValueType>> values;
-    for (auto enumerant : enumerants)
-        values.emplace_back(enumerant.getProto().getName(), ValueType(enumerant.getOrdinal()));
-    return std::make_shared<DataTypeEnum<ValueType>>(std::move(values));
-}
-
-static DataTypePtr getEnumDataTypeFromEnumSchema(const capnp::EnumSchema & enum_schema)
-{
-    auto enumerants = enum_schema.getEnumerants();
-    if (enumerants.size() < 128)
-        return getEnumDataTypeFromEnumerants<Int8>(enumerants);
-    if (enumerants.size() < 32768)
-        return getEnumDataTypeFromEnumerants<Int16>(enumerants);
-
-    throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "ClickHouse supports only 8 and 16-bit Enums");
-}
-
-static DataTypePtr getDataTypeFromCapnProtoType(const capnp::Type & capnp_type, bool skip_unsupported_fields)
-{
-    switch (capnp_type.which())
-    {
-        case capnp::schema::Type::INT8:
-            return std::make_shared<DataTypeInt8>();
-        case capnp::schema::Type::INT16:
-            return std::make_shared<DataTypeInt16>();
-        case capnp::schema::Type::INT32:
-            return std::make_shared<DataTypeInt32>();
-        case capnp::schema::Type::INT64:
-            return std::make_shared<DataTypeInt64>();
-        case capnp::schema::Type::BOOL: [[fallthrough]];
-        case capnp::schema::Type::UINT8:
-            return std::make_shared<DataTypeUInt8>();
-        case capnp::schema::Type::UINT16:
-            return std::make_shared<DataTypeUInt16>();
-        case capnp::schema::Type::UINT32:
-            return std::make_shared<DataTypeUInt32>();
-        case capnp::schema::Type::UINT64:
-            return std::make_shared<DataTypeUInt64>();
-        case capnp::schema::Type::FLOAT32:
-            return std::make_shared<DataTypeFloat32>();
-        case capnp::schema::Type::FLOAT64:
-            return std::make_shared<DataTypeFloat64>();
-        case capnp::schema::Type::DATA: [[fallthrough]];
-        case capnp::schema::Type::TEXT:
-            return std::make_shared<DataTypeString>();
-        case capnp::schema::Type::ENUM:
-            return getEnumDataTypeFromEnumSchema(capnp_type.asEnum());
-        case capnp::schema::Type::LIST:
-        {
-            auto list_schema = capnp_type.asList();
-            auto nested_type = getDataTypeFromCapnProtoType(list_schema.getElementType(), skip_unsupported_fields);
-            if (!nested_type)
-                return nullptr;
-            return std::make_shared<DataTypeArray>(nested_type);
-        }
-        case capnp::schema::Type::STRUCT:
-        {
-            auto struct_schema = capnp_type.asStruct();
-
-
-            if (struct_schema.getFields().size() == 0)
-            {
-                if (skip_unsupported_fields)
-                    return nullptr;
-                throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "Empty messages are not supported");
-            }
-
-            /// Check if it can be Nullable.
-            if (checkIfStructIsNamedUnion(struct_schema))
-            {
-                auto fields = struct_schema.getUnionFields();
-                if (fields.size() != 2 || (!fields[0].getType().isVoid() && !fields[1].getType().isVoid()))
-                {
-                    if (skip_unsupported_fields)
-                        return nullptr;
-                    throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "Unions are not supported");
-                }
-                auto value_type = fields[0].getType().isVoid() ? fields[1].getType() : fields[0].getType();
-                if (value_type.isStruct() || value_type.isList())
-                {
-                    if (skip_unsupported_fields)
-                        return nullptr;
-                    throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "Tuples and Lists cannot be inside Nullable");
-                }
-
-                auto nested_type = getDataTypeFromCapnProtoType(value_type, skip_unsupported_fields);
-                if (!nested_type)
-                    return nullptr;
-                return std::make_shared<DataTypeNullable>(nested_type);
-            }
-
-            if (checkIfStructContainsUnnamedUnion(struct_schema))
-                throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "Unnamed union is not supported");
-
-            /// Treat Struct as Tuple.
-            DataTypes nested_types;
-            Names nested_names;
-            for (auto field : struct_schema.getNonUnionFields())
-            {
-                auto nested_type = getDataTypeFromCapnProtoType(field.getType(), skip_unsupported_fields);
-                if (!nested_type)
-                    continue;
-                nested_names.push_back(field.getProto().getName());
-                nested_types.push_back(nested_type);
-            }
-            if (nested_types.empty())
-                return nullptr;
-            return std::make_shared<DataTypeTuple>(std::move(nested_types), std::move(nested_names));
-        }
-        default:
-        {
-            if (skip_unsupported_fields)
-                return nullptr;
-            throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "Unsupported CapnProtoType: {}", getCapnProtoFullTypeName(capnp_type));
-        }
-    }
-}
-
-NamesAndTypesList capnProtoSchemaToCHSchema(const capnp::StructSchema & schema, bool skip_unsupported_fields)
-{
-    if (checkIfStructContainsUnnamedUnion(schema))
-        throw Exception(ErrorCodes::CAPN_PROTO_BAD_TYPE, "Unnamed union is not supported");
-
-    NamesAndTypesList names_and_types;
-    for (auto field : schema.getNonUnionFields())
-    {
-        auto name = field.getProto().getName();
-        auto type = getDataTypeFromCapnProtoType(field.getType(), skip_unsupported_fields);
-        if (type)
-            names_and_types.emplace_back(name, type);
-    }
-    if (names_and_types.empty())
-        throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                        "Cannot convert CapnProto schema to ClickHouse table schema, all fields have unsupported types");
-
-    return names_and_types;
-}
-
-}
-
-#endif
diff --git a/src/Formats/EscapingRuleUtils.cpp b/src/Formats/EscapingRuleUtils.cpp
index 804f32e4b46..9f744218da2 100644
--- a/src/Formats/EscapingRuleUtils.cpp
+++ b/src/Formats/EscapingRuleUtils.cpp
@@ -408,9 +408,10 @@ DataTypes getDefaultDataTypeForEscapingRules(const std::vector<FormatSettings::E
 String getAdditionalFormatInfoForAllRowBasedFormats(const FormatSettings & settings)
 {
     return fmt::format(
-        "schema_inference_hints={}, max_rows_to_read_for_schema_inference={}, schema_inference_make_columns_nullable={}",
+        "schema_inference_hints={}, max_rows_to_read_for_schema_inference={}, max_bytes_to_read_for_schema_inference={}, schema_inference_make_columns_nullable={}",
         settings.schema_inference_hints,
         settings.max_rows_to_read_for_schema_inference,
+        settings.max_bytes_to_read_for_schema_inference,
         settings.schema_inference_make_columns_nullable);
 }
 
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 586e1bb7251..ad991aa0335 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -69,6 +69,9 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
     format_settings.csv.use_best_effort_in_schema_inference = settings.input_format_csv_use_best_effort_in_schema_inference;
     format_settings.csv.skip_first_lines = settings.input_format_csv_skip_first_lines;
     format_settings.csv.try_detect_header = settings.input_format_csv_detect_header;
+    format_settings.csv.skip_trailing_empty_lines = settings.input_format_csv_skip_trailing_empty_lines;
+    format_settings.csv.trim_whitespaces = settings.input_format_csv_trim_whitespaces;
+    format_settings.csv.allow_whitespace_or_tab_as_delimiter = settings.input_format_csv_allow_whitespace_or_tab_as_delimiter;
     format_settings.hive_text.fields_delimiter = settings.input_format_hive_text_fields_delimiter;
     format_settings.hive_text.collection_items_delimiter = settings.input_format_hive_text_collection_items_delimiter;
     format_settings.hive_text.map_keys_delimiter = settings.input_format_hive_text_map_keys_delimiter;
@@ -80,6 +83,7 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
     format_settings.custom.row_before_delimiter = settings.format_custom_row_before_delimiter;
     format_settings.custom.row_between_delimiter = settings.format_custom_row_between_delimiter;
     format_settings.custom.try_detect_header = settings.input_format_custom_detect_header;
+    format_settings.custom.skip_trailing_empty_lines = settings.input_format_custom_skip_trailing_empty_lines;
     format_settings.date_time_input_format = settings.date_time_input_format;
     format_settings.date_time_output_format = settings.date_time_output_format;
     format_settings.input_format_ipv4_default_on_conversion_error = settings.input_format_ipv4_default_on_conversion_error;
@@ -149,6 +153,7 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
     format_settings.tsv.use_best_effort_in_schema_inference = settings.input_format_tsv_use_best_effort_in_schema_inference;
     format_settings.tsv.skip_first_lines = settings.input_format_tsv_skip_first_lines;
     format_settings.tsv.try_detect_header = settings.input_format_tsv_detect_header;
+    format_settings.tsv.skip_trailing_empty_lines = settings.input_format_tsv_skip_trailing_empty_lines;
     format_settings.values.accurate_types_of_literals = settings.input_format_values_accurate_types_of_literals;
     format_settings.values.deduce_templates_of_expressions = settings.input_format_values_deduce_templates_of_expressions;
     format_settings.values.interpret_expressions = settings.input_format_values_interpret_expressions;
@@ -182,6 +187,7 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
     format_settings.msgpack.number_of_columns = settings.input_format_msgpack_number_of_columns;
     format_settings.msgpack.output_uuid_representation = settings.output_format_msgpack_uuid_representation;
     format_settings.max_rows_to_read_for_schema_inference = settings.input_format_max_rows_to_read_for_schema_inference;
+    format_settings.max_bytes_to_read_for_schema_inference = settings.input_format_max_rows_to_read_for_schema_inference;
     format_settings.column_names_for_schema_inference = settings.column_names_for_schema_inference;
     format_settings.schema_inference_hints = settings.schema_inference_hints;
     format_settings.schema_inference_make_columns_nullable = settings.schema_inference_make_columns_nullable;
@@ -363,7 +369,7 @@ std::unique_ptr<ReadBuffer> FormatFactory::wrapReadBufferIfNeeded(
             settings.max_download_buffer_size);
 
         res = wrapInParallelReadBufferIfSupported(
-            buf, threadPoolCallbackRunner<void>(IOThreadPool::get(), "ParallelRead"),
+            buf, threadPoolCallbackRunner<void>(getIOThreadPool().get(), "ParallelRead"),
             max_download_threads, settings.max_download_buffer_size, file_size);
     }
 
diff --git a/src/Formats/FormatFactory.h b/src/Formats/FormatFactory.h
index 1d258beca8d..489db944ee6 100644
--- a/src/Formats/FormatFactory.h
+++ b/src/Formats/FormatFactory.h
@@ -153,6 +153,7 @@ public:
     ///  * Parallel reading.
     ///    To enable it, make sure `buf` is a SeekableReadBuffer implementing readBigAt().
     ///  * Parallel parsing.
+    /// `buf` must outlive the returned IInputFormat.
     InputFormatPtr getInput(
         const String & name,
         ReadBuffer & buf,
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index e332bd749a1..07d4a7ede4a 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -36,7 +36,8 @@ struct FormatSettings
     bool defaults_for_omitted_fields = true;
 
     bool seekable_read = true;
-    UInt64 max_rows_to_read_for_schema_inference = 100;
+    UInt64 max_rows_to_read_for_schema_inference = 25000;
+    UInt64 max_bytes_to_read_for_schema_inference = 32 * 1024 * 1024;
 
     String column_names_for_schema_inference;
     String schema_inference_hints;
@@ -136,6 +137,9 @@ struct FormatSettings
         UInt64 skip_first_lines = 0;
         String custom_delimiter;
         bool try_detect_header = true;
+        bool skip_trailing_empty_lines = false;
+        bool trim_whitespaces = true;
+        bool allow_whitespace_or_tab_as_delimiter = false;
     } csv;
 
     struct HiveText
@@ -156,6 +160,7 @@ struct FormatSettings
         std::string field_delimiter;
         EscapingRule escaping_rule = EscapingRule::Escaped;
         bool try_detect_header = true;
+        bool skip_trailing_empty_lines = false;
     } custom;
 
     struct
@@ -291,6 +296,7 @@ struct FormatSettings
         bool use_best_effort_in_schema_inference = true;
         UInt64 skip_first_lines = 0;
         bool try_detect_header = true;
+        bool skip_trailing_empty_lines = false;
     } tsv;
 
     struct
@@ -323,16 +329,16 @@ struct FormatSettings
 
     /// For capnProto format we should determine how to
     /// compare ClickHouse Enum and Enum from schema.
-    enum class EnumComparingMode
+    enum class CapnProtoEnumComparingMode
     {
         BY_NAMES, // Names in enums should be the same, values can be different.
         BY_NAMES_CASE_INSENSITIVE, // Case-insensitive name comparison.
         BY_VALUES, // Values should be the same, names can be different.
     };
 
-    struct
+    struct CapnProto
     {
-        EnumComparingMode enum_comparing_mode = EnumComparingMode::BY_VALUES;
+        CapnProtoEnumComparingMode enum_comparing_mode = CapnProtoEnumComparingMode::BY_VALUES;
         bool skip_fields_with_unsupported_types_in_schema_inference = false;
     } capn_proto;
 
diff --git a/src/Formats/JSONUtils.cpp b/src/Formats/JSONUtils.cpp
index 284cffdb9d7..0aac72c68fe 100644
--- a/src/Formats/JSONUtils.cpp
+++ b/src/Formats/JSONUtils.cpp
@@ -45,9 +45,9 @@ namespace JSONUtils
             const auto current_object_size = memory.size() + static_cast<size_t>(pos - in.position());
             if (min_bytes != 0 && current_object_size > 10 * min_bytes)
                 throw ParsingException(ErrorCodes::INCORRECT_DATA,
-                    "Size of JSON object is extremely large. Expected not greater than {} bytes, but current is {} bytes per row. "
+                    "Size of JSON object at position {} is extremely large. Expected not greater than {} bytes, but current is {} bytes per row. "
                     "Increase the value setting 'min_chunk_bytes_for_parallel_parsing' or check your data manually, "
-                    "most likely JSON is malformed", min_bytes, current_object_size);
+                    "most likely JSON is malformed", in.count(), min_bytes, current_object_size);
 
             if (quotes)
             {
diff --git a/src/Formats/ReadSchemaUtils.cpp b/src/Formats/ReadSchemaUtils.cpp
index 61683b226ee..cbfa05bfba6 100644
--- a/src/Formats/ReadSchemaUtils.cpp
+++ b/src/Formats/ReadSchemaUtils.cpp
@@ -75,6 +75,8 @@ ColumnsDescription readSchemaFromFormat(
         SchemaReaderPtr schema_reader;
         size_t max_rows_to_read = format_settings ? format_settings->max_rows_to_read_for_schema_inference
                                                   : context->getSettingsRef().input_format_max_rows_to_read_for_schema_inference;
+        size_t max_bytes_to_read = format_settings ? format_settings->max_bytes_to_read_for_schema_inference
+                                                                             : context->getSettingsRef().input_format_max_bytes_to_read_for_schema_inference;
         size_t iterations = 0;
         ColumnsDescription cached_columns;
         while (true)
@@ -120,7 +122,7 @@ ColumnsDescription readSchemaFromFormat(
             try
             {
                 schema_reader = FormatFactory::instance().getSchemaReader(format_name, *buf, context, format_settings);
-                schema_reader->setMaxRowsToRead(max_rows_to_read);
+                schema_reader->setMaxRowsAndBytesToRead(max_rows_to_read, max_bytes_to_read);
                 names_and_types = schema_reader->readSchema();
                 break;
             }
@@ -132,10 +134,14 @@ ColumnsDescription readSchemaFromFormat(
                     size_t rows_read = schema_reader->getNumRowsRead();
                     assert(rows_read <= max_rows_to_read);
                     max_rows_to_read -= schema_reader->getNumRowsRead();
-                    if (rows_read != 0 && max_rows_to_read == 0)
+                    size_t bytes_read = buf->count();
+                    /// We could exceed max_bytes_to_read a bit to complete row parsing.
+                    max_bytes_to_read -= std::min(bytes_read, max_bytes_to_read);
+                    if (rows_read != 0 && (max_rows_to_read == 0 || max_bytes_to_read == 0))
                     {
-                        exception_message += "\nTo increase the maximum number of rows to read for structure determination, use setting "
-                                             "input_format_max_rows_to_read_for_schema_inference";
+                        exception_message += "\nTo increase the maximum number of rows/bytes to read for structure determination, use setting "
+                                             "input_format_max_rows_to_read_for_schema_inference/input_format_max_bytes_to_read_for_schema_inference";
+
                         if (iterations > 1)
                         {
                             exception_messages += "\n" + exception_message;
diff --git a/src/Functions/DateTimeTransforms.h b/src/Functions/DateTimeTransforms.h
index f179d9fbe60..019e0c42cde 100644
--- a/src/Functions/DateTimeTransforms.h
+++ b/src/Functions/DateTimeTransforms.h
@@ -5,6 +5,8 @@
 #include <Common/Exception.h>
 #include <Common/DateLUTImpl.h>
 #include <Common/DateLUT.h>
+#include <Columns/ColumnNullable.h>
+#include <Columns/ColumnsNumber.h>
 #include <Columns/ColumnVector.h>
 #include <Columns/ColumnDecimal.h>
 #include <Functions/FunctionHelpers.h>
@@ -21,6 +23,7 @@ namespace ErrorCodes
 {
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int ILLEGAL_COLUMN;
+    extern const int CANNOT_CONVERT_TYPE;
 }
 
 /** Transformations.
@@ -1425,12 +1428,15 @@ struct ToDateTimeComponentsImpl
     using FactorTransform = ZeroTransform;
 };
 
+struct DateTimeAccurateConvertStrategyAdditions {};
+struct DateTimeAccurateOrNullConvertStrategyAdditions {};
 
-template <typename FromType, typename ToType, typename Transform, bool is_extended_result = false>
+template <typename FromType, typename ToType, typename Transform, bool is_extended_result = false, typename Additions = void *>
 struct Transformer
 {
     template <typename FromTypeVector, typename ToTypeVector>
-    static void vector(const FromTypeVector & vec_from, ToTypeVector & vec_to, const DateLUTImpl & time_zone, const Transform & transform)
+    static void vector(const FromTypeVector & vec_from, ToTypeVector & vec_to, const DateLUTImpl & time_zone, const Transform & transform,
+        [[maybe_unused]] ColumnUInt8::Container * vec_null_map_to)
     {
         using ValueType = typename ToTypeVector::value_type;
         size_t size = vec_from.size();
@@ -1438,6 +1444,30 @@ struct Transformer
 
         for (size_t i = 0; i < size; ++i)
         {
+            if constexpr (std::is_same_v<ToType, DataTypeDate> || std::is_same_v<ToType, DataTypeDateTime>)
+            {
+                if constexpr (std::is_same_v<Additions, DateTimeAccurateConvertStrategyAdditions>
+                    || std::is_same_v<Additions, DateTimeAccurateOrNullConvertStrategyAdditions>)
+                {
+                    bool is_valid_input = vec_from[i] >= 0 && vec_from[i] <= 0xFFFFFFFFL;
+
+                    if (!is_valid_input)
+                    {
+                        if constexpr (std::is_same_v<Additions, DateTimeAccurateOrNullConvertStrategyAdditions>)
+                        {
+                            vec_to[i] = 0;
+                            (*vec_null_map_to)[i] = true;
+                            continue;
+                        }
+                        else
+                        {
+                            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Value {} cannot be safely converted into type {}",
+                                vec_from[i], TypeName<ValueType>);
+                        }
+                    }
+                }
+            }
+
             if constexpr (is_extended_result)
                 vec_to[i] = static_cast<ValueType>(transform.executeExtendedResult(vec_from[i], time_zone));
             else
@@ -1446,18 +1476,26 @@ struct Transformer
     }
 };
 
-
 template <typename FromDataType, typename ToDataType, typename Transform, bool is_extended_result = false>
 struct DateTimeTransformImpl
 {
+    template <typename Additions = void *>
     static ColumnPtr execute(
         const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t /*input_rows_count*/, const Transform & transform = {})
     {
-        using Op = Transformer<typename FromDataType::FieldType, typename ToDataType::FieldType, Transform, is_extended_result>;
+        using Op = Transformer<FromDataType, ToDataType, Transform, is_extended_result, Additions>;
 
         const ColumnPtr source_col = arguments[0].column;
         if (const auto * sources = checkAndGetColumn<typename FromDataType::ColumnType>(source_col.get()))
         {
+            ColumnUInt8::MutablePtr col_null_map_to;
+            ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
+            if constexpr (std::is_same_v<Additions, DateTimeAccurateOrNullConvertStrategyAdditions>)
+            {
+                col_null_map_to = ColumnUInt8::create(sources->getData().size(), false);
+                vec_null_map_to = &col_null_map_to->getData();
+            }
+
             auto mutable_result_col = result_type->createColumn();
             auto * col_to = assert_cast<typename ToDataType::ColumnType *>(mutable_result_col.get());
 
@@ -1465,7 +1503,7 @@ struct DateTimeTransformImpl
             if (result_data_type.isDateTime() || result_data_type.isDateTime64())
             {
                 const auto & time_zone = dynamic_cast<const TimezoneMixin &>(*result_type).getTimeZone();
-                Op::vector(sources->getData(), col_to->getData(), time_zone, transform);
+                Op::vector(sources->getData(), col_to->getData(), time_zone, transform, vec_null_map_to);
             }
             else
             {
@@ -1474,7 +1512,15 @@ struct DateTimeTransformImpl
                     time_zone_argument_position = 2;
 
                 const DateLUTImpl & time_zone = extractTimeZoneFromFunctionArguments(arguments, time_zone_argument_position, 0);
-                Op::vector(sources->getData(), col_to->getData(), time_zone, transform);
+                Op::vector(sources->getData(), col_to->getData(), time_zone, transform, vec_null_map_to);
+            }
+
+            if constexpr (std::is_same_v<Additions, DateTimeAccurateOrNullConvertStrategyAdditions>)
+            {
+                if (vec_null_map_to)
+                {
+                    return ColumnNullable::create(std::move(mutable_result_col), std::move(col_null_map_to));
+                }
             }
 
             return mutable_result_col;
diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index b205822aab5..c699da4eaf6 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -2046,51 +2046,68 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
     }
 
 #if USE_EMBEDDED_COMPILER
-    bool isCompilableImpl(const DataTypes & arguments) const override
+    bool isCompilableImpl(const DataTypes & arguments, const DataTypePtr & result_type) const override
     {
         if (2 != arguments.size())
             return false;
 
+        if (!canBeNativeType(*arguments[0]) || !canBeNativeType(*arguments[1]) || !canBeNativeType(*result_type))
+            return false;
+
+        WhichDataType data_type_lhs(arguments[0]);
+        WhichDataType data_type_rhs(arguments[1]);
+        if ((data_type_lhs.isDateOrDate32() || data_type_lhs.isDateTime()) ||
+            (data_type_rhs.isDateOrDate32() || data_type_rhs.isDateTime()))
+            return false;
+
         return castBothTypes(arguments[0].get(), arguments[1].get(), [&](const auto & left, const auto & right)
         {
             using LeftDataType = std::decay_t<decltype(left)>;
             using RightDataType = std::decay_t<decltype(right)>;
-            if constexpr (std::is_same_v<DataTypeFixedString, LeftDataType> || std::is_same_v<DataTypeFixedString, RightDataType> || std::is_same_v<DataTypeString, LeftDataType> || std::is_same_v<DataTypeString, RightDataType>)
-                return false;
-            else
+            if constexpr (!std::is_same_v<DataTypeFixedString, LeftDataType> &&
+                !std::is_same_v<DataTypeFixedString, RightDataType> &&
+                !std::is_same_v<DataTypeString, LeftDataType> &&
+                !std::is_same_v<DataTypeString, RightDataType>)
             {
                 using ResultDataType = typename BinaryOperationTraits<Op, LeftDataType, RightDataType>::ResultDataType;
                 using OpSpec = Op<typename LeftDataType::FieldType, typename RightDataType::FieldType>;
-                return !std::is_same_v<ResultDataType, InvalidType> && !IsDataTypeDecimal<ResultDataType> && OpSpec::compilable;
+                if constexpr (!std::is_same_v<ResultDataType, InvalidType> && !IsDataTypeDecimal<ResultDataType> && OpSpec::compilable)
+                    return true;
             }
+            return false;
         });
     }
 
-    llvm::Value * compileImpl(llvm::IRBuilderBase & builder, const DataTypes & types, Values values) const override
+    llvm::Value * compileImpl(llvm::IRBuilderBase & builder, const ValuesWithType & arguments, const DataTypePtr & result_type) const override
     {
-        assert(2 == types.size() && 2 == values.size());
+        assert(2 == arguments.size());
 
         llvm::Value * result = nullptr;
-        castBothTypes(types[0].get(), types[1].get(), [&](const auto & left, const auto & right)
+        castBothTypes(arguments[0].type.get(), arguments[1].type.get(), [&](const auto & left, const auto & right)
         {
             using LeftDataType = std::decay_t<decltype(left)>;
             using RightDataType = std::decay_t<decltype(right)>;
-            if constexpr (!std::is_same_v<DataTypeFixedString, LeftDataType> && !std::is_same_v<DataTypeFixedString, RightDataType> && !std::is_same_v<DataTypeString, LeftDataType> && !std::is_same_v<DataTypeString, RightDataType>)
+            if constexpr (!std::is_same_v<DataTypeFixedString, LeftDataType> &&
+                !std::is_same_v<DataTypeFixedString, RightDataType> &&
+                !std::is_same_v<DataTypeString, LeftDataType> &&
+                !std::is_same_v<DataTypeString, RightDataType>)
             {
                 using ResultDataType = typename BinaryOperationTraits<Op, LeftDataType, RightDataType>::ResultDataType;
                 using OpSpec = Op<typename LeftDataType::FieldType, typename RightDataType::FieldType>;
                 if constexpr (!std::is_same_v<ResultDataType, InvalidType> && !IsDataTypeDecimal<ResultDataType> && OpSpec::compilable)
                 {
                     auto & b = static_cast<llvm::IRBuilder<> &>(builder);
-                    auto type = std::make_shared<ResultDataType>();
-                    auto * lval = nativeCast(b, types[0], values[0], type);
-                    auto * rval = nativeCast(b, types[1], values[1], type);
+                    auto * lval = nativeCast(b, arguments[0], result_type);
+                    auto * rval = nativeCast(b, arguments[1], result_type);
                     result = OpSpec::compile(b, lval, rval, std::is_signed_v<typename ResultDataType::FieldType>);
+
                     return true;
                 }
             }
+
             return false;
         });
+
         return result;
     }
 #endif
diff --git a/src/Functions/FunctionDateOrDateTimeAddInterval.h b/src/Functions/FunctionDateOrDateTimeAddInterval.h
index 507dc37e266..1546c24d30c 100644
--- a/src/Functions/FunctionDateOrDateTimeAddInterval.h
+++ b/src/Functions/FunctionDateOrDateTimeAddInterval.h
@@ -679,7 +679,7 @@ public:
         }
         else if constexpr (std::is_same_v<ResultDataType, DataTypeDateTime>)
         {
-            return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 2, 0));
+            return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false));
         }
         else if constexpr (std::is_same_v<ResultDataType, DataTypeDateTime64>)
         {
@@ -696,7 +696,7 @@ public:
                     return {};
                 });
 
-            auto timezone = extractTimeZoneNameFromFunctionArguments(arguments, 2, 0);
+            auto timezone = extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false);
             if (const auto* datetime64_type = typeid_cast<const DataTypeDateTime64 *>(arguments[0].type.get()))
             {
                 const auto from_scale = datetime64_type->getScale();
diff --git a/src/Functions/FunctionDateOrDateTimeToDateOrDate32.h b/src/Functions/FunctionDateOrDateTimeToDateOrDate32.h
index 8e006b93b98..6eb3e534b62 100644
--- a/src/Functions/FunctionDateOrDateTimeToDateOrDate32.h
+++ b/src/Functions/FunctionDateOrDateTimeToDateOrDate32.h
@@ -36,7 +36,7 @@ public:
         /// If the time zone is specified but empty, throw an exception.
         /// only validate the time_zone part if the number of arguments is 2.
         if ((which.isDateTime() || which.isDateTime64()) && arguments.size() == 2
-            && extractTimeZoneNameFromFunctionArguments(arguments, 1, 0).empty())
+            && extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, false).empty())
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
                 "Function {} supports a 2nd argument (optional) that must be a valid time zone",
                 this->getName());
diff --git a/src/Functions/FunctionDateOrDateTimeToDateTimeOrDateTime64.h b/src/Functions/FunctionDateOrDateTimeToDateTimeOrDateTime64.h
index 3d1f0f192cf..9f1066fd687 100644
--- a/src/Functions/FunctionDateOrDateTimeToDateTimeOrDateTime64.h
+++ b/src/Functions/FunctionDateOrDateTimeToDateTimeOrDateTime64.h
@@ -34,7 +34,7 @@ public:
 
         WhichDataType which(from_type);
 
-        std::string time_zone = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0);
+        std::string time_zone = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, false);
 
         /// If the time zone is specified but empty, throw an exception.
         /// only validate the time_zone part if the number of arguments is 2.
diff --git a/src/Functions/FunctionDateOrDateTimeToSomething.h b/src/Functions/FunctionDateOrDateTimeToSomething.h
index 47433d13e0b..82818cc3d2b 100644
--- a/src/Functions/FunctionDateOrDateTimeToSomething.h
+++ b/src/Functions/FunctionDateOrDateTimeToSomething.h
@@ -24,7 +24,7 @@ public:
         /// If the time zone is specified but empty, throw an exception.
         if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
         {
-            std::string time_zone = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0);
+            std::string time_zone = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, false);
             /// only validate the time_zone part if the number of arguments is 2. This is mainly
             /// to accommodate functions like toStartOfDay(today()), toStartOfDay(yesterday()) etc.
             if (arguments.size() == 2 && time_zone.empty())
@@ -53,7 +53,7 @@ public:
                 scale = std::max(source_scale, static_cast<Int64>(9));
             }
 
-            return std::make_shared<ToDataType>(scale, extractTimeZoneNameFromFunctionArguments(arguments, 1, 0));
+            return std::make_shared<ToDataType>(scale, extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, false));
         }
         else
             return std::make_shared<ToDataType>();
diff --git a/src/Functions/FunctionIfBase.h b/src/Functions/FunctionIfBase.h
index 4c9ecf78a12..2d5f42a53a0 100644
--- a/src/Functions/FunctionIfBase.h
+++ b/src/Functions/FunctionIfBase.h
@@ -2,6 +2,7 @@
 
 #include <Functions/IFunction.h>
 #include <DataTypes/Native.h>
+#include <DataTypes/DataTypeNullable.h>
 
 #include "config.h"
 
@@ -12,8 +13,11 @@ class FunctionIfBase : public IFunction
 {
 #if USE_EMBEDDED_COMPILER
 public:
-    bool isCompilableImpl(const DataTypes & types) const override
+    bool isCompilableImpl(const DataTypes & types, const DataTypePtr & result_type) const override
     {
+        if (!canBeNativeType(result_type))
+            return false;
+
         /// It's difficult to compare Date and DateTime - cannot use JIT compilation.
         bool has_date = false;
         bool has_datetime = false;
@@ -31,43 +35,43 @@ public:
             if (has_date && has_datetime)
                 return false;
 
-            if (!isCompilableType(type_removed_nullable))
+            if (!canBeNativeType(type_removed_nullable))
                 return false;
         }
+
         return true;
     }
 
-    llvm::Value * compileImpl(llvm::IRBuilderBase & builder, const DataTypes & types, Values values) const override
+    llvm::Value * compileImpl(llvm::IRBuilderBase & builder, const ValuesWithType & arguments, const DataTypePtr & result_type) const override
     {
         auto & b = static_cast<llvm::IRBuilder<> &>(builder);
-        auto return_type = getReturnTypeImpl(types);
 
         auto * head = b.GetInsertBlock();
         auto * join = llvm::BasicBlock::Create(head->getContext(), "join_block", head->getParent());
 
         std::vector<std::pair<llvm::BasicBlock *, llvm::Value *>> returns;
-        for (size_t i = 0; i + 1 < types.size(); i += 2)
+        for (size_t i = 0; i + 1 < arguments.size(); i += 2)
         {
             auto * then = llvm::BasicBlock::Create(head->getContext(), "then_" + std::to_string(i), head->getParent());
             auto * next = llvm::BasicBlock::Create(head->getContext(), "next_" + std::to_string(i), head->getParent());
-            auto * cond = values[i];
+            const auto & cond = arguments[i];
 
-            b.CreateCondBr(nativeBoolCast(b, types[i], cond), then, next);
+            b.CreateCondBr(nativeBoolCast(b, cond), then, next);
             b.SetInsertPoint(then);
 
-            auto * value = nativeCast(b, types[i + 1], values[i + 1], return_type);
+            auto * value = nativeCast(b, arguments[i + 1], result_type);
             returns.emplace_back(b.GetInsertBlock(), value);
             b.CreateBr(join);
             b.SetInsertPoint(next);
         }
 
-        auto * else_value = nativeCast(b, types.back(), values.back(), return_type);
+        auto * else_value = nativeCast(b, arguments.back(), result_type);
         returns.emplace_back(b.GetInsertBlock(), else_value);
         b.CreateBr(join);
 
         b.SetInsertPoint(join);
 
-        auto * phi = b.CreatePHI(toNativeType(b, return_type), static_cast<unsigned>(returns.size()));
+        auto * phi = b.CreatePHI(toNativeType(b, result_type), static_cast<unsigned>(returns.size()));
         for (const auto & [block, value] : returns)
             phi->addIncoming(value, block);
 
diff --git a/src/Functions/FunctionMathUnary.h b/src/Functions/FunctionMathUnary.h
index 6e4bff7122d..9f400932356 100644
--- a/src/Functions/FunctionMathUnary.h
+++ b/src/Functions/FunctionMathUnary.h
@@ -154,6 +154,8 @@ private:
             using ColVecType = ColumnVectorOrDecimal<Type>;
 
             const auto col_vec = checkAndGetColumn<ColVecType>(col.column.get());
+            if (col_vec == nullptr)
+                return false;
             return (res = execute<Type, ReturnType>(col_vec)) != nullptr;
         };
 
diff --git a/src/Functions/FunctionSnowflake.h b/src/Functions/FunctionSnowflake.h
index 998db98890a..b57e21e9a50 100644
--- a/src/Functions/FunctionSnowflake.h
+++ b/src/Functions/FunctionSnowflake.h
@@ -5,7 +5,10 @@
 #include <Functions/FunctionHelpers.h>
 #include <DataTypes/DataTypeDateTime64.h>
 #include <DataTypes/DataTypesNumber.h>
+#include <Columns/ColumnConst.h>
+#include <Columns/ColumnsDateTime.h>
 #include <Columns/ColumnsNumber.h>
+#include <Interpreters/Context.h>
 
 #include <base/arithmeticOverflow.h>
 
@@ -52,29 +55,30 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
         const auto & src = arguments[0];
-        const auto & col = *src.column;
+        const auto & src_column = *src.column;
 
         auto res_column = ColumnInt64::create(input_rows_count);
-        auto & result_data = res_column->getData();
+        auto & res_data = res_column->getData();
 
-        const auto & source_data = typeid_cast<const ColumnUInt32 &>(col).getData();
+        const auto & src_data = typeid_cast<const ColumnUInt32 &>(src_column).getData();
         for (size_t i = 0; i < input_rows_count; ++i)
-        {
-            result_data[i] = (Int64(source_data[i]) * 1000 - snowflake_epoch) << time_shift;
-        }
+            res_data[i] = (Int64(src_data[i]) * 1000 - snowflake_epoch) << time_shift;
 
         return res_column;
     }
 };
 
-
 class FunctionSnowflakeToDateTime : public IFunction
 {
 private:
     const char * name;
+    const bool allow_nonconst_timezone_arguments;
 
 public:
-    explicit FunctionSnowflakeToDateTime(const char * name_) : name(name_) { }
+    explicit FunctionSnowflakeToDateTime(const char * name_, ContextPtr context)
+        : name(name_)
+        , allow_nonconst_timezone_arguments(context->getSettings().allow_nonconst_timezone_arguments)
+    {}
 
     String getName() const override { return name; }
     size_t getNumberOfArguments() const override { return 0; }
@@ -92,7 +96,7 @@ public:
 
         std::string timezone;
         if (arguments.size() == 2)
-            timezone = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0);
+            timezone = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, allow_nonconst_timezone_arguments);
 
         return std::make_shared<DataTypeDateTime>(timezone);
     }
@@ -100,18 +104,28 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
         const auto & src = arguments[0];
-        const auto & col = *src.column;
+        const auto & src_column = *src.column;
 
         auto res_column = ColumnUInt32::create(input_rows_count);
-        auto & result_data = res_column->getData();
+        auto & res_data = res_column->getData();
 
-        const auto & source_data = typeid_cast<const ColumnInt64 &>(col).getData();
-
-        for (size_t i = 0; i < input_rows_count; ++i)
+        if (const auto * src_column_non_const = typeid_cast<const ColumnInt64 *>(&src_column))
         {
-            result_data[i] = static_cast<UInt32>(
-                ((source_data[i] >> time_shift) + snowflake_epoch) / 1000);
+            const auto & src_data = src_column_non_const->getData();
+            for (size_t i = 0; i < input_rows_count; ++i)
+                res_data[i] = static_cast<UInt32>(
+                    ((src_data[i] >> time_shift) + snowflake_epoch) / 1000);
         }
+        else if (const auto * src_column_const = typeid_cast<const ColumnConst *>(&src_column))
+        {
+            Int64 src_val = src_column_const->getValue<Int64>();
+            for (size_t i = 0; i < input_rows_count; ++i)
+                res_data[i] = static_cast<UInt32>(
+                    ((src_val >> time_shift) + snowflake_epoch) / 1000);
+        }
+        else
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal argument for function {}", name);
+
         return res_column;
     }
 };
@@ -142,16 +156,14 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
         const auto & src = arguments[0];
-        const auto & col = *src.column;
+        const auto & src_column = *src.column;
 
         auto res_column = ColumnInt64::create(input_rows_count);
-        auto & result_data = res_column->getData();
+        auto & res_data = res_column->getData();
 
-        const auto & source_data = typeid_cast<const ColumnDecimal<DateTime64> &>(col).getData();
+        const auto & src_data = typeid_cast<const ColumnDecimal<DateTime64> &>(src_column).getData();
         for (size_t i = 0; i < input_rows_count; ++i)
-        {
-            result_data[i] = (source_data[i] - snowflake_epoch) << time_shift;
-        }
+            res_data[i] = (src_data[i] - snowflake_epoch) << time_shift;
 
         return res_column;
     }
@@ -162,9 +174,13 @@ class FunctionSnowflakeToDateTime64 : public IFunction
 {
 private:
     const char * name;
+    const bool allow_nonconst_timezone_arguments;
 
 public:
-    explicit FunctionSnowflakeToDateTime64(const char * name_) : name(name_) { }
+    explicit FunctionSnowflakeToDateTime64(const char * name_, ContextPtr context)
+        : name(name_)
+        , allow_nonconst_timezone_arguments(context->getSettings().allow_nonconst_timezone_arguments)
+    {}
 
     String getName() const override { return name; }
     size_t getNumberOfArguments() const override { return 0; }
@@ -182,7 +198,7 @@ public:
 
         std::string timezone;
         if (arguments.size() == 2)
-            timezone = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0);
+            timezone = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, allow_nonconst_timezone_arguments);
 
         return std::make_shared<DataTypeDateTime64>(3, timezone);
     }
@@ -190,17 +206,26 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
         const auto & src = arguments[0];
-        const auto & col = *src.column;
+        const auto & src_column = *src.column;
 
         auto res_column = ColumnDecimal<DateTime64>::create(input_rows_count, 3);
-        auto & result_data = res_column->getData();
+        auto & res_data = res_column->getData();
 
-        const auto & source_data = typeid_cast<const ColumnInt64 &>(col).getData();
-
-        for (size_t i = 0; i < input_rows_count; ++i)
+        if (const auto * src_column_non_const = typeid_cast<const ColumnInt64 *>(&src_column))
         {
-            result_data[i] = (source_data[i] >> time_shift) + snowflake_epoch;
+            const auto & src_data = src_column_non_const->getData();
+            for (size_t i = 0; i < input_rows_count; ++i)
+                res_data[i] = (src_data[i] >> time_shift) + snowflake_epoch;
         }
+        else if (const auto * src_column_const = typeid_cast<const ColumnConst *>(&src_column))
+        {
+            Int64 src_val = src_column_const->getValue<Int64>();
+            for (size_t i = 0; i < input_rows_count; ++i)
+                res_data[i] = (src_val >> time_shift) + snowflake_epoch;
+        }
+        else
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal argument for function {}", name);
+
         return res_column;
     }
 };
diff --git a/src/Functions/FunctionUnaryArithmetic.h b/src/Functions/FunctionUnaryArithmetic.h
index 4098d58299c..259dc1c42ba 100644
--- a/src/Functions/FunctionUnaryArithmetic.h
+++ b/src/Functions/FunctionUnaryArithmetic.h
@@ -477,31 +477,45 @@ public:
     }
 
 #if USE_EMBEDDED_COMPILER
-    bool isCompilableImpl(const DataTypes & arguments) const override
+    bool isCompilableImpl(const DataTypes & arguments, const DataTypePtr & result_type) const override
     {
         if (1 != arguments.size())
             return false;
 
+        if (!canBeNativeType(*arguments[0]) || !canBeNativeType(*result_type))
+            return false;
+
         return castType(arguments[0].get(), [&](const auto & type)
         {
             using DataType = std::decay_t<decltype(type)>;
             if constexpr (std::is_same_v<DataTypeFixedString, DataType> || std::is_same_v<DataTypeString, DataType>)
+            {
                 return false;
+            }
             else
-                return !IsDataTypeDecimal<DataType> && Op<typename DataType::FieldType>::compilable;
+            {
+                using T0 = typename DataType::FieldType;
+                using T1 = typename Op<T0>::ResultType;
+                if constexpr (!std::is_same_v<T1, InvalidType> && !IsDataTypeDecimal<DataType> && Op<T0>::compilable)
+                    return true;
+            }
+
+            return false;
         });
     }
 
-    llvm::Value * compileImpl(llvm::IRBuilderBase & builder, const DataTypes & types, Values values) const override
+    llvm::Value * compileImpl(llvm::IRBuilderBase & builder, const ValuesWithType & arguments, const DataTypePtr & result_type) const override
     {
-        assert(1 == types.size() && 1 == values.size());
+        assert(1 == arguments.size());
 
         llvm::Value * result = nullptr;
-        castType(types[0].get(), [&](const auto & type)
+        castType(arguments[0].type.get(), [&](const auto & type)
         {
             using DataType = std::decay_t<decltype(type)>;
             if constexpr (std::is_same_v<DataTypeFixedString, DataType> || std::is_same_v<DataTypeString, DataType>)
+            {
                 return false;
+            }
             else
             {
                 using T0 = typename DataType::FieldType;
@@ -509,13 +523,16 @@ public:
                 if constexpr (!std::is_same_v<T1, InvalidType> && !IsDataTypeDecimal<DataType> && Op<T0>::compilable)
                 {
                     auto & b = static_cast<llvm::IRBuilder<> &>(builder);
-                    auto * v = nativeCast(b, types[0], values[0], std::make_shared<DataTypeNumber<T1>>());
+                    auto * v = nativeCast(b, arguments[0], result_type);
                     result = Op<T0>::compile(b, v, is_signed_v<T1>);
+
                     return true;
                 }
             }
+
             return false;
         });
+
         return result;
     }
 #endif
diff --git a/src/Functions/FunctionUnixTimestamp64.h b/src/Functions/FunctionUnixTimestamp64.h
index 7519e46f9dc..58a23f7266e 100644
--- a/src/Functions/FunctionUnixTimestamp64.h
+++ b/src/Functions/FunctionUnixTimestamp64.h
@@ -6,6 +6,7 @@
 #include <DataTypes/DataTypeDateTime64.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <Columns/ColumnsNumber.h>
+#include <Interpreters/Context.h>
 
 #include <base/arithmeticOverflow.h>
 
@@ -99,11 +100,13 @@ class FunctionFromUnixTimestamp64 : public IFunction
 private:
     size_t target_scale;
     const char * name;
+    const bool allow_nonconst_timezone_arguments;
 public:
-    FunctionFromUnixTimestamp64(size_t target_scale_, const char * name_)
-        : target_scale(target_scale_), name(name_)
-    {
-    }
+    FunctionFromUnixTimestamp64(size_t target_scale_, const char * name_, ContextPtr context)
+        : target_scale(target_scale_)
+        , name(name_)
+        , allow_nonconst_timezone_arguments(context->getSettings().allow_nonconst_timezone_arguments)
+    {}
 
     String getName() const override { return name; }
     size_t getNumberOfArguments() const override { return 0; }
@@ -121,7 +124,7 @@ public:
 
         std::string timezone;
         if (arguments.size() == 2)
-            timezone = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0);
+            timezone = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, allow_nonconst_timezone_arguments);
 
         return std::make_shared<DataTypeDateTime64>(target_scale, timezone);
     }
diff --git a/src/Functions/FunctionsCodingIP.cpp b/src/Functions/FunctionsCodingIP.cpp
index 2671418fc7b..7bdbac6531d 100644
--- a/src/Functions/FunctionsCodingIP.cpp
+++ b/src/Functions/FunctionsCodingIP.cpp
@@ -580,7 +580,7 @@ private:
 #if __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__
             unalignedStoreLittleEndian<UInt64>(buf + 8, 0x00000000FFFF0000ull | (static_cast<UInt64>(ntohl(in)) << 32));
 #else
-            unalignedStoreLittleEndian<UInt64>(buf + 8, 0x00000000FFFF0000ull | (static_cast<UInt64>(__builtin_bswap32(in))) << 32));
+            unalignedStoreLittleEndian<UInt64>(buf + 8, 0x00000000FFFF0000ull | (static_cast<UInt64>(std::byteswap(in)) << 32));
 #endif
     }
 };
diff --git a/src/Functions/FunctionsCodingIP.h b/src/Functions/FunctionsCodingIP.h
index d02cc81f608..9d090abb736 100644
--- a/src/Functions/FunctionsCodingIP.h
+++ b/src/Functions/FunctionsCodingIP.h
@@ -2,6 +2,7 @@
 
 #include <type_traits>
 #include <Common/formatIPv6.h>
+#include <Common/IPv6ToBinary.h>
 
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnNullable.h>
@@ -16,6 +17,7 @@ namespace ErrorCodes
     extern const int CANNOT_PARSE_IPV4;
     extern const int CANNOT_PARSE_IPV6;
     extern const int ILLEGAL_COLUMN;
+    extern const int CANNOT_CONVERT_TYPE;
 }
 
 enum class IPStringToNumExceptionMode : uint8_t
@@ -296,4 +298,87 @@ ColumnPtr convertToIPv4(ColumnPtr column, const PaddedPODArray<UInt8> * null_map
     return col_res;
 }
 
+template <IPStringToNumExceptionMode exception_mode, typename ToColumn = ColumnIPv4>
+ColumnPtr convertIPv6ToIPv4(ColumnPtr column, const PaddedPODArray<UInt8> * null_map = nullptr)
+{
+    const ColumnIPv6 * column_ipv6 = checkAndGetColumn<ColumnIPv6>(column.get());
+
+    if (!column_ipv6)
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column type {}. Expected IPv6.", column->getName());
+
+    size_t column_size = column_ipv6->size();
+
+    ColumnUInt8::MutablePtr col_null_map_to;
+    ColumnUInt8::Container * vec_null_map_to = nullptr;
+
+    if constexpr (exception_mode == IPStringToNumExceptionMode::Null)
+    {
+        col_null_map_to = ColumnUInt8::create(column_size, false);
+        vec_null_map_to = &col_null_map_to->getData();
+    }
+
+    const uint8_t ip4_cidr[] {0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00};
+
+    auto col_res = ToColumn::create();
+    auto & vec_res = col_res->getData();
+    vec_res.resize(column_size);
+    const auto & vec_src = column_ipv6->getData();
+
+    for (size_t i = 0; i < vec_res.size(); ++i)
+    {
+        const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_src[i]);
+        uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_res[i]);
+
+        if (null_map && (*null_map)[i])
+        {
+            std::memset(dst, '\0', IPV4_BINARY_LENGTH);
+            if constexpr (exception_mode == IPStringToNumExceptionMode::Null)
+                (*vec_null_map_to)[i] = true;
+            continue;
+        }
+
+        if (!matchIPv6Subnet(src, ip4_cidr, 96))
+        {
+            if constexpr (exception_mode == IPStringToNumExceptionMode::Throw)
+            {
+                char addr[IPV6_MAX_TEXT_LENGTH + 1] {};
+                char * paddr = addr;
+                formatIPv6(src, paddr);
+
+                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "IPv6 {} in column {} is not in IPv4 mapping block", addr, column->getName());
+            }
+            else if constexpr (exception_mode == IPStringToNumExceptionMode::Default)
+            {
+                std::memset(dst, '\0', IPV4_BINARY_LENGTH);
+            }
+            else if constexpr (exception_mode == IPStringToNumExceptionMode::Null)
+            {
+                (*vec_null_map_to)[i] = true;
+                std::memset(dst, '\0', IPV4_BINARY_LENGTH);
+            }
+            continue;
+        }
+
+        if constexpr (std::endian::native == std::endian::little)
+        {
+            dst[0] = src[15];
+            dst[1] = src[14];
+            dst[2] = src[13];
+            dst[3] = src[12];
+        }
+        else
+        {
+            dst[0] = src[12];
+            dst[1] = src[13];
+            dst[2] = src[14];
+            dst[3] = src[15];
+        }
+    }
+
+    if constexpr (exception_mode == IPStringToNumExceptionMode::Null)
+        return ColumnNullable::create(std::move(col_res), std::move(col_null_map_to));
+
+    return col_res;
+}
+
 }
diff --git a/src/Functions/FunctionsComparison.h b/src/Functions/FunctionsComparison.h
index 08bc350c1d4..66269f72866 100644
--- a/src/Functions/FunctionsComparison.h
+++ b/src/Functions/FunctionsComparison.h
@@ -1382,37 +1382,6 @@ public:
             return executeGeneric(col_with_type_and_name_left, col_with_type_and_name_right);
         }
     }
-
-#if USE_EMBEDDED_COMPILER
-    bool isCompilableImpl(const DataTypes & types) const override
-    {
-        if (2 != types.size())
-            return false;
-
-        WhichDataType data_type_lhs(types[0]);
-        WhichDataType data_type_rhs(types[1]);
-
-        auto is_big_integer = [](WhichDataType type) { return type.isUInt64() || type.isInt64(); };
-
-        if ((is_big_integer(data_type_lhs) && data_type_rhs.isFloat())
-            || (is_big_integer(data_type_rhs) && data_type_lhs.isFloat())
-            || (data_type_lhs.isDate() && data_type_rhs.isDateTime())
-            || (data_type_rhs.isDate() && data_type_lhs.isDateTime()))
-            return false; /// TODO: implement (double, int_N where N > double's mantissa width)
-
-        return isCompilableType(types[0]) && isCompilableType(types[1]);
-    }
-
-    llvm::Value * compileImpl(llvm::IRBuilderBase & builder, const DataTypes & types, Values values) const override
-    {
-        assert(2 == types.size() && 2 == values.size());
-
-        auto & b = static_cast<llvm::IRBuilder<> &>(builder);
-        auto [x, y] = nativeCastToCommon(b, types[0], values[0], types[1], values[1]);
-        auto * result = CompileOp<Op>::compile(b, x, y, typeIsSigned(*types[0]) || typeIsSigned(*types[1]));
-        return b.CreateSelect(result, b.getInt8(1), b.getInt8(0));
-    }
-#endif
 };
 
 }
diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index 940585d6d57..00c4cfe7284 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -57,6 +57,7 @@
 #include <Interpreters/Context.h>
 #include <Common/HashTable/HashMap.h>
 #include <DataTypes/DataTypeIPv4andIPv6.h>
+#include <Common/IPv6ToBinary.h>
 #include <Core/Types.h>
 
 
@@ -210,13 +211,13 @@ struct ConvertImpl
                 }
                 else if constexpr (
                     (std::is_same_v<FromDataType, DataTypeIPv4> != std::is_same_v<ToDataType, DataTypeIPv4>)
-                    && !(is_any_of<FromDataType, DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64> || is_any_of<ToDataType, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256>)
+                    && !(is_any_of<FromDataType, DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeIPv6> || is_any_of<ToDataType, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256, DataTypeIPv6>)
                 )
                 {
                     throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Conversion from {} to {} is not supported",
                                     TypeName<typename FromDataType::FieldType>, TypeName<typename ToDataType::FieldType>);
                 }
-                else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> != std::is_same_v<ToDataType, DataTypeIPv6>)
+                else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> != std::is_same_v<ToDataType, DataTypeIPv6> && !(std::is_same_v<ToDataType, DataTypeIPv4> || std::is_same_v<FromDataType, DataTypeIPv4>))
                 {
                     throw Exception(ErrorCodes::NOT_IMPLEMENTED,
                                     "Conversion between numeric types and IPv6 is not supported. "
@@ -297,7 +298,58 @@ struct ConvertImpl
                         }
                         else
                         {
-                            if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeUInt64>)
+                            if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeIPv6>)
+                            {
+                                const uint8_t ip4_cidr[] {0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00};
+                                const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
+                                if (!matchIPv6Subnet(src, ip4_cidr, 96))
+                                {
+                                    char addr[IPV6_MAX_TEXT_LENGTH + 1] {};
+                                    char * paddr = addr;
+                                    formatIPv6(src, paddr);
+
+                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "IPv6 {} in column {} is not in IPv4 mapping block", addr, named_from.column->getName());
+                                }
+
+                                uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
+                                if constexpr (std::endian::native == std::endian::little)
+                                {
+                                    dst[0] = src[15];
+                                    dst[1] = src[14];
+                                    dst[2] = src[13];
+                                    dst[3] = src[12];
+                                }
+                                else
+                                {
+                                    dst[0] = src[12];
+                                    dst[1] = src[13];
+                                    dst[2] = src[14];
+                                    dst[3] = src[15];
+                                }
+                            }
+                            else if constexpr (std::is_same_v<ToDataType, DataTypeIPv6> && std::is_same_v<FromDataType, DataTypeIPv4>)
+                            {
+                                const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
+                                uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
+                                std::memset(dst, '\0', IPV6_BINARY_LENGTH);
+                                dst[10] = dst[11] = 0xff;
+
+                                if constexpr (std::endian::native == std::endian::little)
+                                {
+                                    dst[12] = src[3];
+                                    dst[13] = src[2];
+                                    dst[14] = src[1];
+                                    dst[15] = src[0];
+                                }
+                                else
+                                {
+                                    dst[12] = src[0];
+                                    dst[13] = src[1];
+                                    dst[14] = src[2];
+                                    dst[15] = src[3];
+                                }
+                            }
+                            else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeUInt64>)
                                 vec_to[i] = static_cast<ToFieldType>(static_cast<IPv4::UnderlyingType>(vec_from[i]));
                             else if constexpr (std::is_same_v<Name, NameToUnixTimestamp> && (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>))
                                 vec_to[i] = static_cast<ToFieldType>(vec_from[i] * DATE_SECONDS_PER_DAY);
@@ -434,7 +486,7 @@ struct ToDate32Transform32Or64Signed
 
     static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
     {
-        static const Int32 daynum_min_offset = -static_cast<Int32>(DateLUT::instance().getDayNumOffsetEpoch());
+        static const Int32 daynum_min_offset = -static_cast<Int32>(time_zone.getDayNumOffsetEpoch());
         if (from < daynum_min_offset)
             return daynum_min_offset;
         return (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
@@ -713,9 +765,9 @@ template <>
 struct FormatImpl<DataTypeDate>
 {
     template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDate::FieldType x, WriteBuffer & wb, const DataTypeDate *, const DateLUTImpl *)
+    static ReturnType execute(const DataTypeDate::FieldType x, WriteBuffer & wb, const DataTypeDate *, const DateLUTImpl * time_zone)
     {
-        writeDateText(DayNum(x), wb);
+        writeDateText(DayNum(x), wb, *time_zone);
         return ReturnType(true);
     }
 };
@@ -724,9 +776,9 @@ template <>
 struct FormatImpl<DataTypeDate32>
 {
     template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDate32::FieldType x, WriteBuffer & wb, const DataTypeDate32 *, const DateLUTImpl *)
+    static ReturnType execute(const DataTypeDate32::FieldType x, WriteBuffer & wb, const DataTypeDate32 *, const DateLUTImpl * time_zone)
     {
-        writeDateText(ExtendedDayNum(x), wb);
+        writeDateText(ExtendedDayNum(x), wb, *time_zone);
         return ReturnType(true);
     }
 };
@@ -825,7 +877,10 @@ struct ConvertImpl<FromDataType, DataTypeString, Name, ConvertDefaultBehaviorTag
         const auto & type = static_cast<const FromDataType &>(*col_with_type_and_name.type);
 
         const DateLUTImpl * time_zone = nullptr;
-        /// For argument of DateTime type, second argument with time zone could be specified.
+
+        if constexpr (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>)
+            time_zone = &DateLUT::instance();
+        /// For argument of Date or DateTime type, second argument with time zone could be specified.
         if constexpr (std::is_same_v<FromDataType, DataTypeDateTime> || std::is_same_v<FromDataType, DataTypeDateTime64>)
         {
             auto non_null_args = createBlockWithNestedColumns(arguments);
@@ -976,18 +1031,18 @@ void parseImpl(typename DataType::FieldType & x, ReadBuffer & rb, const DateLUTI
 }
 
 template <>
-inline void parseImpl<DataTypeDate>(DataTypeDate::FieldType & x, ReadBuffer & rb, const DateLUTImpl *)
+inline void parseImpl<DataTypeDate>(DataTypeDate::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone)
 {
     DayNum tmp(0);
-    readDateText(tmp, rb);
+    readDateText(tmp, rb, *time_zone);
     x = tmp;
 }
 
 template <>
-inline void parseImpl<DataTypeDate32>(DataTypeDate32::FieldType & x, ReadBuffer & rb, const DateLUTImpl *)
+inline void parseImpl<DataTypeDate32>(DataTypeDate32::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone)
 {
     ExtendedDayNum tmp(0);
-    readDateText(tmp, rb);
+    readDateText(tmp, rb, *time_zone);
     x = tmp;
 }
 
@@ -1035,20 +1090,20 @@ bool tryParseImpl(typename DataType::FieldType & x, ReadBuffer & rb, const DateL
 }
 
 template <>
-inline bool tryParseImpl<DataTypeDate>(DataTypeDate::FieldType & x, ReadBuffer & rb, const DateLUTImpl *)
+inline bool tryParseImpl<DataTypeDate>(DataTypeDate::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone)
 {
     DayNum tmp(0);
-    if (!tryReadDateText(tmp, rb))
+    if (!tryReadDateText(tmp, rb, *time_zone))
         return false;
     x = tmp;
     return true;
 }
 
 template <>
-inline bool tryParseImpl<DataTypeDate32>(DataTypeDate32::FieldType & x, ReadBuffer & rb, const DateLUTImpl *)
+inline bool tryParseImpl<DataTypeDate32>(DataTypeDate32::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone)
 {
     ExtendedDayNum tmp(0);
-    if (!tryReadDateText(tmp, rb))
+    if (!tryReadDateText(tmp, rb, *time_zone))
         return false;
     x = tmp;
     return true;
@@ -1188,7 +1243,7 @@ struct ConvertThroughParsing
         const DateLUTImpl * local_time_zone [[maybe_unused]] = nullptr;
         const DateLUTImpl * utc_time_zone [[maybe_unused]] = nullptr;
 
-        /// For conversion to DateTime type, second argument with time zone could be specified.
+        /// For conversion to Date or DateTime type, second argument with time zone could be specified.
         if constexpr (std::is_same_v<ToDataType, DataTypeDateTime> || to_datetime64)
         {
             const auto result_type = removeNullable(res_type);
@@ -1201,6 +1256,12 @@ struct ConvertThroughParsing
             if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffort || parsing_mode == ConvertFromStringParsingMode::BestEffortUS)
                 utc_time_zone = &DateLUT::instance("UTC");
         }
+        else if constexpr (std::is_same_v<ToDataType, DataTypeDate> || std::is_same_v<ToDataType, DataTypeDate32>)
+        {
+            // Timezone is more or less dummy when parsing Date/Date32 from string.
+            local_time_zone = &DateLUT::instance();
+            utc_time_zone = &DateLUT::instance("UTC");
+        }
 
         const IColumn * col_from = arguments[0].column.get();
         const ColumnString * col_from_string = checkAndGetColumn<ColumnString>(col_from);
@@ -1751,7 +1812,7 @@ public:
             || std::is_same_v<Name, NameToUnixTimestamp>
             // toDate(value[, timezone : String])
             || std::is_same_v<ToDataType, DataTypeDate> // TODO: shall we allow timestamp argument for toDate? DateTime knows nothing about timezones and this argument is ignored below.
-            // toDate(value[, timezone : String])
+            // toDate32(value[, timezone : String])
             || std::is_same_v<ToDataType, DataTypeDate32>
             // toDateTime(value[, timezone: String])
             || std::is_same_v<ToDataType, DataTypeDateTime>
@@ -1796,13 +1857,13 @@ public:
 
                 if (to_datetime64 || scale != 0) /// toDateTime('xxxx-xx-xx xx:xx:xx', 0) return DateTime
                     return std::make_shared<DataTypeDateTime64>(scale,
-                        extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0));
+                        extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0, false));
 
-                return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0));
+                return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0, false));
             }
 
             if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
-                return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0));
+                return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0, false));
             else if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected branch in code of conversion function: it is a bug.");
             else
@@ -2067,7 +2128,7 @@ public:
             UInt64 scale = to_datetime64 ? DataTypeDateTime64::default_scale : 0;
             if (arguments.size() > 1)
                 scale = extractToDecimalScale(arguments[1]);
-            const auto timezone = extractTimeZoneNameFromFunctionArguments(arguments, 2, 0);
+            const auto timezone = extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false);
 
             res = scale == 0 ? res = std::make_shared<DataTypeDateTime>(timezone) : std::make_shared<DataTypeDateTime64>(scale, timezone);
         }
@@ -2117,7 +2178,7 @@ public:
             }
 
             if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
-                res = std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 1, 0));
+                res = std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, false));
             else if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "LOGICAL ERROR: It is a bug.");
             else if constexpr (to_decimal)
@@ -2866,20 +2927,37 @@ private:
                 using LeftDataType = typename Types::LeftType;
                 using RightDataType = typename Types::RightType;
 
-                if constexpr (IsDataTypeNumber<LeftDataType> && IsDataTypeNumber<RightDataType>)
+                if constexpr (IsDataTypeNumber<LeftDataType>)
                 {
-                    if (wrapper_cast_type == CastType::accurate)
+                    if constexpr (IsDataTypeNumber<RightDataType>)
                     {
-                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName>::execute(
-                            arguments, result_type, input_rows_count, AccurateConvertStrategyAdditions());
-                    }
-                    else
-                    {
-                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName>::execute(
-                            arguments, result_type, input_rows_count, AccurateOrNullConvertStrategyAdditions());
+                        if (wrapper_cast_type == CastType::accurate)
+                        {
+                            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName>::execute(
+                                arguments, result_type, input_rows_count, AccurateConvertStrategyAdditions());
+                        }
+                        else
+                        {
+                            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName>::execute(
+                                arguments, result_type, input_rows_count, AccurateOrNullConvertStrategyAdditions());
+                        }
+                        return true;
                     }
 
-                    return true;
+                    if constexpr (std::is_same_v<RightDataType, DataTypeDate> || std::is_same_v<RightDataType, DataTypeDateTime>)
+                    {
+                        if (wrapper_cast_type == CastType::accurate)
+                        {
+                            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName>::template execute<DateTimeAccurateConvertStrategyAdditions>(
+                                arguments, result_type, input_rows_count);
+                        }
+                        else
+                        {
+                            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName>::template execute<DateTimeAccurateOrNullConvertStrategyAdditions>(
+                                arguments, result_type, input_rows_count);
+                        }
+                        return true;
+                    }
                 }
 
                 return false;
@@ -3984,6 +4062,26 @@ private:
                     return true;
                 }
             }
+            else if constexpr (WhichDataType(FromDataType::type_id).isIPv6() && WhichDataType(ToDataType::type_id).isIPv4())
+            {
+                ret = [cast_ipv4_ipv6_default_on_conversion_error_value, requested_result_is_nullable](
+                                ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * column_nullable, size_t)
+                        -> ColumnPtr
+                {
+                    if (!WhichDataType(result_type).isIPv4())
+                        throw Exception(
+                            ErrorCodes::TYPE_MISMATCH, "Wrong result type {}. Expected IPv4", result_type->getName());
+
+                    const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
+                    if (cast_ipv4_ipv6_default_on_conversion_error_value || requested_result_is_nullable)
+                        return convertIPv6ToIPv4<IPStringToNumExceptionMode::Default>(arguments[0].column, null_map);
+                    else
+                        return convertIPv6ToIPv4<IPStringToNumExceptionMode::Throw>(arguments[0].column, null_map);
+                };
+
+                return true;
+            }
+
             if constexpr (WhichDataType(ToDataType::type_id).isStringOrFixedString())
             {
                 if (from_type->getCustomSerialization())
diff --git a/src/Functions/FunctionsExternalDictionaries.cpp b/src/Functions/FunctionsExternalDictionaries.cpp
index 70b1e3cc861..9fa08c82d41 100644
--- a/src/Functions/FunctionsExternalDictionaries.cpp
+++ b/src/Functions/FunctionsExternalDictionaries.cpp
@@ -45,11 +45,26 @@ Accepts 3 parameters:
 Returned value: value of the dictionary attribute parsed in the attribute’s data type if key is found, otherwise NULL.
 
 Throws an exception if cannot parse the value of the attribute or the value does not match the attribute data type.
+)" };
+
+    constexpr auto dict_get_all_description { R"(
+Retrieves all values from a dictionary corresponding to the given key values.
+
+Accepts 3 or 4 parameters:
+-- name of the dictionary;
+-- name of the column of the dictionary or tuple of column names;
+-- key value - expression returning dictionary key-type value or tuple-type value - depending on the dictionary configuration;
+-- [optional] maximum number of values to return for each attribute;
+
+Returned value: array of dictionary attribute values parsed in the attribute's data type if key is found, otherwise empty array.
+
+Throws an exception if cannot parse the value of the attribute, the value does not match the attribute data type, or the dictionary doesn't support this function.
 )" };
 
     factory.registerFunction<FunctionDictGetNoType<DictionaryGetFunctionType::get>>(FunctionDocumentation{ .description=fmt::format(dict_get_description, "attribute’s data type") });
     factory.registerFunction<FunctionDictGetNoType<DictionaryGetFunctionType::getOrDefault>>(FunctionDocumentation{ .description=fmt::format(dict_get_or_default_description, "attribute’s data type") });
     factory.registerFunction<FunctionDictGetOrNull>(FunctionDocumentation{ .description=dict_get_or_null_description });
+    factory.registerFunction<FunctionDictGetNoType<DictionaryGetFunctionType::getAll>>(FunctionDocumentation{ .description=dict_get_all_description });
 
     factory.registerFunction<FunctionDictGetUInt8>(FunctionDocumentation{ .description=fmt::format(dict_get_description, "UInt8") });
     factory.registerFunction<FunctionDictGetUInt16>(FunctionDocumentation{ .description=fmt::format(dict_get_description, "UInt16") });
diff --git a/src/Functions/FunctionsExternalDictionaries.h b/src/Functions/FunctionsExternalDictionaries.h
index 97d85f384bc..db6529da73c 100644
--- a/src/Functions/FunctionsExternalDictionaries.h
+++ b/src/Functions/FunctionsExternalDictionaries.h
@@ -296,7 +296,8 @@ private:
 enum class DictionaryGetFunctionType
 {
     get,
-    getOrDefault
+    getOrDefault,
+    getAll
 };
 
 /// This variant of function derives the result type automatically.
@@ -304,7 +305,10 @@ template <DictionaryGetFunctionType dictionary_get_function_type>
 class FunctionDictGetNoType final : public IFunction
 {
 public:
-    static constexpr auto name = dictionary_get_function_type == DictionaryGetFunctionType::get ? "dictGet" : "dictGetOrDefault";
+    // Kind of gross but we need a static field called "name" for FunctionFactory::registerFunction, and this is the easiest way
+    static constexpr auto name = (dictionary_get_function_type == DictionaryGetFunctionType::get)
+        ? "dictGet"
+        : ((dictionary_get_function_type == DictionaryGetFunctionType::getOrDefault) ? "dictGetOrDefault" : "dictGetAll");
 
     static FunctionPtr create(ContextPtr context)
     {
@@ -321,7 +325,13 @@ public:
 
     bool useDefaultImplementationForConstants() const final { return true; }
     bool useDefaultImplementationForNulls() const final { return false; }
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const final { return {0, 1}; }
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const final
+    {
+        if constexpr (dictionary_get_function_type == DictionaryGetFunctionType::getAll)
+            return {0, 1, 3};
+        else
+            return {0, 1};
+    }
 
     bool isDeterministic() const override { return false; }
 
@@ -360,6 +370,15 @@ public:
         }
 
         bool key_is_nullable = arguments[2].type->isNullable();
+        if constexpr (dictionary_get_function_type == DictionaryGetFunctionType::getAll)
+        {
+            if (key_is_nullable)
+                throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "Function {} does not support nullable keys", getName());
+
+            // Wrap all the attribute types in Array()
+            for (auto it = attribute_types.begin(); it != attribute_types.end(); ++it)
+                *it = std::make_shared<DataTypeArray>(*it);
+        }
         if (attribute_types.size() > 1)
         {
             if (key_is_nullable)
@@ -424,6 +443,7 @@ public:
         }
 
         Columns default_cols;
+        size_t collect_values_limit = std::numeric_limits<size_t>::max();
 
         if (dictionary_get_function_type == DictionaryGetFunctionType::getOrDefault)
         {
@@ -464,6 +484,20 @@ public:
         }
         else
         {
+            if (dictionary_get_function_type == DictionaryGetFunctionType::getAll && current_arguments_index < arguments.size())
+            {
+                auto limit_col = arguments[current_arguments_index].column;
+                // The getUInt later attempts to cast and throws on a type mismatch, so skip actual type checking here
+                if (!limit_col || !isColumnConst(*limit_col))
+                    throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                        "Illegal type {} of fourth argument of function {}. Expected const unsigned integer.",
+                        arguments[current_arguments_index].type->getName(),
+                        getName());
+
+                collect_values_limit = limit_col->getUInt(0);
+                ++current_arguments_index;
+            }
+
             for (size_t i = 0; i < attribute_names.size(); ++i)
                 default_cols.emplace_back(nullptr);
         }
@@ -549,7 +583,8 @@ public:
             attribute_type = attribute_types.front();
         }
 
-        auto result_column = executeDictionaryRequest(dictionary, attribute_names, key_columns, key_types, attribute_type, default_cols);
+        auto result_column = executeDictionaryRequest(
+            dictionary, attribute_names, key_columns, key_types, attribute_type, default_cols, collect_values_limit);
 
         if (key_is_nullable)
             result_column = wrapInNullable(result_column, {arguments[2]}, result_type, input_rows_count);
@@ -565,7 +600,8 @@ private:
         const Columns & key_columns,
         const DataTypes & key_types,
         const DataTypePtr & result_type,
-        const Columns & default_cols) const
+        const Columns & default_cols,
+        size_t collect_values_limit) const
     {
         ColumnPtr result;
 
@@ -573,23 +609,31 @@ private:
         {
             const auto & result_tuple_type = assert_cast<const DataTypeTuple &>(*result_type);
 
-            Columns result_columns = dictionary->getColumns(
-                attribute_names,
-                result_tuple_type.getElements(),
-                key_columns,
-                key_types,
-                default_cols);
+            Columns result_columns;
+            if constexpr (dictionary_get_function_type == DictionaryGetFunctionType::getAll)
+            {
+                result_columns = dictionary->getColumnsAllValues(
+                    attribute_names, result_tuple_type.getElements(), key_columns, key_types, default_cols, collect_values_limit);
+            }
+            else
+            {
+                result_columns
+                    = dictionary->getColumns(attribute_names, result_tuple_type.getElements(), key_columns, key_types, default_cols);
+            }
 
             result = ColumnTuple::create(std::move(result_columns));
         }
         else
         {
-            result = dictionary->getColumn(
-                attribute_names[0],
-                result_type,
-                key_columns,
-                key_types,
-                default_cols.front());
+            if constexpr (dictionary_get_function_type == DictionaryGetFunctionType::getAll)
+            {
+                result = dictionary->getColumnAllValues(
+                    attribute_names[0], result_type, key_columns, key_types, default_cols.front(), collect_values_limit);
+            }
+            else
+            {
+                result = dictionary->getColumn(attribute_names[0], result_type, key_columns, key_types, default_cols.front());
+            }
         }
 
         return result;
diff --git a/src/Functions/FunctionsHashing.h b/src/Functions/FunctionsHashing.h
index 32e3fbbd4ea..db0ff976d63 100644
--- a/src/Functions/FunctionsHashing.h
+++ b/src/Functions/FunctionsHashing.h
@@ -402,34 +402,6 @@ struct SipHash128ReferenceImpl
     static constexpr bool use_int_hash_for_pods = false;
 };
 
-struct SipHash128ReferenceKeyedImpl
-{
-    static constexpr auto name = "sipHash128ReferenceKeyed";
-    using ReturnType = UInt128;
-    using Key = impl::SipHashKey;
-
-    static Key parseKey(const ColumnWithTypeAndName & key) { return impl::parseSipHashKey(key); }
-
-    static UInt128 applyKeyed(const Key & key, const char * begin, size_t size)
-    {
-        return sipHash128ReferenceKeyed(key.key0, key.key1, begin, size);
-    }
-
-    static UInt128 combineHashesKeyed(const Key & key, UInt128 h1, UInt128 h2)
-    {
-#if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
-        UInt128 tmp;
-        reverseMemcpy(&tmp, &h1, sizeof(UInt128));
-        h1 = tmp;
-        reverseMemcpy(&tmp, &h2, sizeof(UInt128));
-        h2 = tmp;
-#endif
-        UInt128 hashes[] = {h1, h2};
-        return applyKeyed(key, reinterpret_cast<const char *>(hashes), 2 * sizeof(UInt128));
-    }
-
-    static constexpr bool use_int_hash_for_pods = false;
-};
 
 /** Why we need MurmurHash2?
   * MurmurHash2 is an outdated hash function, superseded by MurmurHash3 and subsequently by CityHash, xxHash, HighwayHash.
@@ -816,12 +788,7 @@ struct ImplBLAKE3
 #else
     static void apply(const char * begin, const size_t size, unsigned char* out_char_data)
     {
-#    if defined(MEMORY_SANITIZER)
-            auto err_msg = blake3_apply_shim_msan_compat(begin, safe_cast<uint32_t>(size), out_char_data);
-            __msan_unpoison(out_char_data, length);
-#    else
-            auto err_msg = blake3_apply_shim(begin, safe_cast<uint32_t>(size), out_char_data);
-#    endif
+        auto err_msg = blake3_apply_shim(begin, safe_cast<uint32_t>(size), out_char_data);
         if (err_msg != nullptr)
         {
             auto err_st = std::string(err_msg);
@@ -1742,7 +1709,6 @@ using FunctionSHA512 = FunctionStringHashFixedString<SHA512Impl>;
 using FunctionSipHash128 = FunctionAnyHash<SipHash128Impl>;
 using FunctionSipHash128Keyed = FunctionAnyHash<SipHash128KeyedImpl, true, SipHash128KeyedImpl::Key>;
 using FunctionSipHash128Reference = FunctionAnyHash<SipHash128ReferenceImpl>;
-using FunctionSipHash128ReferenceKeyed = FunctionAnyHash<SipHash128ReferenceKeyedImpl, true, SipHash128ReferenceKeyedImpl::Key>;
 using FunctionCityHash64 = FunctionAnyHash<ImplCityHash64>;
 using FunctionFarmFingerprint64 = FunctionAnyHash<ImplFarmFingerprint64>;
 using FunctionFarmHash64 = FunctionAnyHash<ImplFarmHash64>;
diff --git a/src/Functions/FunctionsHashingMisc.cpp b/src/Functions/FunctionsHashingMisc.cpp
index 127c87ba940..56c3c1ed00c 100644
--- a/src/Functions/FunctionsHashingMisc.cpp
+++ b/src/Functions/FunctionsHashingMisc.cpp
@@ -20,11 +20,6 @@ REGISTER_FUNCTION(Hashing)
         .examples{{"hash", "SELECT hex(sipHash128Reference('foo', '\\x01', 3))", ""}},
         .categories{"Hash"}
     });
-    factory.registerFunction<FunctionSipHash128ReferenceKeyed>(FunctionDocumentation{
-        .description="Same as [sipHash128Reference](#hash_functions-siphash128reference) but additionally takes an explicit key argument instead of using a fixed key.",
-        .examples{{"hash", "SELECT hex(sipHash128ReferenceKeyed((506097522914230528, 1084818905618843912),'foo', '\\x01', 3));", ""}},
-        .categories{"Hash"}
-    });
     factory.registerFunction<FunctionCityHash64>();
     factory.registerFunction<FunctionFarmFingerprint64>();
     factory.registerFunction<FunctionFarmHash64>();
diff --git a/src/Functions/FunctionsLogical.h b/src/Functions/FunctionsLogical.h
index b2a59c51123..a25bffcdd73 100644
--- a/src/Functions/FunctionsLogical.h
+++ b/src/Functions/FunctionsLogical.h
@@ -184,41 +184,46 @@ public:
     ColumnPtr getConstantResultForNonConstArguments(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type) const override;
 
 #if USE_EMBEDDED_COMPILER
-    bool isCompilableImpl(const DataTypes &) const override { return useDefaultImplementationForNulls(); }
+    bool isCompilableImpl(const DataTypes &, const DataTypePtr &) const override { return useDefaultImplementationForNulls(); }
 
-    llvm::Value * compileImpl(llvm::IRBuilderBase & builder, const DataTypes & types, Values values) const override
+    llvm::Value * compileImpl(llvm::IRBuilderBase & builder, const ValuesWithType & values, const DataTypePtr &) const override
     {
-        assert(!types.empty() && !values.empty());
+        assert(!values.empty());
 
         auto & b = static_cast<llvm::IRBuilder<> &>(builder);
         if constexpr (!Impl::isSaturable())
         {
-            auto * result = nativeBoolCast(b, types[0], values[0]);
-            for (size_t i = 1; i < types.size(); ++i)
-                result = Impl::apply(b, result, nativeBoolCast(b, types[i], values[i]));
+            auto * result = nativeBoolCast(b, values[0]);
+            for (size_t i = 1; i < values.size(); ++i)
+                result = Impl::apply(b, result, nativeBoolCast(b, values[i]));
             return b.CreateSelect(result, b.getInt8(1), b.getInt8(0));
         }
+
         constexpr bool break_on_true = Impl::isSaturatedValue(true);
         auto * next = b.GetInsertBlock();
         auto * stop = llvm::BasicBlock::Create(next->getContext(), "", next->getParent());
         b.SetInsertPoint(stop);
+
         auto * phi = b.CreatePHI(b.getInt8Ty(), static_cast<unsigned>(values.size()));
-        for (size_t i = 0; i < types.size(); ++i)
+
+        for (size_t i = 0; i < values.size(); ++i)
         {
             b.SetInsertPoint(next);
-            auto * value = values[i];
-            auto * truth = nativeBoolCast(b, types[i], value);
-            if (!types[i]->equals(DataTypeUInt8{}))
+            auto * value = values[i].value;
+            auto * truth = nativeBoolCast(b, values[i]);
+            if (!values[i].type->equals(DataTypeUInt8{}))
                 value = b.CreateSelect(truth, b.getInt8(1), b.getInt8(0));
             phi->addIncoming(value, b.GetInsertBlock());
-            if (i + 1 < types.size())
+            if (i + 1 < values.size())
             {
                 next = llvm::BasicBlock::Create(next->getContext(), "", next->getParent());
                 b.CreateCondBr(truth, break_on_true ? stop : next, break_on_true ? next : stop);
             }
         }
+
         b.CreateBr(stop);
         b.SetInsertPoint(stop);
+
         return phi;
     }
 #endif
@@ -248,12 +253,12 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/) const override;
 
 #if USE_EMBEDDED_COMPILER
-    bool isCompilableImpl(const DataTypes &) const override { return true; }
+    bool isCompilableImpl(const DataTypes &, const DataTypePtr &) const override { return true; }
 
-    llvm::Value * compileImpl(llvm::IRBuilderBase & builder, const DataTypes & types, Values values) const override
+    llvm::Value * compileImpl(llvm::IRBuilderBase & builder, const ValuesWithType & values, const DataTypePtr &) const override
     {
         auto & b = static_cast<llvm::IRBuilder<> &>(builder);
-        return b.CreateSelect(Impl<UInt8>::apply(b, nativeBoolCast(b, types[0], values[0])), b.getInt8(1), b.getInt8(0));
+        return b.CreateSelect(Impl<UInt8>::apply(b, nativeBoolCast(b, values[0])), b.getInt8(1), b.getInt8(0));
     }
 #endif
 };
diff --git a/src/Functions/FunctionsTimeWindow.cpp b/src/Functions/FunctionsTimeWindow.cpp
index 8a57a4da692..231e8b6fa77 100644
--- a/src/Functions/FunctionsTimeWindow.cpp
+++ b/src/Functions/FunctionsTimeWindow.cpp
@@ -138,7 +138,7 @@ struct TimeWindowImpl<TUMBLE>
         if (result_type_is_date)
             data_type = std::make_shared<DataTypeDate>();
         else
-            data_type = std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 2, 0));
+            data_type = std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false));
 
         return std::make_shared<DataTypeTuple>(DataTypes{data_type, data_type});
     }
@@ -322,7 +322,7 @@ struct TimeWindowImpl<HOP>
         if (result_type_is_date)
             data_type = std::make_shared<DataTypeDate>();
         else
-            data_type = std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 3, 0));
+            data_type = std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 3, 0, false));
         return std::make_shared<DataTypeTuple>(DataTypes{data_type, data_type});
     }
 
diff --git a/src/Functions/HasTokenImpl.h b/src/Functions/HasTokenImpl.h
index 18e629b58fb..8cacdfff99d 100644
--- a/src/Functions/HasTokenImpl.h
+++ b/src/Functions/HasTokenImpl.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <Columns/ColumnString.h>
+#include <Common/StringSearcher.h>
 #include <Core/ColumnNumbers.h>
 
 
@@ -9,6 +10,7 @@ namespace DB
 
 namespace ErrorCodes
 {
+    extern const int BAD_ARGUMENTS;
     extern const int ILLEGAL_COLUMN;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
@@ -44,51 +46,47 @@ struct HasTokenImpl
         const UInt8 * const end = haystack_data.data() + haystack_data.size();
         const UInt8 * pos = begin;
 
-        try
+        if (!ASCIICaseSensitiveTokenSearcher::isValidNeedle(pattern.data(), pattern.size()))
         {
-            /// Parameter `pattern` is supposed to be a literal of letters and/or numbers.
-            /// Otherwise, an exception from the constructor of `TokenSearcher` is thrown.
-            /// If no exception is thrown at that point, then no further error cases may occur.
-            TokenSearcher searcher(pattern.data(), pattern.size(), end - pos);
             if (res_null)
-                std::ranges::fill(res_null->getData(), false);
-
-            /// The current index in the array of strings.
-            size_t i = 0;
-            /// We will search for the next occurrence in all rows at once.
-            while (pos < end && end != (pos = searcher.search(pos, end - pos)))
-            {
-                /// Let's determine which index it refers to.
-                while (begin + haystack_offsets[i] <= pos)
-                {
-                    res[i] = negate;
-                    ++i;
-                }
-
-                /// We check that the entry does not pass through the boundaries of strings.
-                if (pos + pattern.size() < begin + haystack_offsets[i])
-                    res[i] = !negate;
-                else
-                    res[i] = negate;
-
-                pos = begin + haystack_offsets[i];
-                ++i;
-            }
-
-            /// Tail, in which there can be no substring.
-            if (i < res.size())
-                memset(&res[i], negate, (res.size() - i) * sizeof(res[0]));
-        }
-        catch (...)
-        {
-            if (!res_null)
-                throw;
-            else
             {
                 std::ranges::fill(res, 0);
                 std::ranges::fill(res_null->getData(), true);
+                return;
             }
+            else
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Needle must not contain whitespace or separator characters");
         }
+
+        TokenSearcher searcher(pattern.data(), pattern.size(), end - pos);
+        if (res_null)
+            std::ranges::fill(res_null->getData(), false);
+
+        /// The current index in the array of strings.
+        size_t i = 0;
+        /// We will search for the next occurrence in all rows at once.
+        while (pos < end && end != (pos = searcher.search(pos, end - pos)))
+        {
+            /// Let's determine which index it refers to.
+            while (begin + haystack_offsets[i] <= pos)
+            {
+                res[i] = negate;
+                ++i;
+            }
+
+            /// We check that the entry does not pass through the boundaries of strings.
+            if (pos + pattern.size() < begin + haystack_offsets[i])
+                res[i] = !negate;
+            else
+                res[i] = negate;
+
+            pos = begin + haystack_offsets[i];
+            ++i;
+        }
+
+        /// Tail, in which there can be no substring.
+        if (i < res.size())
+            memset(&res[i], negate, (res.size() - i) * sizeof(res[0]));
     }
 
     template <typename... Args>
diff --git a/src/Functions/IFunction.cpp b/src/Functions/IFunction.cpp
index 7563135f21f..650b54d9a37 100644
--- a/src/Functions/IFunction.cpp
+++ b/src/Functions/IFunction.cpp
@@ -484,59 +484,74 @@ DataTypePtr IFunctionOverloadResolver::getReturnTypeWithoutLowCardinality(const
 
 static std::optional<DataTypes> removeNullables(const DataTypes & types)
 {
+    bool has_nullable = false;
     for (const auto & type : types)
     {
         if (!typeid_cast<const DataTypeNullable *>(type.get()))
             continue;
+
+        has_nullable = true;
+        break;
+    }
+
+    if (has_nullable)
+    {
         DataTypes filtered;
+        filtered.reserve(types.size());
+
         for (const auto & sub_type : types)
             filtered.emplace_back(removeNullable(sub_type));
+
         return filtered;
     }
+
     return {};
 }
 
-bool IFunction::isCompilable(const DataTypes & arguments) const
+bool IFunction::isCompilable(const DataTypes & arguments, const DataTypePtr & result_type) const
 {
-
     if (useDefaultImplementationForNulls())
-        if (auto denulled = removeNullables(arguments))
-            return isCompilableImpl(*denulled);
-    return isCompilableImpl(arguments);
+        if (auto denulled_arguments = removeNullables(arguments))
+            return isCompilableImpl(*denulled_arguments, result_type);
+
+    return isCompilableImpl(arguments, result_type);
 }
 
-llvm::Value * IFunction::compile(llvm::IRBuilderBase & builder, const DataTypes & arguments, Values values) const
+llvm::Value * IFunction::compile(llvm::IRBuilderBase & builder, const ValuesWithType & arguments, const DataTypePtr & result_type) const
 {
-    auto denulled_arguments = removeNullables(arguments);
-    if (useDefaultImplementationForNulls() && denulled_arguments)
+    DataTypes arguments_types;
+    arguments_types.reserve(arguments.size());
+
+    for (const auto & argument : arguments)
+        arguments_types.push_back(argument.type);
+
+    auto denulled_arguments_types = removeNullables(arguments_types);
+    if (useDefaultImplementationForNulls() && denulled_arguments_types)
     {
         auto & b = static_cast<llvm::IRBuilder<> &>(builder);
 
-        std::vector<llvm::Value*> unwrapped_values;
-        std::vector<llvm::Value*> is_null_values;
+        ValuesWithType unwrapped_arguments;
+        unwrapped_arguments.reserve(arguments.size());
 
-        unwrapped_values.reserve(arguments.size());
-        is_null_values.reserve(arguments.size());
+        std::vector<llvm::Value*> is_null_values;
 
         for (size_t i = 0; i < arguments.size(); ++i)
         {
-            auto * value = values[i];
+            const auto & argument = arguments[i];
+            llvm::Value * unwrapped_value = argument.value;
 
-            WhichDataType data_type(arguments[i]);
-            if (data_type.isNullable())
+            if (argument.type->isNullable())
             {
-                unwrapped_values.emplace_back(b.CreateExtractValue(value, {0}));
-                is_null_values.emplace_back(b.CreateExtractValue(value, {1}));
-            }
-            else
-            {
-                unwrapped_values.emplace_back(value);
+                unwrapped_value = b.CreateExtractValue(argument.value, {0});
+                is_null_values.emplace_back(b.CreateExtractValue(argument.value, {1}));
             }
+
+            unwrapped_arguments.emplace_back(unwrapped_value, (*denulled_arguments_types)[i]);
         }
 
-        auto * result = compileImpl(builder, *denulled_arguments, unwrapped_values);
+        auto * result = compileImpl(builder, unwrapped_arguments, removeNullable(result_type));
 
-        auto * nullable_structure_type = toNativeType(b, makeNullable(getReturnTypeImpl(*denulled_arguments)));
+        auto * nullable_structure_type = toNativeType(b, makeNullable(getReturnTypeImpl(*denulled_arguments_types)));
         auto * nullable_structure_value = llvm::Constant::getNullValue(nullable_structure_type);
 
         auto * nullable_structure_with_result_value = b.CreateInsertValue(nullable_structure_value, result, {0});
@@ -548,7 +563,7 @@ llvm::Value * IFunction::compile(llvm::IRBuilderBase & builder, const DataTypes
         return b.CreateInsertValue(nullable_structure_with_result_value, nullable_structure_result_null, {1});
     }
 
-    return compileImpl(builder, arguments, std::move(values));
+    return compileImpl(builder, arguments, result_type);
 }
 
 #endif
diff --git a/src/Functions/IFunction.h b/src/Functions/IFunction.h
index b613ddb8987..c5b9a78015d 100644
--- a/src/Functions/IFunction.h
+++ b/src/Functions/IFunction.h
@@ -11,6 +11,11 @@
 
 #include <memory>
 
+#if USE_EMBEDDED_COMPILER
+#    include <Core/ValuesWithType.h>
+#endif
+
+
 /// This file contains user interface for functions.
 
 namespace llvm
@@ -119,8 +124,6 @@ private:
 
 using ExecutableFunctionPtr = std::shared_ptr<IExecutableFunction>;
 
-using Values = std::vector<llvm::Value *>;
-
 /** Function with known arguments and return type (when the specific overload was chosen).
   * It is also the point where all function-specific properties are known.
   */
@@ -160,7 +163,7 @@ public:
       *       templates with default arguments is impossible and including LLVM in such a generic header
       *       as this one is a major pain.
       */
-    virtual llvm::Value * compile(llvm::IRBuilderBase & /*builder*/, Values /*values*/) const
+    virtual llvm::Value * compile(llvm::IRBuilderBase & /*builder*/, const ValuesWithType & /*arguments*/) const
     {
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "{} is not JIT-compilable", getName());
     }
@@ -509,9 +512,9 @@ public:
 
 #if USE_EMBEDDED_COMPILER
 
-    bool isCompilable(const DataTypes & arguments) const;
+    bool isCompilable(const DataTypes & arguments, const DataTypePtr & result_type) const;
 
-    llvm::Value * compile(llvm::IRBuilderBase &, const DataTypes & arguments, Values values) const;
+    llvm::Value * compile(llvm::IRBuilderBase & builder, const ValuesWithType & arguments, const DataTypePtr & result_type) const;
 
 #endif
 
@@ -519,9 +522,9 @@ protected:
 
 #if USE_EMBEDDED_COMPILER
 
-    virtual bool isCompilableImpl(const DataTypes &) const { return false; }
+    virtual bool isCompilableImpl(const DataTypes & /*arguments*/, const DataTypePtr & /*result_type*/) const { return false; }
 
-    virtual llvm::Value * compileImpl(llvm::IRBuilderBase &, const DataTypes &, Values) const
+    virtual llvm::Value * compileImpl(llvm::IRBuilderBase & /*builder*/, const ValuesWithType & /*arguments*/, const DataTypePtr & /*result_type*/) const
     {
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "{} is not JIT-compilable", getName());
     }
diff --git a/src/Functions/IFunctionAdaptors.h b/src/Functions/IFunctionAdaptors.h
index eb2350d9b5e..23725b1a8b1 100644
--- a/src/Functions/IFunctionAdaptors.h
+++ b/src/Functions/IFunctionAdaptors.h
@@ -55,11 +55,11 @@ public:
 
 #if USE_EMBEDDED_COMPILER
 
-    bool isCompilable() const override { return function->isCompilable(getArgumentTypes()); }
+    bool isCompilable() const override { return function->isCompilable(getArgumentTypes(), getResultType()); }
 
-    llvm::Value * compile(llvm::IRBuilderBase & builder, Values values) const override
+    llvm::Value * compile(llvm::IRBuilderBase & builder, const ValuesWithType & compile_arguments) const override
     {
-        return function->compile(builder, getArgumentTypes(), std::move(values));
+        return function->compile(builder, compile_arguments, getResultType());
     }
 
 #endif
diff --git a/src/Functions/LowerUpperUTF8Impl.h b/src/Functions/LowerUpperUTF8Impl.h
index e8d0abae322..f6b18439fd1 100644
--- a/src/Functions/LowerUpperUTF8Impl.h
+++ b/src/Functions/LowerUpperUTF8Impl.h
@@ -139,7 +139,7 @@ struct LowerUpperUTF8Impl
             /// In case partial buffer was passed (due to SSE optimization)
             /// we cannot convert it with current src_end, but we may have more
             /// bytes to convert and eventually got correct symbol.
-            if (partial && src_sequence_length > static_cast<size_t>(src_end-src))
+            if (partial && src_sequence_length > static_cast<size_t>(src_end - src))
                 return false;
 
             auto src_code_point = UTF8::convertUTF8ToCodePoint(src, src_end - src);
@@ -181,7 +181,9 @@ private:
 
 #ifdef __SSE2__
         static constexpr auto bytes_sse = sizeof(__m128i);
-        const auto * src_end_sse = src + (src_end - src) / bytes_sse * bytes_sse;
+
+        /// If we are before this position, we can still read at least bytes_sse.
+        const auto * src_end_sse = src_end - bytes_sse + 1;
 
         /// SSE2 packed comparison operate on signed types, hence compare (c < 0) instead of (c > 0x7f)
         const auto v_zero = _mm_setzero_si128();
@@ -227,9 +229,11 @@ private:
             {
                 /// UTF-8
 
+                /// Find the offset of the next string after src
                 size_t offset_from_begin = src - begin;
                 while (offset_from_begin >= *offset_it)
                     ++offset_it;
+
                 /// Do not allow one row influence another (since row may have invalid sequence, and break the next)
                 const UInt8 * row_end = begin + *offset_it;
                 chassert(row_end >= src);
@@ -247,8 +251,9 @@ private:
             }
         }
 
-        /// Find which offset src has now
-        while (offset_it != offsets.end() && static_cast<size_t>(src - begin) >= *offset_it)
+        /// Find the offset of the next string after src
+        size_t offset_from_begin = src - begin;
+        while (offset_it != offsets.end() && offset_from_begin >= *offset_it)
             ++offset_it;
 #endif
 
diff --git a/src/Functions/UserDefined/UserDefinedSQLFunctionVisitor.cpp b/src/Functions/UserDefined/UserDefinedSQLFunctionVisitor.cpp
index 57cc45cc75d..597e4efe35e 100644
--- a/src/Functions/UserDefined/UserDefinedSQLFunctionVisitor.cpp
+++ b/src/Functions/UserDefined/UserDefinedSQLFunctionVisitor.cpp
@@ -25,6 +25,12 @@ namespace ErrorCodes
 
 void UserDefinedSQLFunctionVisitor::visit(ASTPtr & ast)
 {
+    if (!ast)
+    {
+        chassert(false);
+        return;
+    }
+
     const auto visit_child_with_shared_ptr = [&](ASTPtr & child)
     {
         if (!child)
diff --git a/src/Functions/addressToLine.cpp b/src/Functions/addressToLine.cpp
index 42f9be23c38..771c85cabf6 100644
--- a/src/Functions/addressToLine.cpp
+++ b/src/Functions/addressToLine.cpp
@@ -52,6 +52,7 @@ protected:
         writeChar(':', out);
         writeIntText(location.line, out);
 
+        out.finalize();
         result = out.complete();
     }
 };
diff --git a/src/Functions/addressToLineWithInlines.cpp b/src/Functions/addressToLineWithInlines.cpp
index 9a7b0858b87..43e2eeb10c7 100644
--- a/src/Functions/addressToLineWithInlines.cpp
+++ b/src/Functions/addressToLineWithInlines.cpp
@@ -59,14 +59,13 @@ protected:
 
     void setResult(StringRefs & result, const Dwarf::LocationInfo & location, const std::vector<Dwarf::SymbolizedFrame> & inline_frames) const override
     {
-
         appendLocationToResult(result, location, nullptr);
         for (const auto & inline_frame : inline_frames)
             appendLocationToResult(result, inline_frame.location, &inline_frame);
     }
-private:
 
-    inline ALWAYS_INLINE void appendLocationToResult(StringRefs & result, const Dwarf::LocationInfo & location, const Dwarf::SymbolizedFrame * frame) const
+private:
+    void appendLocationToResult(StringRefs & result, const Dwarf::LocationInfo & location, const Dwarf::SymbolizedFrame * frame) const
     {
         const char * arena_begin = nullptr;
         WriteBufferFromArena out(cache.arena, arena_begin);
@@ -83,6 +82,7 @@ private:
         }
 
         result.emplace_back(out.complete());
+        out.finalize();
     }
 
 };
diff --git a/src/Functions/array/emptyArray.cpp b/src/Functions/array/emptyArray.cpp
index aeb7f83c6c5..684f8af162a 100644
--- a/src/Functions/array/emptyArray.cpp
+++ b/src/Functions/array/emptyArray.cpp
@@ -1,11 +1,7 @@
 #include <Functions/IFunction.h>
 #include <Functions/FunctionFactory.h>
 #include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypesNumber.h>
-#include <DataTypes/DataTypeDate.h>
-#include <DataTypes/DataTypeDateTime.h>
-#include <DataTypes/DataTypeDateTime64.h>
-#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypeFactory.h>
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnsNumber.h>
@@ -17,24 +13,27 @@ namespace DB
 namespace
 {
 
-template <typename DataType>
 class FunctionEmptyArray : public IFunction
 {
+private:
+    String element_type;
+
 public:
-    static String getNameImpl() { return "emptyArray" + DataType().getName(); }
-    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionEmptyArray>(); }
+    static String getNameImpl(const String & element_type) { return "emptyArray" + element_type; }
+
+    explicit FunctionEmptyArray(const String & element_type_) : element_type(element_type_) {}
 
 private:
     String getName() const override
     {
-        return getNameImpl();
+        return getNameImpl(element_type);
     }
 
     size_t getNumberOfArguments() const override { return 0; }
 
     DataTypePtr getReturnTypeImpl(const DataTypes & /*arguments*/) const override
     {
-        return std::make_shared<DataTypeArray>(std::make_shared<DataType>());
+        return std::make_shared<DataTypeArray>(DataTypeFactory::instance().get(element_type));
     }
 
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return false; }
@@ -42,34 +41,35 @@ private:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName &, const DataTypePtr &, size_t input_rows_count) const override
     {
         return ColumnArray::create(
-            DataType().createColumn(),
+            DataTypeFactory::instance().get(element_type)->createColumn(),
             ColumnArray::ColumnOffsets::create(input_rows_count, 0));
     }
 };
 
-template <typename F>
-void registerFunction(FunctionFactory & factory)
+void registerFunction(FunctionFactory & factory, const String & element_type)
 {
-    factory.registerFunction<F>(F::getNameImpl());
+    factory.registerFunction(FunctionEmptyArray::getNameImpl(element_type),
+        [element_type](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+            std::make_shared<FunctionEmptyArray>(element_type)); });
 }
 
 }
 
 REGISTER_FUNCTION(EmptyArray)
 {
-    registerFunction<FunctionEmptyArray<DataTypeUInt8>>(factory);
-    registerFunction<FunctionEmptyArray<DataTypeUInt16>>(factory);
-    registerFunction<FunctionEmptyArray<DataTypeUInt32>>(factory);
-    registerFunction<FunctionEmptyArray<DataTypeUInt64>>(factory);
-    registerFunction<FunctionEmptyArray<DataTypeInt8>>(factory);
-    registerFunction<FunctionEmptyArray<DataTypeInt16>>(factory);
-    registerFunction<FunctionEmptyArray<DataTypeInt32>>(factory);
-    registerFunction<FunctionEmptyArray<DataTypeInt64>>(factory);
-    registerFunction<FunctionEmptyArray<DataTypeFloat32>>(factory);
-    registerFunction<FunctionEmptyArray<DataTypeFloat64>>(factory);
-    registerFunction<FunctionEmptyArray<DataTypeDate>>(factory);
-    registerFunction<FunctionEmptyArray<DataTypeDateTime>>(factory);
-    registerFunction<FunctionEmptyArray<DataTypeString>>(factory);
+    registerFunction(factory, "UInt8");
+    registerFunction(factory, "UInt16");
+    registerFunction(factory, "UInt32");
+    registerFunction(factory, "UInt64");
+    registerFunction(factory, "Int8");
+    registerFunction(factory, "Int16");
+    registerFunction(factory, "Int32");
+    registerFunction(factory, "Int64");
+    registerFunction(factory, "Float32");
+    registerFunction(factory, "Float64");
+    registerFunction(factory, "Date");
+    registerFunction(factory, "DateTime");
+    registerFunction(factory, "String");
 }
 
 }
diff --git a/src/Functions/blockSerializedSize.cpp b/src/Functions/blockSerializedSize.cpp
index 35be65f3fed..8cfa3b8a4e3 100644
--- a/src/Functions/blockSerializedSize.cpp
+++ b/src/Functions/blockSerializedSize.cpp
@@ -60,6 +60,7 @@ public:
             settings, state);
         serialization->serializeBinaryBulkStateSuffix(settings, state);
 
+        out.finalize();
         return out.count();
     }
 };
diff --git a/src/Functions/dateName.cpp b/src/Functions/dateName.cpp
index bfb190b9a08..4d7a4f0b53d 100644
--- a/src/Functions/dateName.cpp
+++ b/src/Functions/dateName.cpp
@@ -170,7 +170,7 @@ public:
 
         auto * begin = reinterpret_cast<char *>(result_column_data.data());
 
-        WriteBuffer buffer(begin, result_column_data.size());
+        WriteBufferFromPointer buffer(begin, result_column_data.size());
 
         using TimeType = DateTypeToTimeType<DataType>;
         callOnDatePartWriter<TimeType>(date_part, [&](const auto & writer)
@@ -195,6 +195,8 @@ public:
 
         result_column_data.resize(buffer.position() - begin);
 
+        buffer.finalize();
+
         return result_column;
     }
 
diff --git a/src/Functions/date_trunc.cpp b/src/Functions/date_trunc.cpp
index 87fff0b7f3c..414512fc4f8 100644
--- a/src/Functions/date_trunc.cpp
+++ b/src/Functions/date_trunc.cpp
@@ -1,6 +1,6 @@
 #include <Columns/ColumnConst.h>
-#include <Columns/ColumnString.h>
 #include <Columns/ColumnsNumber.h>
+#include <Columns/ColumnString.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
 #include <DataTypes/DataTypeInterval.h>
@@ -25,7 +25,7 @@ class FunctionDateTrunc : public IFunction
 public:
     static constexpr auto name = "dateTrunc";
 
-    explicit FunctionDateTrunc(ContextPtr context_) : context(context_) { }
+    explicit FunctionDateTrunc(ContextPtr context_) : context(context_) {}
 
     static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionDateTrunc>(context); }
 
@@ -39,58 +39,51 @@ public:
     {
         /// The first argument is a constant string with the name of datepart.
 
-        intermediate_type_is_date = false;
+        auto result_type_is_date = false;
         String datepart_param;
-        auto check_first_argument = [&]
-        {
+        auto check_first_argument = [&] {
             const ColumnConst * datepart_column = checkAndGetColumnConst<ColumnString>(arguments[0].column.get());
             if (!datepart_column)
-                throw Exception(
-                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                    "First argument for function {} must be constant string: "
-                    "name of datepart",
-                    getName());
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "First argument for function {} must be constant string: "
+                    "name of datepart", getName());
 
             datepart_param = datepart_column->getValue<String>();
             if (datepart_param.empty())
-                throw Exception(
-                    ErrorCodes::BAD_ARGUMENTS, "First argument (name of datepart) for function {} cannot be empty", getName());
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "First argument (name of datepart) for function {} cannot be empty",
+                    getName());
 
             if (!IntervalKind::tryParseString(datepart_param, datepart_kind))
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "{} doesn't look like datepart name in {}", datepart_param, getName());
 
-            intermediate_type_is_date = (datepart_kind == IntervalKind::Year) || (datepart_kind == IntervalKind::Quarter)
-                || (datepart_kind == IntervalKind::Month) || (datepart_kind == IntervalKind::Week);
+            result_type_is_date = (datepart_kind == IntervalKind::Year)
+                || (datepart_kind == IntervalKind::Quarter) || (datepart_kind == IntervalKind::Month)
+                || (datepart_kind == IntervalKind::Week);
         };
 
         bool second_argument_is_date = false;
-        auto check_second_argument = [&]
-        {
+        auto check_second_argument = [&] {
             if (!isDate(arguments[1].type) && !isDateTime(arguments[1].type) && !isDateTime64(arguments[1].type))
-                throw Exception(
-                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                    "Illegal type {} of 2nd argument of function {}. "
-                    "Should be a date or a date with time",
-                    arguments[1].type->getName(),
-                    getName());
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of 2nd argument of function {}. "
+                    "Should be a date or a date with time", arguments[1].type->getName(), getName());
 
             second_argument_is_date = isDate(arguments[1].type);
 
-            if (second_argument_is_date
-                && ((datepart_kind == IntervalKind::Hour) || (datepart_kind == IntervalKind::Minute)
-                    || (datepart_kind == IntervalKind::Second)))
+            if (second_argument_is_date && ((datepart_kind == IntervalKind::Hour)
+                || (datepart_kind == IntervalKind::Minute) || (datepart_kind == IntervalKind::Second)))
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type Date of argument for function {}", getName());
         };
 
-        auto check_timezone_argument = [&]
-        {
+        auto check_timezone_argument = [&] {
             if (!WhichDataType(arguments[2].type).isString())
-                throw Exception(
-                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                    "Illegal type {} of argument of function {}. "
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
                     "This argument is optional and must be a constant string with timezone name",
-                    arguments[2].type->getName(),
-                    getName());
+                    arguments[2].type->getName(), getName());
+
+            if (second_argument_is_date && result_type_is_date)
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                                "The timezone argument of function {} with datepart '{}' "
+                                "is allowed only when the 2nd argument has the type DateTime",
+                                getName(), datepart_param);
         };
 
         if (arguments.size() == 2)
@@ -106,14 +99,15 @@ public:
         }
         else
         {
-            throw Exception(
-                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
                 "Number of arguments for function {} doesn't match: passed {}, should be 2 or 3",
-                getName(),
-                arguments.size());
+                getName(), arguments.size());
         }
 
-        return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 2, 1));
+        if (result_type_is_date)
+            return std::make_shared<DataTypeDate>();
+        else
+            return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 2, 1, false));
     }
 
     bool useDefaultImplementationForConstants() const override { return true; }
@@ -130,40 +124,26 @@ public:
 
         auto to_start_of_interval = FunctionFactory::instance().get("toStartOfInterval", context);
 
-        ColumnPtr truncated_column;
-        auto date_type = std::make_shared<DataTypeDate>();
-
         if (arguments.size() == 2)
-            truncated_column = to_start_of_interval->build(temp_columns)
-                                    ->execute(temp_columns, intermediate_type_is_date ? date_type : result_type, input_rows_count);
-        else
-        {
-            temp_columns[2] = arguments[2];
-            truncated_column = to_start_of_interval->build(temp_columns)
-                                    ->execute(temp_columns, intermediate_type_is_date ? date_type : result_type, input_rows_count);
-        }
+            return to_start_of_interval->build(temp_columns)->execute(temp_columns, result_type, input_rows_count);
 
-        if (!intermediate_type_is_date)
-            return truncated_column;
-
-        ColumnsWithTypeAndName temp_truncated_column(1);
-        temp_truncated_column[0] = {truncated_column, date_type, ""};
-
-        auto to_date_time_or_default = FunctionFactory::instance().get("toDateTime", context);
-        return to_date_time_or_default->build(temp_truncated_column)->execute(temp_truncated_column, result_type, input_rows_count);
+        temp_columns[2] = arguments[2];
+        return to_start_of_interval->build(temp_columns)->execute(temp_columns, result_type, input_rows_count);
     }
 
-    bool hasInformationAboutMonotonicity() const override { return true; }
+    bool hasInformationAboutMonotonicity() const override
+    {
+        return true;
+    }
 
     Monotonicity getMonotonicityForRange(const IDataType &, const Field &, const Field &) const override
     {
-        return {.is_monotonic = true, .is_always_monotonic = true};
+        return { .is_monotonic = true, .is_always_monotonic = true };
     }
 
 private:
     ContextPtr context;
     mutable IntervalKind::Kind datepart_kind = IntervalKind::Kind::Second;
-    mutable bool intermediate_type_is_date = false;
 };
 
 }
diff --git a/src/Functions/extractTimeZoneFromFunctionArguments.cpp b/src/Functions/extractTimeZoneFromFunctionArguments.cpp
index 7ed240fdbcf..7168c68c9c9 100644
--- a/src/Functions/extractTimeZoneFromFunctionArguments.cpp
+++ b/src/Functions/extractTimeZoneFromFunctionArguments.cpp
@@ -30,10 +30,11 @@ std::string extractTimeZoneNameFromColumn(const IColumn * column, const String &
 }
 
 
-std::string extractTimeZoneNameFromFunctionArguments(const ColumnsWithTypeAndName & arguments, size_t time_zone_arg_num, size_t datetime_arg_num)
+std::string extractTimeZoneNameFromFunctionArguments(const ColumnsWithTypeAndName & arguments, size_t time_zone_arg_num, size_t datetime_arg_num, bool allow_nonconst_timezone_arguments)
 {
     /// Explicit time zone may be passed in last argument.
-    if (arguments.size() == time_zone_arg_num + 1)
+    if ((arguments.size() == time_zone_arg_num + 1)
+       && (!allow_nonconst_timezone_arguments || arguments[time_zone_arg_num].column))
     {
         return extractTimeZoneNameFromColumn(arguments[time_zone_arg_num].column.get(), arguments[time_zone_arg_num].name);
     }
diff --git a/src/Functions/extractTimeZoneFromFunctionArguments.h b/src/Functions/extractTimeZoneFromFunctionArguments.h
index 858be40def7..3c012c64c49 100644
--- a/src/Functions/extractTimeZoneFromFunctionArguments.h
+++ b/src/Functions/extractTimeZoneFromFunctionArguments.h
@@ -16,8 +16,16 @@ std::string extractTimeZoneNameFromColumn(const IColumn * column, const String &
 
 /// Determine working timezone either from optional argument with time zone name or from time zone in DateTime type of argument.
 /// Returns empty string if default time zone should be used.
+///
+/// Parameter allow_nonconst_timezone_arguments toggles if non-const timezone function arguments are accepted (legacy behavior) or not. The
+/// problem with the old behavior is that the timezone is part of the type, and not part of the value. This lead to confusion and unexpected
+/// results.
+/// - For new functions, set allow_nonconst_timezone_arguments = false.
+/// - For existing functions
+///    - which disallow non-const timezone arguments anyways (e.g. getArgumentsThatAreAlwaysConstant()), set allow_nonconst_timezone_arguments = false,
+///    - which allow non-const timezone arguments, set allow_nonconst_timezone_arguments according to the corresponding setting.
 std::string extractTimeZoneNameFromFunctionArguments(
-    const ColumnsWithTypeAndName & arguments, size_t time_zone_arg_num, size_t datetime_arg_num);
+    const ColumnsWithTypeAndName & arguments, size_t time_zone_arg_num, size_t datetime_arg_num, bool allow_nonconst_timezone_arguments);
 
 const DateLUTImpl & extractTimeZoneFromFunctionArguments(
     const ColumnsWithTypeAndName & arguments, size_t time_zone_arg_num, size_t datetime_arg_num);
diff --git a/src/Functions/fromUnixTimestamp64Micro.cpp b/src/Functions/fromUnixTimestamp64Micro.cpp
index 70dcbcd1d4b..191e2137a0d 100644
--- a/src/Functions/fromUnixTimestamp64Micro.cpp
+++ b/src/Functions/fromUnixTimestamp64Micro.cpp
@@ -7,8 +7,8 @@ namespace DB
 REGISTER_FUNCTION(FromUnixTimestamp64Micro)
 {
     factory.registerFunction("fromUnixTimestamp64Micro",
-        [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionFromUnixTimestamp64>(6, "fromUnixTimestamp64Micro")); });
+        [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+            std::make_shared<FunctionFromUnixTimestamp64>(6, "fromUnixTimestamp64Micro", context)); });
 }
 
 }
diff --git a/src/Functions/fromUnixTimestamp64Milli.cpp b/src/Functions/fromUnixTimestamp64Milli.cpp
index 532013dfe5f..c6d4fcd30a2 100644
--- a/src/Functions/fromUnixTimestamp64Milli.cpp
+++ b/src/Functions/fromUnixTimestamp64Milli.cpp
@@ -7,8 +7,8 @@ namespace DB
 REGISTER_FUNCTION(FromUnixTimestamp64Milli)
 {
     factory.registerFunction("fromUnixTimestamp64Milli",
-        [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionFromUnixTimestamp64>(3, "fromUnixTimestamp64Milli")); });
+        [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+            std::make_shared<FunctionFromUnixTimestamp64>(3, "fromUnixTimestamp64Milli", context)); });
 }
 
 }
diff --git a/src/Functions/fromUnixTimestamp64Nano.cpp b/src/Functions/fromUnixTimestamp64Nano.cpp
index 96afdda0fa8..2b5a7addbfc 100644
--- a/src/Functions/fromUnixTimestamp64Nano.cpp
+++ b/src/Functions/fromUnixTimestamp64Nano.cpp
@@ -7,8 +7,8 @@ namespace DB
 REGISTER_FUNCTION(FromUnixTimestamp64Nano)
 {
     factory.registerFunction("fromUnixTimestamp64Nano",
-        [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionFromUnixTimestamp64>(9, "fromUnixTimestamp64Nano")); });
+        [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+            std::make_shared<FunctionFromUnixTimestamp64>(9, "fromUnixTimestamp64Nano", context)); });
 }
 
 }
diff --git a/src/Functions/hasColumnInTable.cpp b/src/Functions/hasColumnInTable.cpp
index 4676b4083b7..66ed515e490 100644
--- a/src/Functions/hasColumnInTable.cpp
+++ b/src/Functions/hasColumnInTable.cpp
@@ -137,7 +137,7 @@ ColumnPtr FunctionHasColumnInTable::executeImpl(const ColumnsWithTypeAndName & a
             treat_local_as_remote,
             treat_local_port_as_remote,
             /* secure= */ false,
-            /* priority= */ 1,
+            /* priority= */ Priority{1},
             /* cluster_name= */ "",
             /* password= */ ""
         };
diff --git a/src/Functions/hasToken.cpp b/src/Functions/hasToken.cpp
index de67e80e752..b90750ea233 100644
--- a/src/Functions/hasToken.cpp
+++ b/src/Functions/hasToken.cpp
@@ -16,18 +16,18 @@ struct NameHasTokenOrNull
     static constexpr auto name = "hasTokenOrNull";
 };
 
-using FunctionHasToken = DB::FunctionsStringSearch<DB::HasTokenImpl<NameHasToken, DB::VolnitskyCaseSensitiveToken, false>>;
-using FunctionHasTokenOrNull = DB::
-    FunctionsStringSearch<DB::HasTokenImpl<NameHasTokenOrNull, DB::VolnitskyCaseSensitiveToken, false>, DB::ExecutionErrorPolicy::Null>;
+using FunctionHasToken
+    = FunctionsStringSearch<HasTokenImpl<NameHasToken, VolnitskyCaseSensitiveToken, false>>;
+using FunctionHasTokenOrNull
+    = FunctionsStringSearch<HasTokenImpl<NameHasTokenOrNull, VolnitskyCaseSensitiveToken, false>, ExecutionErrorPolicy::Null>;
 
 REGISTER_FUNCTION(HasToken)
 {
     factory.registerFunction<FunctionHasToken>(FunctionDocumentation
-        {.description="Performs lookup of needle in haystack using tokenbf_v1 index."}, DB::FunctionFactory::CaseSensitive);
+        {.description="Performs lookup of needle in haystack using tokenbf_v1 index."}, FunctionFactory::CaseSensitive);
 
     factory.registerFunction<FunctionHasTokenOrNull>(FunctionDocumentation
-        {.description="Performs lookup of needle in haystack using tokenbf_v1 index. Returns null if needle is ill-formed."},
-        DB::FunctionFactory::CaseSensitive);
+        {.description="Performs lookup of needle in haystack using tokenbf_v1 index. Returns null if needle is ill-formed."}, FunctionFactory::CaseSensitive);
 }
 
 }
diff --git a/src/Functions/hasTokenCaseInsensitive.cpp b/src/Functions/hasTokenCaseInsensitive.cpp
index a6e8ecf3e9d..d7381e336b5 100644
--- a/src/Functions/hasTokenCaseInsensitive.cpp
+++ b/src/Functions/hasTokenCaseInsensitive.cpp
@@ -17,10 +17,9 @@ struct NameHasTokenCaseInsensitiveOrNull
 };
 
 using FunctionHasTokenCaseInsensitive
-    = DB::FunctionsStringSearch<DB::HasTokenImpl<NameHasTokenCaseInsensitive, DB::VolnitskyCaseInsensitiveToken, false>>;
-using FunctionHasTokenCaseInsensitiveOrNull = DB::FunctionsStringSearch<
-    DB::HasTokenImpl<NameHasTokenCaseInsensitiveOrNull, DB::VolnitskyCaseInsensitiveToken, false>,
-    DB::ExecutionErrorPolicy::Null>;
+    = FunctionsStringSearch<HasTokenImpl<NameHasTokenCaseInsensitive, VolnitskyCaseInsensitiveToken, false>>;
+using FunctionHasTokenCaseInsensitiveOrNull
+    = FunctionsStringSearch<HasTokenImpl<NameHasTokenCaseInsensitiveOrNull, VolnitskyCaseInsensitiveToken, false>, ExecutionErrorPolicy::Null>;
 
 REGISTER_FUNCTION(HasTokenCaseInsensitive)
 {
diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 93bdf406f9d..65e2212e894 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -1116,6 +1116,32 @@ public:
 
         return res;
     }
+
+    ColumnPtr getConstantResultForNonConstArguments(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type) const override
+    {
+        const ColumnWithTypeAndName & arg_cond = arguments[0];
+        if (!arg_cond.column || !isColumnConst(*arg_cond.column))
+            return {};
+
+        const ColumnConst * cond_const_col = checkAndGetColumnConst<ColumnVector<UInt8>>(arg_cond.column.get());
+        if (!cond_const_col)
+            return {};
+
+        bool condition_value = cond_const_col->getValue<UInt8>();
+
+        const ColumnWithTypeAndName & arg_then = arguments[1];
+        const ColumnWithTypeAndName & arg_else = arguments[2];
+        const ColumnWithTypeAndName & potential_const_column = condition_value ? arg_then : arg_else;
+
+        if (!potential_const_column.column || !isColumnConst(*potential_const_column.column))
+            return {};
+
+        auto result = castColumn(potential_const_column, result_type);
+        if (!isColumnConst(*result))
+            return {};
+
+        return result;
+    }
 };
 
 }
diff --git a/src/Functions/in.cpp b/src/Functions/in.cpp
index 7a41ae2e3ea..9045ba677f2 100644
--- a/src/Functions/in.cpp
+++ b/src/Functions/in.cpp
@@ -122,9 +122,13 @@ public:
             tuple = typeid_cast<const ColumnTuple *>(materialized_tuple.get());
         }
 
-        auto set = column_set->getData();
+        auto future_set = column_set->getData();
+        if (!future_set)
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "No Set is passed as the second argument for function '{}'", getName());
+
+        auto set = future_set->get();
         if (!set)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Not-ready Set passed as the second argument for function '{}'", getName());
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Not-ready Set is passed as the second argument for function '{}'", getName());
 
         auto set_types = set->getDataTypes();
 
diff --git a/src/Functions/now.cpp b/src/Functions/now.cpp
index 3c3bff1524f..d3a94379a61 100644
--- a/src/Functions/now.cpp
+++ b/src/Functions/now.cpp
@@ -5,6 +5,7 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/IFunction.h>
 #include <Functions/extractTimeZoneFromFunctionArguments.h>
+#include <Interpreters/Context.h>
 
 namespace DB
 {
@@ -87,7 +88,10 @@ public:
     bool isVariadic() const override { return true; }
 
     size_t getNumberOfArguments() const override { return 0; }
-    static FunctionOverloadResolverPtr create(ContextPtr) { return std::make_unique<NowOverloadResolver>(); }
+    static FunctionOverloadResolverPtr create(ContextPtr context) { return std::make_unique<NowOverloadResolver>(context); }
+    explicit NowOverloadResolver(ContextPtr context)
+        : allow_nonconst_timezone_arguments(context->getSettings().allow_nonconst_timezone_arguments)
+    {}
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
     {
@@ -102,7 +106,7 @@ public:
         }
         if (arguments.size() == 1)
         {
-            return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 0, 0));
+            return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 0, 0, allow_nonconst_timezone_arguments));
         }
         return std::make_shared<DataTypeDateTime>();
     }
@@ -121,10 +125,12 @@ public:
         if (arguments.size() == 1)
             return std::make_unique<FunctionBaseNow>(
                 time(nullptr), DataTypes{arguments.front().type},
-                std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 0, 0)));
+                std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 0, 0, allow_nonconst_timezone_arguments)));
 
         return std::make_unique<FunctionBaseNow>(time(nullptr), DataTypes(), std::make_shared<DataTypeDateTime>());
     }
+private:
+    const bool allow_nonconst_timezone_arguments;
 };
 
 }
diff --git a/src/Functions/now64.cpp b/src/Functions/now64.cpp
index f29b73061d9..349b8c71145 100644
--- a/src/Functions/now64.cpp
+++ b/src/Functions/now64.cpp
@@ -5,6 +5,7 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/extractTimeZoneFromFunctionArguments.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <Interpreters/Context.h>
 
 #include <Common/assert_cast.h>
 
@@ -115,7 +116,10 @@ public:
     bool isVariadic() const override { return true; }
 
     size_t getNumberOfArguments() const override { return 0; }
-    static FunctionOverloadResolverPtr create(ContextPtr) { return std::make_unique<Now64OverloadResolver>(); }
+    static FunctionOverloadResolverPtr create(ContextPtr context) { return std::make_unique<Now64OverloadResolver>(context); }
+    explicit Now64OverloadResolver(ContextPtr context)
+        : allow_nonconst_timezone_arguments(context->getSettings().allow_nonconst_timezone_arguments)
+    {}
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
     {
@@ -137,7 +141,7 @@ public:
         }
         if (arguments.size() == 2)
         {
-            timezone_name = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0);
+            timezone_name = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, allow_nonconst_timezone_arguments);
         }
 
         return std::make_shared<DataTypeDateTime64>(scale, timezone_name);
@@ -157,6 +161,8 @@ public:
 
         return std::make_unique<FunctionBaseNow64>(nowSubsecond(scale), std::move(arg_types), result_type);
     }
+private:
+    const bool allow_nonconst_timezone_arguments;
 };
 
 }
diff --git a/src/Functions/nowInBlock.cpp b/src/Functions/nowInBlock.cpp
index dfb3ed7c34a..0d5f9c45780 100644
--- a/src/Functions/nowInBlock.cpp
+++ b/src/Functions/nowInBlock.cpp
@@ -4,6 +4,7 @@
 #include <DataTypes/DataTypeDateTime.h>
 #include <Columns/ColumnsDateTime.h>
 #include <Columns/ColumnVector.h>
+#include <Interpreters/Context.h>
 
 
 namespace DB
@@ -25,10 +26,13 @@ class FunctionNowInBlock : public IFunction
 {
 public:
     static constexpr auto name = "nowInBlock";
-    static FunctionPtr create(ContextPtr)
+    static FunctionPtr create(ContextPtr context)
     {
-        return std::make_shared<FunctionNowInBlock>();
+        return std::make_shared<FunctionNowInBlock>(context);
     }
+    explicit FunctionNowInBlock(ContextPtr context)
+        : allow_nonconst_timezone_arguments(context->getSettings().allow_nonconst_timezone_arguments)
+    {}
 
     String getName() const override
     {
@@ -68,7 +72,7 @@ public:
         }
         if (arguments.size() == 1)
         {
-            return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 0, 0));
+            return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 0, 0, allow_nonconst_timezone_arguments));
         }
         return std::make_shared<DataTypeDateTime>();
     }
@@ -77,6 +81,8 @@ public:
     {
         return ColumnDateTime::create(input_rows_count, static_cast<UInt32>(time(nullptr)));
     }
+private:
+    const bool allow_nonconst_timezone_arguments;
 };
 
 }
diff --git a/src/Functions/serverConstants.cpp b/src/Functions/serverConstants.cpp
index 19a0d82caf4..0fda53414de 100644
--- a/src/Functions/serverConstants.cpp
+++ b/src/Functions/serverConstants.cpp
@@ -60,13 +60,22 @@ namespace
     };
 
 
-    /// Returns the server time zone.
+    /// Returns timezone for current session.
     class FunctionTimezone : public FunctionConstantBase<FunctionTimezone, String, DataTypeString>
     {
     public:
         static constexpr auto name = "timezone";
         static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionTimezone>(context); }
-        explicit FunctionTimezone(ContextPtr context) : FunctionConstantBase(String{DateLUT::instance().getTimeZone()}, context->isDistributed()) {}
+        explicit FunctionTimezone(ContextPtr context) : FunctionConstantBase(DateLUT::instance().getTimeZone(), context->isDistributed()) {}
+    };
+
+    /// Returns the server time zone (timezone in which server runs).
+    class FunctionServerTimezone : public FunctionConstantBase<FunctionServerTimezone, String, DataTypeString>
+    {
+    public:
+        static constexpr auto name = "serverTimezone";
+        static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionServerTimezone>(context); }
+        explicit FunctionServerTimezone(ContextPtr context) : FunctionConstantBase(DateLUT::serverTimezoneInstance().getTimeZone(), context->isDistributed()) {}
     };
 
 
@@ -151,8 +160,34 @@ REGISTER_FUNCTION(TcpPort)
 
 REGISTER_FUNCTION(Timezone)
 {
-    factory.registerFunction<FunctionTimezone>();
-    factory.registerAlias("timeZone", "timezone");
+    factory.registerFunction<FunctionTimezone>(
+        FunctionDocumentation{
+        .description=R"(
+Returns the default timezone for current session.
+Used as default timezone for parsing DateTime|DateTime64 without explicitly specified timezone.
+Can be changed with SET timezone = 'New/Tz'
+
+[example:timezone]
+    )",
+    .examples{{"timezone", "SELECT timezone();", ""}},
+    .categories{"Constant", "Miscellaneous"}
+});
+factory.registerAlias("timeZone", "timezone");
+}
+
+REGISTER_FUNCTION(ServerTimezone)
+{
+    factory.registerFunction<FunctionServerTimezone>(
+    FunctionDocumentation{
+        .description=R"(
+Returns the timezone name in which server operates.
+
+[example:serverTimezone]
+    )",
+     .examples{{"serverTimezone", "SELECT serverTimezone();", ""}},
+     .categories{"Constant", "Miscellaneous"}
+});
+    factory.registerAlias("serverTimeZone", "serverTimezone");
 }
 
 REGISTER_FUNCTION(Uptime)
diff --git a/src/Functions/snowflake.cpp b/src/Functions/snowflake.cpp
index 4849d6512ca..c18f1c03332 100644
--- a/src/Functions/snowflake.cpp
+++ b/src/Functions/snowflake.cpp
@@ -21,14 +21,14 @@ REGISTER_FUNCTION(DateTime64ToSnowflake)
 REGISTER_FUNCTION(SnowflakeToDateTime)
 {
     factory.registerFunction("snowflakeToDateTime",
-        [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionSnowflakeToDateTime>("snowflakeToDateTime")); });
+        [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+            std::make_shared<FunctionSnowflakeToDateTime>("snowflakeToDateTime", context)); });
 }
 REGISTER_FUNCTION(SnowflakeToDateTime64)
 {
     factory.registerFunction("snowflakeToDateTime64",
-        [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionSnowflakeToDateTime64>("snowflakeToDateTime64")); });
+        [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+            std::make_shared<FunctionSnowflakeToDateTime64>("snowflakeToDateTime64", context)); });
 }
 
 }
diff --git a/src/Functions/timeSlots.cpp b/src/Functions/timeSlots.cpp
index 568ab5e5a47..040495ab023 100644
--- a/src/Functions/timeSlots.cpp
+++ b/src/Functions/timeSlots.cpp
@@ -270,14 +270,14 @@ public:
         /// Note that there is no explicit time zone argument for this function (we specify 2 as an argument number with explicit time zone).
         if (WhichDataType(arguments[0].type).isDateTime())
         {
-            return std::make_shared<DataTypeArray>(std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 3, 0)));
+            return std::make_shared<DataTypeArray>(std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 3, 0, false)));
         }
         else
         {
             auto start_time_scale = assert_cast<const DataTypeDateTime64 &>(*arguments[0].type).getScale();
             auto duration_scale = assert_cast<const DataTypeDecimal64 &>(*arguments[1].type).getScale();
             return std::make_shared<DataTypeArray>(
-                std::make_shared<DataTypeDateTime64>(std::max(start_time_scale, duration_scale), extractTimeZoneNameFromFunctionArguments(arguments, 3, 0)));
+                std::make_shared<DataTypeDateTime64>(std::max(start_time_scale, duration_scale), extractTimeZoneNameFromFunctionArguments(arguments, 3, 0, false)));
         }
 
     }
diff --git a/src/Functions/timezoneOf.cpp b/src/Functions/timezoneOf.cpp
index 6454b1cd735..7a5957a5dbc 100644
--- a/src/Functions/timezoneOf.cpp
+++ b/src/Functions/timezoneOf.cpp
@@ -6,7 +6,6 @@
 #include <Common/DateLUTImpl.h>
 #include <Core/Field.h>
 
-
 namespace DB
 {
 
diff --git a/src/Functions/toStartOfInterval.cpp b/src/Functions/toStartOfInterval.cpp
index c0220f1aed2..649242d0d86 100644
--- a/src/Functions/toStartOfInterval.cpp
+++ b/src/Functions/toStartOfInterval.cpp
@@ -384,7 +384,7 @@ public:
         if (result_type_is_date)
             return std::make_shared<DataTypeDate>();
         else if (result_type_is_datetime)
-            return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 2, 0));
+            return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false));
         else
         {
             auto scale = 0;
@@ -396,7 +396,7 @@ public:
             else if (interval_type->getKind() == IntervalKind::Millisecond)
                 scale = 3;
 
-            return std::make_shared<DataTypeDateTime64>(scale, extractTimeZoneNameFromFunctionArguments(arguments, 2, 0));
+            return std::make_shared<DataTypeDateTime64>(scale, extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false));
         }
 
     }
diff --git a/src/Functions/toTimezone.cpp b/src/Functions/toTimezone.cpp
index 0a54e5a86b7..a0d90351898 100644
--- a/src/Functions/toTimezone.cpp
+++ b/src/Functions/toTimezone.cpp
@@ -5,6 +5,8 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/extractTimeZoneFromFunctionArguments.h>
 
+#include <Interpreters/Context.h>
+
 #include <IO/WriteHelpers.h>
 #include <Common/assert_cast.h>
 
@@ -84,7 +86,10 @@ public:
     String getName() const override { return name; }
 
     size_t getNumberOfArguments() const override { return 2; }
-    static FunctionOverloadResolverPtr create(ContextPtr) { return std::make_unique<ToTimeZoneOverloadResolver>(); }
+    static FunctionOverloadResolverPtr create(ContextPtr context) { return std::make_unique<ToTimeZoneOverloadResolver>(context); }
+    explicit ToTimeZoneOverloadResolver(ContextPtr context)
+        : allow_nonconst_timezone_arguments(context->getSettings().allow_nonconst_timezone_arguments)
+    {}
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
     {
@@ -98,7 +103,7 @@ public:
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
                 "Should be DateTime or DateTime64", arguments[0].type->getName(), getName());
 
-        String time_zone_name = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0);
+        String time_zone_name = extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, allow_nonconst_timezone_arguments);
 
         if (which_type.isDateTime())
             return std::make_shared<DataTypeDateTime>(time_zone_name);
@@ -119,6 +124,8 @@ public:
 
         return std::make_unique<FunctionBaseToTimeZone>(is_constant_timezone, data_types, result_type);
     }
+private:
+    const bool allow_nonconst_timezone_arguments;
 };
 
 }
diff --git a/src/Functions/transform.cpp b/src/Functions/transform.cpp
index 9970012ef4a..8d6e53c491e 100644
--- a/src/Functions/transform.cpp
+++ b/src/Functions/transform.cpp
@@ -5,6 +5,7 @@
 #include <Columns/ColumnConst.h>
 #include <Columns/ColumnDecimal.h>
 #include <Columns/ColumnString.h>
+#include <Columns/ColumnNullable.h>
 #include <Core/DecimalFunctions.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/getLeastSupertype.h>
@@ -13,9 +14,10 @@
 #include <Functions/IFunction.h>
 #include <Interpreters/castColumn.h>
 #include <Interpreters/convertFieldToType.h>
-#include <Common/Arena.h>
 #include <Common/HashTable/HashMap.h>
 #include <Common/typeid_cast.h>
+#include <Common/FieldVisitorsAccurateComparison.h>
+
 
 namespace DB
 {
@@ -25,32 +27,31 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_COLUMN;
+    extern const int LOGICAL_ERROR;
 }
 
 namespace
 {
-    /** transform(x, from_array, to_array[, default]) - convert x according to an explicitly passed match.
-  */
     /** transform(x, [from...], [to...], default)
-  * - converts the values according to the explicitly specified mapping.
-  *
-  * x - what to transform.
-  * from - a constant array of values for the transformation.
-  * to - a constant array of values into which values from `from` must be transformed.
-  * default - what value to use if x is not equal to any of the values in `from`.
-  * `from` and `to` - arrays of the same size.
-  *
-  * Types:
-  * transform(T, Array(T), Array(U), U) -> U
-  *
-  * transform(x, [from...], [to...])
-  * - if `default` is not specified, then for values of `x` for which there is no corresponding element in `from`, the unchanged value of `x` is returned.
-  *
-  * Types:
-  * transform(T, Array(T), Array(T)) -> T
-  *
-  * Note: the implementation is rather cumbersome.
-  */
+      * - converts the values according to the explicitly specified mapping.
+      *
+      * x - what to transform.
+      * from - a constant array of values for the transformation.
+      * to - a constant array of values into which values from `from` must be transformed.
+      * default - what value to use if x is not equal to any of the values in `from`.
+      * `from` and `to` - arrays of the same size.
+      *
+      * Types:
+      * transform(T, Array(T), Array(U), U) -> U
+      *
+      * transform(x, [from...], [to...])
+      * - if `default` is not specified, then for values of `x` for which there is no corresponding element in `from`, the unchanged value of `x` is returned.
+      *
+      * Types:
+      * transform(T, Array(T), Array(T)) -> T
+      *
+      * Note: the implementation is rather cumbersome.
+      */
     class FunctionTransform : public IFunction
     {
     public:
@@ -79,15 +80,6 @@ namespace
                     args_size);
 
             const DataTypePtr & type_x = arguments[0];
-            const auto & type_x_nn = removeNullable(type_x);
-
-            if (!type_x_nn->isValueRepresentedByNumber() && !isString(type_x_nn) && !isNothing(type_x_nn))
-                throw Exception(
-                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                    "Unsupported type {} of first argument "
-                    "of function {}, must be numeric type or Date/DateTime or String",
-                    type_x->getName(),
-                    getName());
 
             const DataTypeArray * type_arr_from = checkAndGetDataType<DataTypeArray>(arguments[1].get());
 
@@ -99,14 +91,16 @@ namespace
 
             const auto type_arr_from_nested = type_arr_from->getNestedType();
 
-            if ((type_x->isValueRepresentedByNumber() != type_arr_from_nested->isValueRepresentedByNumber())
-                || (isString(type_x) != isString(type_arr_from_nested)))
+            auto src = tryGetLeastSupertype(DataTypes{type_x, type_arr_from_nested});
+            if (!src
+                /// Compatibility with previous versions, that allowed even UInt64 with Int64,
+                /// regardless of ambiguous conversions.
+                && !isNativeNumber(type_x) && !isNativeNumber(type_arr_from_nested))
             {
                 throw Exception(
                     ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
                     "First argument and elements of array "
-                    "of second argument of function {} must have compatible types: "
-                    "both numeric or both strings.",
+                    "of the second argument of function {} must have compatible types",
                     getName());
             }
 
@@ -157,8 +151,8 @@ namespace
             }
         }
 
-        ColumnPtr
-        executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
+        ColumnPtr executeImpl(
+            const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
         {
             initialize(arguments, result_type);
 
@@ -172,22 +166,42 @@ namespace
                 default_non_const = castColumn(arguments[3], result_type);
 
             auto column_result = result_type->createColumn();
-            if (!executeNum<ColumnVector<UInt8>>(in, *column_result, default_non_const)
-                && !executeNum<ColumnVector<UInt16>>(in, *column_result, default_non_const)
-                && !executeNum<ColumnVector<UInt32>>(in, *column_result, default_non_const)
-                && !executeNum<ColumnVector<UInt64>>(in, *column_result, default_non_const)
-                && !executeNum<ColumnVector<Int8>>(in, *column_result, default_non_const)
-                && !executeNum<ColumnVector<Int16>>(in, *column_result, default_non_const)
-                && !executeNum<ColumnVector<Int32>>(in, *column_result, default_non_const)
-                && !executeNum<ColumnVector<Int64>>(in, *column_result, default_non_const)
-                && !executeNum<ColumnVector<Float32>>(in, *column_result, default_non_const)
-                && !executeNum<ColumnVector<Float64>>(in, *column_result, default_non_const)
-                && !executeNum<ColumnDecimal<Decimal32>>(in, *column_result, default_non_const)
-                && !executeNum<ColumnDecimal<Decimal64>>(in, *column_result, default_non_const)
-                && !executeString(in, *column_result, default_non_const))
+            if (cache.is_empty)
             {
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}", in->getName(), getName());
+                return default_non_const
+                    ? default_non_const
+                    : castColumn(arguments[0], result_type);
             }
+            else if (cache.table_num_to_idx)
+            {
+                if (!executeNum<ColumnVector<UInt8>>(in, *column_result, default_non_const)
+                    && !executeNum<ColumnVector<UInt16>>(in, *column_result, default_non_const)
+                    && !executeNum<ColumnVector<UInt32>>(in, *column_result, default_non_const)
+                    && !executeNum<ColumnVector<UInt64>>(in, *column_result, default_non_const)
+                    && !executeNum<ColumnVector<Int8>>(in, *column_result, default_non_const)
+                    && !executeNum<ColumnVector<Int16>>(in, *column_result, default_non_const)
+                    && !executeNum<ColumnVector<Int32>>(in, *column_result, default_non_const)
+                    && !executeNum<ColumnVector<Int64>>(in, *column_result, default_non_const)
+                    && !executeNum<ColumnVector<Float32>>(in, *column_result, default_non_const)
+                    && !executeNum<ColumnVector<Float64>>(in, *column_result, default_non_const)
+                    && !executeNum<ColumnDecimal<Decimal32>>(in, *column_result, default_non_const)
+                    && !executeNum<ColumnDecimal<Decimal64>>(in, *column_result, default_non_const))
+                {
+                    throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}", in->getName(), getName());
+                }
+            }
+            else if (cache.table_string_to_idx)
+            {
+                if (!executeString(in, *column_result, default_non_const))
+                    executeContiguous(in, *column_result, default_non_const);
+            }
+            else if (cache.table_anything_to_idx)
+            {
+                executeAnything(in, *column_result, default_non_const);
+            }
+            else
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "State of the function `transform` is not initialized");
+
             return column_result;
         }
 
@@ -204,6 +218,47 @@ namespace
             return impl->execute(args, result_type, input_rows_count);
         }
 
+        void executeAnything(const IColumn * in, IColumn & column_result, const ColumnPtr default_non_const) const
+        {
+            const size_t size = in->size();
+            const auto & table = *cache.table_anything_to_idx;
+            column_result.reserve(size);
+            for (size_t i = 0; i < size; ++i)
+            {
+                SipHash hash;
+                in->updateHashWithValue(i, hash);
+
+                const auto * it = table.find(hash.get128());
+                if (it)
+                    column_result.insertFrom(*cache.to_column, it->getMapped());
+                else if (cache.default_column)
+                    column_result.insertFrom(*cache.default_column, 0);
+                else if (default_non_const)
+                    column_result.insertFrom(*default_non_const, i);
+                else
+                    column_result.insertFrom(*in, i);
+            }
+        }
+
+        void executeContiguous(const IColumn * in, IColumn & column_result, const ColumnPtr default_non_const) const
+        {
+            const size_t size = in->size();
+            const auto & table = *cache.table_string_to_idx;
+            column_result.reserve(size);
+            for (size_t i = 0; i < size; ++i)
+            {
+                const auto * it = table.find(in->getDataAt(i));
+                if (it)
+                    column_result.insertFrom(*cache.to_column, it->getMapped());
+                else if (cache.default_column)
+                    column_result.insertFrom(*cache.default_column, 0);
+                else if (default_non_const)
+                    column_result.insertFrom(*default_non_const, i);
+                else
+                    column_result.insertFrom(*in, i);
+            }
+        }
+
         template <typename T>
         bool executeNum(const IColumn * in_untyped, IColumn & column_result, const ColumnPtr default_non_const) const
         {
@@ -236,7 +291,7 @@ namespace
                 {
                     const auto * it = table.find(bit_cast<UInt64>(pod[i]));
                     if (it)
-                        column_result.insertFrom(*cache.to_columns, it->getMapped());
+                        column_result.insertFrom(*cache.to_column, it->getMapped());
                     else if (cache.default_column)
                         column_result.insertFrom(*cache.default_column, 0);
                     else if (default_non_const)
@@ -259,14 +314,14 @@ namespace
             out_offs.resize(size);
             auto & out_chars = out->getChars();
 
-            const auto * to_col = reinterpret_cast<const ColumnString *>(cache.to_columns.get());
+            const auto * to_col = assert_cast<const ColumnString *>(cache.to_column.get());
             const auto & to_chars = to_col->getChars();
             const auto & to_offs = to_col->getOffsets();
             const auto & table = *cache.table_num_to_idx;
 
             if (cache.default_column)
             {
-                const auto * def = reinterpret_cast<const ColumnString *>(cache.default_column.get());
+                const auto * def = assert_cast<const ColumnString *>(cache.default_column.get());
                 const auto & def_chars = def->getChars();
                 const auto & def_offs = def->getOffsets();
                 const auto * def_data = def_chars.data();
@@ -275,7 +330,7 @@ namespace
             }
             else
             {
-                const auto * def = reinterpret_cast<const ColumnString *>(default_non_const.get());
+                const auto * def = assert_cast<const ColumnString *>(default_non_const.get());
                 const auto & def_chars = def->getChars();
                 const auto & def_offs = def->getOffsets();
                 executeNumToStringHelper(table, pod, out_chars, out_offs, to_chars, to_offs, def_chars, def_offs, size);
@@ -340,16 +395,16 @@ namespace
             if constexpr (std::is_same_v<ColumnDecimal<Decimal32>, T> || std::is_same_v<ColumnDecimal<Decimal64>, T>)
                 out_scale = out->getScale();
 
-            const auto & to_pod = reinterpret_cast<const T *>(cache.to_columns.get())->getData();
+            const auto & to_pod = assert_cast<const T *>(cache.to_column.get())->getData();
             const auto & table = *cache.table_num_to_idx;
             if (cache.default_column)
             {
-                const auto const_def = reinterpret_cast<const T *>(cache.default_column.get())->getData()[0];
+                const auto const_def = assert_cast<const T *>(cache.default_column.get())->getData()[0];
                 executeNumToNumHelper(table, pod, out_pod, to_pod, const_def, size, out_scale, out_scale);
             }
             else if (default_non_const)
             {
-                const auto & nconst_def = reinterpret_cast<const T *>(default_non_const.get())->getData();
+                const auto & nconst_def = assert_cast<const T *>(default_non_const.get())->getData();
                 executeNumToNumHelper(table, pod, out_pod, to_pod, nconst_def, size, out_scale, out_scale);
             }
             else
@@ -423,11 +478,11 @@ namespace
                 ColumnString::Offset current_offset = 0;
                 for (size_t i = 0; i < size; ++i)
                 {
-                    const StringRef ref{&data[current_offset], offsets[i] - current_offset};
+                    const StringRef ref{&data[current_offset], offsets[i] - current_offset - 1};
                     current_offset = offsets[i];
                     const auto * it = table.find(ref);
                     if (it)
-                        column_result.insertFrom(*cache.to_columns, it->getMapped());
+                        column_result.insertFrom(*cache.to_column, it->getMapped());
                     else if (cache.default_column)
                         column_result.insertFrom(*cache.default_column, 0);
                     else if (default_non_const)
@@ -453,14 +508,14 @@ namespace
             out_offs.resize(size);
             auto & out_chars = out->getChars();
 
-            const auto * to_col = reinterpret_cast<const ColumnString *>(cache.to_columns.get());
+            const auto * to_col = assert_cast<const ColumnString *>(cache.to_column.get());
             const auto & to_chars = to_col->getChars();
             const auto & to_offs = to_col->getOffsets();
 
             const auto & table = *cache.table_string_to_idx;
             if (cache.default_column)
             {
-                const auto * def = reinterpret_cast<const ColumnString *>(cache.default_column.get());
+                const auto * def = assert_cast<const ColumnString *>(cache.default_column.get());
                 const auto & def_chars = def->getChars();
                 const auto & def_offs = def->getOffsets();
                 const auto * def_data = def_chars.data();
@@ -469,7 +524,7 @@ namespace
             }
             else if (default_non_const)
             {
-                const auto * def = reinterpret_cast<const ColumnString *>(default_non_const.get());
+                const auto * def = assert_cast<const ColumnString *>(default_non_const.get());
                 const auto & def_chars = def->getChars();
                 const auto & def_offs = def->getOffsets();
                 executeStringToStringHelper(table, data, offsets, out_chars, out_offs, to_chars, to_offs, def_chars, def_offs, size);
@@ -500,7 +555,7 @@ namespace
             {
                 const char8_t * to = nullptr;
                 size_t to_size = 0;
-                const StringRef ref{&data[current_offset], offsets[i] - current_offset};
+                const StringRef ref{&data[current_offset], offsets[i] - current_offset - 1};
                 current_offset = offsets[i];
                 const auto * it = table.find(ref);
                 if (it)
@@ -542,16 +597,16 @@ namespace
             const size_t size = offsets.size();
             out_pod.resize(size);
 
-            const auto & to_pod = reinterpret_cast<const T *>(cache.to_columns.get())->getData();
+            const auto & to_pod = assert_cast<const T *>(cache.to_column.get())->getData();
             const auto & table = *cache.table_string_to_idx;
             if (cache.default_column)
             {
-                const auto const_def = reinterpret_cast<const T *>(cache.default_column.get())->getData()[0];
+                const auto const_def = assert_cast<const T *>(cache.default_column.get())->getData()[0];
                 executeStringToNumHelper(table, data, offsets, out_pod, to_pod, const_def, size);
             }
             else
             {
-                const auto & nconst_def = reinterpret_cast<const T *>(default_non_const.get())->getData();
+                const auto & nconst_def = assert_cast<const T *>(default_non_const.get())->getData();
                 executeStringToNumHelper(table, data, offsets, out_pod, to_pod, nconst_def, size);
             }
             return true;
@@ -570,7 +625,7 @@ namespace
             ColumnString::Offset current_offset = 0;
             for (size_t i = 0; i < size; ++i)
             {
-                const StringRef ref{&data[current_offset], offsets[i] - current_offset};
+                const StringRef ref{&data[current_offset], offsets[i] - current_offset - 1};
                 current_offset = offsets[i];
                 const auto * it = table.find(ref);
                 if (it)
@@ -593,15 +648,18 @@ namespace
         {
             using NumToIdx = HashMap<UInt64, size_t, HashCRC32<UInt64>>;
             using StringToIdx = HashMap<StringRef, size_t, StringRefHash>;
+            using AnythingToIdx = HashMap<UInt128, size_t>;
 
             std::unique_ptr<NumToIdx> table_num_to_idx;
             std::unique_ptr<StringToIdx> table_string_to_idx;
+            std::unique_ptr<AnythingToIdx> table_anything_to_idx;
 
-            ColumnPtr to_columns;
+            bool is_empty = false;
+
+            ColumnPtr from_column;
+            ColumnPtr to_column;
             ColumnPtr default_column;
 
-            Arena string_pool;
-
             std::atomic<bool> initialized{false};
             std::mutex mutex;
         };
@@ -609,27 +667,6 @@ namespace
         mutable Cache cache;
 
 
-        static UInt64 bitCastToUInt64(const Field & x)
-        {
-            switch (x.getType())
-            {
-                case Field::Types::UInt64:
-                    return x.get<UInt64>();
-                case Field::Types::Int64:
-                    return x.get<Int64>();
-                case Field::Types::Float64:
-                    return std::bit_cast<UInt64>(x.get<Float64>());
-                case Field::Types::Bool:
-                    return x.get<bool>();
-                case Field::Types::Decimal32:
-                    return x.get<DecimalField<Decimal32>>().getValue();
-                case Field::Types::Decimal64:
-                    return x.get<DecimalField<Decimal64>>().getValue();
-                default:
-                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unexpected type in function 'transform'");
-            }
-        }
-
         static void checkAllowedType(const DataTypePtr & type)
         {
             if (type->isNullable())
@@ -656,33 +693,56 @@ namespace
         /// Can be called from different threads. It works only on the first call.
         void initialize(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type) const
         {
-            const ColumnConst * array_from = checkAndGetColumnConst<ColumnArray>(arguments[1].column.get());
-            const ColumnConst * array_to = checkAndGetColumnConst<ColumnArray>(arguments[2].column.get());
+            if (cache.initialized)
+                return;
+
+            const DataTypePtr & from_type = arguments[0].type;
+
+            if (from_type->onlyNull())
+            {
+                cache.is_empty = true;
+                return;
+            }
+
+            const ColumnArray * array_from = checkAndGetColumnConstData<ColumnArray>(arguments[1].column.get());
+            const ColumnArray * array_to = checkAndGetColumnConstData<ColumnArray>(arguments[2].column.get());
 
             if (!array_from || !array_to)
                 throw Exception(
                     ErrorCodes::ILLEGAL_COLUMN, "Second and third arguments of function {} must be constant arrays.", getName());
 
-            if (cache.initialized)
-                return;
-
-            const auto & from = array_from->getValue<Array>();
-            const size_t size = from.size();
-            if (0 == size)
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Empty arrays are illegal in function {}", getName());
-
             std::lock_guard lock(cache.mutex);
 
-            if (cache.initialized)
-                return;
+            const ColumnPtr & from_column_uncasted = array_from->getDataPtr();
 
-            const auto & to = array_to->getValue<Array>();
-            if (size != to.size())
+            cache.from_column = castColumn(
+                {
+                    from_column_uncasted,
+                    typeid_cast<const DataTypeArray &>(*arguments[1].type).getNestedType(),
+                    arguments[1].name
+                },
+                from_type);
+
+            cache.to_column = castColumn(
+                {
+                    array_to->getDataPtr(),
+                    typeid_cast<const DataTypeArray &>(*arguments[2].type).getNestedType(),
+                    arguments[2].name
+                },
+                result_type);
+
+            const size_t size = cache.from_column->size();
+            if (0 == size)
+            {
+                cache.is_empty = true;
+                return;
+            }
+
+            if (cache.to_column->size() != size)
                 throw Exception(
                     ErrorCodes::BAD_ARGUMENTS, "Second and third arguments of function {} must be arrays of same size", getName());
 
             /// Whether the default value is set.
-
             if (arguments.size() == 4)
             {
                 const IColumn * default_col = arguments[3].column.get();
@@ -702,45 +762,54 @@ namespace
 
             /// Note: Doesn't check the duplicates in the `from` array.
 
-            const IDataType & from_type = *arguments[0].type;
-
-            if (from[0].getType() != Field::Types::String)
+            WhichDataType which(from_type);
+            if (isNativeNumber(which) || which.isDecimal32() || which.isDecimal64())
             {
                 cache.table_num_to_idx = std::make_unique<Cache::NumToIdx>();
                 auto & table = *cache.table_num_to_idx;
                 for (size_t i = 0; i < size; ++i)
                 {
-                    Field key = convertFieldToType(from[i], from_type);
-                    if (key.isNull())
-                        continue;
-
-                    /// Field may be of Float type, but for the purpose of bitwise equality we can treat them as UInt64
-                    table[bitCastToUInt64(key)] = i;
+                    if (applyVisitor(FieldVisitorAccurateEquals(), (*cache.from_column)[i], (*from_column_uncasted)[i]))
+                    {
+                        /// Field may be of Float type, but for the purpose of bitwise equality we can treat them as UInt64
+                        StringRef ref = cache.from_column->getDataAt(i);
+                        UInt64 key = 0;
+                        memcpy(&key, ref.data, ref.size);
+                        table[key] = i;
+                    }
                 }
             }
-            else
+            else if (from_type->isValueUnambiguouslyRepresentedInContiguousMemoryRegion())
             {
                 cache.table_string_to_idx = std::make_unique<Cache::StringToIdx>();
                 auto & table = *cache.table_string_to_idx;
                 for (size_t i = 0; i < size; ++i)
                 {
-                    const String & str_from = from[i].get<const String &>();
-                    StringRef ref{cache.string_pool.insert(str_from.data(), str_from.size() + 1), str_from.size() + 1};
-                    table[ref] = i;
+                    if (applyVisitor(FieldVisitorAccurateEquals(), (*cache.from_column)[i], (*from_column_uncasted)[i]))
+                    {
+                        StringRef ref = cache.from_column->getDataAt(i);
+                        table[ref] = i;
+                    }
+                }
+            }
+            else
+            {
+                cache.table_anything_to_idx = std::make_unique<Cache::AnythingToIdx>();
+                auto & table = *cache.table_anything_to_idx;
+                for (size_t i = 0; i < size; ++i)
+                {
+                    if (applyVisitor(FieldVisitorAccurateEquals(), (*cache.from_column)[i], (*from_column_uncasted)[i]))
+                    {
+                        SipHash hash;
+                        cache.from_column->updateHashWithValue(i, hash);
+                        table[hash.get128()] = i;
+                    }
                 }
             }
 
-            auto to_columns = result_type->createColumn();
-            for (size_t i = 0; i < size; ++i)
-            {
-                Field to_value = convertFieldToType(to[i], *result_type);
-                to_columns->insert(to_value);
-            }
-            cache.to_columns = std::move(to_columns);
-
             cache.initialized = true;
         }
-};
+    };
 
 }
 
diff --git a/src/Functions/tupleElement.cpp b/src/Functions/tupleElement.cpp
index b1fd200f5cd..96b5a047419 100644
--- a/src/Functions/tupleElement.cpp
+++ b/src/Functions/tupleElement.cpp
@@ -17,11 +17,8 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-    extern const int ILLEGAL_INDEX;
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int NOT_FOUND_COLUMN_IN_BLOCK;
-    extern const int NUMBER_OF_DIMENSIONS_MISMATCHED;
-    extern const int SIZES_OF_ARRAYS_DONT_MATCH;
 }
 
 namespace
@@ -34,32 +31,14 @@ class FunctionTupleElement : public IFunction
 {
 public:
     static constexpr auto name = "tupleElement";
-    static FunctionPtr create(ContextPtr)
-    {
-        return std::make_shared<FunctionTupleElement>();
-    }
-
-    String getName() const override
-    {
-        return name;
-    }
 
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionTupleElement>(); }
+    String getName() const override { return name; }
     bool isVariadic() const override { return true; }
-
-    size_t getNumberOfArguments() const override
-    {
-        return 0;
-    }
-
-    bool useDefaultImplementationForConstants() const override
-    {
-        return true;
-    }
-
+    size_t getNumberOfArguments() const override { return 0; }
+    bool useDefaultImplementationForConstants() const override { return true; }
     ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
-
     bool useDefaultImplementationForNulls() const override { return false; }
-
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return false; }
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
@@ -72,193 +51,111 @@ public:
                             getName(), number_of_arguments);
 
         size_t count_arrays = 0;
-        const IDataType * tuple_col = arguments[0].type.get();
-        while (const DataTypeArray * array = checkAndGetDataType<DataTypeArray>(tuple_col))
+        const IDataType * input_type = arguments[0].type.get();
+        while (const DataTypeArray * array = checkAndGetDataType<DataTypeArray>(input_type))
         {
-            tuple_col = array->getNestedType().get();
+            input_type = array->getNestedType().get();
             ++count_arrays;
         }
 
-        const DataTypeTuple * tuple = checkAndGetDataType<DataTypeTuple>(tuple_col);
+        const DataTypeTuple * tuple = checkAndGetDataType<DataTypeTuple>(input_type);
         if (!tuple)
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
                 "First argument for function {} must be tuple or array of tuple. Actual {}",
                 getName(),
                 arguments[0].type->getName());
 
-        auto index = getElementNum(arguments[1].column, *tuple, number_of_arguments);
+        std::optional<size_t> index = getElementIndex(arguments[1].column, *tuple, number_of_arguments);
         if (index.has_value())
         {
-            DataTypePtr out_return_type = tuple->getElements()[index.value()];
+            DataTypePtr return_type = tuple->getElements()[index.value()];
 
             for (; count_arrays; --count_arrays)
-                out_return_type = std::make_shared<DataTypeArray>(out_return_type);
+                return_type = std::make_shared<DataTypeArray>(return_type);
 
-            return out_return_type;
+            return return_type;
         }
         else
-        {
-            const IDataType * default_col = arguments[2].type.get();
-            size_t default_argument_count_arrays = 0;
-            if (const DataTypeArray * array = checkAndGetDataType<DataTypeArray>(default_col))
-            {
-                default_argument_count_arrays = array->getNumberOfDimensions();
-            }
-
-            if (count_arrays != default_argument_count_arrays)
-            {
-                throw Exception(ErrorCodes::NUMBER_OF_DIMENSIONS_MISMATCHED,
-                                "Dimension of types mismatched between first argument and third argument. "
-                                "Dimension of 1st argument: {}. "
-                                "Dimension of 3rd argument: {}.",count_arrays, default_argument_count_arrays);
-            }
             return arguments[2].type;
-        }
     }
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
-        Columns array_offsets;
+        const auto & input_arg = arguments[0];
+        const IDataType * input_type = input_arg.type.get();
+        const IColumn * input_col = input_arg.column.get();
 
-        const auto & first_arg = arguments[0];
-
-        const IDataType * tuple_type = first_arg.type.get();
-        const IColumn * tuple_col = first_arg.column.get();
-        bool first_arg_is_const = false;
-        if (typeid_cast<const ColumnConst *>(tuple_col))
+        bool input_arg_is_const = false;
+        if (typeid_cast<const ColumnConst *>(input_col))
         {
-            tuple_col = assert_cast<const ColumnConst *>(tuple_col)->getDataColumnPtr().get();
-            first_arg_is_const = true;
+            input_col = assert_cast<const ColumnConst *>(input_col)->getDataColumnPtr().get();
+            input_arg_is_const = true;
         }
-        while (const DataTypeArray * array_type = checkAndGetDataType<DataTypeArray>(tuple_type))
-        {
-            const ColumnArray * array_col = assert_cast<const ColumnArray *>(tuple_col);
 
-            tuple_type = array_type->getNestedType().get();
-            tuple_col = &array_col->getData();
+        Columns array_offsets;
+        while (const DataTypeArray * array_type = checkAndGetDataType<DataTypeArray>(input_type))
+        {
+            const ColumnArray * array_col = assert_cast<const ColumnArray *>(input_col);
+
+            input_type = array_type->getNestedType().get();
+            input_col = &array_col->getData();
             array_offsets.push_back(array_col->getOffsetsPtr());
         }
 
-        const DataTypeTuple * tuple_type_concrete = checkAndGetDataType<DataTypeTuple>(tuple_type);
-        const ColumnTuple * tuple_col_concrete = checkAndGetColumn<ColumnTuple>(tuple_col);
-        if (!tuple_type_concrete || !tuple_col_concrete)
+        const DataTypeTuple * input_type_as_tuple = checkAndGetDataType<DataTypeTuple>(input_type);
+        const ColumnTuple * input_col_as_tuple = checkAndGetColumn<ColumnTuple>(input_col);
+        if (!input_type_as_tuple || !input_col_as_tuple)
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                "First argument for function {} must be tuple or array of tuple. Actual {}",
-                getName(),
-                first_arg.type->getName());
+                "First argument for function {} must be tuple or array of tuple. Actual {}", getName(), input_arg.type->getName());
 
-        auto index = getElementNum(arguments[1].column, *tuple_type_concrete, arguments.size());
+        std::optional<size_t> index = getElementIndex(arguments[1].column, *input_type_as_tuple, arguments.size());
 
         if (!index.has_value())
-        {
-            if (!array_offsets.empty())
-            {
-                recursiveCheckArrayOffsets(arguments[0].column, arguments[2].column, array_offsets.size());
-            }
             return arguments[2].column;
-        }
 
-        ColumnPtr res = tuple_col_concrete->getColumns()[index.value()];
+        ColumnPtr res = input_col_as_tuple->getColumns()[index.value()];
 
         /// Wrap into Arrays
         for (auto it = array_offsets.rbegin(); it != array_offsets.rend(); ++it)
             res = ColumnArray::create(res, *it);
 
-        if (first_arg_is_const)
-        {
+        if (input_arg_is_const)
             res = ColumnConst::create(res, input_rows_count);
-        }
         return res;
     }
 
 private:
-
-    void recursiveCheckArrayOffsets(ColumnPtr col_x, ColumnPtr col_y, size_t depth) const
-    {
-        for (size_t i = 1; i < depth; ++i)
-        {
-            checkArrayOffsets(col_x, col_y);
-            col_x = assert_cast<const ColumnArray *>(col_x.get())->getDataPtr();
-            col_y = assert_cast<const ColumnArray *>(col_y.get())->getDataPtr();
-        }
-        checkArrayOffsets(col_x, col_y);
-    }
-
-    void checkArrayOffsets(ColumnPtr col_x, ColumnPtr col_y) const
-    {
-        if (isColumnConst(*col_x))
-        {
-            checkArrayOffsetsWithFirstArgConst(col_x, col_y);
-        }
-        else if (isColumnConst(*col_y))
-        {
-            checkArrayOffsetsWithFirstArgConst(col_y, col_x);
-        }
-        else
-        {
-            const auto & array_x = *assert_cast<const ColumnArray *>(col_x.get());
-            const auto & array_y = *assert_cast<const ColumnArray *>(col_y.get());
-            if (!array_x.hasEqualOffsets(array_y))
-            {
-                throw Exception(ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH,
-                                "The argument 1 and argument 3 of function {} have different array sizes", getName());
-            }
-        }
-    }
-
-    void checkArrayOffsetsWithFirstArgConst(ColumnPtr col_x, ColumnPtr col_y) const
-    {
-        col_x = assert_cast<const ColumnConst *>(col_x.get())->getDataColumnPtr();
-        col_y = col_y->convertToFullColumnIfConst();
-        const auto & array_x = *assert_cast<const ColumnArray *>(col_x.get());
-        const auto & array_y = *assert_cast<const ColumnArray *>(col_y.get());
-
-        const auto & offsets_x = array_x.getOffsets();
-        const auto & offsets_y = array_y.getOffsets();
-
-        ColumnArray::Offset prev_offset = 0;
-        size_t row_size = offsets_y.size();
-        for (size_t row = 0; row < row_size; ++row)
-        {
-            if (unlikely(offsets_x[0] != offsets_y[row] - prev_offset))
-            {
-                throw Exception(ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH,
-                                "The argument 1 and argument 3 of function {} have different array sizes", getName());
-            }
-            prev_offset = offsets_y[row];
-        }
-    }
-
-    std::optional<size_t> getElementNum(const ColumnPtr & index_column, const DataTypeTuple & tuple, const size_t argument_size) const
+    std::optional<size_t> getElementIndex(const ColumnPtr & index_column, const DataTypeTuple & tuple, size_t argument_size) const
     {
         if (checkAndGetColumnConst<ColumnUInt8>(index_column.get())
             || checkAndGetColumnConst<ColumnUInt16>(index_column.get())
             || checkAndGetColumnConst<ColumnUInt32>(index_column.get())
             || checkAndGetColumnConst<ColumnUInt64>(index_column.get()))
         {
-            size_t index = index_column->getUInt(0);
+            const size_t index = index_column->getUInt(0);
 
-            if (index == 0)
-                throw Exception(ErrorCodes::ILLEGAL_INDEX, "Indices in tuples are 1-based.");
+            if (index > 0 && index <= tuple.getElements().size())
+                return {index - 1};
+            else
+            {
+                if (argument_size == 2)
+                    throw Exception(ErrorCodes::NOT_FOUND_COLUMN_IN_BLOCK, "Tuple doesn't have element with index '{}'", index);
+                return std::nullopt;
+            }
 
-            if (index > tuple.getElements().size())
-                throw Exception(ErrorCodes::ILLEGAL_INDEX, "Index for tuple element is out of range.");
-
-            return std::optional<size_t>(index - 1);
         }
         else if (const auto * name_col = checkAndGetColumnConst<ColumnString>(index_column.get()))
         {
-            auto index = tuple.tryGetPositionByName(name_col->getValue<String>());
-            if (index.has_value())
-            {
-                return index;
-            }
+            std::optional<size_t> index = tuple.tryGetPositionByName(name_col->getValue<String>());
 
-            if (argument_size == 2)
+            if (index.has_value())
+                return index;
+            else
             {
-                throw Exception(ErrorCodes::NOT_FOUND_COLUMN_IN_BLOCK, "Tuple doesn't have element with name '{}'", name_col->getValue<String>());
+                if (argument_size == 2)
+                    throw Exception(ErrorCodes::NOT_FOUND_COLUMN_IN_BLOCK, "Tuple doesn't have element with name '{}'", name_col->getValue<String>());
+                return std::nullopt;
             }
-            return std::nullopt;
         }
         else
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
diff --git a/src/IO/BoundedReadBuffer.h b/src/IO/BoundedReadBuffer.h
index 183dbedb78b..eb65857e83a 100644
--- a/src/IO/BoundedReadBuffer.h
+++ b/src/IO/BoundedReadBuffer.h
@@ -31,7 +31,8 @@ public:
 
 private:
     std::optional<size_t> read_until_position;
-    size_t file_offset_of_buffer_end = 0;
+    /// atomic because can be used in log or exception messages while being updated.
+    std::atomic<size_t> file_offset_of_buffer_end = 0;
 };
 
 }
diff --git a/src/IO/BrotliWriteBuffer.cpp b/src/IO/BrotliWriteBuffer.cpp
index 47426d62a6e..a19c6770dad 100644
--- a/src/IO/BrotliWriteBuffer.cpp
+++ b/src/IO/BrotliWriteBuffer.cpp
@@ -42,10 +42,7 @@ BrotliWriteBuffer::BrotliWriteBuffer(std::unique_ptr<WriteBuffer> out_, int comp
     BrotliEncoderSetParameter(brotli->state, BROTLI_PARAM_LGWIN, 24);
 }
 
-BrotliWriteBuffer::~BrotliWriteBuffer()
-{
-    finalize();
-}
+BrotliWriteBuffer::~BrotliWriteBuffer() = default;
 
 void BrotliWriteBuffer::nextImpl()
 {
diff --git a/src/IO/BrotliWriteBuffer.h b/src/IO/BrotliWriteBuffer.h
index e03fa1507ba..8cbc78bd9e7 100644
--- a/src/IO/BrotliWriteBuffer.h
+++ b/src/IO/BrotliWriteBuffer.h
@@ -27,6 +27,7 @@ private:
     class BrotliStateWrapper;
     std::unique_ptr<BrotliStateWrapper> brotli;
 
+
     size_t in_available;
     const uint8_t * in_data;
 
diff --git a/src/IO/Bzip2WriteBuffer.cpp b/src/IO/Bzip2WriteBuffer.cpp
index 4b6bed70d35..b84cbdd1e41 100644
--- a/src/IO/Bzip2WriteBuffer.cpp
+++ b/src/IO/Bzip2WriteBuffer.cpp
@@ -45,10 +45,7 @@ Bzip2WriteBuffer::Bzip2WriteBuffer(std::unique_ptr<WriteBuffer> out_, int compre
 {
 }
 
-Bzip2WriteBuffer::~Bzip2WriteBuffer()
-{
-    finalize();
-}
+Bzip2WriteBuffer::~Bzip2WriteBuffer() = default;
 
 void Bzip2WriteBuffer::nextImpl()
 {
diff --git a/src/IO/CascadeWriteBuffer.cpp b/src/IO/CascadeWriteBuffer.cpp
index f0d98027609..91a42e77fdb 100644
--- a/src/IO/CascadeWriteBuffer.cpp
+++ b/src/IO/CascadeWriteBuffer.cpp
@@ -56,6 +56,8 @@ void CascadeWriteBuffer::nextImpl()
 
 void CascadeWriteBuffer::getResultBuffers(WriteBufferPtrs & res)
 {
+    finalize();
+
     /// Sync position with underlying buffer before invalidating
     curr_buffer->position() = position();
 
@@ -67,6 +69,19 @@ void CascadeWriteBuffer::getResultBuffers(WriteBufferPtrs & res)
     lazy_sources.clear();
 }
 
+void CascadeWriteBuffer::finalizeImpl()
+{
+    if (curr_buffer)
+        curr_buffer->position() = position();
+
+    for (auto & buf : prepared_sources)
+    {
+        if (buf)
+        {
+            buf->finalize();
+        }
+    }
+}
 
 WriteBuffer * CascadeWriteBuffer::setNextBuffer()
 {
diff --git a/src/IO/CascadeWriteBuffer.h b/src/IO/CascadeWriteBuffer.h
index 1059c5b8ddb..a003d11bd8a 100644
--- a/src/IO/CascadeWriteBuffer.h
+++ b/src/IO/CascadeWriteBuffer.h
@@ -47,6 +47,8 @@ public:
 
 private:
 
+    void finalizeImpl() override;
+
     WriteBuffer * setNextBuffer();
 
     WriteBufferPtrs prepared_sources;
diff --git a/src/IO/FileEncryptionCommon.cpp b/src/IO/FileEncryptionCommon.cpp
index 5529c813c40..6f4db4975f7 100644
--- a/src/IO/FileEncryptionCommon.cpp
+++ b/src/IO/FileEncryptionCommon.cpp
@@ -8,10 +8,11 @@
 #include <Common/SipHash.h>
 #include <Common/safe_cast.h>
 
-#include <boost/algorithm/string/predicate.hpp>
-#include <cassert>
-#include <random>
+#    include <cassert>
+#    include <boost/algorithm/string/predicate.hpp>
 
+#    include <openssl/err.h>
+#    include <openssl/rand.h>
 
 namespace DB
 {
@@ -20,6 +21,7 @@ namespace ErrorCodes
 {
     extern const int BAD_ARGUMENTS;
     extern const int DATA_ENCRYPTION_ERROR;
+    extern const int OPENSSL_ERROR;
 }
 
 namespace FileEncryption
@@ -260,12 +262,11 @@ void InitVector::write(WriteBuffer & out) const
 
 InitVector InitVector::random()
 {
-    std::random_device rd;
-    std::mt19937 gen{rd()};
-    std::uniform_int_distribution<UInt128::base_type> dis;
     UInt128 counter;
-    for (auto & i : counter.items)
-        i = dis(gen);
+    auto * buf = reinterpret_cast<unsigned char *>(counter.items);
+    auto ret = RAND_bytes(buf, sizeof(counter.items));
+    if (ret != 1)
+        throw Exception(DB::ErrorCodes::OPENSSL_ERROR, "OpenSSL error code: {}", ERR_get_error());
     return InitVector{counter};
 }
 
diff --git a/src/IO/HTTPCommon.cpp b/src/IO/HTTPCommon.cpp
index 4bea646a42b..3ec9b3d0a83 100644
--- a/src/IO/HTTPCommon.cpp
+++ b/src/IO/HTTPCommon.cpp
@@ -68,7 +68,8 @@ namespace
         if (https)
         {
 #if USE_SSL
-            String resolved_host = resolve_host ? DNSResolver::instance().resolveHost(host).toString() : host;
+            /// Cannot resolve host in advance, otherwise SNI won't work in Poco.
+            /// For more information about SNI, see the https://en.wikipedia.org/wiki/Server_Name_Indication
             auto https_session = std::make_shared<Poco::Net::HTTPSClientSession>(host, port);
             if (resolve_host)
                 https_session->setResolvedHost(DNSResolver::instance().resolveHost(host).toString());
@@ -184,6 +185,24 @@ namespace
         std::mutex mutex;
         std::unordered_map<Key, PoolPtr, Hasher> endpoints_pool;
 
+        void updateHostIfIpChanged(Entry & session, const String & new_ip)
+        {
+            const auto old_ip = session->getResolvedHost().empty() ? session->getHost() : session->getResolvedHost();
+
+            if (new_ip != old_ip)
+            {
+                session->reset();
+                if (session->getResolvedHost().empty())
+                {
+                    session->setHost(new_ip);
+                }
+                else
+                {
+                    session->setResolvedHost(new_ip);
+                }
+            }
+        }
+
     protected:
         HTTPSessionPool() = default;
 
@@ -238,13 +257,7 @@ namespace
 
                     if (resolve_host)
                     {
-                        /// Host can change IP
-                        const auto ip = DNSResolver::instance().resolveHost(host).toString();
-                        if (ip != session->getHost())
-                        {
-                            session->reset();
-                            session->setHost(ip);
-                        }
+                        updateHostIfIpChanged(session, DNSResolver::instance().resolveHost(host).toString());
                     }
                 }
                 /// Reset the message, once it has been printed,
diff --git a/src/IO/LZMADeflatingWriteBuffer.cpp b/src/IO/LZMADeflatingWriteBuffer.cpp
index 30e247b1016..c70ec1507cb 100644
--- a/src/IO/LZMADeflatingWriteBuffer.cpp
+++ b/src/IO/LZMADeflatingWriteBuffer.cpp
@@ -44,10 +44,7 @@ LZMADeflatingWriteBuffer::LZMADeflatingWriteBuffer(
             LZMA_VERSION_STRING);
 }
 
-LZMADeflatingWriteBuffer::~LZMADeflatingWriteBuffer()
-{
-    finalize();
-}
+LZMADeflatingWriteBuffer::~LZMADeflatingWriteBuffer() = default;
 
 void LZMADeflatingWriteBuffer::nextImpl()
 {
diff --git a/src/IO/Lz4DeflatingWriteBuffer.cpp b/src/IO/Lz4DeflatingWriteBuffer.cpp
index c3a1b8282c3..27c945f92cf 100644
--- a/src/IO/Lz4DeflatingWriteBuffer.cpp
+++ b/src/IO/Lz4DeflatingWriteBuffer.cpp
@@ -40,10 +40,7 @@ Lz4DeflatingWriteBuffer::Lz4DeflatingWriteBuffer(
             LZ4F_VERSION);
 }
 
-Lz4DeflatingWriteBuffer::~Lz4DeflatingWriteBuffer()
-{
-    finalize();
-}
+Lz4DeflatingWriteBuffer::~Lz4DeflatingWriteBuffer() = default;
 
 void Lz4DeflatingWriteBuffer::nextImpl()
 {
diff --git a/src/IO/MemoryReadWriteBuffer.cpp b/src/IO/MemoryReadWriteBuffer.cpp
index d6f89108561..415a6c6fadb 100644
--- a/src/IO/MemoryReadWriteBuffer.cpp
+++ b/src/IO/MemoryReadWriteBuffer.cpp
@@ -126,6 +126,8 @@ void MemoryWriteBuffer::addChunk()
 
 std::shared_ptr<ReadBuffer> MemoryWriteBuffer::getReadBufferImpl()
 {
+    finalize();
+
     auto res = std::make_shared<ReadBufferFromMemoryWriteBuffer>(std::move(*this));
 
     /// invalidate members
diff --git a/src/IO/MemoryReadWriteBuffer.h b/src/IO/MemoryReadWriteBuffer.h
index ee128c355c6..d6bf231c22b 100644
--- a/src/IO/MemoryReadWriteBuffer.h
+++ b/src/IO/MemoryReadWriteBuffer.h
@@ -30,12 +30,14 @@ public:
         double growth_rate_ = 2.0,
         size_t max_chunk_size_ = 128 * DBMS_DEFAULT_BUFFER_SIZE);
 
-    void nextImpl() override;
-
     ~MemoryWriteBuffer() override;
 
 protected:
 
+    void nextImpl() override;
+
+    void finalizeImpl() override { /* no op */ }
+
     std::shared_ptr<ReadBuffer> getReadBufferImpl() override;
 
     const size_t max_total_size;
diff --git a/src/IO/NullWriteBuffer.cpp b/src/IO/NullWriteBuffer.cpp
index 035259d48c9..295c53ef7c7 100644
--- a/src/IO/NullWriteBuffer.cpp
+++ b/src/IO/NullWriteBuffer.cpp
@@ -4,8 +4,8 @@
 namespace DB
 {
 
-NullWriteBuffer::NullWriteBuffer(size_t buf_size, char * existing_memory, size_t alignment)
-    : BufferWithOwnMemory<WriteBuffer>(buf_size, existing_memory, alignment)
+NullWriteBuffer::NullWriteBuffer()
+    : WriteBuffer(data, sizeof(data))
 {
 }
 
diff --git a/src/IO/NullWriteBuffer.h b/src/IO/NullWriteBuffer.h
index 615a9bf5cef..f14c74ff720 100644
--- a/src/IO/NullWriteBuffer.h
+++ b/src/IO/NullWriteBuffer.h
@@ -8,11 +8,14 @@ namespace DB
 {
 
 /// Simply do nothing, can be used to measure amount of written bytes.
-class NullWriteBuffer : public BufferWithOwnMemory<WriteBuffer>, boost::noncopyable
+class NullWriteBuffer : public WriteBuffer, boost::noncopyable
 {
 public:
-    explicit NullWriteBuffer(size_t buf_size = 16<<10, char * existing_memory = nullptr, size_t alignment = false);
+    NullWriteBuffer();
     void nextImpl() override;
+
+private:
+    char data[128];
 };
 
 }
diff --git a/src/IO/OpenedFileCache.h b/src/IO/OpenedFileCache.h
index 844e5b31d11..61e502a494b 100644
--- a/src/IO/OpenedFileCache.h
+++ b/src/IO/OpenedFileCache.h
@@ -72,6 +72,13 @@ public:
         return res;
     }
 
+    void remove(const std::string & path, int flags)
+    {
+        Key key(path, flags);
+        std::lock_guard lock(mutex);
+        files.erase(key);
+    }
+
     static OpenedFileCache & instance()
     {
         static OpenedFileCache res;
@@ -82,5 +89,3 @@ public:
 using OpenedFileCachePtr = std::shared_ptr<OpenedFileCache>;
 
 }
-
-
diff --git a/src/IO/ParallelReadBuffer.cpp b/src/IO/ParallelReadBuffer.cpp
index 07240ab3a4f..92af1ed0b04 100644
--- a/src/IO/ParallelReadBuffer.cpp
+++ b/src/IO/ParallelReadBuffer.cpp
@@ -125,9 +125,10 @@ off_t ParallelReadBuffer::seek(off_t offset, int whence)
             if (w->bytes_produced > diff)
             {
                 working_buffer = internal_buffer = Buffer(
-                    w->segment.data() + diff, w->segment.data() + w->bytes_produced);
+                    w->segment.data(), w->segment.data() + w->bytes_produced);
+                pos = working_buffer.begin() + diff;
                 w->bytes_consumed = w->bytes_produced;
-                current_position += w->start_offset + w->bytes_consumed;
+                current_position = w->start_offset + w->bytes_consumed;
                 addReaders();
                 return offset;
             }
@@ -255,7 +256,7 @@ void ParallelReadBuffer::readerThreadFunction(ReadWorkerPtr read_worker)
             return false;
         };
 
-        size_t r = input.readBigAt(read_worker->segment.data(), read_worker->segment.size(), read_worker->start_offset);
+        size_t r = input.readBigAt(read_worker->segment.data(), read_worker->segment.size(), read_worker->start_offset, on_progress);
 
         if (!on_progress(r) && r < read_worker->segment.size())
             throw Exception(
diff --git a/src/IO/Progress.cpp b/src/IO/Progress.cpp
index 1069803633c..bf42cdf91d6 100644
--- a/src/IO/Progress.cpp
+++ b/src/IO/Progress.cpp
@@ -9,11 +9,28 @@
 
 namespace DB
 {
+
+namespace
+{
+    UInt64 getApproxTotalRowsToRead(UInt64 read_rows, UInt64 read_bytes, UInt64 total_bytes_to_read)
+    {
+        if (!read_rows || !read_bytes)
+            return 0;
+
+        auto bytes_per_row = std::ceil(static_cast<double>(read_bytes) / read_rows);
+        return static_cast<UInt64>(std::ceil(static_cast<double>(total_bytes_to_read) / bytes_per_row));
+    }
+}
+
 void ProgressValues::read(ReadBuffer & in, UInt64 server_revision)
 {
     readVarUInt(read_rows, in);
     readVarUInt(read_bytes, in);
     readVarUInt(total_rows_to_read, in);
+    if (server_revision >= DBMS_MIN_PROTOCOL_VERSION_WITH_TOTAL_BYTES_IN_PROGRESS)
+    {
+        readVarUInt(total_bytes_to_read, in);
+    }
     if (server_revision >= DBMS_MIN_REVISION_WITH_CLIENT_WRITE_INFO)
     {
         readVarUInt(written_rows, in);
@@ -30,7 +47,17 @@ void ProgressValues::write(WriteBuffer & out, UInt64 client_revision) const
 {
     writeVarUInt(read_rows, out);
     writeVarUInt(read_bytes, out);
-    writeVarUInt(total_rows_to_read, out);
+    /// In new TCP protocol we can send total_bytes_to_read without total_rows_to_read.
+    /// If client doesn't support total_bytes_to_read, send approx total_rows_to_read
+    /// to indicate at least approx progress.
+    if (client_revision < DBMS_MIN_PROTOCOL_VERSION_WITH_TOTAL_BYTES_IN_PROGRESS && total_bytes_to_read && !total_rows_to_read)
+        writeVarUInt(getApproxTotalRowsToRead(read_rows, read_bytes, total_bytes_to_read), out);
+    else
+        writeVarUInt(total_rows_to_read, out);
+    if (client_revision >= DBMS_MIN_PROTOCOL_VERSION_WITH_TOTAL_BYTES_IN_PROGRESS)
+    {
+        writeVarUInt(total_bytes_to_read, out);
+    }
     if (client_revision >= DBMS_MIN_REVISION_WITH_CLIENT_WRITE_INFO)
     {
         writeVarUInt(written_rows, out);
@@ -190,6 +217,7 @@ void Progress::read(ReadBuffer & in, UInt64 server_revision)
     read_rows.store(values.read_rows, std::memory_order_relaxed);
     read_bytes.store(values.read_bytes, std::memory_order_relaxed);
     total_rows_to_read.store(values.total_rows_to_read, std::memory_order_relaxed);
+    total_bytes_to_read.store(values.total_bytes_to_read, std::memory_order_relaxed);
 
     written_rows.store(values.written_rows, std::memory_order_relaxed);
     written_bytes.store(values.written_bytes, std::memory_order_relaxed);
diff --git a/src/IO/ReadBufferFromPocoSocket.cpp b/src/IO/ReadBufferFromPocoSocket.cpp
index d0fba2c28e8..ff72dc5386c 100644
--- a/src/IO/ReadBufferFromPocoSocket.cpp
+++ b/src/IO/ReadBufferFromPocoSocket.cpp
@@ -9,6 +9,7 @@
 #include <Common/ProfileEvents.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/AsyncTaskExecutor.h>
+#include <Common/checkSSLReturnCode.h>
 
 namespace ProfileEvents
 {
@@ -21,7 +22,6 @@ namespace CurrentMetrics
     extern const Metric NetworkReceive;
 }
 
-
 namespace DB
 {
 namespace ErrorCodes
@@ -32,14 +32,13 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-
 bool ReadBufferFromPocoSocket::nextImpl()
 {
     ssize_t bytes_read = 0;
     Stopwatch watch;
 
     SCOPE_EXIT({
-        // / NOTE: it is quite inaccurate on high loads since the thread could be replaced by another one
+        /// NOTE: it is quite inaccurate on high loads since the thread could be replaced by another one
         ProfileEvents::increment(ProfileEvents::NetworkReceiveElapsedMicroseconds, watch.elapsedMicroseconds());
         ProfileEvents::increment(ProfileEvents::NetworkReceiveBytes, bytes_read);
     });
@@ -49,16 +48,38 @@ bool ReadBufferFromPocoSocket::nextImpl()
     {
         CurrentMetrics::Increment metric_increment(CurrentMetrics::NetworkReceive);
 
-        /// If async_callback is specified, and read will block, run async_callback and try again later.
-        /// It is expected that file descriptor may be polled externally.
-        /// Note that receive timeout is not checked here. External code should check it while polling.
-        while (async_callback && !socket.poll(0, Poco::Net::Socket::SELECT_READ | Poco::Net::Socket::SELECT_ERROR))
-            async_callback(socket.impl()->sockfd(), socket.getReceiveTimeout(), AsyncEventTimeoutType::RECEIVE, socket_description, AsyncTaskExecutor::Event::READ | AsyncTaskExecutor::Event::ERROR);
-
         if (internal_buffer.size() > INT_MAX)
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Buffer overflow");
 
-        bytes_read = socket.impl()->receiveBytes(internal_buffer.begin(), static_cast<int>(internal_buffer.size()));
+        /// If async_callback is specified, set socket to non-blocking mode
+        /// and try to read data from it, if socket is not ready for reading,
+        /// run async_callback and try again later.
+        /// It is expected that file descriptor may be polled externally.
+        /// Note that send timeout is not checked here. External code should check it while polling.
+        if (async_callback)
+        {
+            socket.setBlocking(false);
+            SCOPE_EXIT(socket.setBlocking(true));
+            bool secure = socket.secure();
+            bytes_read = socket.impl()->receiveBytes(internal_buffer.begin(), static_cast<int>(internal_buffer.size()));
+
+            /// Check EAGAIN and ERR_SSL_WANT_READ/ERR_SSL_WANT_WRITE for secure socket (reading from secure socket can write too).
+            while (bytes_read < 0 && (errno == EAGAIN || (secure && (checkSSLWantRead(bytes_read) || checkSSLWantWrite(bytes_read)))))
+            {
+                /// In case of ERR_SSL_WANT_WRITE we should wait for socket to be ready for writing, otherwise - for reading.
+                if (secure && checkSSLWantWrite(bytes_read))
+                    async_callback(socket.impl()->sockfd(), socket.getSendTimeout(), AsyncEventTimeoutType::SEND, socket_description, AsyncTaskExecutor::Event::WRITE | AsyncTaskExecutor::Event::ERROR);
+                else
+                    async_callback(socket.impl()->sockfd(), socket.getReceiveTimeout(), AsyncEventTimeoutType::RECEIVE, socket_description, AsyncTaskExecutor::Event::READ | AsyncTaskExecutor::Event::ERROR);
+
+                /// Try to read again.
+                bytes_read = socket.impl()->receiveBytes(internal_buffer.begin(), static_cast<int>(internal_buffer.size()));
+            }
+        }
+        else
+        {
+            bytes_read = socket.impl()->receiveBytes(internal_buffer.begin(), static_cast<int>(internal_buffer.size()));
+        }
     }
     catch (const Poco::Net::NetException & e)
     {
diff --git a/src/IO/ReadHelpers.cpp b/src/IO/ReadHelpers.cpp
index 99d25ee6613..9896468e616 100644
--- a/src/IO/ReadHelpers.cpp
+++ b/src/IO/ReadHelpers.cpp
@@ -31,6 +31,7 @@ namespace ErrorCodes
     extern const int CANNOT_PARSE_QUOTED_STRING;
     extern const int CANNOT_PARSE_DATETIME;
     extern const int CANNOT_PARSE_DATE;
+    extern const int CANNOT_PARSE_UUID;
     extern const int INCORRECT_DATA;
     extern const int ATTEMPT_TO_READ_AFTER_EOF;
     extern const int LOGICAL_ERROR;
@@ -46,48 +47,45 @@ inline void parseHex(IteratorSrc src, IteratorDst dst)
         dst[dst_pos] = unhex2(reinterpret_cast<const char *>(&src[src_pos]));
 }
 
-void parseUUID(const UInt8 * src36, UInt8 * dst16)
+UUID parseUUID(std::span<const UInt8> src)
 {
-    /// If string is not like UUID - implementation specific behaviour.
+    UUID uuid;
+    const auto * src_ptr = src.data();
+    auto * dst = reinterpret_cast<UInt8 *>(&uuid);
+    const auto size = src.size();
 
-    parseHex<4>(&src36[0], &dst16[0]);
-    parseHex<2>(&src36[9], &dst16[4]);
-    parseHex<2>(&src36[14], &dst16[6]);
-    parseHex<2>(&src36[19], &dst16[8]);
-    parseHex<6>(&src36[24], &dst16[10]);
-}
+#if __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__
+    const std::reverse_iterator dst_it(dst + sizeof(UUID));
+#endif
+    if (size == 36)
+    {
+#if __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__
+        parseHex<4>(src_ptr, dst_it + 8);
+        parseHex<2>(src_ptr + 9, dst_it + 12);
+        parseHex<2>(src_ptr + 14, dst_it + 14);
+        parseHex<2>(src_ptr + 19, dst_it);
+        parseHex<6>(src_ptr + 24, dst_it + 2);
+#else
+        parseHex<4>(src_ptr, dst);
+        parseHex<2>(src_ptr + 9, dst + 4);
+        parseHex<2>(src_ptr + 14, dst + 6);
+        parseHex<2>(src_ptr + 19, dst + 8);
+        parseHex<6>(src_ptr + 24, dst + 10);
+#endif
+    }
+    else if (size == 32)
+    {
+#if __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__
+        parseHex<8>(src_ptr, dst_it + 8);
+        parseHex<8>(src_ptr + 16, dst_it);
+#else
+        parseHex<16>(src_ptr, dst);
+#endif
+    }
+    else
+        throw Exception(ErrorCodes::CANNOT_PARSE_UUID, "Unexpected length when trying to parse UUID ({})", size);
 
-void parseUUIDWithoutSeparator(const UInt8 * src36, UInt8 * dst16)
-{
-    /// If string is not like UUID - implementation specific behaviour.
-
-    parseHex<16>(&src36[0], &dst16[0]);
-}
-
-/** Function used when byte ordering is important when parsing uuid
- *  ex: When we create an UUID type
- */
-void parseUUID(const UInt8 * src36, std::reverse_iterator<UInt8 *> dst16)
-{
-    /// If string is not like UUID - implementation specific behaviour.
-
-    /// FIXME This code looks like trash.
-    parseHex<4>(&src36[0], dst16 + 8);
-    parseHex<2>(&src36[9], dst16 + 12);
-    parseHex<2>(&src36[14], dst16 + 14);
-    parseHex<2>(&src36[19], dst16);
-    parseHex<6>(&src36[24], dst16 + 2);
-}
-
-/** Function used when byte ordering is important when parsing uuid
- *  ex: When we create an UUID type
- */
-void parseUUIDWithoutSeparator(const UInt8 * src36, std::reverse_iterator<UInt8 *> dst16)
-{
-    /// If string is not like UUID - implementation specific behaviour.
-
-    parseHex<8>(&src36[0], dst16 + 8);
-    parseHex<8>(&src36[16], dst16);
+    return uuid;
 }
 
 void NO_INLINE throwAtAssertionFailed(const char * s, ReadBuffer & buf)
@@ -849,15 +847,18 @@ void readCSVStringInto(Vector & s, ReadBuffer & buf, const FormatSettings::CSV &
 
             if constexpr (WithResize<Vector>)
             {
-                /** CSV format can contain insignificant spaces and tabs.
-                * Usually the task of skipping them is for the calling code.
-                * But in this case, it will be difficult to do this, so remove the trailing whitespace by ourself.
-                */
-                size_t size = s.size();
-                while (size > 0 && (s[size - 1] == ' ' || s[size - 1] == '\t'))
-                    --size;
+                if (settings.trim_whitespaces) [[likely]]
+                {
+                    /** CSV format can contain insignificant spaces and tabs.
+                    * Usually the task of skipping them is for the calling code.
+                    * But in this case, it will be difficult to do this, so remove the trailing whitespace by ourself.
+                    */
+                    size_t size = s.size();
+                    while (size > 0 && (s[size - 1] == ' ' || s[size - 1] == '\t'))
+                        --size;
 
-                s.resize(size);
+                    s.resize(size);
+                }
             }
             return;
         }
diff --git a/src/IO/ReadHelpers.h b/src/IO/ReadHelpers.h
index 32338552b66..b8ce162ec91 100644
--- a/src/IO/ReadHelpers.h
+++ b/src/IO/ReadHelpers.h
@@ -8,13 +8,16 @@
 #include <algorithm>
 #include <iterator>
 #include <bit>
+#include <span>
 
 #include <type_traits>
 
+#include <Common/StackTrace.h>
 #include <Common/formatIPv6.h>
 #include <Common/DateLUT.h>
 #include <Common/LocalDate.h>
 #include <Common/LocalDateTime.h>
+#include <Common/TransformEndianness.hpp>
 #include <base/StringRef.h>
 #include <base/arithmeticOverflow.h>
 #include <base/sort.h>
@@ -61,6 +64,7 @@ namespace ErrorCodes
     extern const int INCORRECT_DATA;
     extern const int TOO_LARGE_STRING_SIZE;
     extern const int TOO_LARGE_ARRAY_SIZE;
+    extern const int SIZE_OF_FIXED_STRING_DOESNT_MATCH;
 }
 
 /// Helper functions for formatted input.
@@ -136,6 +140,19 @@ inline void readStringBinary(std::string & s, ReadBuffer & buf, size_t max_strin
     buf.readStrict(s.data(), size);
 }
 
+/// For historical reasons we store IPv6 as a String
+inline void readIPv6Binary(IPv6 & ip, ReadBuffer & buf)
+{
+    size_t size = 0;
+    readVarUInt(size, buf);
+
+    if (size != IPV6_BINARY_LENGTH)
+        throw Exception(ErrorCodes::SIZE_OF_FIXED_STRING_DOESNT_MATCH,
+                        "Size of the string {} doesn't match size of binary IPv6 {}", size, IPV6_BINARY_LENGTH);
+
+    buf.readStrict(reinterpret_cast<char*>(&ip.toUnderType()), size);
+}
+
 template <typename T>
 void readVectorBinary(std::vector<T> & v, ReadBuffer & buf)
 {
@@ -623,12 +640,6 @@ struct NullOutput
     void push_back(char) {} /// NOLINT
 };
 
-void parseUUID(const UInt8 * src36, UInt8 * dst16);
-void parseUUIDWithoutSeparator(const UInt8 * src36, UInt8 * dst16);
-void parseUUID(const UInt8 * src36, std::reverse_iterator<UInt8 *> dst16);
-void parseUUIDWithoutSeparator(const UInt8 * src36, std::reverse_iterator<UInt8 *> dst16);
-
-
 template <typename ReturnType>
 ReturnType readDateTextFallback(LocalDate & date, ReadBuffer & buf);
 
@@ -706,7 +717,7 @@ inline void convertToDayNum(DayNum & date, ExtendedDayNum & from)
 }
 
 template <typename ReturnType = void>
-inline ReturnType readDateTextImpl(DayNum & date, ReadBuffer & buf)
+inline ReturnType readDateTextImpl(DayNum & date, ReadBuffer & buf, const DateLUTImpl & date_lut)
 {
     static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
 
@@ -717,13 +728,13 @@ inline ReturnType readDateTextImpl(DayNum & date, ReadBuffer & buf)
     else if (!readDateTextImpl<ReturnType>(local_date, buf))
         return false;
 
-    ExtendedDayNum ret = DateLUT::instance().makeDayNum(local_date.year(), local_date.month(), local_date.day());
-    convertToDayNum(date,ret);
+    ExtendedDayNum ret = date_lut.makeDayNum(local_date.year(), local_date.month(), local_date.day());
+    convertToDayNum(date, ret);
     return ReturnType(true);
 }
 
 template <typename ReturnType = void>
-inline ReturnType readDateTextImpl(ExtendedDayNum & date, ReadBuffer & buf)
+inline ReturnType readDateTextImpl(ExtendedDayNum & date, ReadBuffer & buf, const DateLUTImpl & date_lut)
 {
     static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
 
@@ -735,7 +746,7 @@ inline ReturnType readDateTextImpl(ExtendedDayNum & date, ReadBuffer & buf)
         return false;
 
     /// When the parameter is out of rule or out of range, Date32 uses 1925-01-01 as the default value (-DateLUT::instance().getDayNumOffsetEpoch(), -16436) and Date uses 1970-01-01.
-    date = DateLUT::instance().makeDayNum(local_date.year(), local_date.month(), local_date.day(), -static_cast<Int32>(DateLUT::instance().getDayNumOffsetEpoch()));
+    date = date_lut.makeDayNum(local_date.year(), local_date.month(), local_date.day(), -static_cast<Int32>(date_lut.getDayNumOffsetEpoch()));
     return ReturnType(true);
 }
 
@@ -745,14 +756,14 @@ inline void readDateText(LocalDate & date, ReadBuffer & buf)
     readDateTextImpl<void>(date, buf);
 }
 
-inline void readDateText(DayNum & date, ReadBuffer & buf)
+inline void readDateText(DayNum & date, ReadBuffer & buf, const DateLUTImpl & date_lut = DateLUT::instance())
 {
-    readDateTextImpl<void>(date, buf);
+    readDateTextImpl<void>(date, buf, date_lut);
 }
 
-inline void readDateText(ExtendedDayNum & date, ReadBuffer & buf)
+inline void readDateText(ExtendedDayNum & date, ReadBuffer & buf, const DateLUTImpl & date_lut = DateLUT::instance())
 {
-    readDateTextImpl<void>(date, buf);
+    readDateTextImpl<void>(date, buf, date_lut);
 }
 
 inline bool tryReadDateText(LocalDate & date, ReadBuffer & buf)
@@ -760,16 +771,18 @@ inline bool tryReadDateText(LocalDate & date, ReadBuffer & buf)
     return readDateTextImpl<bool>(date, buf);
 }
 
-inline bool tryReadDateText(DayNum & date, ReadBuffer & buf)
+inline bool tryReadDateText(DayNum & date, ReadBuffer & buf, const DateLUTImpl & time_zone = DateLUT::instance())
 {
-    return readDateTextImpl<bool>(date, buf);
+    return readDateTextImpl<bool>(date, buf, time_zone);
 }
 
-inline bool tryReadDateText(ExtendedDayNum & date, ReadBuffer & buf)
+inline bool tryReadDateText(ExtendedDayNum & date, ReadBuffer & buf, const DateLUTImpl & time_zone = DateLUT::instance())
 {
-    return readDateTextImpl<bool>(date, buf);
+    return readDateTextImpl<bool>(date, buf, time_zone);
 }
 
+UUID parseUUID(std::span<const UInt8> src);
+
 template <typename ReturnType = void>
 inline ReturnType readUUIDTextImpl(UUID & uuid, ReadBuffer & buf)
 {
@@ -797,12 +810,9 @@ inline ReturnType readUUIDTextImpl(UUID & uuid, ReadBuffer & buf)
                     return ReturnType(false);
                 }
             }
-
-            parseUUID(reinterpret_cast<const UInt8 *>(s), std::reverse_iterator<UInt8 *>(reinterpret_cast<UInt8 *>(&uuid) + 16));
         }
-        else
-            parseUUIDWithoutSeparator(reinterpret_cast<const UInt8 *>(s), std::reverse_iterator<UInt8 *>(reinterpret_cast<UInt8 *>(&uuid) + 16));
 
+        uuid = parseUUID({reinterpret_cast<const UInt8 *>(s), size});
         return ReturnType(true);
     }
     else
@@ -1098,30 +1108,13 @@ inline void readBinary(Decimal128 & x, ReadBuffer & buf) { readPODBinary(x, buf)
 inline void readBinary(Decimal256 & x, ReadBuffer & buf) { readPODBinary(x.value, buf); }
 inline void readBinary(LocalDate & x, ReadBuffer & buf) { readPODBinary(x, buf); }
 
+inline void readBinary(StackTrace::FramePointers & x, ReadBuffer & buf) { readPODBinary(x, buf); }
 
 template <std::endian endian, typename T>
-requires is_arithmetic_v<T> && (sizeof(T) <= 8)
 inline void readBinaryEndian(T & x, ReadBuffer & buf)
 {
     readPODBinary(x, buf);
-    if constexpr (std::endian::native != endian)
-        x = std::byteswap(x);
-}
-
-template <std::endian endian, typename T>
-requires is_big_int_v<T>
-inline void readBinaryEndian(T & x, ReadBuffer & buf)
-{
-    if constexpr (std::endian::native == endian)
-    {
-        for (size_t i = 0; i != std::size(x.items); ++i)
-            readBinaryEndian<endian>(x.items[i], buf);
-    }
-    else
-    {
-        for (size_t i = 0; i != std::size(x.items); ++i)
-            readBinaryEndian<endian>(x.items[std::size(x.items) - i - 1], buf);
-    }
+    transformEndianness<endian>(x);
 }
 
 template <typename T>
@@ -1159,8 +1152,10 @@ inline bool tryReadText(IPv6 & x, ReadBuffer & buf) { return tryReadIPv6Text(x,
 inline void readText(is_floating_point auto & x, ReadBuffer & buf) { readFloatText(x, buf); }
 
 inline void readText(String & x, ReadBuffer & buf) { readEscapedString(x, buf); }
+
+inline void readText(DayNum & x, ReadBuffer & buf, const DateLUTImpl & time_zone = DateLUT::instance()) { readDateText(x, buf, time_zone); }
+
 inline void readText(LocalDate & x, ReadBuffer & buf) { readDateText(x, buf); }
-inline void readText(DayNum & x, ReadBuffer & buf) { readDateText(x, buf); }
 inline void readText(LocalDateTime & x, ReadBuffer & buf) { readDateTimeText(x, buf); }
 inline void readText(UUID & x, ReadBuffer & buf) { readUUIDText(x, buf); }
 inline void readText(IPv4 & x, ReadBuffer & buf) { readIPv4Text(x, buf); }
@@ -1172,6 +1167,10 @@ template <typename T>
 requires is_arithmetic_v<T>
 inline void readQuoted(T & x, ReadBuffer & buf) { readText(x, buf); }
 
+template <typename T>
+requires is_arithmetic_v<T>
+inline void readQuoted(T & x, ReadBuffer & buf, const DateLUTImpl & time_zone) { readText(x, buf, time_zone); }
+
 inline void readQuoted(String & x, ReadBuffer & buf) { readQuotedString(x, buf); }
 
 inline void readQuoted(LocalDate & x, ReadBuffer & buf)
@@ -1214,6 +1213,10 @@ template <typename T>
 requires is_arithmetic_v<T>
 inline void readDoubleQuoted(T & x, ReadBuffer & buf) { readText(x, buf); }
 
+template <typename T>
+requires is_arithmetic_v<T>
+inline void readDoubleQuoted(T & x, ReadBuffer & buf, const DateLUTImpl & time_zone) { readText(x, buf, time_zone); }
+
 inline void readDoubleQuoted(String & x, ReadBuffer & buf) { readDoubleQuotedString(x, buf); }
 
 inline void readDoubleQuoted(LocalDate & x, ReadBuffer & buf)
@@ -1230,7 +1233,7 @@ inline void readDoubleQuoted(LocalDateTime & x, ReadBuffer & buf)
     assertChar('"', buf);
 }
 
-/// CSV, for numbers, dates: quotes are optional, no special escaping rules.
+/// CSV for numbers: quotes are optional, no special escaping rules.
 template <typename T>
 inline void readCSVSimple(T & x, ReadBuffer & buf)
 {
@@ -1248,6 +1251,24 @@ inline void readCSVSimple(T & x, ReadBuffer & buf)
         assertChar(maybe_quote, buf);
 }
 
+// standalone overload for dates: to avoid instantiating DateLUTs while parsing other types
+template <typename T>
+inline void readCSVSimple(T & x, ReadBuffer & buf, const DateLUTImpl & time_zone)
+{
+    if (buf.eof()) [[unlikely]]
+        throwReadAfterEOF();
+
+    char maybe_quote = *buf.position();
+
+    if (maybe_quote == '\'' || maybe_quote == '\"')
+        ++buf.position();
+
+    readText(x, buf, time_zone);
+
+    if (maybe_quote == '\'' || maybe_quote == '\"')
+        assertChar(maybe_quote, buf);
+}
+
 template <typename T>
 requires is_arithmetic_v<T>
 inline void readCSV(T & x, ReadBuffer & buf)
@@ -1258,6 +1279,7 @@ inline void readCSV(T & x, ReadBuffer & buf)
 inline void readCSV(String & x, ReadBuffer & buf, const FormatSettings::CSV & settings) { readCSVString(x, buf, settings); }
 inline void readCSV(LocalDate & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
 inline void readCSV(DayNum & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline void readCSV(DayNum & x, ReadBuffer & buf, const DateLUTImpl & time_zone) { readCSVSimple(x, buf, time_zone); }
 inline void readCSV(LocalDateTime & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
 inline void readCSV(UUID & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
 inline void readCSV(IPv4 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
diff --git a/src/IO/ReadSettings.h b/src/IO/ReadSettings.h
index e43ecd7f275..87f249823b2 100644
--- a/src/IO/ReadSettings.h
+++ b/src/IO/ReadSettings.h
@@ -98,7 +98,8 @@ struct ReadSettings
     bool enable_filesystem_cache = true;
     bool read_from_filesystem_cache_if_exists_otherwise_bypass_cache = false;
     bool enable_filesystem_cache_log = false;
-    bool is_file_cache_persistent = false; /// Some files can be made non-evictable.
+    /// Don't populate cache when the read is not part of query execution (e.g. background thread).
+    bool avoid_readthrough_cache_outside_query_context = true;
 
     size_t filesystem_cache_max_download_size = (128UL * 1024 * 1024 * 1024);
     bool skip_download_if_exceeds_query_cache = true;
diff --git a/src/IO/Resource/tests/gtest_resource_manager_static.cpp b/src/IO/Resource/tests/gtest_resource_manager_static.cpp
index 091f6923714..976eac41a49 100644
--- a/src/IO/Resource/tests/gtest_resource_manager_static.cpp
+++ b/src/IO/Resource/tests/gtest_resource_manager_static.cpp
@@ -44,8 +44,8 @@ TEST(IOResourceStaticResourceManager, Smoke)
 
 TEST(IOResourceStaticResourceManager, Prioritization)
 {
-    std::optional<Int64> last_priority;
-    auto check = [&] (Int64 priority)
+    std::optional<Priority> last_priority;
+    auto check = [&] (Priority priority)
     {
         // Lock is not required here because this is called during request execution and we have max_requests = 1
         if (last_priority)
diff --git a/src/IO/SeekAvoidingReadBuffer.cpp b/src/IO/SeekAvoidingReadBuffer.cpp
deleted file mode 100644
index 4d6406d8ddf..00000000000
--- a/src/IO/SeekAvoidingReadBuffer.cpp
+++ /dev/null
@@ -1,35 +0,0 @@
-#include <IO/SeekAvoidingReadBuffer.h>
-
-
-namespace DB
-{
-
-SeekAvoidingReadBuffer::SeekAvoidingReadBuffer(std::unique_ptr<ReadBufferFromFileBase> impl_, UInt64 min_bytes_for_seek_)
-    : ReadBufferFromFileDecorator(std::move(impl_))
-    , min_bytes_for_seek(min_bytes_for_seek_)
-{
-}
-
-
-off_t SeekAvoidingReadBuffer::seek(off_t off, int whence)
-{
-    off_t position = getPosition();
-
-    if (whence == SEEK_CUR)
-    {
-        off += position;
-        whence = SEEK_SET;
-    }
-
-    if (whence == SEEK_SET && off >= position && off < position + static_cast<off_t>(min_bytes_for_seek))
-    {
-        swap(*impl);
-        impl->ignore(off - position);
-        swap(*impl);
-        return off;
-    }
-
-    return ReadBufferFromFileDecorator::seek(off, whence);
-}
-
-}
diff --git a/src/IO/SeekAvoidingReadBuffer.h b/src/IO/SeekAvoidingReadBuffer.h
deleted file mode 100644
index 716d7c5046c..00000000000
--- a/src/IO/SeekAvoidingReadBuffer.h
+++ /dev/null
@@ -1,26 +0,0 @@
-#pragma once
-
-#include <IO/ReadBufferFromFileDecorator.h>
-
-
-namespace DB
-{
-
-/// `SeekAvoidingReadBuffer` prefers sequential reads over seeks within specified window.
-/// It is useful in network and spinning disk storage media when seek is relatively expensive
-/// operation.
-/// See also: `merge_tree_min_rows_for_seek`.
-class SeekAvoidingReadBuffer : public ReadBufferFromFileDecorator
-{
-public:
-    SeekAvoidingReadBuffer(std::unique_ptr<ReadBufferFromFileBase> impl_, UInt64 min_bytes_for_seek_);
-
-    off_t seek(off_t off, int whence) override;
-
-    void prefetch(Priority priority) override { impl->prefetch(priority); }
-
-private:
-    UInt64 min_bytes_for_seek; /// Minimum positive seek offset which shall be executed using seek operation.
-};
-
-}
diff --git a/src/IO/SeekableReadBuffer.h b/src/IO/SeekableReadBuffer.h
index 8ced9d752de..5770948be20 100644
--- a/src/IO/SeekableReadBuffer.h
+++ b/src/IO/SeekableReadBuffer.h
@@ -83,6 +83,10 @@ public:
 
     /// Checks if readBigAt() is allowed. May be slow, may throw (e.g. it may do an HTTP request or an fstat).
     virtual bool supportsReadAt() { return false; }
+
+    /// We do some tricks to avoid seek cost. E.g we read more data and than ignore it (see remote_read_min_bytes_for_seek).
+    /// Sometimes however seek is basically free because underlying read buffer wasn't yet initialised (or re-initialised after reset).
+    virtual bool seekIsCheap() { return false; }
 };
 
 
diff --git a/src/IO/SharedThreadPools.cpp b/src/IO/SharedThreadPools.cpp
index b7b6aea1567..6a0e953f0ef 100644
--- a/src/IO/SharedThreadPools.cpp
+++ b/src/IO/SharedThreadPools.cpp
@@ -9,8 +9,12 @@ namespace CurrentMetrics
     extern const Metric IOThreadsActive;
     extern const Metric BackupsIOThreads;
     extern const Metric BackupsIOThreadsActive;
-    extern const Metric OutdatedPartsLoadingThreads;
-    extern const Metric OutdatedPartsLoadingThreadsActive;
+    extern const Metric MergeTreePartsLoaderThreads;
+    extern const Metric MergeTreePartsLoaderThreadsActive;
+    extern const Metric MergeTreePartsCleanerThreads;
+    extern const Metric MergeTreePartsCleanerThreadsActive;
+    extern const Metric MergeTreeOutdatedPartsLoaderThreads;
+    extern const Metric MergeTreeOutdatedPartsLoaderThreadsActive;
 }
 
 namespace DB
@@ -21,88 +25,117 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-std::unique_ptr<ThreadPool> IOThreadPool::instance;
 
-void IOThreadPool::initialize(size_t max_threads, size_t max_free_threads, size_t queue_size)
+StaticThreadPool::StaticThreadPool(
+    const String & name_,
+    CurrentMetrics::Metric threads_metric_,
+    CurrentMetrics::Metric threads_active_metric_)
+    : name(name_)
+    , threads_metric(threads_metric_)
+    , threads_active_metric(threads_active_metric_)
+{
+}
+
+void StaticThreadPool::initialize(size_t max_threads, size_t max_free_threads, size_t queue_size)
 {
     if (instance)
-    {
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "The IO thread pool is initialized twice");
-    }
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "The {} is initialized twice", name);
 
+    /// By default enabling "turbo mode" won't affect the number of threads anyhow
+    max_threads_turbo = max_threads;
+    max_threads_normal = max_threads;
     instance = std::make_unique<ThreadPool>(
-        CurrentMetrics::IOThreads,
-        CurrentMetrics::IOThreadsActive,
+        threads_metric,
+        threads_active_metric,
         max_threads,
         max_free_threads,
         queue_size,
         /* shutdown_on_exception= */ false);
 }
 
-ThreadPool & IOThreadPool::get()
+void StaticThreadPool::reloadConfiguration(size_t max_threads, size_t max_free_threads, size_t queue_size)
 {
     if (!instance)
-    {
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "The IO thread pool is not initialized");
-    }
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "The {} is not initialized", name);
+
+    instance->setMaxThreads(turbo_mode_enabled > 0 ? max_threads_turbo : max_threads);
+    instance->setMaxFreeThreads(max_free_threads);
+    instance->setQueueSize(queue_size);
+}
+
+
+ThreadPool & StaticThreadPool::get()
+{
+    if (!instance)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "The {} is not initialized", name);
 
     return *instance;
 }
 
-std::unique_ptr<ThreadPool> BackupsIOThreadPool::instance;
-
-void BackupsIOThreadPool::initialize(size_t max_threads, size_t max_free_threads, size_t queue_size)
-{
-    if (instance)
-    {
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "The BackupsIO thread pool is initialized twice");
-    }
-
-    instance = std::make_unique<ThreadPool>(
-        CurrentMetrics::BackupsIOThreads,
-        CurrentMetrics::BackupsIOThreadsActive,
-        max_threads,
-        max_free_threads,
-        queue_size,
-        /* shutdown_on_exception= */ false);
-}
-
-ThreadPool & BackupsIOThreadPool::get()
+void StaticThreadPool::enableTurboMode()
 {
     if (!instance)
-    {
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "The BackupsIO thread pool is not initialized");
-    }
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "The {} is not initialized", name);
 
-    return *instance;
+    std::lock_guard lock(mutex);
+
+    ++turbo_mode_enabled;
+    if (turbo_mode_enabled == 1)
+        instance->setMaxThreads(max_threads_turbo);
 }
 
-std::unique_ptr<ThreadPool> OutdatedPartsLoadingThreadPool::instance;
-
-void OutdatedPartsLoadingThreadPool::initialize(size_t max_threads, size_t max_free_threads, size_t queue_size)
-{
-    if (instance)
-    {
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "The PartsLoadingThreadPool thread pool is initialized twice");
-    }
-
-    instance = std::make_unique<ThreadPool>(
-        CurrentMetrics::OutdatedPartsLoadingThreads,
-        CurrentMetrics::OutdatedPartsLoadingThreadsActive,
-        max_threads,
-        max_free_threads,
-        queue_size,
-        /* shutdown_on_exception= */ false);
-}
-
-ThreadPool & OutdatedPartsLoadingThreadPool::get()
+void StaticThreadPool::disableTurboMode()
 {
     if (!instance)
-    {
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "The PartsLoadingThreadPool thread pool is not initialized");
-    }
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "The {} is not initialized", name);
 
-    return *instance;
+    std::lock_guard lock(mutex);
+
+    --turbo_mode_enabled;
+    if (turbo_mode_enabled == 0)
+        instance->setMaxThreads(max_threads_normal);
+}
+
+void StaticThreadPool::setMaxTurboThreads(size_t max_threads_turbo_)
+{
+    if (!instance)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "The {} is not initialized", name);
+
+    std::lock_guard lock(mutex);
+
+    max_threads_turbo = max_threads_turbo_;
+    if (turbo_mode_enabled > 0)
+        instance->setMaxThreads(max_threads_turbo);
+}
+
+StaticThreadPool & getIOThreadPool()
+{
+    static StaticThreadPool instance("IOThreadPool", CurrentMetrics::IOThreads, CurrentMetrics::IOThreadsActive);
+    return instance;
+}
+
+StaticThreadPool & getBackupsIOThreadPool()
+{
+    static StaticThreadPool instance("BackupsIOThreadPool", CurrentMetrics::BackupsIOThreads, CurrentMetrics::BackupsIOThreadsActive);
+    return instance;
+}
+
+StaticThreadPool & getActivePartsLoadingThreadPool()
+{
+    static StaticThreadPool instance("MergeTreePartsLoaderThreadPool", CurrentMetrics::MergeTreePartsLoaderThreads, CurrentMetrics::MergeTreePartsLoaderThreadsActive);
+    return instance;
+}
+
+StaticThreadPool & getPartsCleaningThreadPool()
+{
+    static StaticThreadPool instance("MergeTreePartsCleanerThreadPool", CurrentMetrics::MergeTreePartsCleanerThreads, CurrentMetrics::MergeTreePartsCleanerThreadsActive);
+    return instance;
+}
+
+StaticThreadPool & getOutdatedPartsLoadingThreadPool()
+{
+    static StaticThreadPool instance("MergeTreeOutdatedPartsLoaderThreadPool", CurrentMetrics::MergeTreeOutdatedPartsLoaderThreads, CurrentMetrics::MergeTreeOutdatedPartsLoaderThreadsActive);
+    return instance;
 }
 
 }
diff --git a/src/IO/SharedThreadPools.h b/src/IO/SharedThreadPools.h
index 1b43dfe778c..188a2a4f003 100644
--- a/src/IO/SharedThreadPools.h
+++ b/src/IO/SharedThreadPools.h
@@ -1,48 +1,64 @@
 #pragma once
 
+#include <base/types.h>
 #include <Common/ThreadPool_fwd.h>
+#include <Common/CurrentMetrics.h>
+
 #include <cstdlib>
 #include <memory>
+#include <mutex>
 
 namespace DB
 {
 
-/*
- * ThreadPool used for the IO.
- */
-class IOThreadPool
+class StaticThreadPool
 {
-    static std::unique_ptr<ThreadPool> instance;
-
 public:
-    static void initialize(size_t max_threads, size_t max_free_threads, size_t queue_size);
-    static ThreadPool & get();
+    StaticThreadPool(
+        const String & name_,
+        CurrentMetrics::Metric threads_metric_,
+        CurrentMetrics::Metric threads_active_metric_);
+
+    ThreadPool & get();
+
+    void initialize(size_t max_threads, size_t max_free_threads, size_t queue_size);
+    void reloadConfiguration(size_t max_threads, size_t max_free_threads, size_t queue_size);
+
+    /// At runtime we can increase the number of threads up the specified limit
+    /// This is needed to utilize as much a possible resources to accomplish some task.
+    void setMaxTurboThreads(size_t max_threads_turbo_);
+    void enableTurboMode();
+    void disableTurboMode();
+
+private:
+    const String name;
+    const CurrentMetrics::Metric threads_metric;
+    const CurrentMetrics::Metric threads_active_metric;
+
+    std::unique_ptr<ThreadPool> instance;
+    std::mutex mutex;
+    size_t max_threads_turbo = 0;
+    size_t max_threads_normal = 0;
+    /// If this counter is > 0 - this specific mode is enabled
+    size_t turbo_mode_enabled = 0;
 };
 
+/// ThreadPool used for the IO.
+StaticThreadPool & getIOThreadPool();
 
-/*
- * ThreadPool used for the Backup IO.
- */
-class BackupsIOThreadPool
-{
-    static std::unique_ptr<ThreadPool> instance;
+/// ThreadPool used for the Backup IO.
+StaticThreadPool & getBackupsIOThreadPool();
 
-public:
-    static void initialize(size_t max_threads, size_t max_free_threads, size_t queue_size);
-    static ThreadPool & get();
-};
+/// ThreadPool used for the loading of Outdated data parts for MergeTree tables.
+StaticThreadPool & getActivePartsLoadingThreadPool();
 
+/// ThreadPool used for deleting data parts for MergeTree tables.
+StaticThreadPool & getPartsCleaningThreadPool();
 
-/*
- * ThreadPool used for the loading of Outdated data parts for MergeTree tables.
- */
-class OutdatedPartsLoadingThreadPool
-{
-    static std::unique_ptr<ThreadPool> instance;
-
-public:
-    static void initialize(size_t max_threads, size_t max_free_threads, size_t queue_size);
-    static ThreadPool & get();
-};
+/// This ThreadPool is used for the loading of Outdated data parts for MergeTree tables.
+/// Normally we will just load Outdated data parts concurrently in background, but in
+/// case when we need to synchronously wait for the loading to be finished, we can increase
+/// the number of threads by calling enableTurboMode() :-)
+StaticThreadPool & getOutdatedPartsLoadingThreadPool();
 
 }
diff --git a/src/IO/WithFileSize.cpp b/src/IO/WithFileSize.cpp
index 28542db7a73..3660d962c08 100644
--- a/src/IO/WithFileSize.cpp
+++ b/src/IO/WithFileSize.cpp
@@ -3,6 +3,7 @@
 #include <IO/CompressedReadBufferWrapper.h>
 #include <IO/ParallelReadBuffer.h>
 #include <IO/ReadBufferFromFileDecorator.h>
+#include <IO/PeekableReadBuffer.h>
 
 namespace DB
 {
@@ -37,6 +38,18 @@ size_t getFileSizeFromReadBuffer(ReadBuffer & in)
     return getFileSize(in);
 }
 
+std::optional<size_t> tryGetFileSizeFromReadBuffer(ReadBuffer & in)
+{
+    try
+    {
+        return getFileSizeFromReadBuffer(in);
+    }
+    catch (...)
+    {
+        return std::nullopt;
+    }
+}
+
 bool isBufferWithFileSize(const ReadBuffer & in)
 {
     if (const auto * delegate = dynamic_cast<const ReadBufferFromFileDecorator *>(&in))
@@ -51,4 +64,23 @@ bool isBufferWithFileSize(const ReadBuffer & in)
     return dynamic_cast<const WithFileSize *>(&in) != nullptr;
 }
 
+size_t getDataOffsetMaybeCompressed(const ReadBuffer & in)
+{
+    if (const auto * delegate = dynamic_cast<const ReadBufferFromFileDecorator *>(&in))
+    {
+        return getDataOffsetMaybeCompressed(delegate->getWrappedReadBuffer());
+    }
+    else if (const auto * compressed = dynamic_cast<const CompressedReadBufferWrapper *>(&in))
+    {
+        return getDataOffsetMaybeCompressed(compressed->getWrappedReadBuffer());
+    }
+    else if (const auto * peekable = dynamic_cast<const PeekableReadBuffer *>(&in))
+    {
+        return getDataOffsetMaybeCompressed(peekable->getSubBuffer());
+    }
+
+    return in.count();
+}
+
+
 }
diff --git a/src/IO/WithFileSize.h b/src/IO/WithFileSize.h
index 060626faed2..0ae3af98ea0 100644
--- a/src/IO/WithFileSize.h
+++ b/src/IO/WithFileSize.h
@@ -18,4 +18,9 @@ bool isBufferWithFileSize(const ReadBuffer & in);
 
 size_t getFileSizeFromReadBuffer(ReadBuffer & in);
 
+/// Return nullopt if couldn't find out file size;
+std::optional<size_t> tryGetFileSizeFromReadBuffer(ReadBuffer & in);
+
+size_t getDataOffsetMaybeCompressed(const ReadBuffer & in);
+
 }
diff --git a/src/IO/WriteBuffer.cpp b/src/IO/WriteBuffer.cpp
new file mode 100644
index 00000000000..61fdd31e16a
--- /dev/null
+++ b/src/IO/WriteBuffer.cpp
@@ -0,0 +1,33 @@
+#include "WriteBuffer.h"
+
+#include <Common/logger_useful.h>
+
+namespace DB
+{
+
+/// Calling finalize() in the destructor of derived classes is a bad practice.
+/// This causes objects to be left on the remote FS when a write operation is rolled back.
+/// Do call finalize() explicitly, before this call you have no guarantee that the file has been written
+WriteBuffer::~WriteBuffer()
+{
+    // That destructor could be call with finalized=false in case of exceptions
+    if (count() > 0 && !finalized)
+    {
+        /// It is totally OK to destroy instance without finalization when an exception occurs
+        /// However it is suspicious to destroy instance without finalization at the green path
+        if (!std::uncaught_exceptions() && std::current_exception() == nullptr)
+        {
+            Poco::Logger * log = &Poco::Logger::get("WriteBuffer");
+            LOG_ERROR(
+                log,
+                "WriteBuffer is not finalized when destructor is called. "
+                "No exceptions in flight are detected. "
+                "The file might not be written at all or might be truncated. "
+                "Stack trace: {}",
+                StackTrace().toString());
+            chassert(false && "WriteBuffer is not finalized in destructor.");
+        }
+    }
+}
+
+}
diff --git a/src/IO/WriteBuffer.h b/src/IO/WriteBuffer.h
index 2c891e17d9a..ea032302235 100644
--- a/src/IO/WriteBuffer.h
+++ b/src/IO/WriteBuffer.h
@@ -32,7 +32,6 @@ class WriteBuffer : public BufferBase
 public:
     using BufferBase::set;
     using BufferBase::position;
-    WriteBuffer(Position ptr, size_t size) : BufferBase(ptr, size, 0) {}
     void set(Position ptr, size_t size) { BufferBase::set(ptr, size, 0); }
 
     /** write the data in the buffer (from the beginning of the buffer to the current position);
@@ -63,10 +62,8 @@ public:
         pos = working_buffer.begin();
     }
 
-    /** it is desirable in the derived classes to place the finalize() call in the destructor,
-      * so that the last data is written (if finalize() wasn't called explicitly)
-      */
-    virtual ~WriteBuffer() = default;
+    /// Calling finalize() in the destructor of derived classes is a bad practice.
+    virtual ~WriteBuffer();
 
     inline void nextIfAtEnd()
     {
@@ -95,7 +92,6 @@ public:
         }
     }
 
-
     inline void write(char x)
     {
         if (finalized)
@@ -121,7 +117,6 @@ public:
         if (finalized)
             return;
 
-        /// finalize() is often called from destructors.
         LockMemoryExceptionInThread lock(VariableContext::Global);
         try
         {
@@ -144,6 +139,8 @@ public:
     }
 
 protected:
+    WriteBuffer(Position ptr, size_t size) : BufferBase(ptr, size, 0) {}
+
     virtual void finalizeImpl()
     {
         next();
@@ -155,11 +152,31 @@ private:
     /** Write the data in the buffer (from the beginning of the buffer to the current position).
       * Throw an exception if something is wrong.
       */
-    virtual void nextImpl() { throw Exception(ErrorCodes::CANNOT_WRITE_AFTER_END_OF_BUFFER, "Cannot write after end of buffer."); }
+    virtual void nextImpl()
+    {
+        throw Exception(ErrorCodes::CANNOT_WRITE_AFTER_END_OF_BUFFER, "Cannot write after end of buffer.");
+    }
 };
 
 
 using WriteBufferPtr = std::shared_ptr<WriteBuffer>;
 
 
+class WriteBufferFromPointer : public WriteBuffer
+{
+public:
+    WriteBufferFromPointer(Position ptr, size_t size) : WriteBuffer(ptr, size) {}
+
+private:
+    virtual void finalizeImpl() override
+    {
+        /// no op
+    }
+
+    virtual void sync() override
+    {
+        /// no on
+    }
+};
+
 }
diff --git a/src/IO/WriteBufferFromArena.h b/src/IO/WriteBufferFromArena.h
index 8445307d179..8e9276496b5 100644
--- a/src/IO/WriteBufferFromArena.h
+++ b/src/IO/WriteBufferFromArena.h
@@ -63,6 +63,10 @@ private:
         internalBuffer() = Buffer(const_cast<char *>(begin), end);
         buffer() = Buffer(continuation, end);
     }
+
+    /// it is super strange,
+    /// but addition next call changes the data in serializeValueIntoArena result
+    virtual void finalizeImpl() override { /* no op */ }
 };
 
 }
diff --git a/src/IO/WriteBufferFromFile.cpp b/src/IO/WriteBufferFromFile.cpp
index e58f1e3a60c..97059ff8f48 100644
--- a/src/IO/WriteBufferFromFile.cpp
+++ b/src/IO/WriteBufferFromFile.cpp
@@ -103,7 +103,7 @@ void WriteBufferFromFile::close()
     if (fd < 0)
         return;
 
-    next();
+    finalize();
 
     if (0 != ::close(fd))
         throw Exception(ErrorCodes::CANNOT_CLOSE_FILE, "Cannot close file");
diff --git a/src/IO/WriteBufferFromFileBase.h b/src/IO/WriteBufferFromFileBase.h
index d35b69a7df7..d6e2144bccf 100644
--- a/src/IO/WriteBufferFromFileBase.h
+++ b/src/IO/WriteBufferFromFileBase.h
@@ -13,7 +13,6 @@ class WriteBufferFromFileBase : public BufferWithOwnMemory<WriteBuffer>
 {
 public:
     WriteBufferFromFileBase(size_t buf_size, char * existing_memory, size_t alignment);
-    ~WriteBufferFromFileBase() override = default;
 
     void sync() override = 0;
     virtual std::string getFileName() const = 0;
diff --git a/src/IO/WriteBufferFromOStream.cpp b/src/IO/WriteBufferFromOStream.cpp
index 2d0d5976f85..ffc3e62e9a6 100644
--- a/src/IO/WriteBufferFromOStream.cpp
+++ b/src/IO/WriteBufferFromOStream.cpp
@@ -1,4 +1,5 @@
 #include <IO/WriteBufferFromOStream.h>
+#include <Common/logger_useful.h>
 
 
 namespace DB
@@ -38,9 +39,4 @@ WriteBufferFromOStream::WriteBufferFromOStream(
 {
 }
 
-WriteBufferFromOStream::~WriteBufferFromOStream()
-{
-    finalize();
-}
-
 }
diff --git a/src/IO/WriteBufferFromOStream.h b/src/IO/WriteBufferFromOStream.h
index f8b45c2fa59..5a933739cb1 100644
--- a/src/IO/WriteBufferFromOStream.h
+++ b/src/IO/WriteBufferFromOStream.h
@@ -18,8 +18,6 @@ public:
         char * existing_memory = nullptr,
         size_t alignment = 0);
 
-    ~WriteBufferFromOStream() override;
-
 protected:
     explicit WriteBufferFromOStream(size_t size = DBMS_DEFAULT_BUFFER_SIZE, char * existing_memory = nullptr, size_t alignment = 0);
 
diff --git a/src/IO/WriteBufferFromPocoSocket.cpp b/src/IO/WriteBufferFromPocoSocket.cpp
index cf3944e019d..171e7f1ce69 100644
--- a/src/IO/WriteBufferFromPocoSocket.cpp
+++ b/src/IO/WriteBufferFromPocoSocket.cpp
@@ -10,7 +10,7 @@
 #include <Common/ProfileEvents.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/AsyncTaskExecutor.h>
-
+#include <Common/checkSSLReturnCode.h>
 
 namespace ProfileEvents
 {
@@ -23,7 +23,6 @@ namespace CurrentMetrics
     extern const Metric NetworkSend;
 }
 
-
 namespace DB
 {
 
@@ -35,7 +34,6 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-
 void WriteBufferFromPocoSocket::nextImpl()
 {
     if (!offset())
@@ -62,13 +60,36 @@ void WriteBufferFromPocoSocket::nextImpl()
             if (size > INT_MAX)
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Buffer overflow");
 
-            /// If async_callback is specified, and write will block, run async_callback and try again later.
+            /// If async_callback is specified, set socket to non-blocking mode
+            /// and try to write data to it, if socket is not ready for writing,
+            /// run async_callback and try again later.
             /// It is expected that file descriptor may be polled externally.
             /// Note that send timeout is not checked here. External code should check it while polling.
-            while (async_callback && !socket.poll(0, Poco::Net::Socket::SELECT_WRITE | Poco::Net::Socket::SELECT_ERROR))
-                async_callback(socket.impl()->sockfd(), socket.getSendTimeout(), AsyncEventTimeoutType::SEND, socket_description, AsyncTaskExecutor::Event::WRITE | AsyncTaskExecutor::Event::ERROR);
+            if (async_callback)
+            {
+                socket.setBlocking(false);
+                /// Set socket to blocking mode at the end.
+                SCOPE_EXIT(socket.setBlocking(true));
+                bool secure = socket.secure();
+                res = socket.impl()->sendBytes(pos, static_cast<int>(size));
 
-            res = socket.impl()->sendBytes(pos, static_cast<int>(size));
+                /// Check EAGAIN and ERR_SSL_WANT_WRITE/ERR_SSL_WANT_READ for secure socket (writing to secure socket can read too).
+                while (res < 0 && (errno == EAGAIN || (secure && (checkSSLWantRead(res) || checkSSLWantWrite(res)))))
+                {
+                    /// In case of ERR_SSL_WANT_READ we should wait for socket to be ready for reading, otherwise - for writing.
+                    if (secure && checkSSLWantRead(res))
+                        async_callback(socket.impl()->sockfd(), socket.getReceiveTimeout(), AsyncEventTimeoutType::RECEIVE, socket_description, AsyncTaskExecutor::Event::READ | AsyncTaskExecutor::Event::ERROR);
+                    else
+                        async_callback(socket.impl()->sockfd(), socket.getSendTimeout(), AsyncEventTimeoutType::SEND, socket_description, AsyncTaskExecutor::Event::WRITE | AsyncTaskExecutor::Event::ERROR);
+
+                    /// Try to write again.
+                    res = socket.impl()->sendBytes(pos, static_cast<int>(size));
+                }
+            }
+            else
+            {
+                res = socket.impl()->sendBytes(pos, static_cast<int>(size));
+            }
         }
         catch (const Poco::Net::NetException & e)
         {
diff --git a/src/IO/WriteBufferFromS3.cpp b/src/IO/WriteBufferFromS3.cpp
index 990505adfb3..ebab9b323b8 100644
--- a/src/IO/WriteBufferFromS3.cpp
+++ b/src/IO/WriteBufferFromS3.cpp
@@ -235,14 +235,15 @@ WriteBufferFromS3::~WriteBufferFromS3()
 {
     LOG_TRACE(log, "Close WriteBufferFromS3. {}.", getLogDetails());
 
-    // That destructor could be call with finalized=false in case of exceptions
+    /// That destructor could be call with finalized=false in case of exceptions
     if (!finalized)
     {
-        LOG_INFO(log,
-                 "WriteBufferFromS3 is not finalized in destructor. "
-                 "It could be if an exception occurs. File is not written to S3. "
-                 "{}.",
-                 getLogDetails());
+        LOG_INFO(
+            log,
+            "WriteBufferFromS3 is not finalized in destructor. "
+            "The file might not be written to S3. "
+            "{}.",
+            getLogDetails());
     }
 
     task_tracker->safeWaitAll();
diff --git a/src/IO/WriteBufferFromVector.h b/src/IO/WriteBufferFromVector.h
index 4b2a3581625..a2ecc34f1ab 100644
--- a/src/IO/WriteBufferFromVector.h
+++ b/src/IO/WriteBufferFromVector.h
@@ -86,7 +86,10 @@ private:
         size_t old_size = vector.size();
         /// pos may not be equal to vector.data() + old_size, because WriteBuffer::next() can be used to flush data
         size_t pos_offset = pos - reinterpret_cast<Position>(vector.data());
-        vector.resize(old_size * size_multiplier);
+        if (pos_offset == old_size)
+        {
+            vector.resize(old_size * size_multiplier);
+        }
         internal_buffer = Buffer(reinterpret_cast<Position>(vector.data() + pos_offset), reinterpret_cast<Position>(vector.data() + vector.size()));
         working_buffer = internal_buffer;
     }
diff --git a/src/IO/WriteHelpers.cpp b/src/IO/WriteHelpers.cpp
index a0eceddc6f6..4f1a95181d4 100644
--- a/src/IO/WriteHelpers.cpp
+++ b/src/IO/WriteHelpers.cpp
@@ -20,20 +20,35 @@ void formatHex(IteratorSrc src, IteratorDst dst, size_t num_bytes)
     }
 }
 
-/** Function used when byte ordering is important when parsing uuid
- *  ex: When we create an UUID type
- */
-void formatUUID(std::reverse_iterator<const UInt8 *> src16, UInt8 * dst36)
+std::array<char, 36> formatUUID(const UUID & uuid)
 {
-    formatHex(src16 + 8, &dst36[0], 4);
-    dst36[8] = '-';
-    formatHex(src16 + 12, &dst36[9], 2);
-    dst36[13] = '-';
-    formatHex(src16 + 14, &dst36[14], 2);
-    dst36[18] = '-';
-    formatHex(src16, &dst36[19], 2);
-    dst36[23] = '-';
-    formatHex(src16 + 2, &dst36[24], 6);
+    std::array<char, 36> dst;
+    const auto * src_ptr = reinterpret_cast<const UInt8 *>(&uuid);
+    auto * dst_ptr = dst.data();
+#if __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__
+    const std::reverse_iterator src_it(src_ptr + 16);
+    formatHex(src_it + 8, dst_ptr, 4);
+    dst[8] = '-';
+    formatHex(src_it + 12, dst_ptr + 9, 2);
+    dst[13] = '-';
+    formatHex(src_it + 14, dst_ptr + 14, 2);
+    dst[18] = '-';
+    formatHex(src_it, dst_ptr + 19, 2);
+    dst[23] = '-';
+    formatHex(src_it + 2, dst_ptr + 24, 6);
+#else
+    formatHex(src_ptr, dst_ptr, 4);
+    dst[8] = '-';
+    formatHex(src_ptr + 4, dst_ptr + 9, 2);
+    dst[13] = '-';
+    formatHex(src_ptr + 6, dst_ptr + 14, 2);
+    dst[18] = '-';
+    formatHex(src_ptr + 8, dst_ptr + 19, 2);
+    dst[23] = '-';
+    formatHex(src_ptr + 10, dst_ptr + 24, 6);
+#endif
+
+    return dst;
 }
 
 void writeIPv4Text(const IPv4 & ip, WriteBuffer & buf)
diff --git a/src/IO/WriteHelpers.h b/src/IO/WriteHelpers.h
index cdbc952690c..aa4c9b17e48 100644
--- a/src/IO/WriteHelpers.h
+++ b/src/IO/WriteHelpers.h
@@ -10,9 +10,12 @@
 
 #include <pcg-random/pcg_random.hpp>
 
+#include <Common/StackTrace.h>
+#include <Common/formatIPv6.h>
 #include <Common/DateLUT.h>
 #include <Common/LocalDate.h>
 #include <Common/LocalDateTime.h>
+#include <Common/TransformEndianness.hpp>
 #include <base/find_symbols.h>
 #include <base/StringRef.h>
 #include <base/DecomposedFloat.h>
@@ -104,6 +107,13 @@ inline void writeStringBinary(const std::string & s, WriteBuffer & buf)
     buf.write(s.data(), s.size());
 }
 
+/// For historical reasons we store IPv6 as a String
+inline void writeIPv6Binary(const IPv6 & ip, WriteBuffer & buf)
+{
+    writeVarUInt(IPV6_BINARY_LENGTH, buf);
+    buf.write(reinterpret_cast<const char *>(&ip.toUnderType()), IPV6_BINARY_LENGTH);
+}
+
 inline void writeStringBinary(StringRef s, WriteBuffer & buf)
 {
     writeVarUInt(s.size, buf);
@@ -625,13 +635,15 @@ inline void writeXMLStringForTextElement(std::string_view s, WriteBuffer & buf)
     writeXMLStringForTextElement(s.data(), s.data() + s.size(), buf);
 }
 
-void formatUUID(std::reverse_iterator<const UInt8 *> src16, UInt8 * dst36);
+/// @brief Serialize `uuid` into an array of characters in big-endian byte order.
+/// @param uuid UUID to serialize.
+/// @return Array of characters in big-endian byte order.
+std::array<char, 36> formatUUID(const UUID & uuid);
 
 inline void writeUUIDText(const UUID & uuid, WriteBuffer & buf)
 {
-    char s[36];
-    formatUUID(std::reverse_iterator<const UInt8 *>(reinterpret_cast<const UInt8 *>(&uuid) + 16), reinterpret_cast<UInt8 *>(s));
-    buf.write(s, sizeof(s));
+    const auto serialized_uuid = formatUUID(uuid);
+    buf.write(serialized_uuid.data(), serialized_uuid.size());
 }
 
 void writeIPv4Text(const IPv4 & ip, WriteBuffer & buf);
@@ -694,15 +706,15 @@ inline void writeDateText(const LocalDate & date, WriteBuffer & buf)
 }
 
 template <char delimiter = '-'>
-inline void writeDateText(DayNum date, WriteBuffer & buf)
+inline void writeDateText(DayNum date, WriteBuffer & buf, const DateLUTImpl & time_zone = DateLUT::instance())
 {
-    writeDateText<delimiter>(LocalDate(date), buf);
+    writeDateText<delimiter>(LocalDate(date, time_zone), buf);
 }
 
 template <char delimiter = '-'>
-inline void writeDateText(ExtendedDayNum date, WriteBuffer & buf)
+inline void writeDateText(ExtendedDayNum date, WriteBuffer & buf, const DateLUTImpl & time_zone = DateLUT::instance())
 {
-    writeDateText<delimiter>(LocalDate(date), buf);
+    writeDateText<delimiter>(LocalDate(date, time_zone), buf);
 }
 
 /// In the format YYYY-MM-DD HH:MM:SS
@@ -865,6 +877,8 @@ inline void writeBinary(const UUID & x, WriteBuffer & buf) { writePODBinary(x, b
 inline void writeBinary(const IPv4 & x, WriteBuffer & buf) { writePODBinary(x, buf); }
 inline void writeBinary(const IPv6 & x, WriteBuffer & buf) { writePODBinary(x, buf); }
 
+inline void writeBinary(const StackTrace::FramePointers & x, WriteBuffer & buf) { writePODBinary(x, buf); }
+
 /// Methods for outputting the value in text form for a tab-separated format.
 
 inline void writeText(is_integer auto x, WriteBuffer & buf)
@@ -883,7 +897,7 @@ inline void writeText(is_enum auto x, WriteBuffer & buf) { writeText(magic_enum:
 
 inline void writeText(std::string_view x, WriteBuffer & buf) { writeString(x.data(), x.size(), buf); }
 
-inline void writeText(const DayNum & x, WriteBuffer & buf) { writeDateText(LocalDate(x), buf); }
+inline void writeText(const DayNum & x, WriteBuffer & buf, const DateLUTImpl & time_zone = DateLUT::instance()) { writeDateText(LocalDate(x, time_zone), buf); }
 inline void writeText(const LocalDate & x, WriteBuffer & buf) { writeDateText(x, buf); }
 inline void writeText(const LocalDateTime & x, WriteBuffer & buf) { writeDateTimeText(x, buf); }
 inline void writeText(const UUID & x, WriteBuffer & buf) { writeUUIDText(x, buf); }
@@ -1172,32 +1186,13 @@ inline void writeNullTerminatedString(const String & s, WriteBuffer & buffer)
     buffer.write(s.c_str(), s.size() + 1);
 }
 
-
 template <std::endian endian, typename T>
-requires is_arithmetic_v<T> && (sizeof(T) <= 8)
 inline void writeBinaryEndian(T x, WriteBuffer & buf)
 {
-    if constexpr (std::endian::native != endian)
-        x = std::byteswap(x);
+    transformEndianness<endian>(x);
     writePODBinary(x, buf);
 }
 
-template <std::endian endian, typename T>
-requires is_big_int_v<T>
-inline void writeBinaryEndian(const T & x, WriteBuffer & buf)
-{
-    if constexpr (std::endian::native == endian)
-    {
-        for (size_t i = 0; i != std::size(x.items); ++i)
-            writeBinaryEndian<endian>(x.items[i], buf);
-    }
-    else
-    {
-        for (size_t i = 0; i != std::size(x.items); ++i)
-            writeBinaryEndian<endian>(x.items[std::size(x.items) - i - 1], buf);
-    }
-}
-
 template <typename T>
 inline void writeBinaryLittleEndian(T x, WriteBuffer & buf)
 {
diff --git a/src/IO/WriteSettings.h b/src/IO/WriteSettings.h
index e160796d9a3..8f22e44145a 100644
--- a/src/IO/WriteSettings.h
+++ b/src/IO/WriteSettings.h
@@ -19,7 +19,6 @@ struct WriteSettings
     /// Filesystem cache settings
     bool enable_filesystem_cache_on_write_operations = false;
     bool enable_filesystem_cache_log = false;
-    bool is_file_cache_persistent = false;
     bool throw_on_error_from_cache = false;
 
     bool s3_allow_parallel_part_upload = true;
diff --git a/src/IO/ZlibDeflatingWriteBuffer.cpp b/src/IO/ZlibDeflatingWriteBuffer.cpp
index 43bb0405555..5455adcb7c9 100644
--- a/src/IO/ZlibDeflatingWriteBuffer.cpp
+++ b/src/IO/ZlibDeflatingWriteBuffer.cpp
@@ -72,17 +72,7 @@ void ZlibDeflatingWriteBuffer::nextImpl()
     }
 }
 
-ZlibDeflatingWriteBuffer::~ZlibDeflatingWriteBuffer()
-{
-    try
-    {
-        finalize();
-    }
-    catch (...)
-    {
-        tryLogCurrentException(__PRETTY_FUNCTION__);
-    }
-}
+ZlibDeflatingWriteBuffer::~ZlibDeflatingWriteBuffer() = default;
 
 void ZlibDeflatingWriteBuffer::finalizeBefore()
 {
diff --git a/src/IO/ZstdDeflatingAppendableWriteBuffer.cpp b/src/IO/ZstdDeflatingAppendableWriteBuffer.cpp
index be739c0e654..81be8d8ce4d 100644
--- a/src/IO/ZstdDeflatingAppendableWriteBuffer.cpp
+++ b/src/IO/ZstdDeflatingAppendableWriteBuffer.cpp
@@ -1,5 +1,6 @@
 #include <IO/ZstdDeflatingAppendableWriteBuffer.h>
 #include <Common/Exception.h>
+#include "IO/ReadBufferFromFileBase.h"
 #include <IO/ReadBufferFromFile.h>
 
 namespace DB
@@ -11,14 +12,16 @@ namespace ErrorCodes
 }
 
 ZstdDeflatingAppendableWriteBuffer::ZstdDeflatingAppendableWriteBuffer(
-    std::unique_ptr<WriteBufferFromFile> out_,
+    std::unique_ptr<WriteBufferFromFileBase> out_,
     int compression_level,
     bool append_to_existing_file_,
+    std::function<std::unique_ptr<ReadBufferFromFileBase>()> read_buffer_creator_,
     size_t buf_size,
     char * existing_memory,
     size_t alignment)
     : BufferWithOwnMemory(buf_size, existing_memory, alignment)
     , out(std::move(out_))
+    , read_buffer_creator(std::move(read_buffer_creator_))
     , append_to_existing_file(append_to_existing_file_)
 {
     cctx = ZSTD_createCCtx();
@@ -194,13 +197,13 @@ void ZstdDeflatingAppendableWriteBuffer::addEmptyBlock()
 
 bool ZstdDeflatingAppendableWriteBuffer::isNeedToAddEmptyBlock()
 {
-    ReadBufferFromFile reader(out->getFileName());
-    auto fsize = reader.getFileSize();
+    auto reader = read_buffer_creator();
+    auto fsize = reader->getFileSize();
     if (fsize > 3)
     {
         std::array<char, 3> result;
-        reader.seek(fsize - 3, SEEK_SET);
-        reader.readStrict(result.data(), 3);
+        reader->seek(fsize - 3, SEEK_SET);
+        reader->readStrict(result.data(), 3);
 
         /// If we don't have correct block in the end, then we need to add it manually.
         /// NOTE: maybe we can have the same bytes in case of data corruption/unfinished write.
diff --git a/src/IO/ZstdDeflatingAppendableWriteBuffer.h b/src/IO/ZstdDeflatingAppendableWriteBuffer.h
index a0715480737..d9c4f32d6da 100644
--- a/src/IO/ZstdDeflatingAppendableWriteBuffer.h
+++ b/src/IO/ZstdDeflatingAppendableWriteBuffer.h
@@ -5,6 +5,7 @@
 #include <IO/WriteBuffer.h>
 #include <IO/WriteBufferDecorator.h>
 #include <IO/WriteBufferFromFile.h>
+#include <IO/ReadBufferFromFileBase.h>
 
 #include <zstd.h>
 
@@ -29,9 +30,10 @@ public:
     static inline constexpr ZSTDLastBlock ZSTD_CORRECT_TERMINATION_LAST_BLOCK = {0x01, 0x00, 0x00};
 
     ZstdDeflatingAppendableWriteBuffer(
-        std::unique_ptr<WriteBufferFromFile> out_,
+        std::unique_ptr<WriteBufferFromFileBase> out_,
         int compression_level,
         bool append_to_existing_file_,
+        std::function<std::unique_ptr<ReadBufferFromFileBase>()> read_buffer_creator_,
         size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
         char * existing_memory = nullptr,
         size_t alignment = 0);
@@ -68,7 +70,8 @@ private:
     /// Adding zstd empty block (ZSTD_CORRECT_TERMINATION_LAST_BLOCK) to out.working_buffer
     void addEmptyBlock();
 
-    std::unique_ptr<WriteBufferFromFile> out;
+    std::unique_ptr<WriteBufferFromFileBase> out;
+    std::function<std::unique_ptr<ReadBufferFromFileBase>()> read_buffer_creator;
 
     bool append_to_existing_file = false;
     ZSTD_CCtx * cctx;
diff --git a/src/IO/ZstdDeflatingWriteBuffer.cpp b/src/IO/ZstdDeflatingWriteBuffer.cpp
index c6d2ffc39f9..8fec5c5fadb 100644
--- a/src/IO/ZstdDeflatingWriteBuffer.cpp
+++ b/src/IO/ZstdDeflatingWriteBuffer.cpp
@@ -30,11 +30,7 @@ ZstdDeflatingWriteBuffer::ZstdDeflatingWriteBuffer(
     output = {nullptr, 0, 0};
 }
 
-
-ZstdDeflatingWriteBuffer::~ZstdDeflatingWriteBuffer()
-{
-    finalize();
-}
+ZstdDeflatingWriteBuffer::~ZstdDeflatingWriteBuffer() = default;
 
 void ZstdDeflatingWriteBuffer::nextImpl()
 {
diff --git a/src/IO/parseDateTimeBestEffort.cpp b/src/IO/parseDateTimeBestEffort.cpp
index b370bee6f3f..6bdba251c36 100644
--- a/src/IO/parseDateTimeBestEffort.cpp
+++ b/src/IO/parseDateTimeBestEffort.cpp
@@ -578,12 +578,16 @@ ReturnType parseDateTimeBestEffortImpl(
     if (!year && !month && !day_of_month && !has_time)
         return on_error(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot read DateTime: neither Date nor Time was parsed successfully");
 
-    if (!year)
-        year = 2000;
-    if (!month)
-        month = 1;
     if (!day_of_month)
         day_of_month = 1;
+    if (!month)
+        month = 1;
+    if (!year)
+    {
+        time_t now = time(nullptr);
+        UInt16 curr_year = local_time_zone.toYear(now);
+        year = now < local_time_zone.makeDateTime(curr_year, month, day_of_month, hour, minute, second) ? curr_year - 1 : curr_year;
+    }
 
     auto is_leap_year = (year % 400 == 0) || (year % 100 != 0 && year % 4 == 0);
 
diff --git a/src/IO/tests/gtest_DateTime64_parsing_and_writing.cpp b/src/IO/tests/gtest_DateTime64_parsing_and_writing.cpp
index 697851b217a..6dd6ea67125 100644
--- a/src/IO/tests/gtest_DateTime64_parsing_and_writing.cpp
+++ b/src/IO/tests/gtest_DateTime64_parsing_and_writing.cpp
@@ -59,8 +59,9 @@ TEST_P(DateTime64StringWriteTest, WriteText)
 
     PaddedPODArray<char> actual_string(param.string.size() * 2, '\0'); // TODO: detect overflows
 
-    WriteBuffer write_buffer(actual_string.data(), actual_string.size());
+    WriteBufferFromPointer write_buffer(actual_string.data(), actual_string.size());
     EXPECT_NO_THROW(writeDateTimeText(param.dt64, param.scale, write_buffer, param.timezone));
+    write_buffer.finalize();
 
     EXPECT_STREQ(param.string.data(), actual_string.data());
 }
diff --git a/src/Interpreters/ActionsDAG.cpp b/src/Interpreters/ActionsDAG.cpp
index cbf6cc1cbe3..906875dd314 100644
--- a/src/Interpreters/ActionsDAG.cpp
+++ b/src/Interpreters/ActionsDAG.cpp
@@ -598,6 +598,8 @@ Block ActionsDAG::updateHeader(Block header) const
     }
 
     ColumnsWithTypeAndName result_columns;
+
+
     result_columns.reserve(outputs.size());
 
     struct Frame
@@ -1874,10 +1876,10 @@ struct ConjunctionNodes
     ActionsDAG::NodeRawConstPtrs rejected;
 };
 
-/// Take a node which result is predicate.
+/// Take a node which result is a predicate.
 /// Assuming predicate is a conjunction (probably, trivial).
 /// Find separate conjunctions nodes. Split nodes into allowed and rejected sets.
-/// Allowed predicate is a predicate which can be calculated using only nodes from allowed_nodes set.
+/// Allowed predicate is a predicate which can be calculated using only nodes from the allowed_nodes set.
 ConjunctionNodes getConjunctionNodes(ActionsDAG::Node * predicate, std::unordered_set<const ActionsDAG::Node *> allowed_nodes)
 {
     ConjunctionNodes conjunction;
@@ -2111,9 +2113,9 @@ ActionsDAGPtr ActionsDAG::cloneActionsForFilterPushDown(
     Node * predicate = const_cast<Node *>(tryFindInOutputs(filter_name));
     if (!predicate)
         throw Exception(ErrorCodes::LOGICAL_ERROR,
-                "Output nodes for ActionsDAG do not contain filter column name {}. DAG:\n{}",
-                filter_name,
-                dumpDAG());
+            "Output nodes for ActionsDAG do not contain filter column name {}. DAG:\n{}",
+            filter_name,
+            dumpDAG());
 
     /// If condition is constant let's do nothing.
     /// It means there is nothing to push down or optimization was already applied.
@@ -2140,18 +2142,29 @@ ActionsDAGPtr ActionsDAG::cloneActionsForFilterPushDown(
     }
 
     auto conjunction = getConjunctionNodes(predicate, allowed_nodes);
-    if (conjunction.rejected.size() == 1 && !conjunction.rejected.front()->result_type->equals(*predicate->result_type)
-        && conjunction.allowed.front()->type == ActionType::COLUMN)
-    {
-        // No further optimization can be done
+
+    if (conjunction.allowed.empty())
         return nullptr;
+
+    chassert(predicate->result_type);
+
+    if (conjunction.rejected.size() == 1)
+    {
+        chassert(conjunction.rejected.front()->result_type);
+
+        if (conjunction.allowed.front()->type == ActionType::COLUMN
+            && !conjunction.rejected.front()->result_type->equals(*predicate->result_type))
+        {
+            /// No further optimization can be done
+            return nullptr;
+        }
     }
 
     auto actions = cloneActionsForConjunction(conjunction.allowed, all_inputs);
     if (!actions)
         return nullptr;
 
-    /// Now, when actions are created, update current DAG.
+    /// Now, when actions are created, update the current DAG.
 
     if (conjunction.rejected.empty())
     {
diff --git a/src/Interpreters/ActionsVisitor.cpp b/src/Interpreters/ActionsVisitor.cpp
index 28ba2e3e838..10502b7e66d 100644
--- a/src/Interpreters/ActionsVisitor.cpp
+++ b/src/Interpreters/ActionsVisitor.cpp
@@ -57,6 +57,9 @@
 #include <Functions/UserDefined/UserDefinedExecutableFunctionFactory.h>
 #include <Parsers/QueryParameterVisitor.h>
 
+#include <Analyzer/QueryNode.h>
+#include <Interpreters/InterpreterSelectQueryAnalyzer.h>
+#include <Parsers/queryToString.h>
 
 namespace DB
 {
@@ -422,9 +425,8 @@ Block createBlockForSet(
 }
 
 
-SetPtr makeExplicitSet(
-    const ASTFunction * node, const ActionsDAG & actions, bool create_ordered_set,
-    ContextPtr context, const SizeLimits & size_limits, PreparedSets & prepared_sets)
+FutureSetPtr makeExplicitSet(
+    const ASTFunction * node, const ActionsDAG & actions, ContextPtr context, PreparedSets & prepared_sets)
 {
     const IAST & args = *node->arguments;
 
@@ -443,14 +445,16 @@ SetPtr makeExplicitSet(
     if (left_tuple_type && left_tuple_type->getElements().size() != 1)
         set_element_types = left_tuple_type->getElements();
 
+    auto set_element_keys = Set::getElementTypes(set_element_types, context->getSettingsRef().transform_null_in);
+
+    auto set_key = right_arg->getTreeHash();
+    if (auto set = prepared_sets.findTuple(set_key, set_element_keys))
+        return set; /// Already prepared.
+
     for (auto & element_type : set_element_types)
         if (const auto * low_cardinality_type = typeid_cast<const DataTypeLowCardinality *>(element_type.get()))
             element_type = low_cardinality_type->getDictionaryType();
 
-    auto set_key = PreparedSetKey::forLiteral(*right_arg, set_element_types);
-    if (auto set = prepared_sets.get(set_key))
-        return set; /// Already prepared.
-
     Block block;
     const auto & right_arg_func = std::dynamic_pointer_cast<ASTFunction>(right_arg);
     if (right_arg_func && (right_arg_func->name == "tuple" || right_arg_func->name == "array"))
@@ -458,14 +462,7 @@ SetPtr makeExplicitSet(
     else
         block = createBlockForSet(left_arg_type, right_arg, set_element_types, context);
 
-    SetPtr set
-        = std::make_shared<Set>(size_limits, create_ordered_set, context->getSettingsRef().transform_null_in);
-    set->setHeader(block.cloneEmpty().getColumnsWithTypeAndName());
-    set->insertFromBlock(block.getColumnsWithTypeAndName());
-    set->finishInsert();
-
-    prepared_sets.set(set_key, set);
-    return set;
+    return prepared_sets.addFromTuple(set_key, block, context->getSettings());
 }
 
 class ScopeStack::Index
@@ -950,7 +947,7 @@ void ActionsMatcher::visit(const ASTFunction & node, const ASTPtr & ast, Data &
         return;
     }
 
-    FutureSet prepared_set;
+    FutureSetPtr prepared_set;
     if (checkFunctionIsInOrGlobalInOperator(node))
     {
         /// Let's find the type of the first argument (then getActionsImpl will be called again and will not affect anything).
@@ -959,7 +956,7 @@ void ActionsMatcher::visit(const ASTFunction & node, const ASTPtr & ast, Data &
         if (!data.no_makeset && !(data.is_create_parameterized_view && !analyzeReceiveQueryParams(ast).empty()))
             prepared_set = makeSet(node, data, data.no_subqueries);
 
-        if (prepared_set.isValid())
+        if (prepared_set)
         {
             /// Transform tuple or subquery into a set.
         }
@@ -1171,14 +1168,14 @@ void ActionsMatcher::visit(const ASTFunction & node, const ASTPtr & ast, Data &
                 num_arguments += columns.size() - 1;
                 arg += columns.size() - 1;
             }
-            else if (checkFunctionIsInOrGlobalInOperator(node) && arg == 1 && prepared_set.isValid())
+            else if (checkFunctionIsInOrGlobalInOperator(node) && arg == 1 && prepared_set)
             {
                 ColumnWithTypeAndName column;
                 column.type = std::make_shared<DataTypeSet>();
 
                 /// If the argument is a set given by an enumeration of values (so, the set was already built), give it a unique name,
                 ///  so that sets with the same literal representation do not fuse together (they can have different types).
-                const bool is_constant_set = prepared_set.isCreated();
+                const bool is_constant_set = typeid_cast<const FutureSetFromSubquery *>(prepared_set.get()) == nullptr;
                 if (is_constant_set)
                     column.name = data.getUniqueName("__set");
                 else
@@ -1381,7 +1378,7 @@ void ActionsMatcher::visit(const ASTLiteral & literal, const ASTPtr & /* ast */,
     data.addColumn(std::move(column));
 }
 
-FutureSet ActionsMatcher::makeSet(const ASTFunction & node, Data & data, bool no_subqueries)
+FutureSetPtr ActionsMatcher::makeSet(const ASTFunction & node, Data & data, bool no_subqueries)
 {
     if (!data.prepared_sets)
         return {};
@@ -1400,13 +1397,34 @@ FutureSet ActionsMatcher::makeSet(const ASTFunction & node, Data & data, bool no
     {
         if (no_subqueries)
             return {};
-        auto set_key = PreparedSetKey::forSubquery(*right_in_operand);
 
+        PreparedSets::Hash set_key;
+        if (data.getContext()->getSettingsRef().allow_experimental_analyzer && !identifier)
         {
-            auto set = data.prepared_sets->getFuture(set_key);
-            if (set.isValid())
-                return set;
+            /// Here we can be only from mutation interpreter. Normal selects with analyzed use other interpreter.
+            /// This is a hacky way to allow reusing cache for prepared sets.
+            ///
+            /// Mutation is executed in two stages:
+            /// * first, query 'SELECT count() FROM table WHERE ...' is executed to get the set of affected parts (using analyzer)
+            /// * second, every part is mutated separately, where plan is build "manually", using this code as well
+            /// To share the Set in between first and second stage, we should use the same hash.
+            /// New analyzer is uses a hash from query tree, so here we also build a query tree.
+            ///
+            /// Note : this code can be safely removed, but the test 02581_share_big_sets will be too slow (and fail by timeout).
+            /// Note : we should use new analyzer for mutations and remove this hack.
+            InterpreterSelectQueryAnalyzer interpreter(right_in_operand, data.getContext(), SelectQueryOptions().analyze(true).subquery());
+            const auto & query_tree = interpreter.getQueryTree();
+            if (auto * query_node = query_tree->as<QueryNode>())
+                query_node->setIsSubquery(true);
+            set_key = query_tree->getTreeHash();
         }
+        else
+            set_key = right_in_operand->getTreeHash();
+
+        if (auto set = data.prepared_sets->findSubquery(set_key))
+            return set;
+
+        FutureSetPtr external_table_set;
 
         /// A special case is if the name of the table is specified on the right side of the IN statement,
         ///  and the table has the type Set (a previously prepared set).
@@ -1417,20 +1435,25 @@ FutureSet ActionsMatcher::makeSet(const ASTFunction & node, Data & data, bool no
 
             if (table)
             {
-                StorageSet * storage_set = dynamic_cast<StorageSet *>(table.get());
-                if (storage_set)
-                {
-                    SetPtr set = storage_set->getSet();
-                    data.prepared_sets->set(set_key, set);
-                    return FutureSet(set);
-                }
+                if (auto set = data.prepared_sets->findStorage(set_key))
+                    return set;
+
+                if (StorageSet * storage_set = dynamic_cast<StorageSet *>(table.get()))
+                    return data.prepared_sets->addFromStorage(set_key, storage_set->getSet());
+            }
+
+            if (!data.getContext()->isGlobalContext())
+            {
+                /// If we are reading from storage, it can be an external table which is used for GLOBAL IN.
+                /// Here, we take FutureSet which is used to build external table.
+                /// It will be used if set is useful for primary key. During PK analysis
+                /// temporary table is not filled yet, so we need to fill it first.
+                if (auto tmp_table = data.getContext()->findExternalTable(identifier->getColumnName()))
+                    external_table_set = tmp_table->future_set;
             }
         }
 
-        /// We get the stream of blocks for the subquery. Create Set and put it in place of the subquery.
-        String set_id = right_in_operand->getColumnName();
-        bool transform_null_in =  data.getContext()->getSettingsRef().transform_null_in;
-        SubqueryForSet & subquery_for_set = data.prepared_sets->createOrGetSubquery(set_id, set_key, data.set_size_limit, transform_null_in);
+        std::unique_ptr<QueryPlan> source = std::make_unique<QueryPlan>();
 
         /** The following happens for GLOBAL INs or INs:
           * - in the addExternalStorage function, the IN (SELECT ...) subquery is replaced with IN _data1,
@@ -1440,13 +1463,12 @@ FutureSet ActionsMatcher::makeSet(const ASTFunction & node, Data & data, bool no
           * In case that we have HAVING with IN subquery, we have to force creating set for it.
           * Also it doesn't make sense if it is GLOBAL IN or ordinary IN.
           */
-        if (!subquery_for_set.hasSource())
         {
             auto interpreter = interpretSubquery(right_in_operand, data.getContext(), data.subquery_depth, {});
-            subquery_for_set.createSource(*interpreter);
+            interpreter->buildQueryPlan(*source);
         }
 
-        return subquery_for_set.set;
+        return data.prepared_sets->addFromSubquery(set_key, std::move(source), nullptr, std::move(external_table_set), data.getContext()->getSettingsRef());
     }
     else
     {
@@ -1454,8 +1476,7 @@ FutureSet ActionsMatcher::makeSet(const ASTFunction & node, Data & data, bool no
         const auto & index = data.actions_stack.getLastActionsIndex();
         if (data.prepared_sets && index.contains(left_in_operand->getColumnName()))
             /// An explicit enumeration of values in parentheses.
-            return FutureSet(
-                makeExplicitSet(&node, last_actions, false, data.getContext(), data.set_size_limit, *data.prepared_sets));
+            return makeExplicitSet(&node, last_actions, data.getContext(), *data.prepared_sets);
         else
             return {};
     }
diff --git a/src/Interpreters/ActionsVisitor.h b/src/Interpreters/ActionsVisitor.h
index 3cf43746630..1e2ebaf6d87 100644
--- a/src/Interpreters/ActionsVisitor.h
+++ b/src/Interpreters/ActionsVisitor.h
@@ -25,9 +25,8 @@ class IFunctionOverloadResolver;
 using FunctionOverloadResolverPtr = std::shared_ptr<IFunctionOverloadResolver>;
 
 /// The case of an explicit enumeration of values.
-SetPtr makeExplicitSet(
-    const ASTFunction * node, const ActionsDAG & actions, bool create_ordered_set,
-    ContextPtr context, const SizeLimits & limits, PreparedSets & prepared_sets);
+FutureSetPtr makeExplicitSet(
+    const ASTFunction * node, const ActionsDAG & actions, ContextPtr context, PreparedSets & prepared_sets);
 
 /** For ActionsVisitor
   * A stack of ExpressionActions corresponding to nested lambda expressions.
@@ -217,7 +216,7 @@ private:
     static void visit(const ASTLiteral & literal, const ASTPtr & ast, Data & data);
     static void visit(ASTExpressionList & expression_list, const ASTPtr & ast, Data & data);
 
-    static FutureSet makeSet(const ASTFunction & node, Data & data, bool no_subqueries);
+    static FutureSetPtr makeSet(const ASTFunction & node, Data & data, bool no_subqueries);
     static ASTs doUntuple(const ASTFunction * function, ActionsMatcher::Data & data);
     static std::optional<NameAndTypePair> getNameAndTypeFromAST(const ASTPtr & ast, Data & data);
 };
diff --git a/src/Interpreters/Cache/FileCache.cpp b/src/Interpreters/Cache/FileCache.cpp
index 79a9765108f..91d1c63e832 100644
--- a/src/Interpreters/Cache/FileCache.cpp
+++ b/src/Interpreters/Cache/FileCache.cpp
@@ -11,6 +11,8 @@
 #include <base/hex.h>
 #include <pcg-random/pcg_random.hpp>
 #include <Common/randomSeed.h>
+#include <Common/ThreadPool.h>
+#include <Common/ElapsedTimeProfileEventIncrement.h>
 
 #include <filesystem>
 
@@ -21,6 +23,11 @@ namespace ProfileEvents
 {
     extern const Event FilesystemCacheEvictedBytes;
     extern const Event FilesystemCacheEvictedFileSegments;
+    extern const Event FilesystemCacheLockCacheMicroseconds;
+    extern const Event FilesystemCacheReserveMicroseconds;
+    extern const Event FilesystemCacheEvictMicroseconds;
+    extern const Event FilesystemCacheGetOrSetMicroseconds;
+    extern const Event FilesystemCacheGetMicroseconds;
 }
 
 namespace
@@ -46,12 +53,12 @@ namespace ErrorCodes
 
 FileCache::FileCache(const FileCacheSettings & settings)
     : max_file_segment_size(settings.max_file_segment_size)
-    , allow_persistent_files(settings.do_not_evict_index_and_mark_files)
     , bypass_cache_threshold(settings.enable_bypass_cache_with_threashold ? settings.bypass_cache_threashold : 0)
     , delayed_cleanup_interval_ms(settings.delayed_cleanup_interval_ms)
+    , boundary_alignment(settings.boundary_alignment)
+    , background_download_threads(settings.background_download_threads)
     , log(&Poco::Logger::get("FileCache"))
     , metadata(settings.base_path)
-    , boundary_alignment(settings.boundary_alignment)
 {
     main_priority = std::make_unique<LRUFileCachePriority>(settings.max_size, settings.max_elements);
 
@@ -74,12 +81,12 @@ const String & FileCache::getBasePath() const
 
 String FileCache::getPathInLocalCache(const Key & key, size_t offset, FileSegmentKind segment_kind) const
 {
-    return metadata.getPathInLocalCache(key, offset, segment_kind);
+    return metadata.getPathForFileSegment(key, offset, segment_kind);
 }
 
 String FileCache::getPathInLocalCache(const Key & key) const
 {
-    return metadata.getPathInLocalCache(key);
+    return metadata.getPathForKey(key);
 }
 
 void FileCache::assertInitialized() const
@@ -124,11 +131,20 @@ void FileCache::initialize()
 
     is_initialized = true;
 
+    for (size_t i = 0; i < background_download_threads; ++i)
+         download_threads.emplace_back([this] { metadata.downloadThreadFunc(); });
+
     cleanup_task = Context::getGlobalContextInstance()->getSchedulePool().createTask("FileCacheCleanup", [this]{ cleanupThreadFunc(); });
     cleanup_task->activate();
     cleanup_task->scheduleAfter(delayed_cleanup_interval_ms);
 }
 
+CacheGuard::Lock FileCache::lockCache() const
+{
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheLockCacheMicroseconds);
+    return cache_guard.lock();
+}
+
 FileSegments FileCache::getImpl(const LockedKey & locked_key, const FileSegment::Range & range) const
 {
     /// Given range = [left, right] and non-overlapping ordered set of file segments,
@@ -149,7 +165,7 @@ FileSegments FileCache::getImpl(const LockedKey & locked_key, const FileSegment:
     auto add_to_result = [&](const FileSegmentMetadata & file_segment_metadata)
     {
         FileSegmentPtr file_segment;
-        if (file_segment_metadata.valid())
+        if (!file_segment_metadata.evicting())
         {
             file_segment = file_segment_metadata.file_segment;
             if (file_segment->isDownloaded())
@@ -412,8 +428,15 @@ FileSegmentsHolderPtr FileCache::set(
 }
 
 FileSegmentsHolderPtr
-FileCache::getOrSet(const Key & key, size_t offset, size_t size, size_t file_size, const CreateFileSegmentSettings & settings)
+FileCache::getOrSet(
+    const Key & key,
+    size_t offset,
+    size_t size,
+    size_t file_size,
+    const CreateFileSegmentSettings & settings)
 {
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheGetOrSetMicroseconds);
+
     assertInitialized();
 
     const auto aligned_offset = roundDownToMultiple(offset, boundary_alignment);
@@ -448,6 +471,8 @@ FileCache::getOrSet(const Key & key, size_t offset, size_t size, size_t file_siz
 
 FileSegmentsHolderPtr FileCache::get(const Key & key, size_t offset, size_t size)
 {
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheGetMicroseconds);
+
     assertInitialized();
 
     auto locked_key = metadata.lockKeyMetadata(key, CacheMetadata::KeyNotFoundPolicy::RETURN_NULL);
@@ -483,12 +508,14 @@ KeyMetadata::iterator FileCache::addFileSegment(
     chassert(size > 0); /// Empty file segments in cache are not allowed.
 
     const auto & key = locked_key.getKey();
-    if (locked_key.tryGetByOffset(offset))
+    const FileSegment::Range range(offset, offset + size - 1);
+
+    if (auto intersecting_range = locked_key.hasIntersectingRange(range))
     {
         throw Exception(
             ErrorCodes::LOGICAL_ERROR,
-            "Cache entry already exists for key: `{}`, offset: {}, size: {}.",
-            key, offset, size);
+            "Attempt to add intersecting file segment in cache ({} intersects {})",
+            range.toString(), intersecting_range->toString());
     }
 
     FileSegment::State result_state;
@@ -562,8 +589,10 @@ KeyMetadata::iterator FileCache::addFileSegment(
 
 bool FileCache::tryReserve(FileSegment & file_segment, const size_t size)
 {
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheReserveMicroseconds);
+
     assertInitialized();
-    auto cache_lock = cache_guard.lock();
+    auto cache_lock = lockCache();
 
     LOG_TEST(
         log, "Trying to reserve space ({} bytes) for {}:{}, current usage {}/{}",
@@ -595,15 +624,11 @@ bool FileCache::tryReserve(FileSegment & file_segment, const size_t size)
             file_segment.key(), file_segment.offset());
     }
 
-    /// A file_segment_metadata acquires a LRUQueue iterator on first successful space reservation attempt.
-    auto queue_iterator = file_segment.getQueueIterator();
-    chassert(!queue_iterator || file_segment.getReservedSize() > 0);
-
     struct EvictionCandidates
     {
-        explicit EvictionCandidates(KeyMetadataPtr key_metadata_) : key_metadata(key_metadata_) {}
+        explicit EvictionCandidates(KeyMetadataPtr key_metadata_) : key_metadata(std::move(key_metadata_)) {}
 
-        void add(FileSegmentMetadataPtr candidate)
+        void add(const FileSegmentMetadataPtr & candidate)
         {
             candidate->removal_candidate = true;
             candidates.push_back(candidate);
@@ -624,36 +649,20 @@ bool FileCache::tryReserve(FileSegment & file_segment, const size_t size)
     std::unordered_map<Key, EvictionCandidates> to_delete;
     size_t freeable_space = 0, freeable_count = 0;
 
-    auto iterate_func = [&](LockedKey & locked_key, FileSegmentMetadataPtr segment_metadata)
+    auto iterate_func = [&](LockedKey & locked_key, const FileSegmentMetadataPtr & segment_metadata)
     {
         chassert(segment_metadata->file_segment->assertCorrectness());
 
-        const bool is_persistent = allow_persistent_files && segment_metadata->file_segment->isPersistent();
-        const bool releasable = segment_metadata->releasable() && !is_persistent;
-
-        if (releasable)
+        if (segment_metadata->releasable())
         {
-            auto segment = segment_metadata->file_segment;
-            if (segment->state() == FileSegment::State::DOWNLOADED)
-            {
-                const auto & key = segment->key();
+            const auto & key = segment_metadata->file_segment->key();
+            auto it = to_delete.find(key);
+            if (it == to_delete.end())
+                it = to_delete.emplace(key, locked_key.getKeyMetadata()).first;
+            it->second.add(segment_metadata);
 
-                auto it = to_delete.find(key);
-                if (it == to_delete.end())
-                    it = to_delete.emplace(key, locked_key.getKeyMetadata()).first;
-                it->second.add(segment_metadata);
-
-                freeable_space += segment_metadata->size();
-                freeable_count += 1;
-
-                return PriorityIterationResult::CONTINUE;
-            }
-
-            ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictedFileSegments);
-            ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictedBytes, segment->range().size());
-
-            locked_key.removeFileSegment(segment->offset(), segment->lock());
-            return PriorityIterationResult::REMOVE_AND_CONTINUE;
+            freeable_space += segment_metadata->size();
+            ++freeable_count;
         }
         return PriorityIterationResult::CONTINUE;
     };
@@ -669,7 +678,7 @@ bool FileCache::tryReserve(FileSegment & file_segment, const size_t size)
         if (is_query_priority_overflow())
         {
             query_priority->iterate(
-                [&](LockedKey & locked_key, FileSegmentMetadataPtr segment_metadata)
+                [&](LockedKey & locked_key, const FileSegmentMetadataPtr & segment_metadata)
                 { return is_query_priority_overflow() ? iterate_func(locked_key, segment_metadata) : PriorityIterationResult::BREAK; },
                 cache_lock);
 
@@ -682,20 +691,28 @@ bool FileCache::tryReserve(FileSegment & file_segment, const size_t size)
             file_segment.key(), file_segment.offset());
     }
 
-    auto is_main_priority_overflow = [&]
+    auto is_main_priority_overflow = [main_priority_size_limit = main_priority->getSizeLimit(),
+                                      main_priority_elements_limit = main_priority->getElementsLimit(),
+                                      size,
+                                      &freeable_space,
+                                      &freeable_count,
+                                      &file_segment,
+                                      &cache_lock,
+                                      my_main_priority = this->main_priority.get(),
+                                      my_log = this->log]
     {
-        /// max_size == 0 means unlimited cache size,
-        /// max_element_size == 0 means unlimited number of cache elements.
-        const bool is_overflow = (main_priority->getSizeLimit() != 0
-                                  && (main_priority->getSize(cache_lock) + size - freeable_space > main_priority->getSizeLimit()))
-            || (main_priority->getElementsLimit() != 0
-                && freeable_count == 0 && main_priority->getElementsCount(cache_lock) == main_priority->getElementsLimit());
+        const bool is_overflow =
+            /// size_limit == 0 means unlimited cache size
+            (main_priority_size_limit != 0 && (my_main_priority->getSize(cache_lock) + size - freeable_space > main_priority_size_limit))
+            /// elements_limit == 0 means unlimited number of cache elements
+            || (main_priority_elements_limit != 0 && freeable_count == 0
+                && my_main_priority->getElementsCount(cache_lock) == main_priority_elements_limit);
 
         LOG_TEST(
-            log, "Overflow: {}, size: {}, ready to remove: {} ({} in number), current cache size: {}/{}, elements: {}/{}, while reserving for {}:{}",
+            my_log, "Overflow: {}, size: {}, ready to remove: {} ({} in number), current cache size: {}/{}, elements: {}/{}, while reserving for {}:{}",
             is_overflow, size, freeable_space, freeable_count,
-            main_priority->getSize(cache_lock), main_priority->getSizeLimit(),
-            main_priority->getElementsCount(cache_lock), main_priority->getElementsLimit(),
+            my_main_priority->getSize(cache_lock), my_main_priority->getSizeLimit(),
+            my_main_priority->getElementsCount(cache_lock), my_main_priority->getElementsLimit(),
             file_segment.key(), file_segment.offset());
 
         return is_overflow;
@@ -704,7 +721,7 @@ bool FileCache::tryReserve(FileSegment & file_segment, const size_t size)
     if (is_main_priority_overflow())
     {
         main_priority->iterate(
-            [&](LockedKey & locked_key, FileSegmentMetadataPtr segment_metadata)
+            [&](LockedKey & locked_key, const FileSegmentMetadataPtr & segment_metadata)
             { return is_main_priority_overflow() ? iterate_func(locked_key, segment_metadata) : PriorityIterationResult::BREAK; },
             cache_lock);
 
@@ -715,37 +732,50 @@ bool FileCache::tryReserve(FileSegment & file_segment, const size_t size)
     if (!file_segment.getKeyMetadata()->createBaseDirectory())
         return false;
 
-    for (auto & [current_key, deletion_info] : to_delete)
+    if (!to_delete.empty())
     {
-        auto locked_key = deletion_info.key_metadata->tryLock();
-        if (!locked_key)
-            continue; /// key could become invalid after we released the key lock above, just skip it.
+        LOG_DEBUG(
+            log, "Will evict {} file segments (while reserving {} bytes for {}:{})",
+            to_delete.size(), size, file_segment.key(), file_segment.offset());
 
-        /// delete from vector in reverse order just for efficiency
-        auto & candidates = deletion_info.candidates;
-        while (!candidates.empty())
+        ProfileEventTimeIncrement<Microseconds> evict_watch(ProfileEvents::FilesystemCacheEvictMicroseconds);
+
+        for (auto & [current_key, deletion_info] : to_delete)
         {
-            auto & candidate = candidates.back();
-            chassert(candidate->releasable());
+            auto locked_key = deletion_info.key_metadata->tryLock();
+            if (!locked_key)
+                continue; /// key could become invalid after we released the key lock above, just skip it.
 
-            const auto * segment = candidate->file_segment.get();
+            /// delete from vector in reverse order just for efficiency
+            auto & candidates = deletion_info.candidates;
+            while (!candidates.empty())
+            {
+                auto & candidate = candidates.back();
+                chassert(candidate->releasable());
 
-            ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictedFileSegments);
-            ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictedBytes, segment->range().size());
+                const auto * segment = candidate->file_segment.get();
+                auto queue_it = segment->getQueueIterator();
+                chassert(queue_it);
 
-            locked_key->removeFileSegment(segment->offset(), segment->lock());
-            segment->getQueueIterator()->remove(cache_lock);
+                ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictedFileSegments);
+                ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictedBytes, segment->range().size());
 
-            if (query_context)
-                query_context->remove(current_key, segment->offset(), cache_lock);
+                locked_key->removeFileSegment(segment->offset(), segment->lock());
+                queue_it->remove(cache_lock);
 
-            candidates.pop_back();
+                if (query_context)
+                    query_context->remove(current_key, segment->offset(), cache_lock);
+
+                candidates.pop_back();
+            }
         }
     }
 
-    /// queue_iteratir is std::nullopt here if no space has been reserved yet, a file_segment_metadata
-    /// acquires queue iterator on first successful space reservation attempt.
-    /// If queue iterator already exists, we need to update the size after each space reservation.
+    /// A file_segment_metadata acquires a LRUQueue iterator on first successful space reservation attempt,
+    /// e.g. queue_iteratir is std::nullopt here if no space has been reserved yet.
+    auto queue_iterator = file_segment.getQueueIterator();
+    chassert(!queue_iterator || file_segment.getReservedSize() > 0);
+
     if (queue_iterator)
     {
         queue_iterator->updateSize(size);
@@ -791,17 +821,18 @@ void FileCache::removeKeyIfExists(const Key & key)
     locked_key->removeAllReleasable();
 }
 
+void FileCache::removePathIfExists(const String & path)
+{
+    removeKeyIfExists(createKeyForPath(path));
+}
+
 void FileCache::removeAllReleasable()
 {
     assertInitialized();
 
-    /// Only releasable file segments are evicted.
-    /// `remove_persistent_files` defines whether non-evictable by some criteria files
-    /// (they do not comply with the cache eviction policy) should also be removed.
+    auto lock = lockCache();
 
-    auto lock = cache_guard.lock();
-
-    main_priority->iterate([&](LockedKey & locked_key, FileSegmentMetadataPtr segment_metadata)
+    main_priority->iterate([&](LockedKey & locked_key, const FileSegmentMetadataPtr & segment_metadata)
     {
         if (segment_metadata->releasable())
         {
@@ -822,7 +853,7 @@ void FileCache::removeAllReleasable()
 
 void FileCache::loadMetadata()
 {
-    auto lock = cache_guard.lock();
+    auto lock = lockCache();
 
     UInt64 offset = 0;
     size_t size = 0;
@@ -901,7 +932,9 @@ void FileCache::loadMetadata()
                     parsed = tryParse<UInt64>(offset, offset_with_suffix.substr(0, delim_pos));
                     if (offset_with_suffix.substr(delim_pos+1) == "persistent")
                     {
-                        segment_kind = FileSegmentKind::Persistent;
+                        /// For compatibility. Persistent files are no longer supported.
+                        fs::remove(offset_it->path());
+                        continue;
                     }
                     if (offset_with_suffix.substr(delim_pos+1) == "temporary")
                     {
@@ -926,8 +959,20 @@ void FileCache::loadMetadata()
                 if ((main_priority->getSizeLimit() == 0 || main_priority->getSize(lock) + size <= main_priority->getSizeLimit())
                     && (main_priority->getElementsLimit() == 0 || main_priority->getElementsCount(lock) + 1 <= main_priority->getElementsLimit()))
                 {
-                    auto file_segment_metadata_it = addFileSegment(
-                        *locked_key, offset, size, FileSegment::State::DOWNLOADED, CreateFileSegmentSettings(segment_kind), &lock);
+                    KeyMetadata::iterator file_segment_metadata_it;
+                    try
+                    {
+                        file_segment_metadata_it = addFileSegment(
+                            *locked_key, offset, size, FileSegment::State::DOWNLOADED, CreateFileSegmentSettings(segment_kind), &lock);
+                    }
+                    catch (...)
+                    {
+                        tryLogCurrentException(__PRETTY_FUNCTION__);
+                        chassert(false);
+
+                        fs::remove(offset_it->path());
+                        continue;
+                    }
 
                     const auto & file_segment_metadata = file_segment_metadata_it->second;
                     chassert(file_segment_metadata->file_segment->assertCorrectness());
@@ -979,6 +1024,11 @@ void FileCache::deactivateBackgroundOperations()
 {
     if (cleanup_task)
         cleanup_task->deactivate();
+
+    metadata.cancelDownload();
+    for (auto & thread : download_threads)
+        if (thread.joinable())
+            thread.join();
 }
 
 void FileCache::cleanup()
@@ -988,10 +1038,6 @@ void FileCache::cleanup()
 
 void FileCache::cleanupThreadFunc()
 {
-#ifndef NDEBUG
-    assertCacheCorrectness();
-#endif
-
     try
     {
         cleanup();
@@ -999,6 +1045,7 @@ void FileCache::cleanupThreadFunc()
     catch (...)
     {
         tryLogCurrentException(__PRETTY_FUNCTION__);
+        chassert(false);
     }
 
     cleanup_task->scheduleAfter(delayed_cleanup_interval_ms);
@@ -1034,11 +1081,11 @@ FileSegmentsHolderPtr FileCache::dumpQueue()
     assertInitialized();
 
     FileSegments file_segments;
-    main_priority->iterate([&](LockedKey &, FileSegmentMetadataPtr segment_metadata)
+    main_priority->iterate([&](LockedKey &, const FileSegmentMetadataPtr & segment_metadata)
     {
         file_segments.push_back(FileSegment::getSnapshot(segment_metadata->file_segment));
         return PriorityIterationResult::CONTINUE;
-    }, cache_guard.lock());
+    }, lockCache());
 
     return std::make_unique<FileSegmentsHolder>(std::move(file_segments));
 }
@@ -1056,25 +1103,25 @@ std::vector<String> FileCache::tryGetCachePaths(const Key & key)
     for (const auto & [offset, file_segment_metadata] : *locked_key->getKeyMetadata())
     {
         if (file_segment_metadata->file_segment->state() == FileSegment::State::DOWNLOADED)
-            cache_paths.push_back(metadata.getPathInLocalCache(key, offset, file_segment_metadata->file_segment->getKind()));
+            cache_paths.push_back(metadata.getPathForFileSegment(key, offset, file_segment_metadata->file_segment->getKind()));
     }
     return cache_paths;
 }
 
 size_t FileCache::getUsedCacheSize() const
 {
-    return main_priority->getSize(cache_guard.lock());
+    return main_priority->getSize(lockCache());
 }
 
 size_t FileCache::getFileSegmentsNum() const
 {
-    return main_priority->getElementsCount(cache_guard.lock());
+    return main_priority->getElementsCount(lockCache());
 }
 
 void FileCache::assertCacheCorrectness()
 {
-    auto lock = cache_guard.lock();
-    main_priority->iterate([&](LockedKey &, FileSegmentMetadataPtr segment_metadata)
+    auto lock = lockCache();
+    main_priority->iterate([&](LockedKey &, const FileSegmentMetadataPtr & segment_metadata)
     {
         const auto & file_segment = *segment_metadata->file_segment;
         UNUSED(file_segment);
@@ -1099,7 +1146,7 @@ FileCache::QueryContextHolder::~QueryContextHolder()
     /// the query has been completed and the query_context is released.
     if (context && context.use_count() == 2)
     {
-        auto lock = cache->cache_guard.lock();
+        auto lock = cache->lockCache();
         cache->query_limit->removeQueryContext(query_id, lock);
     }
 }
@@ -1110,7 +1157,7 @@ FileCache::QueryContextHolderPtr FileCache::getQueryContextHolder(
     if (!query_limit || settings.filesystem_cache_max_download_size == 0)
         return {};
 
-    auto lock = cache_guard.lock();
+    auto lock = lockCache();
     auto context = query_limit->getOrSetQueryContext(query_id, settings, lock);
     return std::make_unique<QueryContextHolder>(query_id, this, std::move(context));
 }
diff --git a/src/Interpreters/Cache/FileCache.h b/src/Interpreters/Cache/FileCache.h
index 71fc1722844..0e3b17baa2f 100644
--- a/src/Interpreters/Cache/FileCache.h
+++ b/src/Interpreters/Cache/FileCache.h
@@ -86,6 +86,9 @@ public:
     /// Remove files by `key`. Removes files which might be used at the moment.
     void removeKeyIfExists(const Key & key);
 
+    /// Removes files by `path`. Removes files which might be used at the moment.
+    void removePathIfExists(const String & path);
+
     /// Remove files by `key`. Will not remove files which are used at the moment.
     void removeAllReleasable();
 
@@ -125,15 +128,16 @@ public:
     using QueryContextHolderPtr = std::unique_ptr<QueryContextHolder>;
     QueryContextHolderPtr getQueryContextHolder(const String & query_id, const ReadSettings & settings);
 
-    CacheGuard::Lock lockCache() { return cache_guard.lock(); }
+    CacheGuard::Lock lockCache() const;
 
 private:
     using KeyAndOffset = FileCacheKeyAndOffset;
 
     const size_t max_file_segment_size;
-    const bool allow_persistent_files;
     const size_t bypass_cache_threshold = 0;
     const size_t delayed_cleanup_interval_ms;
+    const size_t boundary_alignment;
+    const size_t background_download_threads;
 
     Poco::Logger * log;
 
@@ -178,9 +182,9 @@ private:
      */
     BackgroundSchedulePool::TaskHolder cleanup_task;
 
-    void assertInitialized() const;
+    std::vector<ThreadFromGlobalPool> download_threads;
 
-    size_t boundary_alignment;
+    void assertInitialized() const;
 
     void assertCacheCorrectness();
 
diff --git a/src/Interpreters/Cache/FileCacheSettings.cpp b/src/Interpreters/Cache/FileCacheSettings.cpp
index 1fe51bf5f3e..455e9b44d0b 100644
--- a/src/Interpreters/Cache/FileCacheSettings.cpp
+++ b/src/Interpreters/Cache/FileCacheSettings.cpp
@@ -31,10 +31,9 @@ void FileCacheSettings::loadFromConfig(const Poco::Util::AbstractConfiguration &
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Disk Cache requires non-empty `path` field (cache base path) in config");
 
     max_elements = config.getUInt64(config_prefix + ".max_elements", FILECACHE_DEFAULT_MAX_ELEMENTS);
+
     if (config.has(config_prefix + ".max_file_segment_size"))
         max_file_segment_size = parseWithSizeSuffix<uint64_t>(config.getString(config_prefix + ".max_file_segment_size"));
-    else
-        max_file_segment_size = FILECACHE_DEFAULT_MAX_FILE_SEGMENT_SIZE;
 
     cache_on_write_operations = config.getUInt64(config_prefix + ".cache_on_write_operations", false);
     enable_filesystem_query_cache_limit = config.getUInt64(config_prefix + ".enable_filesystem_query_cache_limit", false);
@@ -44,12 +43,12 @@ void FileCacheSettings::loadFromConfig(const Poco::Util::AbstractConfiguration &
 
     if (config.has(config_prefix + ".bypass_cache_threashold"))
         bypass_cache_threashold = parseWithSizeSuffix<uint64_t>(config.getString(config_prefix + ".bypass_cache_threashold"));
-    else
-         bypass_cache_threashold = FILECACHE_BYPASS_THRESHOLD;
 
-    do_not_evict_index_and_mark_files = config.getUInt64(config_prefix + ".do_not_evict_index_and_mark_files", true);
+    if (config.has(config_prefix + ".boundary_alignment"))
+        boundary_alignment = parseWithSizeSuffix<uint64_t>(config.getString(config_prefix + ".boundary_alignment"));
 
-    boundary_alignment = config.getUInt64(config_prefix + ".boundary_alignment", DBMS_DEFAULT_BUFFER_SIZE);
+    if (config.has(config_prefix + ".background_download_threads"))
+        background_download_threads = config.getUInt(config_prefix + ".background_download_threads");
 
     delayed_cleanup_interval_ms = config.getUInt64(config_prefix + ".delayed_cleanup_interval_ms", FILECACHE_DELAYED_CLEANUP_INTERVAL_MS);
 }
diff --git a/src/Interpreters/Cache/FileCacheSettings.h b/src/Interpreters/Cache/FileCacheSettings.h
index eeb2a02c131..e56d6fcc54d 100644
--- a/src/Interpreters/Cache/FileCacheSettings.h
+++ b/src/Interpreters/Cache/FileCacheSettings.h
@@ -22,13 +22,12 @@ struct FileCacheSettings
     size_t cache_hits_threshold = FILECACHE_DEFAULT_HITS_THRESHOLD;
     bool enable_filesystem_query_cache_limit = false;
 
-    bool do_not_evict_index_and_mark_files = true;
-
     bool enable_bypass_cache_with_threashold = false;
     size_t bypass_cache_threashold = FILECACHE_BYPASS_THRESHOLD;
     size_t delayed_cleanup_interval_ms = FILECACHE_DELAYED_CLEANUP_INTERVAL_MS;
 
-    size_t boundary_alignment = DBMS_DEFAULT_BUFFER_SIZE;
+    size_t boundary_alignment = FILECACHE_DEFAULT_FILE_SEGMENT_ALIGNMENT;
+    size_t background_download_threads = FILECACHE_DEFAULT_BACKGROUND_DOWNLOAD_THREADS;
 
     void loadFromConfig(const Poco::Util::AbstractConfiguration & config, const std::string & config_prefix);
 };
diff --git a/src/Interpreters/Cache/FileCache_fwd.h b/src/Interpreters/Cache/FileCache_fwd.h
index dbb85fa0e7a..4d4a1c1429c 100644
--- a/src/Interpreters/Cache/FileCache_fwd.h
+++ b/src/Interpreters/Cache/FileCache_fwd.h
@@ -4,8 +4,10 @@
 namespace DB
 {
 
-static constexpr int FILECACHE_DEFAULT_MAX_FILE_SEGMENT_SIZE = 8 * 1024 * 1024;
-static constexpr int FILECACHE_DEFAULT_MAX_ELEMENTS = 1024 * 1024;
+static constexpr int FILECACHE_DEFAULT_MAX_FILE_SEGMENT_SIZE = 32 * 1024 * 1024; /// 32Mi
+static constexpr int FILECACHE_DEFAULT_FILE_SEGMENT_ALIGNMENT = 4 * 1024 * 1024; /// 4Mi
+static constexpr int FILECACHE_DEFAULT_BACKGROUND_DOWNLOAD_THREADS = 2;
+static constexpr int FILECACHE_DEFAULT_MAX_ELEMENTS = 10000000;
 static constexpr int FILECACHE_DEFAULT_HITS_THRESHOLD = 0;
 static constexpr size_t FILECACHE_BYPASS_THRESHOLD = 256 * 1024 * 1024;
 static constexpr size_t FILECACHE_DELAYED_CLEANUP_INTERVAL_MS = 1000 * 60; /// 1 min
diff --git a/src/Interpreters/Cache/FileSegment.cpp b/src/Interpreters/Cache/FileSegment.cpp
index 9370b64b2d4..d191b2a803c 100644
--- a/src/Interpreters/Cache/FileSegment.cpp
+++ b/src/Interpreters/Cache/FileSegment.cpp
@@ -9,11 +9,22 @@
 #include <Common/OpenTelemetryTraceContext.h>
 #include <Common/logger_useful.h>
 #include <Common/scope_guard_safe.h>
+#include <Common/ElapsedTimeProfileEventIncrement.h>
 
 #include <magic_enum.hpp>
 
 namespace fs = std::filesystem;
 
+namespace ProfileEvents
+{
+    extern const Event FileSegmentWaitMicroseconds;
+    extern const Event FileSegmentCompleteMicroseconds;
+    extern const Event FileSegmentLockMicroseconds;
+    extern const Event FileSegmentWriteMicroseconds;
+    extern const Event FileSegmentUseMicroseconds;
+    extern const Event FileSegmentHolderCompleteMicroseconds;
+}
+
 namespace DB
 {
 
@@ -83,9 +94,15 @@ FileSegment::FileSegment(
     }
 }
 
+FileSegment::Range::Range(size_t left_, size_t right_) : left(left_), right(right_)
+{
+    if (left > right)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to create incorrect range: [{}, {}]", left, right);
+}
+
 FileSegment::State FileSegment::state() const
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     return download_state;
 }
 
@@ -94,6 +111,12 @@ String FileSegment::getPathInLocalCache() const
     return getKeyMetadata()->getFileSegmentPath(*this);
 }
 
+FileSegmentGuard::Lock FileSegment::lockFileSegment() const
+{
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FileSegmentLockMicroseconds);
+    return segment_guard.lock();
+}
+
 void FileSegment::setDownloadState(State state, const FileSegmentGuard::Lock & lock)
 {
     if (isCompleted(false) && state != State::DETACHED)
@@ -110,19 +133,19 @@ void FileSegment::setDownloadState(State state, const FileSegmentGuard::Lock & l
 
 size_t FileSegment::getReservedSize() const
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     return reserved_size;
 }
 
 FileSegment::Priority::Iterator FileSegment::getQueueIterator() const
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     return queue_iterator;
 }
 
 void FileSegment::setQueueIterator(Priority::Iterator iterator)
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     if (queue_iterator)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Queue iterator cannot be set twice");
     queue_iterator = iterator;
@@ -150,14 +173,14 @@ size_t FileSegment::getDownloadedSize(bool sync) const
 
 void FileSegment::setDownloadedSize(size_t delta)
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     downloaded_size += delta;
     assert(downloaded_size == std::filesystem::file_size(getPathInLocalCache()));
 }
 
 bool FileSegment::isDownloaded() const
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     return download_state == State::DOWNLOADED;
 }
 
@@ -173,7 +196,7 @@ String FileSegment::getCallerId()
 
 String FileSegment::getDownloader() const
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     return getDownloaderUnlocked(lock);
 }
 
@@ -184,7 +207,7 @@ String FileSegment::getDownloaderUnlocked(const FileSegmentGuard::Lock &) const
 
 String FileSegment::getOrSetDownloader()
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
 
     assertNotDetachedUnlocked(lock);
 
@@ -214,13 +237,15 @@ void FileSegment::resetDownloadingStateUnlocked(const FileSegmentGuard::Lock & l
     /// range().size() can equal 0 in case of write-though cache.
     if (!is_unbound && current_downloaded_size != 0 && current_downloaded_size == range().size())
         setDownloadedUnlocked(lock);
-    else
+    else if (current_downloaded_size)
         setDownloadState(State::PARTIALLY_DOWNLOADED, lock);
+    else
+        setDownloadState(State::EMPTY, lock);
 }
 
 void FileSegment::resetDownloader()
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
 
     SCOPE_EXIT({ cv.notify_all(); });
 
@@ -255,7 +280,7 @@ void FileSegment::assertIsDownloaderUnlocked(const std::string & operation, cons
 
 bool FileSegment::isDownloader() const
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     return isDownloaderUnlocked(lock);
 }
 
@@ -266,41 +291,32 @@ bool FileSegment::isDownloaderUnlocked(const FileSegmentGuard::Lock & lock) cons
 
 FileSegment::RemoteFileReaderPtr FileSegment::getRemoteFileReader()
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     assertIsDownloaderUnlocked("getRemoteFileReader", lock);
     return remote_file_reader;
 }
 
 void FileSegment::resetRemoteFileReader()
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     assertIsDownloaderUnlocked("resetRemoteFileReader", lock);
     remote_file_reader.reset();
 }
 
 FileSegment::RemoteFileReaderPtr FileSegment::extractRemoteFileReader()
 {
-    auto locked_key = lockKeyMetadata(false);
-    if (!locked_key)
+    auto lock = lockFileSegment();
+    if (remote_file_reader && (download_state == State::DOWNLOADED
+        || download_state == State::PARTIALLY_DOWNLOADED_NO_CONTINUATION))
     {
-        assert(isDetached());
         return std::move(remote_file_reader);
     }
-
-    auto segment_lock = segment_guard.lock();
-
-    assert(download_state != State::DETACHED);
-
-    bool is_last_holder = locked_key->isLastOwnerOfFileSegment(offset());
-    if (!downloader_id.empty() || !is_last_holder)
-        return nullptr;
-
-    return std::move(remote_file_reader);
+    return nullptr;
 }
 
 void FileSegment::setRemoteFileReader(RemoteFileReaderPtr remote_file_reader_)
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     assertIsDownloaderUnlocked("setRemoteFileReader", lock);
 
     if (remote_file_reader)
@@ -311,11 +327,15 @@ void FileSegment::setRemoteFileReader(RemoteFileReaderPtr remote_file_reader_)
 
 void FileSegment::write(const char * from, size_t size, size_t offset)
 {
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FileSegmentWriteMicroseconds);
+
     if (!size)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Writing zero size is not allowed");
 
+    const auto file_segment_path = getPathInLocalCache();
+
     {
-        auto lock = segment_guard.lock();
+        auto lock = lockFileSegment();
 
         assertIsDownloaderUnlocked("write", lock);
         assertNotDetachedUnlocked(lock);
@@ -352,7 +372,7 @@ void FileSegment::write(const char * from, size_t size, size_t offset)
                     "Cache writer was finalized (downloaded size: {}, state: {})",
                     current_downloaded_size, stateToString(download_state));
 
-            cache_writer = std::make_unique<WriteBufferFromFile>(getPathInLocalCache());
+            cache_writer = std::make_unique<WriteBufferFromFile>(file_segment_path);
         }
     }
 
@@ -366,19 +386,20 @@ void FileSegment::write(const char * from, size_t size, size_t offset)
 
         downloaded_size += size;
 
-        chassert(std::filesystem::file_size(getPathInLocalCache()) == downloaded_size);
+        chassert(std::filesystem::file_size(file_segment_path) == downloaded_size);
     }
     catch (ErrnoException & e)
     {
-        auto lock = segment_guard.lock();
+        auto lock = lockFileSegment();
         e.addMessage(fmt::format("{}, current cache state: {}", e.what(), getInfoForLogUnlocked(lock)));
 
         int code = e.getErrno();
         if (code == /* No space left on device */28 || code == /* Quota exceeded */122)
         {
-            const auto file_size = fs::file_size(getPathInLocalCache());
+            const auto file_size = fs::file_size(file_segment_path);
             chassert(downloaded_size <= file_size);
             chassert(reserved_size >= file_size);
+            chassert(file_size <= range().size());
             if (downloaded_size != file_size)
                 downloaded_size = file_size;
         }
@@ -389,7 +410,7 @@ void FileSegment::write(const char * from, size_t size, size_t offset)
     }
     catch (Exception & e)
     {
-        auto lock = segment_guard.lock();
+        auto lock = lockFileSegment();
         e.addMessage(fmt::format("{}, current cache state: {}", e.what(), getInfoForLogUnlocked(lock)));
         setDownloadFailedUnlocked(lock);
         throw;
@@ -402,7 +423,7 @@ FileSegment::State FileSegment::wait(size_t offset)
 {
     OpenTelemetry::SpanHolder span{fmt::format("FileSegment::wait({})", key().toString())};
 
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
 
     if (downloader_id.empty() || offset < getCurrentWriteOffset(true))
         return download_state;
@@ -413,13 +434,14 @@ FileSegment::State FileSegment::wait(size_t offset)
     if (download_state == State::DOWNLOADING)
     {
         LOG_TEST(log, "{} waiting on: {}, current downloader: {}", getCallerId(), range().toString(), downloader_id);
+        ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FileSegmentWaitMicroseconds);
 
         chassert(!getDownloaderUnlocked(lock).empty());
         chassert(!isDownloaderUnlocked(lock));
 
         [[maybe_unused]] const auto ok = cv.wait_for(lock, std::chrono::seconds(60), [&, this]()
         {
-            return download_state != State::DOWNLOADING || offset < getCurrentWriteOffset(true);
+            return download_state != State::DOWNLOADING || offset < getCurrentWriteOffset(false);
         });
         /// chassert(ok);
     }
@@ -504,7 +526,7 @@ bool FileSegment::reserve(size_t size_to_reserve)
     reserved = cache->tryReserve(*this, size_to_reserve);
 
     if (!reserved)
-        setDownloadFailedUnlocked(segment_guard.lock());
+        setDownloadFailedUnlocked(lockFileSegment());
 
     return reserved;
 }
@@ -523,8 +545,8 @@ void FileSegment::setDownloadedUnlocked(const FileSegmentGuard::Lock &)
         remote_file_reader.reset();
     }
 
-    chassert(getDownloadedSize(false) > 0);
-    chassert(fs::file_size(getPathInLocalCache()) > 0);
+    chassert(downloaded_size > 0);
+    chassert(fs::file_size(getPathInLocalCache()) == downloaded_size);
 }
 
 void FileSegment::setDownloadFailedUnlocked(const FileSegmentGuard::Lock & lock)
@@ -546,7 +568,7 @@ void FileSegment::setDownloadFailedUnlocked(const FileSegmentGuard::Lock & lock)
 
 void FileSegment::completePartAndResetDownloader()
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
 
     SCOPE_EXIT({ cv.notify_all(); });
 
@@ -566,6 +588,8 @@ void FileSegment::completePartAndResetDownloader()
 
 void FileSegment::complete()
 {
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FileSegmentCompleteMicroseconds);
+
     if (isCompleted())
         return;
 
@@ -579,7 +603,7 @@ void FileSegment::complete()
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot complete file segment: {}", getInfoForLog());
     }
 
-    auto segment_lock = segment_guard.lock();
+    auto segment_lock = lockFileSegment();
 
     if (isCompleted(false))
         return;
@@ -604,21 +628,9 @@ void FileSegment::complete()
         resetDownloaderUnlocked(segment_lock);
     }
 
-    if (is_downloader || is_last_holder)
-    {
-        if (cache_writer)
-        {
-            cache_writer->finalize();
-            cache_writer.reset();
-        }
-        remote_file_reader.reset();
-    }
-
     if (segment_kind == FileSegmentKind::Temporary && is_last_holder)
     {
         LOG_TEST(log, "Removing temporary file segment: {}", getInfoForLogUnlocked(segment_lock));
-        detach(segment_lock, *locked_key);
-        setDownloadState(State::DETACHED, segment_lock);
         locked_key->removeFileSegment(offset(), segment_lock);
         return;
     }
@@ -630,6 +642,7 @@ void FileSegment::complete()
             chassert(current_downloaded_size == range().size());
             chassert(current_downloaded_size == fs::file_size(getPathInLocalCache()));
             chassert(!cache_writer);
+            chassert(!remote_file_reader);
             break;
         }
         case State::DOWNLOADING:
@@ -638,7 +651,33 @@ void FileSegment::complete()
             break;
         }
         case State::EMPTY:
+        {
+            if (is_last_holder)
+                locked_key->removeFileSegment(offset(), segment_lock);
+            break;
+        }
         case State::PARTIALLY_DOWNLOADED:
+        {
+            chassert(current_downloaded_size > 0);
+
+            if (is_last_holder)
+            {
+                if (remote_file_reader)
+                {
+                    LOG_TEST(
+                        log, "Submitting file segment for background download "
+                        "(having {}/{})", downloaded_size, range().size());
+
+                    locked_key->addToDownloadQueue(offset(), segment_lock); /// Finish download in background.
+                }
+                else
+                {
+                    locked_key->shrinkFileSegmentToDownloadedSize(offset(), segment_lock);
+                    setDetachedState(segment_lock); /// See comment below.
+                }
+            }
+            break;
+        }
         case State::PARTIALLY_DOWNLOADED_NO_CONTINUATION:
         {
             chassert(current_downloaded_size != range().size());
@@ -647,7 +686,6 @@ void FileSegment::complete()
             {
                 if (current_downloaded_size == 0)
                 {
-                    LOG_TEST(log, "Remove file segment {} (nothing downloaded)", range().toString());
                     locked_key->removeFileSegment(offset(), segment_lock);
                 }
                 else
@@ -669,9 +707,8 @@ void FileSegment::complete()
 
                     /// We mark current file segment with state DETACHED, even though the data is still in cache
                     /// (but a separate file segment) because is_last_holder is satisfied, so it does not matter.
+                    setDetachedState(segment_lock);
                 }
-
-                setDetachedState(segment_lock);
             }
             break;
         }
@@ -684,7 +721,7 @@ void FileSegment::complete()
 
 String FileSegment::getInfoForLog() const
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     return getInfoForLogUnlocked(lock);
 }
 
@@ -728,7 +765,7 @@ String FileSegment::stateToString(FileSegment::State state)
 
 bool FileSegment::assertCorrectness() const
 {
-    return assertCorrectnessUnlocked(segment_guard.lock());
+    return assertCorrectnessUnlocked(lockFileSegment());
 }
 
 bool FileSegment::assertCorrectnessUnlocked(const FileSegmentGuard::Lock &) const
@@ -767,7 +804,6 @@ bool FileSegment::assertCorrectnessUnlocked(const FileSegmentGuard::Lock &) cons
         }
 
         chassert(reserved_size >= downloaded_size);
-        chassert((reserved_size == 0) || queue_iterator);
         check_iterator(queue_iterator);
     }
 
@@ -776,7 +812,7 @@ bool FileSegment::assertCorrectnessUnlocked(const FileSegmentGuard::Lock &) cons
 
 void FileSegment::assertNotDetached() const
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     assertNotDetachedUnlocked(lock);
 }
 
@@ -794,7 +830,7 @@ void FileSegment::assertNotDetachedUnlocked(const FileSegmentGuard::Lock & lock)
 
 FileSegmentPtr FileSegment::getSnapshot(const FileSegmentPtr & file_segment)
 {
-    auto lock = file_segment->segment_guard.lock();
+    auto lock = file_segment->lockFileSegment();
 
     auto snapshot = std::make_shared<FileSegment>(
         file_segment->key(),
@@ -813,7 +849,7 @@ FileSegmentPtr FileSegment::getSnapshot(const FileSegmentPtr & file_segment)
 
 bool FileSegment::isDetached() const
 {
-    auto lock = segment_guard.lock();
+    auto lock = lockFileSegment();
     return download_state == State::DETACHED;
 }
 
@@ -829,7 +865,7 @@ bool FileSegment::isCompleted(bool sync) const
         if (is_completed_state())
             return true;
 
-        auto lock = segment_guard.lock();
+        auto lock = lockFileSegment();
         return is_completed_state();
     }
 
@@ -841,6 +877,9 @@ void FileSegment::setDetachedState(const FileSegmentGuard::Lock & lock)
     setDownloadState(State::DETACHED, lock);
     key_metadata.reset();
     cache = nullptr;
+    queue_iterator = nullptr;
+    cache_writer.reset();
+    remote_file_reader.reset();
 }
 
 void FileSegment::detach(const FileSegmentGuard::Lock & lock, const LockedKey &)
@@ -848,15 +887,18 @@ void FileSegment::detach(const FileSegmentGuard::Lock & lock, const LockedKey &)
     if (download_state == State::DETACHED)
         return;
 
-    resetDownloaderUnlocked(lock);
+    if (!downloader_id.empty())
+        resetDownloaderUnlocked(lock);
     setDetachedState(lock);
 }
 
 void FileSegment::use()
 {
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FileSegmentUseMicroseconds);
+
     if (!cache)
     {
-        chassert(isCompleted(true));
+        chassert(isDetached());
         return;
     }
 
@@ -864,7 +906,7 @@ void FileSegment::use()
     if (it)
     {
         auto cache_lock = cache->lockCache();
-        it->use(cache_lock);
+        hits_count = it->use(cache_lock);
     }
 }
 
@@ -876,6 +918,8 @@ FileSegments::iterator FileSegmentsHolder::completeAndPopFrontImpl()
 
 FileSegmentsHolder::~FileSegmentsHolder()
 {
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FileSegmentHolderCompleteMicroseconds);
+
     if (!complete_on_dtor)
         return;
 
diff --git a/src/Interpreters/Cache/FileSegment.h b/src/Interpreters/Cache/FileSegment.h
index 163a15fcfda..44d95816915 100644
--- a/src/Interpreters/Cache/FileSegment.h
+++ b/src/Interpreters/Cache/FileSegment.h
@@ -37,11 +37,6 @@ enum class FileSegmentKind
      */
     Regular,
 
-    /* `Persistent` file segment can't be evicted from cache,
-     * it should be removed manually.
-     */
-    Persistent,
-
     /* `Temporary` file segment is removed right after releasing.
      * Also corresponding files are removed during cache loading (if any).
      */
@@ -85,7 +80,7 @@ public:
         EMPTY,
         /**
          * A newly created file segment never has DOWNLOADING state until call to getOrSetDownloader
-         * because each cache user might acquire multiple file segments and reads them one by one,
+         * because each cache user might acquire multiple file segments and read them one by one,
          * so only user which actually needs to read this segment earlier than others - becomes a downloader.
          */
         DOWNLOADING,
@@ -130,10 +125,12 @@ public:
         size_t left;
         size_t right;
 
-        Range(size_t left_, size_t right_) : left(left_), right(right_) {}
+        Range(size_t left_, size_t right_);
 
         bool operator==(const Range & other) const { return left == other.left && right == other.right; }
 
+        bool operator<(const Range & other) const { return right < other.left; }
+
         size_t size() const { return right - left + 1; }
 
         String toString() const { return fmt::format("[{}, {}]", std::to_string(left), std::to_string(right)); }
@@ -155,12 +152,12 @@ public:
 
     FileSegmentKind getKind() const { return segment_kind; }
 
-    bool isPersistent() const { return segment_kind == FileSegmentKind::Persistent; }
-
     bool isUnbound() const { return is_unbound; }
 
     String getPathInLocalCache() const;
 
+    int getFlagsForLocalRead() const { return O_RDONLY | O_CLOEXEC; }
+
     /**
      * ========== Methods for _any_ file segment's owner ========================
      */
@@ -180,8 +177,6 @@ public:
 
     size_t getRefCount() const { return ref_count; }
 
-    void incrementHitsCount() { ++hits_count; }
-
     size_t getCurrentWriteOffset(bool sync) const;
 
     size_t getFirstNonDownloadedOffset(bool sync) const;
@@ -293,6 +288,7 @@ private:
     bool assertCorrectnessUnlocked(const FileSegmentGuard::Lock &) const;
 
     LockedKeyPtr lockKeyMetadata(bool assert_exists = true) const;
+    FileSegmentGuard::Lock lockFileSegment() const;
 
     Key file_key;
     Range segment_range;
@@ -360,12 +356,6 @@ struct FileSegmentsHolder : private boost::noncopyable
     FileSegments::const_iterator begin() const { return file_segments.begin(); }
     FileSegments::const_iterator end() const { return file_segments.end(); }
 
-    void moveTo(FileSegmentsHolder & holder)
-    {
-        holder.file_segments.insert(holder.file_segments.end(), file_segments.begin(), file_segments.end());
-        file_segments.clear();
-    }
-
 private:
     FileSegments file_segments{};
     const bool complete_on_dtor = true;
diff --git a/src/Interpreters/Cache/IFileCachePriority.h b/src/Interpreters/Cache/IFileCachePriority.h
index ad63dcc7ea5..34c49653ab8 100644
--- a/src/Interpreters/Cache/IFileCachePriority.h
+++ b/src/Interpreters/Cache/IFileCachePriority.h
@@ -44,13 +44,13 @@ public:
 
         virtual size_t use(const CacheGuard::Lock &) = 0;
 
-        virtual std::shared_ptr<IIterator> remove(const CacheGuard::Lock &) = 0;
+        virtual void remove(const CacheGuard::Lock &) = 0;
 
         virtual const Entry & getEntry() const = 0;
 
         virtual Entry & getEntry() = 0;
 
-        virtual void annul() = 0;
+        virtual void invalidate() = 0;
 
         virtual void updateSize(int64_t size) = 0;
     };
@@ -64,7 +64,7 @@ public:
         CONTINUE,
         REMOVE_AND_CONTINUE,
     };
-    using IterateFunc = std::function<IterationResult(LockedKey &, FileSegmentMetadataPtr)>;
+    using IterateFunc = std::function<IterationResult(LockedKey &, const FileSegmentMetadataPtr &)>;
 
     IFileCachePriority(size_t max_size_, size_t max_elements_) : max_size(max_size_), max_elements(max_elements_) {}
 
@@ -85,6 +85,7 @@ public:
 
     virtual void removeAll(const CacheGuard::Lock &) = 0;
 
+    /// From lowest to highest priority.
     virtual void iterate(IterateFunc && func, const CacheGuard::Lock &) = 0;
 
 private:
diff --git a/src/Interpreters/Cache/LRUFileCachePriority.cpp b/src/Interpreters/Cache/LRUFileCachePriority.cpp
index 3c36962a0e5..18862e154da 100644
--- a/src/Interpreters/Cache/LRUFileCachePriority.cpp
+++ b/src/Interpreters/Cache/LRUFileCachePriority.cpp
@@ -25,6 +25,14 @@ IFileCachePriority::Iterator LRUFileCachePriority::add(
     const CacheGuard::Lock &)
 {
     const auto & key = key_metadata->key;
+    if (size == 0)
+    {
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR,
+            "Adding zero size entries to LRU queue is not allowed "
+            "(key: {}, offset: {})", key, offset);
+    }
+
 #ifndef NDEBUG
     for (const auto & entry : queue)
     {
@@ -48,10 +56,9 @@ IFileCachePriority::Iterator LRUFileCachePriority::add(
     }
 
     auto iter = queue.insert(queue.end(), Entry(key, offset, size, key_metadata));
-    current_size += size;
 
-    CurrentMetrics::add(CurrentMetrics::FilesystemCacheSize, size);
-    CurrentMetrics::add(CurrentMetrics::FilesystemCacheElements);
+    updateSize(size);
+    updateElementsCount(1);
 
     LOG_TEST(
         log, "Added entry into LRU queue, key: {}, offset: {}, size: {}",
@@ -62,13 +69,11 @@ IFileCachePriority::Iterator LRUFileCachePriority::add(
 
 void LRUFileCachePriority::removeAll(const CacheGuard::Lock &)
 {
-    CurrentMetrics::sub(CurrentMetrics::FilesystemCacheSize, current_size);
-    CurrentMetrics::sub(CurrentMetrics::FilesystemCacheElements, queue.size());
-
     LOG_TEST(log, "Removed all entries from LRU queue");
 
+    updateSize(-current_size);
+    updateElementsCount(-current_elements_num);
     queue.clear();
-    current_size = 0;
 }
 
 void LRUFileCachePriority::pop(const CacheGuard::Lock &)
@@ -78,10 +83,12 @@ void LRUFileCachePriority::pop(const CacheGuard::Lock &)
 
 LRUFileCachePriority::LRUQueueIterator LRUFileCachePriority::remove(LRUQueueIterator it)
 {
-    current_size -= it->size;
-
-    CurrentMetrics::sub(CurrentMetrics::FilesystemCacheSize, it->size);
-    CurrentMetrics::sub(CurrentMetrics::FilesystemCacheElements);
+    /// If size is 0, entry is invalidated, current_elements_num was already updated.
+    if (it->size)
+    {
+        updateSize(-it->size);
+        updateElementsCount(-1);
+    }
 
     LOG_TEST(
         log, "Removed entry from LRU queue, key: {}, offset: {}, size: {}",
@@ -90,6 +97,19 @@ LRUFileCachePriority::LRUQueueIterator LRUFileCachePriority::remove(LRUQueueIter
     return queue.erase(it);
 }
 
+void LRUFileCachePriority::updateSize(int64_t size)
+{
+    current_size += size;
+    CurrentMetrics::add(CurrentMetrics::FilesystemCacheSize, size);
+}
+
+void LRUFileCachePriority::updateElementsCount(int64_t num)
+{
+    current_elements_num += num;
+    CurrentMetrics::add(CurrentMetrics::FilesystemCacheElements, num);
+}
+
+
 LRUFileCachePriority::LRUFileCacheIterator::LRUFileCacheIterator(
     LRUFileCachePriority * cache_priority_,
     LRUFileCachePriority::LRUQueueIterator queue_iter_)
@@ -146,39 +166,51 @@ void LRUFileCachePriority::iterate(IterateFunc && func, const CacheGuard::Lock &
     }
 }
 
-LRUFileCachePriority::Iterator
-LRUFileCachePriority::LRUFileCacheIterator::remove(const CacheGuard::Lock &)
+void LRUFileCachePriority::LRUFileCacheIterator::remove(const CacheGuard::Lock &)
 {
-    return std::make_shared<LRUFileCacheIterator>(
-        cache_priority, cache_priority->remove(queue_iter));
+    checkUsable();
+    cache_priority->remove(queue_iter);
+    queue_iter = LRUQueueIterator{};
 }
 
-void LRUFileCachePriority::LRUFileCacheIterator::annul()
+void LRUFileCachePriority::LRUFileCacheIterator::invalidate()
 {
-    updateSize(-queue_iter->size);
-    chassert(queue_iter->size == 0);
+    checkUsable();
+
+    LOG_TEST(
+        cache_priority->log,
+        "Invalidating entry in LRU queue. Key: {}, offset: {}, previous size: {}",
+        queue_iter->key, queue_iter->offset, queue_iter->size);
+
+    cache_priority->updateSize(-queue_iter->size);
+    cache_priority->updateElementsCount(-1);
+    queue_iter->size = 0;
 }
 
 void LRUFileCachePriority::LRUFileCacheIterator::updateSize(int64_t size)
 {
+    checkUsable();
+
     LOG_TEST(
         cache_priority->log,
         "Update size with {} in LRU queue for key: {}, offset: {}, previous size: {}",
         size, queue_iter->key, queue_iter->offset, queue_iter->size);
 
-    cache_priority->current_size += size;
+    cache_priority->updateSize(size);
     queue_iter->size += size;
-
-    CurrentMetrics::add(CurrentMetrics::FilesystemCacheSize, size);
-
-    chassert(cache_priority->current_size >= 0);
-    chassert(queue_iter->size >= 0);
 }
 
 size_t LRUFileCachePriority::LRUFileCacheIterator::use(const CacheGuard::Lock &)
 {
+    checkUsable();
     cache_priority->queue.splice(cache_priority->queue.end(), cache_priority->queue, queue_iter);
     return ++queue_iter->hits;
 }
 
+void LRUFileCachePriority::LRUFileCacheIterator::checkUsable() const
+{
+    if (queue_iter == LRUQueueIterator{})
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to use invalid iterator");
+}
+
 }
diff --git a/src/Interpreters/Cache/LRUFileCachePriority.h b/src/Interpreters/Cache/LRUFileCachePriority.h
index a80e4647f2d..e0d7d45062a 100644
--- a/src/Interpreters/Cache/LRUFileCachePriority.h
+++ b/src/Interpreters/Cache/LRUFileCachePriority.h
@@ -22,7 +22,7 @@ public:
 
     size_t getSize(const CacheGuard::Lock &) const override { return current_size; }
 
-    size_t getElementsCount(const CacheGuard::Lock &) const override { return queue.size(); }
+    size_t getElementsCount(const CacheGuard::Lock &) const override { return current_elements_num; }
 
     Iterator add(KeyMetadataPtr key_metadata, size_t offset, size_t size, const CacheGuard::Lock &) override;
 
@@ -33,10 +33,16 @@ public:
     void iterate(IterateFunc && func, const CacheGuard::Lock &) override;
 
 private:
+    void updateElementsCount(int64_t num);
+    void updateSize(int64_t size);
+
     LRUQueue queue;
     Poco::Logger * log = &Poco::Logger::get("LRUFileCachePriority");
 
     std::atomic<size_t> current_size = 0;
+    /// current_elements_num is not always equal to queue.size()
+    /// because of invalidated entries.
+    std::atomic<size_t> current_elements_num = 0;
 
     LRUQueueIterator remove(LRUQueueIterator it);
 };
@@ -54,13 +60,15 @@ public:
 
     size_t use(const CacheGuard::Lock &) override;
 
-    Iterator remove(const CacheGuard::Lock &) override;
+    void remove(const CacheGuard::Lock &) override;
 
-    void annul() override;
+    void invalidate() override;
 
     void updateSize(int64_t size) override;
 
 private:
+    void checkUsable() const;
+
     LRUFileCachePriority * cache_priority;
     mutable LRUFileCachePriority::LRUQueueIterator queue_iter;
 };
diff --git a/src/Interpreters/Cache/Metadata.cpp b/src/Interpreters/Cache/Metadata.cpp
index 843ffd45b63..decc69bb81f 100644
--- a/src/Interpreters/Cache/Metadata.cpp
+++ b/src/Interpreters/Cache/Metadata.cpp
@@ -1,11 +1,24 @@
 #include <Interpreters/Cache/Metadata.h>
 #include <Interpreters/Cache/FileCache.h>
 #include <Interpreters/Cache/FileSegment.h>
+#include "Common/Exception.h"
 #include <Common/logger_useful.h>
+#include <Common/ElapsedTimeProfileEventIncrement.h>
 #include <filesystem>
 
 namespace fs = std::filesystem;
 
+namespace CurrentMetrics
+{
+    extern const Metric FilesystemCacheDownloadQueueElements;
+}
+
+namespace ProfileEvents
+{
+    extern const Event FilesystemCacheLockKeyMicroseconds;
+    extern const Event FilesystemCacheLockMetadataMicroseconds;
+}
+
 namespace DB
 {
 
@@ -46,11 +59,15 @@ KeyMetadata::KeyMetadata(
     const Key & key_,
     const std::string & key_path_,
     CleanupQueue & cleanup_queue_,
+    DownloadQueue & download_queue_,
+    Poco::Logger * log_,
     bool created_base_directory_)
     : key(key_)
     , key_path(key_path_)
     , cleanup_queue(cleanup_queue_)
+    , download_queue(download_queue_)
     , created_base_directory(created_base_directory_)
+    , log(log_)
 {
     if (created_base_directory)
         chassert(fs::exists(key_path));
@@ -69,6 +86,8 @@ LockedKeyPtr KeyMetadata::lock()
 
 LockedKeyPtr KeyMetadata::tryLock()
 {
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheLockKeyMicroseconds);
+
     auto locked = std::make_unique<LockedKey>(shared_from_this());
     if (key_state == KeyMetadata::KeyState::ACTIVE)
         return locked;
@@ -123,6 +142,7 @@ private:
 CacheMetadata::CacheMetadata(const std::string & path_)
     : path(path_)
     , cleanup_queue(std::make_unique<CleanupQueue>())
+    , download_queue(std::make_unique<DownloadQueue>())
     , log(&Poco::Logger::get("CacheMetadata"))
 {
 }
@@ -132,33 +152,32 @@ String CacheMetadata::getFileNameForFileSegment(size_t offset, FileSegmentKind s
     String file_suffix;
     switch (segment_kind)
     {
-        case FileSegmentKind::Persistent:
-            file_suffix = "_persistent";
-            break;
         case FileSegmentKind::Temporary:
             file_suffix = "_temporary";
             break;
         case FileSegmentKind::Regular:
-            file_suffix = "";
             break;
     }
     return std::to_string(offset) + file_suffix;
 }
 
-String CacheMetadata::getPathInLocalCache(const Key & key, size_t offset, FileSegmentKind segment_kind) const
+String CacheMetadata::getPathForFileSegment(const Key & key, size_t offset, FileSegmentKind segment_kind) const
 {
-    String file_suffix;
-
-    const auto key_str = key.toString();
-    return fs::path(path) / key_str.substr(0, 3) / key_str / getFileNameForFileSegment(offset, segment_kind);
+    return fs::path(getPathForKey(key)) / getFileNameForFileSegment(offset, segment_kind);
 }
 
-String CacheMetadata::getPathInLocalCache(const Key & key) const
+String CacheMetadata::getPathForKey(const Key & key) const
 {
     const auto key_str = key.toString();
     return fs::path(path) / key_str.substr(0, 3) / key_str;
 }
 
+CacheMetadataGuard::Lock CacheMetadata::lockMetadata() const
+{
+    ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheLockMetadataMicroseconds);
+    return guard.lock();
+}
+
 LockedKeyPtr CacheMetadata::lockKeyMetadata(
     const FileCacheKey & key,
     KeyNotFoundPolicy key_not_found_policy,
@@ -166,7 +185,7 @@ LockedKeyPtr CacheMetadata::lockKeyMetadata(
 {
     KeyMetadataPtr key_metadata;
     {
-        auto lock = guard.lock();
+        auto lock = lockMetadata();
 
         auto it = find(key);
         if (it == end())
@@ -178,16 +197,20 @@ LockedKeyPtr CacheMetadata::lockKeyMetadata(
 
             it = emplace(
                 key, std::make_shared<KeyMetadata>(
-                    key, getPathInLocalCache(key), *cleanup_queue, is_initial_load)).first;
+                    key, getPathForKey(key), *cleanup_queue, *download_queue, log, is_initial_load)).first;
         }
 
         key_metadata = it->second;
     }
 
     {
-        auto locked_metadata = std::make_unique<LockedKey>(key_metadata);
-        const auto key_state = locked_metadata->getKeyState();
+        LockedKeyPtr locked_metadata;
+        {
+            ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheLockKeyMicroseconds);
+            locked_metadata = std::make_unique<LockedKey>(key_metadata);
+        }
 
+        const auto key_state = locked_metadata->getKeyState();
         if (key_state == KeyMetadata::KeyState::ACTIVE)
             return locked_metadata;
 
@@ -216,10 +239,15 @@ LockedKeyPtr CacheMetadata::lockKeyMetadata(
 
 void CacheMetadata::iterate(IterateCacheMetadataFunc && func)
 {
-    auto lock = guard.lock();
+    auto lock = lockMetadata();
     for (const auto & [key, key_metadata] : *this)
     {
-        auto locked_key = std::make_unique<LockedKey>(key_metadata);
+        LockedKeyPtr locked_key;
+        {
+            ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheLockKeyMicroseconds);
+            locked_key = std::make_unique<LockedKey>(key_metadata);
+        }
+
         const auto key_state = locked_key->getKeyState();
 
         if (key_state == KeyMetadata::KeyState::ACTIVE)
@@ -238,7 +266,7 @@ void CacheMetadata::iterate(IterateCacheMetadataFunc && func)
 
 void CacheMetadata::doCleanup()
 {
-    auto lock = guard.lock();
+    auto lock = lockMetadata();
 
     FileCacheKey cleanup_key;
     while (cleanup_queue->tryPop(cleanup_key))
@@ -247,20 +275,25 @@ void CacheMetadata::doCleanup()
         if (it == end())
             continue;
 
-        auto locked_metadata = std::make_unique<LockedKey>(it->second);
-        const auto key_state = locked_metadata->getKeyState();
+        LockedKeyPtr locked_metadata;
+        {
+            ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheLockKeyMicroseconds);
+            locked_metadata = std::make_unique<LockedKey>(it->second);
+        }
 
+        const auto key_state = locked_metadata->getKeyState();
         if (key_state == KeyMetadata::KeyState::ACTIVE)
         {
             /// Key was added back to cache after we submitted it to removal queue.
             continue;
         }
 
+        chassert(it->second->empty());
         locked_metadata->markAsRemoved();
         erase(it);
         LOG_DEBUG(log, "Key {} is removed from metadata", cleanup_key);
 
-        const fs::path key_directory = getPathInLocalCache(cleanup_key);
+        const fs::path key_directory = getPathForKey(cleanup_key);
         const fs::path key_prefix_directory = key_directory.parent_path();
 
         try
@@ -278,7 +311,7 @@ void CacheMetadata::doCleanup()
         try
         {
             if (fs::exists(key_prefix_directory) && fs::is_empty(key_prefix_directory))
-                fs::remove_all(key_prefix_directory);
+                fs::remove(key_prefix_directory);
         }
         catch (const fs::filesystem_error & e)
         {
@@ -296,14 +329,183 @@ void CacheMetadata::doCleanup()
     }
 }
 
+class DownloadQueue
+{
+friend struct CacheMetadata;
+public:
+    void add(std::weak_ptr<FileSegment> file_segment)
+    {
+        {
+            std::lock_guard lock(mutex);
+            queue.push(file_segment);
+        }
+
+        CurrentMetrics::add(CurrentMetrics::FilesystemCacheDownloadQueueElements);
+        cv.notify_one();
+    }
+
+private:
+    void cancel()
+    {
+        {
+            std::lock_guard lock(mutex);
+            cancelled = true;
+        }
+        cv.notify_all();
+    }
+
+    std::mutex mutex;
+    std::condition_variable cv;
+    std::queue<std::weak_ptr<FileSegment>> queue;
+    bool cancelled = false;
+};
+
+void CacheMetadata::downloadThreadFunc()
+{
+    std::optional<Memory<>> memory;
+    while (true)
+    {
+        std::weak_ptr<FileSegment> file_segment_weak;
+
+        {
+            std::unique_lock lock(download_queue->mutex);
+
+            if (download_queue->cancelled)
+                return;
+
+            if (download_queue->queue.empty())
+            {
+                download_queue->cv.wait(lock);
+                continue;
+            }
+
+            file_segment_weak = download_queue->queue.front();
+            download_queue->queue.pop();
+        }
+
+        CurrentMetrics::sub(CurrentMetrics::FilesystemCacheDownloadQueueElements);
+
+        FileSegmentsHolderPtr holder;
+        try
+        {
+            {
+                auto file_segment = file_segment_weak.lock();
+                if (!file_segment
+                    || file_segment->state() != FileSegment::State::PARTIALLY_DOWNLOADED)
+                    continue;
+
+                auto locked_key = lockKeyMetadata(file_segment->key(), KeyNotFoundPolicy::RETURN_NULL);
+                if (!locked_key)
+                    continue;
+
+                auto file_segment_metadata = locked_key->tryGetByOffset(file_segment->offset());
+                if (!file_segment_metadata || file_segment_metadata->evicting())
+                    continue;
+
+                holder = std::make_unique<FileSegmentsHolder>(FileSegments{file_segment});
+            }
+
+            downloadImpl(holder->front(), memory);
+        }
+        catch (...)
+        {
+            if (holder)
+            {
+                const auto & file_segment = holder->front();
+                LOG_ERROR(
+                    log, "Error during background download of {}:{} ({}): {}",
+                    file_segment.key(), file_segment.offset(),
+                    file_segment.getInfoForLog(), getCurrentExceptionMessage(true));
+            }
+            else
+            {
+                tryLogCurrentException(__PRETTY_FUNCTION__);
+                chassert(false);
+            }
+        }
+    }
+}
+
+void CacheMetadata::downloadImpl(FileSegment & file_segment, std::optional<Memory<>> & memory)
+{
+    chassert(file_segment.assertCorrectness());
+
+    if (file_segment.getOrSetDownloader() != FileSegment::getCallerId())
+        return;
+
+    if (file_segment.getDownloadedSize(false) == file_segment.range().size())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "File segment is already fully downloaded");
+
+    LOG_TEST(
+        log, "Downloading {} bytes for file segment {}",
+        file_segment.range().size() - file_segment.getDownloadedSize(false), file_segment.getInfoForLog());
+
+    auto reader = file_segment.getRemoteFileReader();
+
+    if (!reader)
+    {
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR, "No reader. "
+            "File segment should not have been submitted for background download ({})",
+            file_segment.getInfoForLog());
+    }
+
+    /// If remote_fs_read_method == 'threadpool',
+    /// reader itself never owns/allocates the buffer.
+    if (reader->internalBuffer().empty())
+    {
+        if (!memory)
+            memory.emplace(DBMS_DEFAULT_BUFFER_SIZE);
+        reader->set(memory->data(), memory->size());
+    }
+
+    size_t offset = file_segment.getCurrentWriteOffset(false);
+    if (offset != static_cast<size_t>(reader->getPosition()))
+        reader->seek(offset, SEEK_SET);
+
+    while (!reader->eof())
+    {
+        auto size = reader->available();
+
+        if (!file_segment.reserve(size))
+        {
+            LOG_TEST(
+                log, "Failed to reserve space during background download "
+                "for {}:{} (downloaded size: {}/{})",
+                file_segment.key(), file_segment.offset(),
+                file_segment.getDownloadedSize(false), file_segment.range().size());
+            return;
+        }
+
+        try
+        {
+            file_segment.write(reader->position(), size, offset);
+            offset += size;
+            reader->position() += size;
+        }
+        catch (ErrnoException & e)
+        {
+            int code = e.getErrno();
+            if (code == /* No space left on device */28 || code == /* Quota exceeded */122)
+            {
+                LOG_INFO(log, "Insert into cache is skipped due to insufficient disk space. ({})", e.displayText());
+                return;
+            }
+            throw;
+        }
+    }
+
+    LOG_TEST(log, "Downloaded file segment: {}", file_segment.getInfoForLog());
+}
+
+void CacheMetadata::cancelDownload()
+{
+    download_queue->cancel();
+}
+
 LockedKey::LockedKey(std::shared_ptr<KeyMetadata> key_metadata_)
     : key_metadata(key_metadata_)
     , lock(key_metadata->guard.lock())
-#ifdef ABORT_ON_LOGICAL_ERROR
-    , log(&Poco::Logger::get("LockedKey(" + key_metadata_->key.toString() + ")"))
-#else
-    , log(&Poco::Logger::get("LockedKey"))
-#endif
 {
 }
 
@@ -313,7 +515,7 @@ LockedKey::~LockedKey()
         return;
 
     key_metadata->key_state = KeyMetadata::KeyState::REMOVING;
-    LOG_DEBUG(log, "Submitting key {} for removal", getKey());
+    LOG_DEBUG(key_metadata->log, "Submitting key {} for removal", getKey());
     key_metadata->cleanup_queue.add(getKey());
 }
 
@@ -346,6 +548,16 @@ void LockedKey::removeAllReleasable()
             ++it;
             continue;
         }
+        else if (it->second->evicting())
+        {
+            /// File segment is currently a removal candidate,
+            /// we do not know if it will be removed or not yet,
+            /// but its size is currently accounted as potentially removed,
+            /// so if we remove file segment now, we break the freeable_count
+            /// calculation in tryReserve.
+            ++it;
+            continue;
+        }
 
         auto file_segment = it->second->file_segment;
         it = removeFileSegment(file_segment->offset(), file_segment->lock());
@@ -361,19 +573,34 @@ KeyMetadata::iterator LockedKey::removeFileSegment(size_t offset, const FileSegm
     auto file_segment = it->second->file_segment;
 
     LOG_DEBUG(
-        log, "Remove from cache. Key: {}, offset: {}, size: {}",
+        key_metadata->log, "Remove from cache. Key: {}, offset: {}, size: {}",
         getKey(), offset, file_segment->reserved_size);
 
     chassert(file_segment->assertCorrectnessUnlocked(segment_lock));
 
     if (file_segment->queue_iterator)
-        file_segment->queue_iterator->annul();
-
-    const auto path = key_metadata->getFileSegmentPath(*file_segment);
-    if (fs::exists(path))
-        fs::remove(path);
+        file_segment->queue_iterator->invalidate();
 
     file_segment->detach(segment_lock, *this);
+
+    const auto path = key_metadata->getFileSegmentPath(*file_segment);
+    bool exists = fs::exists(path);
+    if (exists)
+    {
+        fs::remove(path);
+
+        /// Clear OpenedFileCache to avoid reading from incorrect file descriptor.
+        int flags = file_segment->getFlagsForLocalRead();
+        /// Files are created with flags from file_segment->getFlagsForLocalRead()
+        /// plus optionally O_DIRECT is added, depends on query setting, so remove both.
+        OpenedFileCache::instance().remove(path, flags);
+        OpenedFileCache::instance().remove(path, flags | O_DIRECT);
+
+        LOG_TEST(key_metadata->log, "Removed file segment at path: {}", path);
+    }
+    else if (file_segment->downloaded_size)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected path {} to exist", path);
+
     return key_metadata->erase(it);
 }
 
@@ -413,6 +640,37 @@ void LockedKey::shrinkFileSegmentToDownloadedSize(
     chassert(file_segment->assertCorrectnessUnlocked(segment_lock));
 }
 
+void LockedKey::addToDownloadQueue(size_t offset, const FileSegmentGuard::Lock &)
+{
+    auto it = key_metadata->find(offset);
+    if (it == key_metadata->end())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "There is not offset {}", offset);
+    key_metadata->download_queue.add(it->second->file_segment);
+}
+
+std::optional<FileSegment::Range> LockedKey::hasIntersectingRange(const FileSegment::Range & range) const
+{
+    if (key_metadata->empty())
+        return {};
+
+    auto it = key_metadata->lower_bound(range.left);
+    if (it != key_metadata->end()) /// has next range
+    {
+        auto next_range = it->second->file_segment->range();
+        if (!(range < next_range))
+            return next_range;
+
+        if (it == key_metadata->begin())
+            return {};
+    }
+
+    auto prev_range = std::prev(it)->second->file_segment->range();
+    if (!(prev_range < range))
+        return prev_range;
+
+    return {};
+}
+
 std::shared_ptr<const FileSegmentMetadata> LockedKey::getByOffset(size_t offset) const
 {
     auto it = key_metadata->find(offset);
diff --git a/src/Interpreters/Cache/Metadata.h b/src/Interpreters/Cache/Metadata.h
index 2e015b07ed0..503c19f4150 100644
--- a/src/Interpreters/Cache/Metadata.h
+++ b/src/Interpreters/Cache/Metadata.h
@@ -8,8 +8,12 @@
 
 namespace DB
 {
+
 class CleanupQueue;
 using CleanupQueuePtr = std::shared_ptr<CleanupQueue>;
+class DownloadQueue;
+using DownloadQueuePtr = std::shared_ptr<DownloadQueue>;
+using FileSegmentsHolderPtr = std::unique_ptr<FileSegmentsHolder>;
 
 
 struct FileSegmentMetadata : private boost::noncopyable
@@ -22,7 +26,7 @@ struct FileSegmentMetadata : private boost::noncopyable
 
     size_t size() const;
 
-    bool valid() const { return !removal_candidate.load(); }
+    bool evicting() const { return removal_candidate.load(); }
 
     Priority::Iterator getQueueIterator() const { return file_segment->getQueueIterator(); }
 
@@ -44,6 +48,8 @@ struct KeyMetadata : public std::map<size_t, FileSegmentMetadataPtr>,
         const Key & key_,
         const std::string & key_path_,
         CleanupQueue & cleanup_queue_,
+        DownloadQueue & download_queue_,
+        Poco::Logger * log_,
         bool created_base_directory_ = false);
 
     enum class KeyState
@@ -69,7 +75,9 @@ private:
     KeyState key_state = KeyState::ACTIVE;
     KeyGuard guard;
     CleanupQueue & cleanup_queue;
+    DownloadQueue & download_queue;
     std::atomic<bool> created_base_directory = false;
+    Poco::Logger * log;
 };
 
 using KeyMetadataPtr = std::shared_ptr<KeyMetadata>;
@@ -85,12 +93,12 @@ public:
 
     const String & getBaseDirectory() const { return path; }
 
-    String getPathInLocalCache(
+    String getPathForFileSegment(
         const Key & key,
         size_t offset,
         FileSegmentKind segment_kind) const;
 
-    String getPathInLocalCache(const Key & key) const;
+    String getPathForKey(const Key & key) const;
     static String getFileNameForFileSegment(size_t offset, FileSegmentKind segment_kind);
 
     void iterate(IterateCacheMetadataFunc && func);
@@ -109,11 +117,19 @@ public:
 
     void doCleanup();
 
+    void downloadThreadFunc();
+
+    void cancelDownload();
+
 private:
+    CacheMetadataGuard::Lock lockMetadata() const;
     const std::string path; /// Cache base path
-    CacheMetadataGuard guard;
+    mutable CacheMetadataGuard guard;
     const CleanupQueuePtr cleanup_queue;
+    const DownloadQueuePtr download_queue;
     Poco::Logger * log;
+
+    void downloadImpl(FileSegment & file_segment, std::optional<Memory<>> & memory);
 };
 
 
@@ -159,8 +175,12 @@ struct LockedKey : private boost::noncopyable
 
     void shrinkFileSegmentToDownloadedSize(size_t offset, const FileSegmentGuard::Lock &);
 
+    void addToDownloadQueue(size_t offset, const FileSegmentGuard::Lock &);
+
     bool isLastOwnerOfFileSegment(size_t offset) const;
 
+    std::optional<FileSegment::Range> hasIntersectingRange(const FileSegment::Range & range) const;
+
     void removeFromCleanupQueue();
 
     void markAsRemoved();
@@ -170,7 +190,6 @@ struct LockedKey : private boost::noncopyable
 private:
     const std::shared_ptr<KeyMetadata> key_metadata;
     KeyGuard::Lock lock; /// `lock` must be destructed before `key_metadata`.
-    Poco::Logger * log;
 };
 
 }
diff --git a/src/Interpreters/Cache/QueryCache.cpp b/src/Interpreters/Cache/QueryCache.cpp
index 3118f386111..f46a10ca51d 100644
--- a/src/Interpreters/Cache/QueryCache.cpp
+++ b/src/Interpreters/Cache/QueryCache.cpp
@@ -132,6 +132,11 @@ QueryCache::Key::Key(
 {
 }
 
+QueryCache::Key::Key(ASTPtr ast_, const String & user_name_)
+    : QueryCache::Key(ast_, {}, user_name_, false, std::chrono::system_clock::from_time_t(1), false) /// dummy values for everything != AST or user name
+{
+}
+
 bool QueryCache::Key::operator==(const Key & other) const
 {
     return ast->getTreeHash() == other.ast->getTreeHash();
@@ -233,6 +238,7 @@ void QueryCache::Writer::buffer(Chunk && chunk, ChunkType chunk_type)
             auto & buffered_chunk = (chunk_type == ChunkType::Totals) ? query_result->totals : query_result->extremes;
 
             convertToFullIfSparse(chunk);
+            convertToFullIfConst(chunk);
 
             if (!buffered_chunk.has_value())
                 buffered_chunk = std::move(chunk);
@@ -263,16 +269,16 @@ void QueryCache::Writer::finalizeWrite()
 
     if (auto entry = cache.getWithKey(key); entry.has_value() && !IsStale()(entry->key))
     {
-        /// same check as in ctor because a parallel Writer could have inserted the current key in the meantime
+        /// Same check as in ctor because a parallel Writer could have inserted the current key in the meantime
         LOG_TRACE(&Poco::Logger::get("QueryCache"), "Skipped insert (non-stale entry found), query: {}", key.queryStringFromAst());
         return;
     }
 
     if (squash_partial_results)
     {
-        // Squash partial result chunks to chunks of size 'max_block_size' each. This costs some performance but provides a more natural
-        // compression of neither too small nor big blocks. Also, it will look like 'max_block_size' is respected when the query result is
-        // served later on from the query cache.
+        /// Squash partial result chunks to chunks of size 'max_block_size' each. This costs some performance but provides a more natural
+        /// compression of neither too small nor big blocks. Also, it will look like 'max_block_size' is respected when the query result is
+        /// served later on from the query cache.
 
         Chunks squashed_chunks;
         size_t rows_remaining_in_squashed = 0; /// how many further rows can the last squashed chunk consume until it reaches max_block_size
@@ -280,6 +286,7 @@ void QueryCache::Writer::finalizeWrite()
         for (auto & chunk : query_result->chunks)
         {
             convertToFullIfSparse(chunk);
+            convertToFullIfConst(chunk);
 
             const size_t rows_chunk = chunk.getNumRows();
             if (rows_chunk == 0)
@@ -385,19 +392,22 @@ QueryCache::Reader::Reader(Cache & cache_, const Key & key, const std::lock_guar
         return;
     }
 
-    if (!entry->key.is_shared && entry->key.user_name != key.user_name)
+    const auto & entry_key = entry->key;
+    const auto & entry_mapped = entry->mapped;
+
+    if (!entry_key.is_shared && entry_key.user_name != key.user_name)
     {
         LOG_TRACE(&Poco::Logger::get("QueryCache"), "Inaccessible entry found for query {}", key.queryStringFromAst());
         return;
     }
 
-    if (IsStale()(entry->key))
+    if (IsStale()(entry_key))
     {
         LOG_TRACE(&Poco::Logger::get("QueryCache"), "Stale entry found for query {}", key.queryStringFromAst());
         return;
     }
 
-    if (!entry->key.is_compressed)
+    if (!entry_key.is_compressed)
     {
         // Cloning chunks isn't exactly great. It could be avoided by another indirection, i.e. wrapping Entry's members chunks, totals and
         // extremes into shared_ptrs and assuming that the lifecycle of these shared_ptrs coincides with the lifecycle of the Entry
@@ -406,15 +416,15 @@ QueryCache::Reader::Reader(Cache & cache_, const Key & key, const std::lock_guar
         // optimization.
 
         Chunks cloned_chunks;
-        for (const auto & chunk : entry->mapped->chunks)
+        for (const auto & chunk : entry_mapped->chunks)
             cloned_chunks.push_back(chunk.clone());
 
-        buildSourceFromChunks(entry->key.header, std::move(cloned_chunks), entry->mapped->totals, entry->mapped->extremes);
+        buildSourceFromChunks(entry_key.header, std::move(cloned_chunks), entry_mapped->totals, entry_mapped->extremes);
     }
     else
     {
         Chunks decompressed_chunks;
-        const Chunks & chunks = entry->mapped->chunks;
+        const Chunks & chunks = entry_mapped->chunks;
         for (const auto & chunk : chunks)
         {
             const Columns & columns = chunk.getColumns();
@@ -428,7 +438,7 @@ QueryCache::Reader::Reader(Cache & cache_, const Key & key, const std::lock_guar
             decompressed_chunks.push_back(std::move(decompressed_chunk));
         }
 
-        buildSourceFromChunks(entry->key.header, std::move(decompressed_chunks), entry->mapped->totals, entry->mapped->extremes);
+        buildSourceFromChunks(entry_key.header, std::move(decompressed_chunks), entry_mapped->totals, entry_mapped->extremes);
     }
 
     LOG_TRACE(&Poco::Logger::get("QueryCache"), "Entry found for query {}", key.queryStringFromAst());
diff --git a/src/Interpreters/Cache/QueryCache.h b/src/Interpreters/Cache/QueryCache.h
index bafa78f13d5..6ef7cc60918 100644
--- a/src/Interpreters/Cache/QueryCache.h
+++ b/src/Interpreters/Cache/QueryCache.h
@@ -49,7 +49,7 @@ public:
         /// If the associated entry can be read by other users. In general, sharing is a bad idea: First, it is unlikely that different
         /// users pose the same queries. Second, sharing potentially breaches security. E.g. User A should not be able to bypass row
         /// policies on some table by running the same queries as user B for whom no row policies exist.
-        bool is_shared;
+        const bool is_shared;
 
         /// When does the entry expire?
         const std::chrono::time_point<std::chrono::system_clock> expires_at;
@@ -58,12 +58,16 @@ public:
         /// (we could theoretically apply compression also to the totals and extremes but it's an obscure use case)
         const bool is_compressed;
 
+        /// Ctor to construct a Key for writing into query cache.
         Key(ASTPtr ast_,
             Block header_,
             const String & user_name_, bool is_shared_,
             std::chrono::time_point<std::chrono::system_clock> expires_at_,
             bool is_compressed);
 
+        /// Ctor to construct a Key for reading from query cache (this operation only needs the AST + user name).
+        Key(ASTPtr ast_, const String & user_name_);
+
         bool operator==(const Key & other) const;
         String queryStringFromAst() const;
     };
diff --git a/src/Interpreters/Cache/WriteBufferToFileSegment.cpp b/src/Interpreters/Cache/WriteBufferToFileSegment.cpp
index 1eac87a804d..d50289a5728 100644
--- a/src/Interpreters/Cache/WriteBufferToFileSegment.cpp
+++ b/src/Interpreters/Cache/WriteBufferToFileSegment.cpp
@@ -71,16 +71,4 @@ std::shared_ptr<ReadBuffer> WriteBufferToFileSegment::getReadBufferImpl()
     return std::make_shared<ReadBufferFromFile>(file_segment->getPathInLocalCache());
 }
 
-WriteBufferToFileSegment::~WriteBufferToFileSegment()
-{
-    try
-    {
-        finalize();
-    }
-    catch (...)
-    {
-        tryLogCurrentException(__PRETTY_FUNCTION__);
-    }
-}
-
 }
diff --git a/src/Interpreters/Cache/WriteBufferToFileSegment.h b/src/Interpreters/Cache/WriteBufferToFileSegment.h
index 4d1e82996a3..d39772873f7 100644
--- a/src/Interpreters/Cache/WriteBufferToFileSegment.h
+++ b/src/Interpreters/Cache/WriteBufferToFileSegment.h
@@ -17,8 +17,6 @@ public:
 
     void nextImpl() override;
 
-    ~WriteBufferToFileSegment() override;
-
 private:
 
     std::shared_ptr<ReadBuffer> getReadBufferImpl() override;
diff --git a/src/Interpreters/Cluster.cpp b/src/Interpreters/Cluster.cpp
index 8c30dbe230f..edbef77ef02 100644
--- a/src/Interpreters/Cluster.cpp
+++ b/src/Interpreters/Cluster.cpp
@@ -108,7 +108,7 @@ Cluster::Address::Address(
     password = config.getString(config_prefix + ".password", "");
     default_database = config.getString(config_prefix + ".default_database", "");
     secure = ConfigHelper::getBool(config, config_prefix + ".secure", false, /* empty_as */true) ? Protocol::Secure::Enable : Protocol::Secure::Disable;
-    priority = config.getInt(config_prefix + ".priority", 1);
+    priority = Priority{config.getInt(config_prefix + ".priority", 1)};
 
     const char * port_type = secure == Protocol::Secure::Enable ? "tcp_port_secure" : "tcp_port";
     auto default_port = config.getInt(port_type, 0);
diff --git a/src/Interpreters/Cluster.h b/src/Interpreters/Cluster.h
index 4798384f29c..de10a445d01 100644
--- a/src/Interpreters/Cluster.h
+++ b/src/Interpreters/Cluster.h
@@ -4,6 +4,7 @@
 #include <Client/ConnectionPoolWithFailover.h>
 #include <Common/Macros.h>
 #include <Common/MultiVersion.h>
+#include <Common/Priority.h>
 
 #include <Poco/Net/SocketAddress.h>
 
@@ -44,7 +45,7 @@ struct ClusterConnectionParameters
     bool treat_local_as_remote;
     bool treat_local_port_as_remote;
     bool secure = false;
-    Int64 priority = 1;
+    Priority priority{1};
     String cluster_name;
     String cluster_secret;
 };
@@ -131,7 +132,7 @@ public:
         Protocol::Compression compression = Protocol::Compression::Enable;
         Protocol::Secure secure = Protocol::Secure::Disable;
 
-        Int64 priority = 1;
+        Priority priority{1};
 
         Address() = default;
 
diff --git a/src/Interpreters/ClusterDiscovery.cpp b/src/Interpreters/ClusterDiscovery.cpp
index 884e3b87343..553488edf50 100644
--- a/src/Interpreters/ClusterDiscovery.cpp
+++ b/src/Interpreters/ClusterDiscovery.cpp
@@ -246,7 +246,7 @@ ClusterPtr ClusterDiscovery::makeCluster(const ClusterInfo & cluster_info)
         /* treat_local_as_remote= */ false,
         /* treat_local_port_as_remote= */ false, /// should be set only for clickhouse-local, but cluster discovery is not used there
         /* secure= */ secure,
-        /* priority= */ 1,
+        /* priority= */ Priority{1},
         /* cluster_name= */ "",
         /* password= */ ""};
     auto cluster = std::make_shared<Cluster>(
diff --git a/src/Interpreters/ClusterProxy/SelectStreamFactory.h b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
index f1a8b3e0984..030c0b77dd5 100644
--- a/src/Interpreters/ClusterProxy/SelectStreamFactory.h
+++ b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
@@ -26,6 +26,8 @@ using QueryPlanPtr = std::unique_ptr<QueryPlan>;
 
 struct StorageID;
 
+class PreparedSets;
+using PreparedSetsPtr = std::shared_ptr<PreparedSets>;
 namespace ClusterProxy
 {
 
diff --git a/src/Interpreters/ConcurrentHashJoin.cpp b/src/Interpreters/ConcurrentHashJoin.cpp
index 03c173a73d9..fc24f0ae029 100644
--- a/src/Interpreters/ConcurrentHashJoin.cpp
+++ b/src/Interpreters/ConcurrentHashJoin.cpp
@@ -18,6 +18,7 @@
 #include <Common/Exception.h>
 #include <Common/WeakHash.h>
 #include <Common/typeid_cast.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 
 namespace DB
 {
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 8fb06e21d22..7482450d529 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -377,7 +377,7 @@ struct ContextSharedPart : boost::noncopyable
         {
             try
             {
-                LOG_DEBUG(log, "Desctructing remote fs threadpool reader");
+                LOG_DEBUG(log, "Destructing remote fs threadpool reader");
                 asynchronous_remote_fs_reader->wait();
                 asynchronous_remote_fs_reader.reset();
             }
@@ -391,7 +391,7 @@ struct ContextSharedPart : boost::noncopyable
         {
             try
             {
-                LOG_DEBUG(log, "Desctructing local fs threadpool reader");
+                LOG_DEBUG(log, "Destructing local fs threadpool reader");
                 asynchronous_local_fs_reader->wait();
                 asynchronous_local_fs_reader.reset();
             }
@@ -405,7 +405,7 @@ struct ContextSharedPart : boost::noncopyable
         {
             try
             {
-                LOG_DEBUG(log, "Desctructing local fs threadpool reader");
+                LOG_DEBUG(log, "Destructing local fs threadpool reader");
                 synchronous_local_fs_reader->wait();
                 synchronous_local_fs_reader.reset();
             }
@@ -419,7 +419,7 @@ struct ContextSharedPart : boost::noncopyable
         {
             try
             {
-                LOG_DEBUG(log, "Desctructing threadpool writer");
+                LOG_DEBUG(log, "Destructing threadpool writer");
                 threadpool_writer->wait();
                 threadpool_writer.reset();
             }
@@ -433,7 +433,7 @@ struct ContextSharedPart : boost::noncopyable
         {
             try
             {
-                LOG_DEBUG(log, "Desctructing marks loader");
+                LOG_DEBUG(log, "Destructing marks loader");
                 load_marks_threadpool->wait();
                 load_marks_threadpool.reset();
             }
@@ -447,7 +447,7 @@ struct ContextSharedPart : boost::noncopyable
         {
             try
             {
-                LOG_DEBUG(log, "Desctructing prefetch threadpool");
+                LOG_DEBUG(log, "Destructing prefetch threadpool");
                 prefetch_threadpool->wait();
                 prefetch_threadpool.reset();
             }
@@ -1319,6 +1319,21 @@ void Context::addExternalTable(const String & table_name, TemporaryTableHolder &
     external_tables_mapping.emplace(table_name, std::make_shared<TemporaryTableHolder>(std::move(temporary_table)));
 }
 
+std::shared_ptr<TemporaryTableHolder> Context::findExternalTable(const String & table_name) const
+{
+    if (isGlobalContext())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Global context cannot have external tables");
+
+    std::shared_ptr<TemporaryTableHolder> holder;
+    {
+        auto lock = getLock();
+        auto iter = external_tables_mapping.find(table_name);
+        if (iter == external_tables_mapping.end())
+            return {};
+        holder = iter->second;
+    }
+    return holder;
+}
 
 std::shared_ptr<TemporaryTableHolder> Context::removeExternalTable(const String & table_name)
 {
@@ -1476,7 +1491,7 @@ StoragePtr Context::executeTableFunction(const ASTPtr & table_expression, const
     StoragePtr table = DatabaseCatalog::instance().tryGetTable({database_name, table_name}, getQueryContext());
     if (table)
     {
-        if (table.get()->isView() && table->as<StorageView>()->isParameterizedView())
+        if (table.get()->isView() && table->as<StorageView>() && table->as<StorageView>()->isParameterizedView())
         {
             function->prefer_subquery_to_function_formatting = true;
             return table;
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index 194da016ee7..6cbb0e58911 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -1,5 +1,7 @@
 #pragma once
 
+#ifndef CLICKHOUSE_PROGRAM_STANDALONE_BUILD
+
 #include <base/types.h>
 #include <Common/isLocalAddress.h>
 #include <Common/MultiVersion.h>
@@ -615,6 +617,7 @@ public:
 
     Tables getExternalTables() const;
     void addExternalTable(const String & table_name, TemporaryTableHolder && temporary_table);
+    std::shared_ptr<TemporaryTableHolder> findExternalTable(const String & table_name) const;
     std::shared_ptr<TemporaryTableHolder> removeExternalTable(const String & table_name);
 
     const Scalars & getScalars() const;
@@ -1239,3 +1242,9 @@ struct HTTPContext : public IHTTPContext
 };
 
 }
+
+#else
+
+#include <Coordination/Standalone/Context.h>
+
+#endif
diff --git a/src/Interpreters/DatabaseCatalog.cpp b/src/Interpreters/DatabaseCatalog.cpp
index 8d3fa91a7fe..4cb2f6e3b3d 100644
--- a/src/Interpreters/DatabaseCatalog.cpp
+++ b/src/Interpreters/DatabaseCatalog.cpp
@@ -110,7 +110,7 @@ TemporaryTableHolder::TemporaryTableHolder(
 }
 
 TemporaryTableHolder::TemporaryTableHolder(TemporaryTableHolder && rhs) noexcept
-        : WithContext(rhs.context), temporary_tables(rhs.temporary_tables), id(rhs.id)
+        : WithContext(rhs.context), temporary_tables(rhs.temporary_tables), id(rhs.id), future_set(std::move(rhs.future_set))
 {
     rhs.id = UUIDHelpers::Nil;
 }
@@ -216,8 +216,24 @@ void DatabaseCatalog::shutdownImpl()
 
     /// We still hold "databases" (instead of std::move) for Buffer tables to flush data correctly.
 
+    /// Delay shutdown of temporary and system databases. They will be shutdown last.
+    /// Because some databases might use them until their shutdown is called, but calling shutdown
+    /// on temporary database means clearing its set of tables, which will lead to unnecessary errors like "table not found".
+    std::vector<DatabasePtr> databases_with_delayed_shutdown;
     for (auto & database : current_databases)
+    {
+        if (database.first == TEMPORARY_DATABASE || database.first == SYSTEM_DATABASE)
+        {
+            databases_with_delayed_shutdown.push_back(database.second);
+            continue;
+        }
         database.second->shutdown();
+    }
+
+    for (auto & database : databases_with_delayed_shutdown)
+    {
+        database->shutdown();
+    }
 
     {
         std::lock_guard lock(tables_marked_dropped_mutex);
diff --git a/src/Interpreters/DatabaseCatalog.h b/src/Interpreters/DatabaseCatalog.h
index 51e9fbdb936..258ea2dee7c 100644
--- a/src/Interpreters/DatabaseCatalog.h
+++ b/src/Interpreters/DatabaseCatalog.h
@@ -79,6 +79,8 @@ private:
 
 using DDLGuardPtr = std::unique_ptr<DDLGuard>;
 
+class FutureSet;
+using FutureSetPtr = std::shared_ptr<FutureSet>;
 
 /// Creates temporary table in `_temporary_and_external_tables` with randomly generated unique StorageID.
 /// Such table can be accessed from everywhere by its ID.
@@ -111,6 +113,7 @@ struct TemporaryTableHolder : boost::noncopyable, WithContext
 
     IDatabase * temporary_tables = nullptr;
     UUID id = UUIDHelpers::Nil;
+    FutureSetPtr future_set;
 };
 
 ///TODO maybe remove shared_ptr from here?
diff --git a/src/Interpreters/ExpressionActions.cpp b/src/Interpreters/ExpressionActions.cpp
index 36725f36804..f1c577948eb 100644
--- a/src/Interpreters/ExpressionActions.cpp
+++ b/src/Interpreters/ExpressionActions.cpp
@@ -936,15 +936,12 @@ bool ExpressionActions::checkColumnIsAlwaysFalse(const String & column_name) con
         for (const auto & action : actions)
         {
             if (action.node->type == ActionsDAG::ActionType::COLUMN && action.node->result_name == set_to_check)
-            {
                 // Constant ColumnSet cannot be empty, so we only need to check non-constant ones.
                 if (const auto * column_set = checkAndGetColumn<const ColumnSet>(action.node->column.get()))
-                {
-                    auto set = column_set->getData();
-                    if (set && set->isCreated() && set->getTotalRowCount() == 0)
-                        return true;
-                }
-            }
+                    if (auto future_set = column_set->getData())
+                        if (auto set = future_set->get())
+                            if (set->getTotalRowCount() == 0)
+                                return true;
         }
     }
 
diff --git a/src/Interpreters/ExpressionAnalyzer.cpp b/src/Interpreters/ExpressionAnalyzer.cpp
index c7c66f6f414..f27d23e8e94 100644
--- a/src/Interpreters/ExpressionAnalyzer.cpp
+++ b/src/Interpreters/ExpressionAnalyzer.cpp
@@ -444,83 +444,12 @@ void ExpressionAnalyzer::initGlobalSubqueriesAndExternalTables(bool do_global, b
     if (do_global)
     {
         GlobalSubqueriesVisitor::Data subqueries_data(
-            getContext(), subquery_depth, isRemoteStorage(), is_explain, external_tables, prepared_sets, has_global_subqueries);
+            getContext(), subquery_depth, isRemoteStorage(), is_explain, external_tables, prepared_sets, has_global_subqueries, syntax->analyzed_join.get());
         GlobalSubqueriesVisitor(subqueries_data).visit(query);
     }
 }
 
 
-void ExpressionAnalyzer::tryMakeSetForIndexFromSubquery(const ASTPtr & subquery_or_table_name, const SelectQueryOptions & query_options)
-{
-    if (!prepared_sets)
-        return;
-
-    auto set_key = PreparedSetKey::forSubquery(*subquery_or_table_name);
-
-    if (prepared_sets->getFuture(set_key).isValid())
-        return; /// Already prepared.
-
-    if (auto set_ptr_from_storage_set = isPlainStorageSetInSubquery(subquery_or_table_name))
-    {
-        prepared_sets->set(set_key, set_ptr_from_storage_set);
-        return;
-    }
-
-    auto build_set = [&] () -> SetPtr
-    {
-        LOG_TRACE(getLogger(), "Building set, key: {}", set_key.toString());
-
-        auto interpreter_subquery = interpretSubquery(subquery_or_table_name, getContext(), {}, query_options);
-        auto io = interpreter_subquery->execute();
-        PullingAsyncPipelineExecutor executor(io.pipeline);
-
-        SetPtr set = std::make_shared<Set>(settings.size_limits_for_set_used_with_index, true, getContext()->getSettingsRef().transform_null_in);
-        set->setHeader(executor.getHeader().getColumnsWithTypeAndName());
-
-        Block block;
-        while (executor.pull(block))
-        {
-            if (block.rows() == 0)
-                continue;
-
-            /// If the limits have been exceeded, give up and let the default subquery processing actions take place.
-            if (!set->insertFromBlock(block.getColumnsWithTypeAndName()))
-                return nullptr;
-        }
-
-        set->finishInsert();
-
-        return set;
-    };
-
-    SetPtr set;
-
-    auto set_cache = getContext()->getPreparedSetsCache();
-    if (set_cache)
-    {
-        auto from_cache = set_cache->findOrPromiseToBuild(set_key.toString());
-        if (from_cache.index() == 0)
-        {
-            set = build_set();
-            std::get<0>(from_cache).set_value(set);
-        }
-        else
-        {
-            LOG_TRACE(getLogger(), "Waiting for set, key: {}", set_key.toString());
-            set = std::get<1>(from_cache).get();
-        }
-    }
-    else
-    {
-        set = build_set();
-    }
-
-    if (!set)
-        return;
-
-    prepared_sets->set(set_key, std::move(set));
-}
-
 SetPtr ExpressionAnalyzer::isPlainStorageSetInSubquery(const ASTPtr & subquery_or_table_name)
 {
     const auto * table = subquery_or_table_name->as<ASTTableIdentifier>();
@@ -534,54 +463,6 @@ SetPtr ExpressionAnalyzer::isPlainStorageSetInSubquery(const ASTPtr & subquery_o
     return storage_set->getSet();
 }
 
-
-/// Performance optimization for IN() if storage supports it.
-void SelectQueryExpressionAnalyzer::makeSetsForIndex(const ASTPtr & node)
-{
-    if (!node || !storage() || !storage()->supportsIndexForIn())
-        return;
-
-    for (auto & child : node->children)
-    {
-        /// Don't descend into subqueries.
-        if (child->as<ASTSubquery>())
-            continue;
-
-        /// Don't descend into lambda functions
-        const auto * func = child->as<ASTFunction>();
-        if (func && func->name == "lambda")
-            continue;
-
-        makeSetsForIndex(child);
-    }
-
-    const auto * func = node->as<ASTFunction>();
-    if (func && functionIsInOrGlobalInOperator(func->name))
-    {
-        const IAST & args = *func->arguments;
-        const ASTPtr & left_in_operand = args.children.at(0);
-
-        if (storage()->mayBenefitFromIndexForIn(left_in_operand, getContext(), metadata_snapshot))
-        {
-            const ASTPtr & arg = args.children.at(1);
-            if (arg->as<ASTSubquery>() || arg->as<ASTTableIdentifier>())
-            {
-                if (settings.use_index_for_in_with_subqueries)
-                    tryMakeSetForIndexFromSubquery(arg, query_options);
-            }
-            else
-            {
-                auto temp_actions = std::make_shared<ActionsDAG>(columns_after_join);
-                getRootActions(left_in_operand, true, temp_actions);
-
-                if (prepared_sets && temp_actions->tryFindInOutputs(left_in_operand->getColumnName()))
-                    makeExplicitSet(func, *temp_actions, true, getContext(), settings.size_limits_for_set, *prepared_sets);
-            }
-        }
-    }
-}
-
-
 void ExpressionAnalyzer::getRootActions(const ASTPtr & ast, bool no_makeset_for_subqueries, ActionsDAGPtr & actions, bool only_consts)
 {
     LogAST log;
@@ -1056,13 +937,6 @@ JoinPtr SelectQueryExpressionAnalyzer::appendJoin(
     return join;
 }
 
-static ActionsDAGPtr createJoinedBlockActions(ContextPtr context, const TableJoin & analyzed_join)
-{
-    ASTPtr expression_list = analyzed_join.rightKeysList();
-    auto syntax_result = TreeRewriter(context).analyze(expression_list, analyzed_join.columnsFromJoinedTable());
-    return ExpressionAnalyzer(expression_list, syntax_result, context).getActionsDAG(true, false);
-}
-
 std::shared_ptr<DirectKeyValueJoin> tryKeyValueJoin(std::shared_ptr<TableJoin> analyzed_join, const Block & right_sample_block);
 
 
@@ -1144,7 +1018,7 @@ static std::unique_ptr<QueryPlan> buildJoinedPlan(
     SelectQueryOptions query_options)
 {
     /// Actions which need to be calculated on joined block.
-    auto joined_block_actions = createJoinedBlockActions(context, analyzed_join);
+    auto joined_block_actions = analyzed_join.createJoinedBlockActions(context);
     NamesWithAliases required_columns_with_aliases = analyzed_join.getRequiredColumns(
         Block(joined_block_actions->getResultColumns()), joined_block_actions->getRequiredColumns().getNames());
 
diff --git a/src/Interpreters/ExpressionAnalyzer.h b/src/Interpreters/ExpressionAnalyzer.h
index 00cd353aa66..271c3943afc 100644
--- a/src/Interpreters/ExpressionAnalyzer.h
+++ b/src/Interpreters/ExpressionAnalyzer.h
@@ -141,11 +141,6 @@ public:
     void makeWindowDescriptionFromAST(const Context & context, const WindowDescriptions & existing_descriptions, WindowDescription & desc, const IAST * ast);
     void makeWindowDescriptions(ActionsDAGPtr actions);
 
-    /** Create Set from a subquery or a table expression in the query. The created set is suitable for using the index.
-      * The set will not be created if its size hits the limit.
-      */
-    void tryMakeSetForIndexFromSubquery(const ASTPtr & subquery_or_table_name, const SelectQueryOptions & query_options = {});
-
     /** Checks if subquery is not a plain StorageSet.
       * Because while making set we will read data from StorageSet which is not allowed.
       * Returns valid SetPtr from StorageSet if the latter is used after IN or nullptr otherwise.
@@ -363,9 +358,6 @@ public:
     /// Deletes all columns except mentioned by SELECT, arranges the remaining columns and renames them to aliases.
     ActionsDAGPtr appendProjectResult(ExpressionActionsChain & chain) const;
 
-    /// Create Set-s that we make from IN section to use index on them.
-    void makeSetsForIndex(const ASTPtr & node);
-
 private:
     StorageMetadataPtr metadata_snapshot;
     /// If non-empty, ignore all expressions not from this list.
diff --git a/src/Interpreters/ExpressionJIT.cpp b/src/Interpreters/ExpressionJIT.cpp
index dfc88e97052..0eacb598fbe 100644
--- a/src/Interpreters/ExpressionJIT.cpp
+++ b/src/Interpreters/ExpressionJIT.cpp
@@ -160,9 +160,9 @@ public:
 
     bool isCompilable() const override { return true; }
 
-    llvm::Value * compile(llvm::IRBuilderBase & builder, Values values) const override
+    llvm::Value * compile(llvm::IRBuilderBase & builder, const ValuesWithType & arguments) const override
     {
-        return dag.compile(builder, values);
+        return dag.compile(builder, arguments).value;
     }
 
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & arguments) const override
diff --git a/src/Interpreters/GlobalSubqueriesVisitor.h b/src/Interpreters/GlobalSubqueriesVisitor.h
index 08862032007..5b633fee9b6 100644
--- a/src/Interpreters/GlobalSubqueriesVisitor.h
+++ b/src/Interpreters/GlobalSubqueriesVisitor.h
@@ -9,6 +9,7 @@
 #include <Interpreters/InDepthNodeVisitor.h>
 #include <Interpreters/interpretSubquery.h>
 #include <Interpreters/PreparedSets.h>
+#include <Interpreters/TableJoin.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTLiteral.h>
@@ -30,6 +31,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int WRONG_GLOBAL_SUBQUERY;
+    extern const int LOGICAL_ERROR;
 }
 
 class GlobalSubqueriesMatcher
@@ -43,6 +45,7 @@ public:
         TemporaryTablesMapping & external_tables;
         PreparedSetsPtr prepared_sets;
         bool & has_global_subqueries;
+        TableJoin * table_join;
 
         Data(
             ContextPtr context_,
@@ -51,7 +54,8 @@ public:
             bool is_explain_,
             TemporaryTablesMapping & tables,
             PreparedSetsPtr prepared_sets_,
-            bool & has_global_subqueries_)
+            bool & has_global_subqueries_,
+            TableJoin * table_join_)
             : WithContext(context_)
             , subquery_depth(subquery_depth_)
             , is_remote(is_remote_)
@@ -59,10 +63,11 @@ public:
             , external_tables(tables)
             , prepared_sets(prepared_sets_)
             , has_global_subqueries(has_global_subqueries_)
+            , table_join(table_join_)
         {
         }
 
-        void addExternalStorage(ASTPtr & ast, bool set_alias = false)
+        void addExternalStorage(ASTPtr & ast, const Names & required_columns, bool set_alias = false)
         {
             /// With nondistributed queries, creating temporary tables does not make sense.
             if (!is_remote)
@@ -145,7 +150,7 @@ public:
             if (external_tables.contains(external_table_name))
                 return;
 
-            auto interpreter = interpretSubquery(subquery_or_table_name, getContext(), subquery_depth, {});
+            auto interpreter = interpretSubquery(subquery_or_table_name, getContext(), subquery_depth, required_columns);
 
             Block sample = interpreter->getSampleBlock();
             NamesAndTypesList columns = sample.getNamesAndTypesList();
@@ -157,30 +162,20 @@ public:
                 nullptr,
                 /*create_for_global_subquery*/ true);
             StoragePtr external_storage = external_storage_holder->getTable();
-
             external_tables.emplace(external_table_name, external_storage_holder);
 
-            /// We need to materialize external tables immediately because reading from distributed
-            /// tables might generate local plans which can refer to external tables during index
-            /// analysis. It's too late to populate the external table via CreatingSetsTransform.
-            if (is_explain)
+            auto set_key = database_and_table_name->getTreeHash();
+
+            if (!prepared_sets->findSubquery(set_key))
             {
-                /// Do not materialize external tables if it's explain statement.
-            }
-            else if (getContext()->getSettingsRef().use_index_for_in_with_subqueries)
-            {
-                auto external_table = external_storage_holder->getTable();
-                auto table_out = external_table->write({}, external_table->getInMemoryMetadataPtr(), getContext());
-                auto io = interpreter->execute();
-                io.pipeline.complete(std::move(table_out));
-                CompletedPipelineExecutor executor(io.pipeline);
-                executor.execute();
+                std::unique_ptr<QueryPlan> source = std::make_unique<QueryPlan>();
+                interpreter->buildQueryPlan(*source);
+
+                auto future_set = prepared_sets->addFromSubquery(set_key, std::move(source), std::move(external_storage), nullptr, getContext()->getSettingsRef());
+                external_storage_holder->future_set = std::move(future_set);
             }
             else
-            {
-                auto & subquery_for_set = prepared_sets->getSubquery(external_table_name);
-                subquery_for_set.createSource(*interpreter, external_storage);
-            }
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Set is already created for GLOBAL IN");
 
             /** NOTE If it was written IN tmp_table - the existing temporary (but not external) table,
             *  then a new temporary table will be created (for example, _data1),
@@ -238,7 +233,7 @@ private:
                 return;
             }
 
-            data.addExternalStorage(ast);
+            data.addExternalStorage(ast, {});
             data.has_global_subqueries = true;
         }
     }
@@ -249,7 +244,21 @@ private:
         if (table_elem.table_join
             && (table_elem.table_join->as<ASTTableJoin &>().locality == JoinLocality::Global || shouldBeExecutedGlobally(data)))
         {
-            data.addExternalStorage(table_elem.table_expression, true);
+            Names required_columns;
+
+            /// Fill required columns for GLOBAL JOIN.
+            /// This code is partial copy-paste from ExpressionAnalyzer.
+            if (data.table_join)
+            {
+                auto joined_block_actions = data.table_join->createJoinedBlockActions(data.getContext());
+                NamesWithAliases required_columns_with_aliases = data.table_join->getRequiredColumns(
+                    Block(joined_block_actions->getResultColumns()), joined_block_actions->getRequiredColumns().getNames());
+
+                for (auto & pr : required_columns_with_aliases)
+                    required_columns.push_back(pr.first);
+            }
+
+            data.addExternalStorage(table_elem.table_expression, required_columns, true);
             data.has_global_subqueries = true;
         }
     }
diff --git a/src/Interpreters/GraceHashJoin.cpp b/src/Interpreters/GraceHashJoin.cpp
index f54ee9d85c7..4218a8ea4e1 100644
--- a/src/Interpreters/GraceHashJoin.cpp
+++ b/src/Interpreters/GraceHashJoin.cpp
@@ -304,10 +304,8 @@ void GraceHashJoin::initBuckets()
 
 bool GraceHashJoin::isSupported(const std::shared_ptr<TableJoin> & table_join)
 {
-
     bool is_asof = (table_join->strictness() == JoinStrictness::Asof);
-    auto kind = table_join->kind();
-    return !is_asof && (isInner(kind) || isLeft(kind) || isRight(kind) || isFull(kind)) && table_join->oneDisjunct();
+    return !is_asof && isInnerOrLeft(table_join->kind()) && table_join->oneDisjunct();
 }
 
 GraceHashJoin::~GraceHashJoin() = default;
@@ -327,6 +325,7 @@ bool GraceHashJoin::hasMemoryOverflow(size_t total_rows, size_t total_bytes) con
     /// One row can't be split, avoid loop
     if (total_rows < 2)
         return false;
+
     bool has_overflow = !table_join->sizeLimits().softCheck(total_rows, total_bytes);
 
     if (has_overflow)
@@ -386,11 +385,23 @@ GraceHashJoin::Buckets GraceHashJoin::rehashBuckets(size_t to_size)
 
 void GraceHashJoin::addBucket(Buckets & destination)
 {
-    auto & left_file = tmp_data->createStream(left_sample_block);
-    auto & right_file = tmp_data->createStream(prepareRightBlock(right_sample_block));
+    // There could be exceptions from createStream, In ci tests
+    // there is a certain probability of failure in allocating memory, see memory_tracker_fault_probability.
+    // It may terminate this thread and leave a broken hash_join, and another thread cores when it tries to
+    // use the broken hash_join. So we print an exception message here to help debug.
+    try
+    {
+        auto & left_file = tmp_data->createStream(left_sample_block);
+        auto & right_file = tmp_data->createStream(prepareRightBlock(right_sample_block));
 
-    BucketPtr new_bucket = std::make_shared<FileBucket>(destination.size(), left_file, right_file, log);
-    destination.emplace_back(std::move(new_bucket));
+        BucketPtr new_bucket = std::make_shared<FileBucket>(destination.size(), left_file, right_file, log);
+        destination.emplace_back(std::move(new_bucket));
+    }
+    catch (...)
+    {
+        LOG_ERROR(&Poco::Logger::get("GraceHashJoin"), "Can't create bucket. current buckets size: {}", destination.size());
+        throw;
+    }
 }
 
 void GraceHashJoin::checkTypesOfKeys(const Block & block) const
@@ -471,30 +482,18 @@ bool GraceHashJoin::alwaysReturnsEmptySet() const
 
     return hash_join_is_empty;
 }
-/// Each bucket are handled by the following steps
-/// 1. build hash_join by the right side blocks.
-/// 2. join left side with the hash_join,
-/// 3. read right non-joined blocks from hash_join.
-/// buckets are handled one by one, each hash_join will not be release before the right non-joined blocks are emitted.
-///
-/// There is a finished counter in JoiningTransform/DelayedJoinedBlocksWorkerTransform,
-/// only one processor could take the non-joined blocks from right stream, and ensure all rows from
-/// left stream have been emitted before this.
-IBlocksStreamPtr
-GraceHashJoin::getNonJoinedBlocks(const Block & left_sample_block_, const Block & result_sample_block_, UInt64 max_block_size_) const
+
+IBlocksStreamPtr GraceHashJoin::getNonJoinedBlocks(const Block &, const Block &, UInt64) const
 {
-    return hash_join->getNonJoinedBlocks(left_sample_block_, result_sample_block_, max_block_size_);
+    /// We do no support returning non joined blocks here.
+    /// TODO: They _should_ be reported by getDelayedBlocks instead
+    return nullptr;
 }
 
 class GraceHashJoin::DelayedBlocks : public IBlocksStream
 {
 public:
-    explicit DelayedBlocks(
-        size_t current_bucket_,
-        Buckets buckets_,
-        InMemoryJoinPtr hash_join_,
-        const Names & left_key_names_,
-        const Names & right_key_names_)
+    explicit DelayedBlocks(size_t current_bucket_, Buckets buckets_, InMemoryJoinPtr hash_join_, const Names & left_key_names_, const Names & right_key_names_)
         : current_bucket(current_bucket_)
         , buckets(std::move(buckets_))
         , hash_join(std::move(hash_join_))
@@ -512,15 +511,12 @@ public:
 
         do
         {
-            // One DelayedBlocks is shared among multiple DelayedJoinedBlocksWorkerTransform.
-            // There is a lock inside left_reader.read().
             block = left_reader.read();
             if (!block)
             {
                 return {};
             }
 
-            // block comes from left_reader, need to join with right table to get the result.
             Blocks blocks = JoinCommon::scatterBlockByHash(left_key_names, block, num_buckets);
             block = std::move(blocks[current_idx]);
 
@@ -571,14 +567,18 @@ IBlocksStreamPtr GraceHashJoin::getDelayedBlocks()
 
     size_t bucket_idx = current_bucket->idx;
 
-    size_t prev_keys_num = 0;
-    // If there is only one bucket, don't take this check.
-    if (hash_join && buckets.size() > 1)
+    if (hash_join)
     {
-        // Use previous hash_join's keys number to estimate next hash_join's size is reasonable.
-        prev_keys_num = hash_join->getTotalRowCount();
+        auto right_blocks = hash_join->releaseJoinedBlocks(/* restructure */ false);
+        for (auto & block : right_blocks)
+        {
+            Blocks blocks = JoinCommon::scatterBlockByHash(right_key_names, block, buckets.size());
+            flushBlocksToBuckets<JoinTableSide::Right>(blocks, buckets, bucket_idx);
+        }
     }
 
+    hash_join = makeInMemoryJoin();
+
     for (bucket_idx = bucket_idx + 1; bucket_idx < buckets.size(); ++bucket_idx)
     {
         current_bucket = buckets[bucket_idx].get();
@@ -591,7 +591,6 @@ IBlocksStreamPtr GraceHashJoin::getDelayedBlocks()
             continue;
         }
 
-        hash_join = makeInMemoryJoin(prev_keys_num);
         auto right_reader = current_bucket->startJoining();
         size_t num_rows = 0; /// count rows that were written and rehashed
         while (Block block = right_reader.read())
@@ -602,6 +601,7 @@ IBlocksStreamPtr GraceHashJoin::getDelayedBlocks()
 
         LOG_TRACE(log, "Loaded bucket {} with {}(/{}) rows",
             bucket_idx, hash_join->getTotalRowCount(), num_rows);
+
         return std::make_unique<DelayedBlocks>(current_bucket->idx, buckets, hash_join, left_key_names, right_key_names);
     }
 
@@ -611,9 +611,9 @@ IBlocksStreamPtr GraceHashJoin::getDelayedBlocks()
     return nullptr;
 }
 
-GraceHashJoin::InMemoryJoinPtr GraceHashJoin::makeInMemoryJoin(size_t reserve_num)
+GraceHashJoin::InMemoryJoinPtr GraceHashJoin::makeInMemoryJoin()
 {
-    return std::make_unique<InMemoryJoin>(table_join, right_sample_block, any_take_last_row, reserve_num);
+    return std::make_unique<InMemoryJoin>(table_join, right_sample_block, any_take_last_row);
 }
 
 Block GraceHashJoin::prepareRightBlock(const Block & block)
@@ -623,6 +623,7 @@ Block GraceHashJoin::prepareRightBlock(const Block & block)
 
 void GraceHashJoin::addJoinedBlockImpl(Block block)
 {
+    block = prepareRightBlock(block);
     Buckets buckets_snapshot = getCurrentBuckets();
     size_t bucket_index = current_bucket->idx;
     Block current_block;
@@ -637,23 +638,14 @@ void GraceHashJoin::addJoinedBlockImpl(Block block)
     if (current_block.rows() > 0)
     {
         std::lock_guard lock(hash_join_mutex);
-
+        auto current_buckets = getCurrentBuckets();
+        if (!isPowerOf2(current_buckets.size())) [[unlikely]]
+        {
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Broken buckets. its size({}) is not power of 2", current_buckets.size());
+        }
         if (!hash_join)
             hash_join = makeInMemoryJoin();
 
-        // buckets size has been changed in other threads. Need to scatter current_block again.
-        // rehash could only happen under hash_join_mutex's scope.
-        auto current_buckets = getCurrentBuckets();
-        if (buckets_snapshot.size() != current_buckets.size())
-        {
-            LOG_TRACE(log, "mismatch buckets size. previous:{}, current:{}", buckets_snapshot.size(), getCurrentBuckets().size());
-            Blocks blocks = JoinCommon::scatterBlockByHash(right_key_names, current_block, current_buckets.size());
-            flushBlocksToBuckets<JoinTableSide::Right>(blocks, current_buckets, bucket_index);
-            current_block = std::move(blocks[bucket_index]);
-            if (!current_block.rows())
-                return;
-        }
-        auto prev_keys_num = hash_join->getTotalRowCount();
         hash_join->addJoinedBlock(current_block, /* check_limits = */ false);
 
         if (!hasMemoryOverflow(hash_join))
@@ -661,9 +653,10 @@ void GraceHashJoin::addJoinedBlockImpl(Block block)
 
         current_block = {};
 
+        // Must use the latest buckets snapshot in case that it has been rehashed by other threads.
+        buckets_snapshot = rehashBuckets(current_buckets.size() * 2);
         auto right_blocks = hash_join->releaseJoinedBlocks(/* restructure */ false);
-
-        buckets_snapshot = rehashBuckets(buckets_snapshot.size() * 2);
+        hash_join = nullptr;
 
         {
             Blocks current_blocks;
@@ -681,7 +674,7 @@ void GraceHashJoin::addJoinedBlockImpl(Block block)
                 current_block = concatenateBlocks(current_blocks);
         }
 
-        hash_join = makeInMemoryJoin(prev_keys_num);
+        hash_join = makeInMemoryJoin();
 
         if (current_block.rows() > 0)
             hash_join->addJoinedBlock(current_block, /* check_limits = */ false);
diff --git a/src/Interpreters/GraceHashJoin.h b/src/Interpreters/GraceHashJoin.h
index ec611f373ed..b8d83f4cad0 100644
--- a/src/Interpreters/GraceHashJoin.h
+++ b/src/Interpreters/GraceHashJoin.h
@@ -13,6 +13,7 @@
 
 namespace DB
 {
+
 class TableJoin;
 class HashJoin;
 
@@ -78,7 +79,7 @@ public:
     bool supportTotals() const override { return false; }
 
     IBlocksStreamPtr
-    getNonJoinedBlocks(const Block & left_sample_block_, const Block & result_sample_block_, UInt64 max_block_size) const override;
+    getNonJoinedBlocks(const Block & left_sample_block, const Block & result_sample_block, UInt64 max_block_size) const override;
 
     /// Open iterator over joined blocks.
     /// Must be called after all @joinBlock calls.
@@ -90,8 +91,7 @@ public:
 private:
     void initBuckets();
     /// Create empty join for in-memory processing.
-    /// reserve_num for reserving space in hash table.
-    InMemoryJoinPtr makeInMemoryJoin(size_t reserve_num = 0);
+    InMemoryJoinPtr makeInMemoryJoin();
 
     /// Add right table block to the @join. Calls @rehash on overflow.
     void addJoinedBlockImpl(Block block);
diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index 9306c9b99eb..6fe2b8464f5 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -217,7 +217,7 @@ static void correctNullabilityInplace(ColumnWithTypeAndName & column, bool nulla
         JoinCommon::removeColumnNullability(column);
 }
 
-HashJoin::HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_sample_block_, bool any_take_last_row_, size_t reserve_num)
+HashJoin::HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_sample_block_, bool any_take_last_row_)
     : table_join(table_join_)
     , kind(table_join->kind())
     , strictness(table_join->strictness())
@@ -302,7 +302,7 @@ HashJoin::HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_s
     }
 
     for (auto & maps : data->maps)
-        dataMapInit(maps, reserve_num);
+        dataMapInit(maps);
 }
 
 HashJoin::Type HashJoin::chooseMethod(JoinKind kind, const ColumnRawPtrs & key_columns, Sizes & key_sizes)
@@ -454,15 +454,13 @@ struct KeyGetterForType
     using Type = typename KeyGetterForTypeImpl<type, Value, Mapped>::Type;
 };
 
-void HashJoin::dataMapInit(MapsVariant & map, size_t reserve_num)
+void HashJoin::dataMapInit(MapsVariant & map)
 {
 
     if (kind == JoinKind::Cross)
         return;
     joinDispatchInit(kind, strictness, map);
     joinDispatch(kind, strictness, map, [&](auto, auto, auto & map_) { map_.create(data->type); });
-    if (reserve_num)
-        joinDispatch(kind, strictness, map, [&](auto, auto, auto & map_) { map_.reserve(data->type, reserve_num); });
 }
 
 bool HashJoin::empty() const
@@ -707,8 +705,9 @@ Block HashJoin::prepareRightBlock(const Block & block, const Block & saved_block
     for (const auto & sample_column : saved_block_sample_.getColumnsWithTypeAndName())
     {
         ColumnWithTypeAndName column = block.getByName(sample_column.name);
-        if (sample_column.column->isNullable())
-            JoinCommon::convertColumnToNullable(column);
+
+        /// There's no optimization for right side const columns. Remove constness if any.
+        column.column = recursiveRemoveSparse(column.column->convertToFullColumnIfConst());
 
         if (column.column->lowCardinality() && !sample_column.column->lowCardinality())
         {
@@ -716,8 +715,9 @@ Block HashJoin::prepareRightBlock(const Block & block, const Block & saved_block
             column.type = removeLowCardinality(column.type);
         }
 
-        /// There's no optimization for right side const columns. Remove constness if any.
-        column.column = recursiveRemoveSparse(column.column->convertToFullColumnIfConst());
+        if (sample_column.column->isNullable())
+            JoinCommon::convertColumnToNullable(column);
+
         structured_block.insert(std::move(column));
     }
 
diff --git a/src/Interpreters/HashJoin.h b/src/Interpreters/HashJoin.h
index 58e47432d41..50eda4482bd 100644
--- a/src/Interpreters/HashJoin.h
+++ b/src/Interpreters/HashJoin.h
@@ -146,7 +146,7 @@ public:
 class HashJoin : public IJoin
 {
 public:
-    HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_sample_block, bool any_take_last_row_ = false, size_t reserve_num = 0);
+    HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_sample_block, bool any_take_last_row_ = false);
 
     ~HashJoin() override;
 
@@ -217,16 +217,6 @@ public:
         M(keys256)                     \
         M(hashed)
 
-    /// Only for maps using hash table.
-    #define APPLY_FOR_HASH_JOIN_VARIANTS(M) \
-        M(key32)                            \
-        M(key64)                            \
-        M(key_string)                       \
-        M(key_fixed_string)                 \
-        M(keys128)                          \
-        M(keys256)                          \
-        M(hashed)
-
 
     /// Used for reading from StorageJoin and applying joinGet function
     #define APPLY_FOR_JOIN_VARIANTS_LIMITED(M) \
@@ -276,22 +266,6 @@ public:
             }
         }
 
-        void reserve(Type which, size_t num)
-        {
-            switch (which)
-            {
-                case Type::EMPTY:            break;
-                case Type::CROSS:            break;
-                case Type::key8:             break;
-                case Type::key16:            break;
-
-            #define M(NAME) \
-                case Type::NAME: NAME->reserve(num); break;
-                APPLY_FOR_HASH_JOIN_VARIANTS(M)
-            #undef M
-            }
-        }
-
         size_t getTotalRowCount(Type which) const
         {
             switch (which)
@@ -435,7 +409,7 @@ private:
     /// If set HashJoin instance is not available for modification (addJoinedBlock)
     TableLockHolder storage_join_lock = nullptr;
 
-    void dataMapInit(MapsVariant &, size_t);
+    void dataMapInit(MapsVariant &);
 
     void initRightBlockStructure(Block & saved_block_sample);
 
diff --git a/src/Interpreters/InterpreterAlterQuery.cpp b/src/Interpreters/InterpreterAlterQuery.cpp
index ec2145b38bf..e82415f1aca 100644
--- a/src/Interpreters/InterpreterAlterQuery.cpp
+++ b/src/Interpreters/InterpreterAlterQuery.cpp
@@ -18,8 +18,6 @@
 #include <Parsers/queryToString.h>
 #include <Storages/AlterCommands.h>
 #include <Storages/IStorage.h>
-#include <Storages/LiveView/LiveViewCommands.h>
-#include <Storages/LiveView/StorageLiveView.h>
 #include <Storages/MutationCommands.h>
 #include <Storages/PartitionCommands.h>
 #include <Storages/StorageKeeperMap.h>
@@ -117,7 +115,6 @@ BlockIO InterpreterAlterQuery::executeToTable(const ASTAlterQuery & alter)
     AlterCommands alter_commands;
     PartitionCommands partition_commands;
     MutationCommands mutation_commands;
-    LiveViewCommands live_view_commands;
     for (const auto & child : alter.command_list->children)
     {
         auto * command_ast = child->as<ASTAlterCommand>();
@@ -137,17 +134,13 @@ BlockIO InterpreterAlterQuery::executeToTable(const ASTAlterQuery & alter)
 
             mutation_commands.emplace_back(std::move(*mut_command));
         }
-        else if (auto live_view_command = LiveViewCommand::parse(command_ast))
-        {
-            live_view_commands.emplace_back(std::move(*live_view_command));
-        }
         else
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Wrong parameter type in ALTER query");
     }
 
     if (typeid_cast<DatabaseReplicated *>(database.get()))
     {
-        int command_types_count = !mutation_commands.empty() + !partition_commands.empty() + !live_view_commands.empty() + !alter_commands.empty();
+        int command_types_count = !mutation_commands.empty() + !partition_commands.empty() + !alter_commands.empty();
         bool mixed_settings_amd_metadata_alter = alter_commands.hasSettingsAlterCommand() && !alter_commands.isSettingsAlter();
         if (1 < command_types_count || mixed_settings_amd_metadata_alter)
             throw Exception(ErrorCodes::NOT_IMPLEMENTED, "For Replicated databases it's not allowed "
@@ -170,21 +163,6 @@ BlockIO InterpreterAlterQuery::executeToTable(const ASTAlterQuery & alter)
             res.pipeline = QueryPipeline(std::move(partition_commands_pipe));
     }
 
-    if (!live_view_commands.empty())
-    {
-        live_view_commands.validate(*table);
-        for (const LiveViewCommand & command : live_view_commands)
-        {
-            auto live_view = std::dynamic_pointer_cast<StorageLiveView>(table);
-            switch (command.type)
-            {
-                case LiveViewCommand::REFRESH:
-                    live_view->refresh();
-                    break;
-            }
-        }
-    }
-
     if (!alter_commands.empty())
     {
         auto alter_lock = table->lockForAlter(getContext()->getSettingsRef().lock_acquire_timeout);
diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index ab9e1fb04d6..d0bb3dd389f 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -571,6 +571,7 @@ ColumnsDescription InterpreterCreateQuery::getColumnsDescription(
 
     bool sanity_check_compression_codecs = !attach && !context_->getSettingsRef().allow_suspicious_codecs;
     bool allow_experimental_codecs = attach || context_->getSettingsRef().allow_experimental_codecs;
+    bool enable_deflate_qpl_codec = attach || context_->getSettingsRef().enable_deflate_qpl_codec;
 
     ColumnsDescription res;
     auto name_type_it = column_names_and_types.begin();
@@ -631,7 +632,7 @@ ColumnsDescription InterpreterCreateQuery::getColumnsDescription(
             if (col_decl.default_specifier == "ALIAS")
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot specify codec for column type ALIAS");
             column.codec = CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(
-                col_decl.codec, column.type, sanity_check_compression_codecs, allow_experimental_codecs);
+                col_decl.codec, column.type, sanity_check_compression_codecs, allow_experimental_codecs, enable_deflate_qpl_codec);
         }
 
         if (col_decl.ttl)
diff --git a/src/Interpreters/InterpreterDescribeCacheQuery.cpp b/src/Interpreters/InterpreterDescribeCacheQuery.cpp
index ca875ee57b2..7822ecdb8be 100644
--- a/src/Interpreters/InterpreterDescribeCacheQuery.cpp
+++ b/src/Interpreters/InterpreterDescribeCacheQuery.cpp
@@ -19,12 +19,15 @@ static Block getSampleBlock()
         ColumnWithTypeAndName{std::make_shared<DataTypeUInt64>(), "max_size"},
         ColumnWithTypeAndName{std::make_shared<DataTypeUInt64>(), "max_elements"},
         ColumnWithTypeAndName{std::make_shared<DataTypeUInt64>(), "max_file_segment_size"},
+        ColumnWithTypeAndName{std::make_shared<DataTypeUInt64>(), "boundary_alignment"},
         ColumnWithTypeAndName{std::make_shared<DataTypeNumber<UInt8>>(), "cache_on_write_operations"},
         ColumnWithTypeAndName{std::make_shared<DataTypeNumber<UInt8>>(), "cache_hits_threshold"},
         ColumnWithTypeAndName{std::make_shared<DataTypeUInt64>(), "current_size"},
         ColumnWithTypeAndName{std::make_shared<DataTypeUInt64>(), "current_elements"},
         ColumnWithTypeAndName{std::make_shared<DataTypeString>(), "path"},
-        ColumnWithTypeAndName{std::make_shared<DataTypeNumber<UInt8>>(), "do_not_evict_index_and_mark_files"},
+        ColumnWithTypeAndName{std::make_shared<DataTypeNumber<UInt64>>(), "delayed_cleanup_interval_ms"},
+        ColumnWithTypeAndName{std::make_shared<DataTypeNumber<UInt64>>(), "background_download_threads"},
+        ColumnWithTypeAndName{std::make_shared<DataTypeNumber<UInt64>>(), "enable_bypass_cache_with_threshold"},
     };
     return Block(columns);
 }
@@ -41,15 +44,19 @@ BlockIO InterpreterDescribeCacheQuery::execute()
     const auto & settings = cache_data.settings;
     const auto & cache = cache_data.cache;
 
-    res_columns[0]->insert(settings.max_size);
-    res_columns[1]->insert(settings.max_elements);
-    res_columns[2]->insert(settings.max_file_segment_size);
-    res_columns[3]->insert(settings.cache_on_write_operations);
-    res_columns[4]->insert(settings.cache_hits_threshold);
-    res_columns[5]->insert(cache->getUsedCacheSize());
-    res_columns[6]->insert(cache->getFileSegmentsNum());
-    res_columns[7]->insert(cache->getBasePath());
-    res_columns[8]->insert(settings.do_not_evict_index_and_mark_files);
+    size_t i = 0;
+    res_columns[i++]->insert(settings.max_size);
+    res_columns[i++]->insert(settings.max_elements);
+    res_columns[i++]->insert(settings.max_file_segment_size);
+    res_columns[i++]->insert(settings.boundary_alignment);
+    res_columns[i++]->insert(settings.cache_on_write_operations);
+    res_columns[i++]->insert(settings.cache_hits_threshold);
+    res_columns[i++]->insert(cache->getUsedCacheSize());
+    res_columns[i++]->insert(cache->getFileSegmentsNum());
+    res_columns[i++]->insert(cache->getBasePath());
+    res_columns[i++]->insert(settings.delayed_cleanup_interval_ms);
+    res_columns[i++]->insert(settings.background_download_threads);
+    res_columns[i++]->insert(settings.enable_bypass_cache_with_threashold);
 
     BlockIO res;
     size_t num_rows = res_columns[0]->size();
diff --git a/src/Interpreters/InterpreterInsertQuery.cpp b/src/Interpreters/InterpreterInsertQuery.cpp
index e87b16f0e9d..078499fb013 100644
--- a/src/Interpreters/InterpreterInsertQuery.cpp
+++ b/src/Interpreters/InterpreterInsertQuery.cpp
@@ -282,7 +282,7 @@ Chain InterpreterInsertQuery::buildSink(
     ///       Otherwise we'll get duplicates when MV reads same rows again from Kafka.
     if (table->noPushingToViews() && !no_destination)
     {
-        auto sink = table->write(query_ptr, metadata_snapshot, context_ptr);
+        auto sink = table->write(query_ptr, metadata_snapshot, context_ptr, async_insert);
         sink->setRuntimeData(thread_status, elapsed_counter_ms);
         out.addSource(std::move(sink));
     }
@@ -290,7 +290,7 @@ Chain InterpreterInsertQuery::buildSink(
     {
         out = buildPushingToViewsChain(table, metadata_snapshot, context_ptr,
             query_ptr, no_destination,
-            thread_status_holder, running_group, elapsed_counter_ms);
+            thread_status_holder, running_group, elapsed_counter_ms, async_insert);
     }
 
     return out;
diff --git a/src/Interpreters/InterpreterOptimizeQuery.cpp b/src/Interpreters/InterpreterOptimizeQuery.cpp
index a4507391c4e..ae456e8b31d 100644
--- a/src/Interpreters/InterpreterOptimizeQuery.cpp
+++ b/src/Interpreters/InterpreterOptimizeQuery.cpp
@@ -34,7 +34,7 @@ BlockIO InterpreterOptimizeQuery::execute()
 
     getContext()->checkAccess(getRequiredAccess());
 
-    auto table_id = getContext()->resolveStorageID(ast, Context::ResolveOrdinary);
+    auto table_id = getContext()->resolveStorageID(ast);
     StoragePtr table = DatabaseCatalog::instance().getTable(table_id, getContext());
     checkStorageSupportsTransactionsIfNeeded(table, getContext());
     auto metadata_snapshot = table->getInMemoryMetadataPtr();
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index d2be48dafb3..6ea15312ec4 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -477,7 +477,7 @@ InterpreterSelectQuery::InterpreterSelectQuery(
     /// Check support for JOIN for parallel replicas with custom key
     if (joined_tables.tablesCount() > 1 && !settings.parallel_replicas_custom_key.value.empty())
     {
-        LOG_WARNING(log, "JOINs are not supported with parallel_replicas_custom_key. Query will be executed without using them.");
+        LOG_DEBUG(log, "JOINs are not supported with parallel_replicas_custom_key. Query will be executed without using them.");
         context->setSetting("parallel_replicas_custom_key", String{""});
     }
 
@@ -487,7 +487,7 @@ InterpreterSelectQuery::InterpreterSelectQuery(
     {
         if (settings.allow_experimental_parallel_reading_from_replicas == 1)
         {
-            LOG_WARNING(log, "FINAL modifier is not supported with parallel replicas. Query will be executed without using them.");
+            LOG_DEBUG(log, "FINAL modifier is not supported with parallel replicas. Query will be executed without using them.");
             context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
             context->setSetting("parallel_replicas_custom_key", String{""});
         }
@@ -503,7 +503,7 @@ InterpreterSelectQuery::InterpreterSelectQuery(
     {
         if (settings.allow_experimental_parallel_reading_from_replicas == 1)
         {
-            LOG_WARNING(log, "To use parallel replicas with plain MergeTree tables please enable setting `parallel_replicas_for_non_replicated_merge_tree`. For now query will be executed without using them.");
+            LOG_DEBUG(log, "To use parallel replicas with plain MergeTree tables please enable setting `parallel_replicas_for_non_replicated_merge_tree`. For now query will be executed without using them.");
             context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
         }
         else if (settings.allow_experimental_parallel_reading_from_replicas == 2)
@@ -833,6 +833,19 @@ InterpreterSelectQuery::InterpreterSelectQuery(
         need_analyze_again = true;
     }
 
+    if (can_analyze_again
+        && settings.max_parallel_replicas > 1
+        && settings.allow_experimental_parallel_reading_from_replicas > 0
+        && settings.parallel_replicas_custom_key.value.empty()
+        && getTrivialCount(0).has_value())
+    {
+        /// The query could use trivial count if it didn't use parallel replicas, so let's disable it and reanalyze
+        context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
+        context->setSetting("max_parallel_replicas", UInt64{0});
+        need_analyze_again = true;
+        LOG_TRACE(log, "Disabling parallel replicas to be able to use a trivial count optimization");
+    }
+
     if (need_analyze_again)
     {
         size_t current_query_analyze_count = context->getQueryContext()->kitchen_sink.analyze_counter.load();
@@ -940,10 +953,7 @@ Block InterpreterSelectQuery::getSampleBlockImpl()
 
     if (storage && !options.only_analyze)
     {
-        query_analyzer->makeSetsForIndex(select_query.where());
-        query_analyzer->makeSetsForIndex(select_query.prewhere());
         query_info.prepared_sets = query_analyzer->getPreparedSets();
-
         from_stage = storage->getQueryProcessingStage(context, options.to_stage, storage_snapshot, query_info);
     }
 
@@ -2254,79 +2264,84 @@ void InterpreterSelectQuery::addPrewhereAliasActions()
     }
 }
 
-void InterpreterSelectQuery::executeFetchColumns(QueryProcessingStage::Enum processing_stage, QueryPlan & query_plan)
+/// Based on the query analysis, check if optimizing the count trivial count to use totalRows is possible
+std::optional<UInt64> InterpreterSelectQuery::getTrivialCount(UInt64 max_parallel_replicas)
 {
-    auto & query = getSelectQuery();
     const Settings & settings = context->getSettingsRef();
-
-    /// Optimization for trivial query like SELECT count() FROM table.
     bool optimize_trivial_count =
         syntax_analyzer_result->optimize_trivial_count
-        && (settings.max_parallel_replicas <= 1)
+        && (max_parallel_replicas <= 1)
         && !settings.allow_experimental_query_deduplication
         && !settings.empty_result_for_aggregation_by_empty_set
         && storage
         && storage->getName() != "MaterializedMySQL"
         && !storage->hasLightweightDeletedMask()
         && query_info.filter_asts.empty()
-        && processing_stage == QueryProcessingStage::FetchColumns
         && query_analyzer->hasAggregation()
         && (query_analyzer->aggregates().size() == 1)
         && typeid_cast<const AggregateFunctionCount *>(query_analyzer->aggregates()[0].function.get());
 
-    if (optimize_trivial_count)
+    if (!optimize_trivial_count)
+        return {};
+
+    auto & query = getSelectQuery();
+    if (!query.prewhere() && !query.where() && !context->getCurrentTransaction())
+    {
+        return storage->totalRows(settings);
+    }
+    else
+    {
+        // It's possible to optimize count() given only partition predicates
+        SelectQueryInfo temp_query_info;
+        temp_query_info.query = query_ptr;
+        temp_query_info.syntax_analyzer_result = syntax_analyzer_result;
+        temp_query_info.prepared_sets = query_analyzer->getPreparedSets();
+
+        return storage->totalRowsByPartitionPredicate(temp_query_info, context);
+    }
+}
+
+void InterpreterSelectQuery::executeFetchColumns(QueryProcessingStage::Enum processing_stage, QueryPlan & query_plan)
+{
+    auto & query = getSelectQuery();
+    const Settings & settings = context->getSettingsRef();
+    std::optional<UInt64> num_rows;
+
+    /// Optimization for trivial query like SELECT count() FROM table.
+    if (processing_stage == QueryProcessingStage::FetchColumns && (num_rows = getTrivialCount(settings.max_parallel_replicas)))
     {
         const auto & desc = query_analyzer->aggregates()[0];
         const auto & func = desc.function;
-        std::optional<UInt64> num_rows{};
+        const AggregateFunctionCount & agg_count = static_cast<const AggregateFunctionCount &>(*func);
 
-        if (!query.prewhere() && !query.where() && !context->getCurrentTransaction())
-        {
-            num_rows = storage->totalRows(settings);
-        }
-        else // It's possible to optimize count() given only partition predicates
-        {
-            SelectQueryInfo temp_query_info;
-            temp_query_info.query = query_ptr;
-            temp_query_info.syntax_analyzer_result = syntax_analyzer_result;
-            temp_query_info.prepared_sets = query_analyzer->getPreparedSets();
+        /// We will process it up to "WithMergeableState".
+        std::vector<char> state(agg_count.sizeOfData());
+        AggregateDataPtr place = state.data();
 
-            num_rows = storage->totalRowsByPartitionPredicate(temp_query_info, context);
-        }
+        agg_count.create(place);
+        SCOPE_EXIT_MEMORY_SAFE(agg_count.destroy(place));
 
-        if (num_rows)
-        {
-            const AggregateFunctionCount & agg_count = static_cast<const AggregateFunctionCount &>(*func);
+        agg_count.set(place, *num_rows);
 
-            /// We will process it up to "WithMergeableState".
-            std::vector<char> state(agg_count.sizeOfData());
-            AggregateDataPtr place = state.data();
+        auto column = ColumnAggregateFunction::create(func);
+        column->insertFrom(place);
 
-            agg_count.create(place);
-            SCOPE_EXIT_MEMORY_SAFE(agg_count.destroy(place));
+        Block header = analysis_result.before_aggregation->getResultColumns();
+        size_t arguments_size = desc.argument_names.size();
+        DataTypes argument_types(arguments_size);
+        for (size_t j = 0; j < arguments_size; ++j)
+            argument_types[j] = header.getByName(desc.argument_names[j]).type;
 
-            agg_count.set(place, *num_rows);
+        Block block_with_count{
+            {std::move(column), std::make_shared<DataTypeAggregateFunction>(func, argument_types, desc.parameters), desc.column_name}};
 
-            auto column = ColumnAggregateFunction::create(func);
-            column->insertFrom(place);
-
-            Block header = analysis_result.before_aggregation->getResultColumns();
-            size_t arguments_size = desc.argument_names.size();
-            DataTypes argument_types(arguments_size);
-            for (size_t j = 0; j < arguments_size; ++j)
-                argument_types[j] = header.getByName(desc.argument_names[j]).type;
-
-            Block block_with_count{
-                {std::move(column), std::make_shared<DataTypeAggregateFunction>(func, argument_types, desc.parameters), desc.column_name}};
-
-            auto source = std::make_shared<SourceFromSingleChunk>(block_with_count);
-            auto prepared_count = std::make_unique<ReadFromPreparedSource>(Pipe(std::move(source)));
-            prepared_count->setStepDescription("Optimized trivial count");
-            query_plan.addStep(std::move(prepared_count));
-            from_stage = QueryProcessingStage::WithMergeableState;
-            analysis_result.first_stage = false;
-            return;
-        }
+        auto source = std::make_shared<SourceFromSingleChunk>(block_with_count);
+        auto prepared_count = std::make_unique<ReadFromPreparedSource>(Pipe(std::move(source)));
+        prepared_count->setStepDescription("Optimized trivial count");
+        query_plan.addStep(std::move(prepared_count));
+        from_stage = QueryProcessingStage::WithMergeableState;
+        analysis_result.first_stage = false;
+        return;
     }
 
     /// Limitation on the number of columns to read.
@@ -3133,7 +3148,17 @@ void InterpreterSelectQuery::executeExtremes(QueryPlan & query_plan)
 
 void InterpreterSelectQuery::executeSubqueriesInSetsAndJoins(QueryPlan & query_plan)
 {
-    addCreatingSetsStep(query_plan, prepared_sets, context);
+    auto subqueries = prepared_sets->getSubqueries();
+
+    if (!subqueries.empty())
+    {
+        auto step = std::make_unique<DelayedCreatingSetsStep>(
+                query_plan.getCurrentDataStream(),
+                std::move(subqueries),
+                context);
+
+        query_plan.addStep(std::move(step));
+    }
 }
 
 
diff --git a/src/Interpreters/InterpreterSelectQuery.h b/src/Interpreters/InterpreterSelectQuery.h
index e39dd675136..0739e818cd6 100644
--- a/src/Interpreters/InterpreterSelectQuery.h
+++ b/src/Interpreters/InterpreterSelectQuery.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <memory>
+#include <optional>
 
 #include <Access/EnabledRowPolicies.h>
 #include <Core/QueryProcessingStage.h>
@@ -187,6 +188,7 @@ private:
     void executeExtremes(QueryPlan & query_plan);
     void executeSubqueriesInSetsAndJoins(QueryPlan & query_plan);
     bool autoFinalOnQuery(ASTSelectQuery & select_query);
+    std::optional<UInt64> getTrivialCount(UInt64 max_parallel_replicas);
 
     enum class Modificator
     {
diff --git a/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp b/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
index 98f70c25dcd..8db1d27c073 100644
--- a/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
+++ b/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
@@ -135,7 +135,10 @@ QueryTreeNodePtr buildQueryTreeAndRunPasses(const ASTPtr & query,
     QueryTreePassManager query_tree_pass_manager(context);
     addQueryTreePasses(query_tree_pass_manager);
 
-    if (select_query_options.ignore_ast_optimizations)
+    /// We should not apply any query tree level optimizations on shards
+    /// because it can lead to a changed header.
+    if (select_query_options.ignore_ast_optimizations
+        || context->getClientInfo().query_kind == ClientInfo::QueryKind::SECONDARY_QUERY)
         query_tree_pass_manager.run(query_tree, 1 /*up_to_pass_index*/);
     else
         query_tree_pass_manager.run(query_tree);
diff --git a/src/Interpreters/InterpreterSelectQueryAnalyzer.h b/src/Interpreters/InterpreterSelectQueryAnalyzer.h
index 1e0ac737536..4434fabe746 100644
--- a/src/Interpreters/InterpreterSelectQueryAnalyzer.h
+++ b/src/Interpreters/InterpreterSelectQueryAnalyzer.h
@@ -69,6 +69,8 @@ public:
     const Planner & getPlanner() const { return planner; }
     Planner & getPlanner() { return planner; }
 
+    const QueryTreeNodePtr & getQueryTree() const { return query_tree; }
+
 private:
     ASTPtr query;
     ContextMutablePtr context;
diff --git a/src/Interpreters/JIT/CHJIT.h b/src/Interpreters/JIT/CHJIT.h
index cde1129c010..fc883802426 100644
--- a/src/Interpreters/JIT/CHJIT.h
+++ b/src/Interpreters/JIT/CHJIT.h
@@ -19,14 +19,14 @@ class JITModuleMemoryManager;
 class JITSymbolResolver;
 class JITCompiler;
 
-/** Custom jit implementation
+/** Custom JIT implementation.
   * Main use cases:
   * 1. Compiled functions in module.
   * 2. Release memory for compiled functions.
   *
   * In LLVM library there are 2 main JIT stacks MCJIT and ORCv2.
   *
-  * Main reasons for custom implementation vs MCJIT
+  * Main reasons for custom implementation vs MCJIT.
   * MCJIT keeps llvm::Module and compiled object code before linking process after module was compiled.
   * llvm::Module can be removed, but compiled object code cannot be removed. Memory for compiled code
   * will be release only during MCJIT instance destruction. It is too expensive to create MCJIT
diff --git a/src/Interpreters/JIT/CompileDAG.cpp b/src/Interpreters/JIT/CompileDAG.cpp
index 2c5c7731150..6da17fb4c67 100644
--- a/src/Interpreters/JIT/CompileDAG.cpp
+++ b/src/Interpreters/JIT/CompileDAG.cpp
@@ -16,19 +16,14 @@
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int LOGICAL_ERROR;
-}
-
-llvm::Value * CompileDAG::compile(llvm::IRBuilderBase & builder, Values input_nodes_values) const
+ValueWithType CompileDAG::compile(llvm::IRBuilderBase & builder, const ValuesWithType & input_nodes_values) const
 {
     assert(input_nodes_values.size() == getInputNodesCount());
 
     llvm::IRBuilder<> & b = static_cast<llvm::IRBuilder<> &>(builder);
 
-    PaddedPODArray<llvm::Value *> compiled_values;
-    compiled_values.resize_fill(nodes.size());
+    ValuesWithType compiled_values;
+    compiled_values.resize(nodes.size());
 
     size_t input_nodes_values_index = 0;
     size_t compiled_values_index = 0;
@@ -44,31 +39,26 @@ llvm::Value * CompileDAG::compile(llvm::IRBuilderBase & builder, Values input_no
             case CompileType::CONSTANT:
             {
                 auto * native_value = getColumnNativeValue(b, node.result_type, *node.column, 0);
-                if (!native_value)
-                    throw Exception(ErrorCodes::LOGICAL_ERROR,
-                    "Cannot find native value for constant column with type {}",
-                    node.result_type->getName());
-
-                compiled_values[compiled_values_index] = native_value;
+                compiled_values[compiled_values_index] = {native_value, node.result_type};
                 break;
             }
             case CompileType::FUNCTION:
             {
-                Values temporary_values;
+                ValuesWithType temporary_values;
                 temporary_values.reserve(node.arguments.size());
 
                 for (auto argument_index : node.arguments)
                 {
-                    assert(compiled_values[argument_index] != nullptr);
+                    assert(compiled_values[argument_index].value != nullptr);
                     temporary_values.emplace_back(compiled_values[argument_index]);
                 }
 
-                compiled_values[compiled_values_index] = node.function->compile(builder, temporary_values);
+                compiled_values[compiled_values_index] = {node.function->compile(builder, temporary_values), node.result_type};
                 break;
             }
             case CompileType::INPUT:
             {
-                compiled_values[compiled_values_index] = input_nodes_values[input_nodes_values_index];
+                compiled_values[compiled_values_index] = {input_nodes_values[input_nodes_values_index].value, node.result_type};
                 ++input_nodes_values_index;
                 break;
             }
diff --git a/src/Interpreters/JIT/CompileDAG.h b/src/Interpreters/JIT/CompileDAG.h
index a05fa629561..77a02230f55 100644
--- a/src/Interpreters/JIT/CompileDAG.h
+++ b/src/Interpreters/JIT/CompileDAG.h
@@ -53,7 +53,7 @@ public:
         std::vector<size_t> arguments;
     };
 
-    llvm::Value * compile(llvm::IRBuilderBase & builder, Values input_nodes_values) const;
+    ValueWithType compile(llvm::IRBuilderBase & builder, const ValuesWithType & input_nodes_values_with_type) const;
 
     std::string dump() const;
 
diff --git a/src/Interpreters/JIT/compileFunction.cpp b/src/Interpreters/JIT/compileFunction.cpp
index a7233433861..fb8dec665b4 100644
--- a/src/Interpreters/JIT/compileFunction.cpp
+++ b/src/Interpreters/JIT/compileFunction.cpp
@@ -9,6 +9,8 @@
 #include <Common/Stopwatch.h>
 #include <Common/ProfileEvents.h>
 #include <DataTypes/Native.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <Columns/ColumnNullable.h>
 #include <Interpreters/JIT/CHJIT.h>
 
 namespace
@@ -107,7 +109,7 @@ static void compileFunction(llvm::Module & module, const IFunctionBase & functio
 
     /// Initialize column row values
 
-    Values arguments;
+    ValuesWithType arguments;
     arguments.reserve(function_argument_types.size());
 
     for (size_t i = 0; i < function_argument_types.size(); ++i)
@@ -116,30 +118,30 @@ static void compileFunction(llvm::Module & module, const IFunctionBase & functio
         const auto & type = function_argument_types[i];
 
         auto * column_data_ptr = column.data_ptr;
-        auto * column_element_value = b.CreateLoad(column.data_element_type, b.CreateGEP(column.data_element_type, column_data_ptr, counter_phi));
+        auto * column_element_value = b.CreateLoad(column.data_element_type, b.CreateInBoundsGEP(column.data_element_type, column_data_ptr, counter_phi));
 
         if (!type->isNullable())
         {
-            arguments.emplace_back(column_element_value);
+            arguments.emplace_back(column_element_value, type);
             continue;
         }
 
-        auto * column_is_null_element_value = b.CreateLoad(b.getInt8Ty(), b.CreateGEP(b.getInt8Ty(), column.null_data_ptr, counter_phi));
+        auto * column_is_null_element_value = b.CreateLoad(b.getInt8Ty(), b.CreateInBoundsGEP(b.getInt8Ty(), column.null_data_ptr, counter_phi));
         auto * is_null = b.CreateICmpNE(column_is_null_element_value, b.getInt8(0));
         auto * nullable_unitialized = llvm::Constant::getNullValue(toNullableType(b, column.data_element_type));
         auto * nullable_value = b.CreateInsertValue(b.CreateInsertValue(nullable_unitialized, column_element_value, {0}), is_null, {1});
-        arguments.emplace_back(nullable_value);
+        arguments.emplace_back(nullable_value, type);
     }
 
     /// Compile values for column rows and store compiled value in result column
 
-    auto * result = function.compile(b, std::move(arguments));
-    auto * result_column_element_ptr = b.CreateGEP(columns.back().data_element_type, columns.back().data_ptr, counter_phi);
+    auto * result = function.compile(b, arguments);
+    auto * result_column_element_ptr = b.CreateInBoundsGEP(columns.back().data_element_type, columns.back().data_ptr, counter_phi);
 
     if (columns.back().null_data_ptr)
     {
         b.CreateStore(b.CreateExtractValue(result, {0}), result_column_element_ptr);
-        auto * result_column_is_null_element_ptr = b.CreateGEP(b.getInt8Ty(), columns.back().null_data_ptr, counter_phi);
+        auto * result_column_is_null_element_ptr = b.CreateInBoundsGEP(b.getInt8Ty(), columns.back().null_data_ptr, counter_phi);
         auto * is_result_column_element_null = b.CreateSelect(b.CreateExtractValue(result, {1}), b.getInt8(1), b.getInt8(0));
         b.CreateStore(is_result_column_element_null, result_column_is_null_element_ptr);
     }
@@ -298,24 +300,24 @@ static void compileAddIntoAggregateStatesFunctions(llvm::Module & module,
     else
         aggregation_place = places_arg;
 
-    std::vector<llvm::Value *> function_arguments_values;
+    ValuesWithType function_arguments;
     previous_columns_size = 0;
 
     for (const auto & function : functions)
     {
-        auto arguments_types = function.function->getArgumentTypes();
+        const auto & arguments_types = function.function->getArgumentTypes();
         size_t function_arguments_size = arguments_types.size();
 
         for (size_t column_argument_index = 0; column_argument_index < function_arguments_size; ++column_argument_index)
         {
             auto & column = columns[previous_columns_size + column_argument_index];
-            auto & argument_type = arguments_types[column_argument_index];
+            const auto & argument_type = arguments_types[column_argument_index];
 
             auto * column_data_element = b.CreateLoad(column.data_element_type, b.CreateGEP(column.data_element_type, column.data_ptr, counter_phi));
 
             if (!argument_type->isNullable())
             {
-                function_arguments_values.push_back(column_data_element);
+                function_arguments.emplace_back(column_data_element, argument_type);
                 continue;
             }
 
@@ -324,16 +326,16 @@ static void compileAddIntoAggregateStatesFunctions(llvm::Module & module,
             auto * nullable_unitialized = llvm::Constant::getNullValue(toNullableType(b, column.data_element_type));
             auto * first_insert = b.CreateInsertValue(nullable_unitialized, column_data_element, {0});
             auto * nullable_value = b.CreateInsertValue(first_insert, is_null, {1});
-            function_arguments_values.push_back(nullable_value);
+            function_arguments.emplace_back(nullable_value, argument_type);
         }
 
         size_t aggregate_function_offset = function.aggregate_data_offset;
         auto * aggregation_place_with_offset = b.CreateConstInBoundsGEP1_64(b.getInt8Ty(), aggregation_place, aggregate_function_offset);
 
         const auto * aggregate_function_ptr = function.function;
-        aggregate_function_ptr->compileAdd(b, aggregation_place_with_offset, arguments_types, function_arguments_values);
+        aggregate_function_ptr->compileAdd(b, aggregation_place_with_offset, function_arguments);
 
-        function_arguments_values.clear();
+        function_arguments.clear();
 
         previous_columns_size += function_arguments_size;
     }
diff --git a/src/Interpreters/JoinUtils.cpp b/src/Interpreters/JoinUtils.cpp
index a05b58e14a1..67ee2a64264 100644
--- a/src/Interpreters/JoinUtils.cpp
+++ b/src/Interpreters/JoinUtils.cpp
@@ -160,16 +160,14 @@ static ColumnPtr tryConvertColumnToNullable(ColumnPtr col)
 
     if (col->lowCardinality())
     {
-        auto mut_col = IColumn::mutate(std::move(col));
-        ColumnLowCardinality * col_lc = assert_cast<ColumnLowCardinality *>(mut_col.get());
-        if (col_lc->nestedIsNullable())
+        const ColumnLowCardinality & col_lc = assert_cast<const ColumnLowCardinality &>(*col);
+        if (col_lc.nestedIsNullable())
         {
-            return mut_col;
+            return col;
         }
-        else if (col_lc->nestedCanBeInsideNullable())
+        else if (col_lc.nestedCanBeInsideNullable())
         {
-            col_lc->nestedToNullable();
-            return mut_col;
+            return col_lc.cloneNullable();
         }
     }
     else if (const ColumnConst * col_const = checkAndGetColumn<ColumnConst>(*col))
@@ -232,11 +230,7 @@ void removeColumnNullability(ColumnWithTypeAndName & column)
 
         if (column.column && column.column->lowCardinality())
         {
-            auto mut_col = IColumn::mutate(std::move(column.column));
-            ColumnLowCardinality * col_as_lc = typeid_cast<ColumnLowCardinality *>(mut_col.get());
-            if (col_as_lc && col_as_lc->nestedIsNullable())
-                col_as_lc->nestedRemoveNullable();
-            column.column = std::move(mut_col);
+            column.column = assert_cast<const ColumnLowCardinality *>(column.column.get())->cloneWithDefaultOnNull();
         }
     }
     else
diff --git a/src/Interpreters/MergeTreeTransaction.cpp b/src/Interpreters/MergeTreeTransaction.cpp
index 1358e3ed3c2..6b8e09a64f5 100644
--- a/src/Interpreters/MergeTreeTransaction.cpp
+++ b/src/Interpreters/MergeTreeTransaction.cpp
@@ -326,6 +326,8 @@ void MergeTreeTransaction::afterFinalize()
     is_read_only = storages.empty();
 
     /// Release shared pointers just in case
+    creating_parts.clear();
+    removing_parts.clear();
     storages.clear();
     mutations.clear();
     finalized = true;
diff --git a/src/Interpreters/MutationsInterpreter.cpp b/src/Interpreters/MutationsInterpreter.cpp
index 713ebade1d5..25c52ad8925 100644
--- a/src/Interpreters/MutationsInterpreter.cpp
+++ b/src/Interpreters/MutationsInterpreter.cpp
@@ -38,6 +38,7 @@
 #include <Analyzer/TableNode.h>
 #include <Interpreters/InterpreterSelectQueryAnalyzer.h>
 #include <Parsers/makeASTForLogicalFunction.h>
+#include <Common/logger_useful.h>
 
 
 namespace DB
@@ -109,13 +110,16 @@ QueryTreeNodePtr prepareQueryAffectedQueryTree(const std::vector<MutationCommand
     return query_tree;
 }
 
-ColumnDependencies getAllColumnDependencies(const StorageMetadataPtr & metadata_snapshot, const NameSet & updated_columns)
+ColumnDependencies getAllColumnDependencies(
+    const StorageMetadataPtr & metadata_snapshot,
+    const NameSet & updated_columns,
+    const std::function<bool(const String & file_name)> & has_index_or_projection)
 {
     NameSet new_updated_columns = updated_columns;
     ColumnDependencies dependencies;
     while (!new_updated_columns.empty())
     {
-        auto new_dependencies = metadata_snapshot->getColumnDependencies(new_updated_columns, true);
+        auto new_dependencies = metadata_snapshot->getColumnDependencies(new_updated_columns, true, has_index_or_projection);
         new_updated_columns.clear();
         for (const auto & dependency : new_dependencies)
         {
@@ -288,6 +292,11 @@ bool MutationsInterpreter::Source::materializeTTLRecalculateOnly() const
     return data && data->getSettings()->materialize_ttl_recalculate_only;
 }
 
+bool MutationsInterpreter::Source::hasIndexOrProjection(const String & file_name) const
+{
+    return part && part->checksums.has(file_name);
+}
+
 static Names getAvailableColumnsWithVirtuals(StorageMetadataPtr metadata_snapshot, const IStorage & storage)
 {
     auto all_columns = metadata_snapshot->getColumns().getNamesOfPhysical();
@@ -524,8 +533,11 @@ void MutationsInterpreter::prepare(bool dry_run)
         validateUpdateColumns(source, metadata_snapshot, updated_columns, column_to_affected_materialized);
     }
 
+    std::function<bool(const String & file_name)> has_index_or_projection
+        = [&](const String & file_name) { return source.hasIndexOrProjection(file_name); };
+
     if (settings.recalculate_dependencies_of_updated_columns)
-        dependencies = getAllColumnDependencies(metadata_snapshot, updated_columns);
+        dependencies = getAllColumnDependencies(metadata_snapshot, updated_columns, has_index_or_projection);
 
     std::vector<String> read_columns;
     /// First, break a sequence of commands into stages.
@@ -680,20 +692,27 @@ void MutationsInterpreter::prepare(bool dry_run)
             if (it == std::cend(indices_desc))
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown index: {}", command.index_name);
 
-            auto query = (*it).expression_list_ast->clone();
-            auto syntax_result = TreeRewriter(context).analyze(query, all_columns);
-            const auto required_columns = syntax_result->requiredSourceColumns();
-            for (const auto & column : required_columns)
-                dependencies.emplace(column, ColumnDependency::SKIP_INDEX);
-            materialized_indices.emplace(command.index_name);
+            if (!source.hasIndexOrProjection("skp_idx_" + it->name + ".idx")
+                && !source.hasIndexOrProjection("skp_idx_" + it->name + ".idx2"))
+            {
+                auto query = (*it).expression_list_ast->clone();
+                auto syntax_result = TreeRewriter(context).analyze(query, all_columns);
+                const auto required_columns = syntax_result->requiredSourceColumns();
+                for (const auto & column : required_columns)
+                    dependencies.emplace(column, ColumnDependency::SKIP_INDEX);
+                materialized_indices.emplace(command.index_name);
+            }
         }
         else if (command.type == MutationCommand::MATERIALIZE_PROJECTION)
         {
             mutation_kind.set(MutationKind::MUTATE_INDEX_PROJECTION);
             const auto & projection = projections_desc.get(command.projection_name);
-            for (const auto & column : projection.required_columns)
-                dependencies.emplace(column, ColumnDependency::PROJECTION);
-            materialized_projections.emplace(command.projection_name);
+            if (!source.hasIndexOrProjection(projection.getDirectoryName()))
+            {
+                for (const auto & column : projection.required_columns)
+                    dependencies.emplace(column, ColumnDependency::PROJECTION);
+                materialized_projections.emplace(command.projection_name);
+            }
         }
         else if (command.type == MutationCommand::DROP_INDEX)
         {
@@ -712,7 +731,8 @@ void MutationsInterpreter::prepare(bool dry_run)
             {
                 // just recalculate ttl_infos without remove expired data
                 auto all_columns_vec = all_columns.getNames();
-                auto new_dependencies = metadata_snapshot->getColumnDependencies(NameSet(all_columns_vec.begin(), all_columns_vec.end()), false);
+                auto new_dependencies = metadata_snapshot->getColumnDependencies(
+                    NameSet(all_columns_vec.begin(), all_columns_vec.end()), false, has_index_or_projection);
                 for (const auto & dependency : new_dependencies)
                 {
                     if (dependency.kind == ColumnDependency::TTL_EXPRESSION)
@@ -737,7 +757,8 @@ void MutationsInterpreter::prepare(bool dry_run)
                 }
 
                 auto all_columns_vec = all_columns.getNames();
-                auto all_dependencies = getAllColumnDependencies(metadata_snapshot, NameSet(all_columns_vec.begin(), all_columns_vec.end()));
+                auto all_dependencies = getAllColumnDependencies(
+                    metadata_snapshot, NameSet(all_columns_vec.begin(), all_columns_vec.end()), has_index_or_projection);
 
                 for (const auto & dependency : all_dependencies)
                 {
@@ -746,7 +767,7 @@ void MutationsInterpreter::prepare(bool dry_run)
                 }
 
                 /// Recalc only skip indices and projections of columns which could be updated by TTL.
-                auto new_dependencies = metadata_snapshot->getColumnDependencies(new_updated_columns, true);
+                auto new_dependencies = metadata_snapshot->getColumnDependencies(new_updated_columns, true, has_index_or_projection);
                 for (const auto & dependency : new_dependencies)
                 {
                     if (dependency.kind == ColumnDependency::SKIP_INDEX || dependency.kind == ColumnDependency::PROJECTION)
@@ -784,10 +805,10 @@ void MutationsInterpreter::prepare(bool dry_run)
     /// We care about affected indices and projections because we also need to rewrite them
     /// when one of index columns updated or filtered with delete.
     /// The same about columns, that are needed for calculation of TTL expressions.
+    NameSet changed_columns;
+    NameSet unchanged_columns;
     if (!dependencies.empty())
     {
-        NameSet changed_columns;
-        NameSet unchanged_columns;
         for (const auto & dependency : dependencies)
         {
             if (dependency.isReadOnly())
@@ -838,6 +859,39 @@ void MutationsInterpreter::prepare(bool dry_run)
         }
     }
 
+    for (const auto & index : metadata_snapshot->getSecondaryIndices())
+    {
+        if (source.hasIndexOrProjection("skp_idx_" + index.name + ".idx") || source.hasIndexOrProjection("skp_idx_" + index.name + ".idx2"))
+        {
+            const auto & index_cols = index.expression->getRequiredColumns();
+            bool changed = std::any_of(
+                index_cols.begin(),
+                index_cols.end(),
+                [&](const auto & col) { return updated_columns.contains(col) || changed_columns.contains(col); });
+            if (changed)
+                materialized_indices.insert(index.name);
+        }
+    }
+
+    for (const auto & projection : metadata_snapshot->getProjections())
+    {
+        if (source.hasIndexOrProjection(projection.getDirectoryName()))
+        {
+            const auto & projection_cols = projection.required_columns;
+            bool changed = std::any_of(
+                projection_cols.begin(),
+                projection_cols.end(),
+                [&](const auto & col) { return updated_columns.contains(col) || changed_columns.contains(col); });
+            if (changed)
+                materialized_projections.insert(projection.name);
+        }
+    }
+
+    /// Stages might be empty when we materialize skip indices or projections which don't add any
+    /// column dependencies.
+    if (stages.empty())
+        stages.emplace_back(context);
+
     is_prepared = true;
     prepareMutationStages(stages, dry_run);
 }
diff --git a/src/Interpreters/MutationsInterpreter.h b/src/Interpreters/MutationsInterpreter.h
index 49ba07641d9..d783b503531 100644
--- a/src/Interpreters/MutationsInterpreter.h
+++ b/src/Interpreters/MutationsInterpreter.h
@@ -120,6 +120,7 @@ public:
         bool supportsLightweightDelete() const;
         bool hasLightweightDeleteMask() const;
         bool materializeTTLRecalculateOnly() const;
+        bool hasIndexOrProjection(const String & file_name) const;
 
         void read(
             Stage & first_stage,
diff --git a/src/Interpreters/OptimizeDateFilterVisitor.cpp b/src/Interpreters/OptimizeDateFilterVisitor.cpp
deleted file mode 100644
index aec2dec19c8..00000000000
--- a/src/Interpreters/OptimizeDateFilterVisitor.cpp
+++ /dev/null
@@ -1,144 +0,0 @@
-#include <Interpreters/OptimizeDateFilterVisitor.h>
-
-#include <Common/DateLUT.h>
-#include <Common/DateLUTImpl.h>
-#include <Parsers/ASTIdentifier.h>
-#include <Parsers/ASTLiteral.h>
-#include <Parsers/ASTFunction.h>
-
-
-namespace DB
-{
-
-ASTPtr generateOptimizedDateFilterAST(const String & comparator, const String & converter, const String & column, UInt64 compare_to)
-{
-    const DateLUTImpl & date_lut = DateLUT::instance();
-
-    String start_date;
-    String end_date;
-
-    if (converter == "toYear")
-    {
-        UInt64 year = compare_to;
-        start_date = date_lut.dateToString(date_lut.makeDayNum(year, 1, 1));
-        end_date = date_lut.dateToString(date_lut.makeDayNum(year, 12, 31));
-    }
-    else if (converter == "toYYYYMM")
-    {
-        UInt64 year = compare_to / 100;
-        UInt64 month = compare_to % 100;
-
-        if (month == 0 || month > 12) return {};
-
-        static constexpr UInt8 days_of_month[] = {31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31};
-
-        bool leap_year = (year & 3) == 0 && (year % 100 || (year % 400 == 0 && year));
-
-        start_date = date_lut.dateToString(date_lut.makeDayNum(year, month, 1));
-        end_date = date_lut.dateToString(date_lut.makeDayNum(year, month, days_of_month[month - 1] + (leap_year && month == 2)));
-    }
-    else
-    {
-        return {};
-    }
-
-    if (comparator == "equals")
-    {
-        return makeASTFunction("and",
-                                makeASTFunction("greaterOrEquals",
-                                            std::make_shared<ASTIdentifier>(column),
-                                            std::make_shared<ASTLiteral>(start_date)
-                                            ),
-                                makeASTFunction("lessOrEquals",
-                                            std::make_shared<ASTIdentifier>(column),
-                                            std::make_shared<ASTLiteral>(end_date)
-                                            )
-                                );
-    }
-    else if (comparator == "notEquals")
-    {
-        return makeASTFunction("or",
-                                makeASTFunction("less",
-                                            std::make_shared<ASTIdentifier>(column),
-                                            std::make_shared<ASTLiteral>(start_date)
-                                            ),
-                                makeASTFunction("greater",
-                                            std::make_shared<ASTIdentifier>(column),
-                                            std::make_shared<ASTLiteral>(end_date)
-                                            )
-                                );
-    }
-    else if (comparator == "less" || comparator == "greaterOrEquals")
-    {
-        return makeASTFunction(comparator,
-                    std::make_shared<ASTIdentifier>(column),
-                    std::make_shared<ASTLiteral>(start_date)
-                    );
-    }
-    else
-    {
-        return makeASTFunction(comparator,
-                    std::make_shared<ASTIdentifier>(column),
-                    std::make_shared<ASTLiteral>(end_date)
-                    );
-    }
-}
-
-bool rewritePredicateInPlace(ASTFunction & function, ASTPtr & ast)
-{
-    const static std::unordered_map<String, String> swap_relations = {
-        {"equals", "equals"},
-        {"notEquals", "notEquals"},
-        {"less", "greater"},
-        {"greater", "less"},
-        {"lessOrEquals", "greaterOrEquals"},
-        {"greaterOrEquals", "lessOrEquals"},
-    };
-
-    if (!swap_relations.contains(function.name)) return false;
-
-    if (!function.arguments || function.arguments->children.size() != 2) return false;
-
-    size_t func_id = function.arguments->children.size();
-
-    for (size_t i = 0; i < function.arguments->children.size(); i++)
-    {
-        if (const auto * func = function.arguments->children[i]->as<ASTFunction>(); func)
-        {
-            if (func->name == "toYear" || func->name == "toYYYYMM")
-            {
-                func_id = i;
-            }
-        }
-    }
-
-    if (func_id == function.arguments->children.size()) return false;
-
-    size_t literal_id = 1 - func_id;
-    const auto * literal = function.arguments->children[literal_id]->as<ASTLiteral>();
-
-    if (!literal || literal->value.getType() != Field::Types::UInt64) return false;
-
-    UInt64 compare_to = literal->value.get<UInt64>();
-    String comparator = literal_id > func_id ? function.name : swap_relations.at(function.name);
-
-    const auto * func = function.arguments->children[func_id]->as<ASTFunction>();
-    const auto * column_id = func->arguments->children.at(0)->as<ASTIdentifier>();
-
-    if (!column_id) return false;
-
-    String column = column_id->name();
-
-    const auto new_ast = generateOptimizedDateFilterAST(comparator, func->name, column, compare_to);
-
-    if (!new_ast) return false;
-
-    ast = new_ast;
-    return true;
-}
-
-void OptimizeDateFilterInPlaceData::visit(ASTFunction & function, ASTPtr & ast) const
-{
-    rewritePredicateInPlace(function, ast);
-}
-}
diff --git a/src/Interpreters/OptimizeDateFilterVisitor.h b/src/Interpreters/OptimizeDateFilterVisitor.h
deleted file mode 100644
index 84394372901..00000000000
--- a/src/Interpreters/OptimizeDateFilterVisitor.h
+++ /dev/null
@@ -1,20 +0,0 @@
-#pragma once
-
-#include <Interpreters/InDepthNodeVisitor.h>
-
-namespace DB
-{
-
-class ASTFunction;
-
-/// Rewrite the predicates in place
-class OptimizeDateFilterInPlaceData
-{
-public:
-    using TypeToVisit = ASTFunction;
-    void visit(ASTFunction & function, ASTPtr & ast) const;
-};
-
-using OptimizeDateFilterInPlaceMatcher = OneTypeMatcher<OptimizeDateFilterInPlaceData>;
-using OptimizeDateFilterInPlaceVisitor = InDepthNodeVisitor<OptimizeDateFilterInPlaceMatcher, true>;
-}
diff --git a/src/Interpreters/PreparedSets.cpp b/src/Interpreters/PreparedSets.cpp
index 7b0efddae87..67822ecf440 100644
--- a/src/Interpreters/PreparedSets.cpp
+++ b/src/Interpreters/PreparedSets.cpp
@@ -1,55 +1,213 @@
 #include <chrono>
 #include <variant>
 #include <Interpreters/PreparedSets.h>
-#include <Processors/QueryPlan/QueryPlan.h>
-#include <Interpreters/InterpreterSelectWithUnionQuery.h>
 #include <Interpreters/Set.h>
+#include <Interpreters/InterpreterSelectWithUnionQuery.h>
 #include <IO/Operators.h>
+#include <Common/logger_useful.h>
+#include <Processors/QueryPlan/CreatingSetsStep.h>
+#include <Processors/Executors/CompletedPipelineExecutor.h>
+#include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
+#include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
+#include <Processors/Sinks/EmptySink.h>
+#include <Processors/Sinks/NullSink.h>
+#include <Processors/QueryPlan/QueryPlan.h>
+#include <Core/Block.h>
+#include <QueryPipeline/QueryPipelineBuilder.h>
+#include <DataTypes/DataTypeLowCardinality.h>
+#include <QueryPipeline/SizeLimits.h>
 
 namespace DB
 {
 
-PreparedSetKey PreparedSetKey::forLiteral(const IAST & ast, DataTypes types_)
+namespace ErrorCodes
 {
-    /// Remove LowCardinality types from type list because Set doesn't support LowCardinality keys now,
-    ///   just converts LowCardinality to ordinary types.
-    for (auto & type : types_)
-        type = recursiveRemoveLowCardinality(type);
-
-    PreparedSetKey key;
-    key.ast_hash = ast.getTreeHash();
-    key.types = std::move(types_);
-    return key;
+    extern const int LOGICAL_ERROR;
 }
 
-PreparedSetKey PreparedSetKey::forSubquery(const IAST & ast)
+static SizeLimits getSizeLimitsForSet(const Settings & settings)
 {
-    PreparedSetKey key;
-    key.ast_hash = ast.getTreeHash();
-    return key;
+    return SizeLimits(settings.max_rows_in_set, settings.max_bytes_in_set, settings.set_overflow_mode);
 }
 
-bool PreparedSetKey::operator==(const PreparedSetKey & other) const
+static bool equals(const DataTypes & lhs, const DataTypes & rhs)
 {
-    if (ast_hash != other.ast_hash)
+    size_t size = lhs.size();
+    if (size != rhs.size())
         return false;
 
-    if (types.size() != other.types.size())
-        return false;
-
-    for (size_t i = 0; i < types.size(); ++i)
+    for (size_t i = 0; i < size; ++i)
     {
-        if (!types[i]->equals(*other.types[i]))
+        if (!lhs[i]->equals(*rhs[i]))
             return false;
     }
 
     return true;
 }
 
-String PreparedSetKey::toString() const
+
+FutureSetFromStorage::FutureSetFromStorage(SetPtr set_) : set(std::move(set_)) {}
+SetPtr FutureSetFromStorage::get() const { return set; }
+const DataTypes & FutureSetFromStorage::getTypes() const { return set->getElementsTypes(); }
+
+SetPtr FutureSetFromStorage::buildOrderedSetInplace(const ContextPtr &)
+{
+    return set->hasExplicitSetElements() ? set : nullptr;
+}
+
+
+FutureSetFromTuple::FutureSetFromTuple(Block block, const Settings & settings)
+{
+    auto size_limits = getSizeLimitsForSet(settings);
+    set = std::make_shared<Set>(size_limits, settings.use_index_for_in_with_subqueries_max_values, settings.transform_null_in);
+    set->setHeader(block.cloneEmpty().getColumnsWithTypeAndName());
+
+    Columns columns;
+    columns.reserve(block.columns());
+    for (const auto & column : block)
+        columns.emplace_back(column.column);
+
+    set_key_columns.filter = ColumnUInt8::create(block.rows());
+
+    set->insertFromColumns(columns, set_key_columns);
+    set->finishInsert();
+}
+
+const DataTypes & FutureSetFromTuple::getTypes() const { return set->getElementsTypes(); }
+
+SetPtr FutureSetFromTuple::buildOrderedSetInplace(const ContextPtr & context)
+{
+    if (set->hasExplicitSetElements())
+        return set;
+
+    const auto & settings = context->getSettingsRef();
+    size_t max_values = settings.use_index_for_in_with_subqueries_max_values;
+    bool too_many_values = max_values && max_values < set->getTotalRowCount();
+    if (!too_many_values)
+    {
+        set->fillSetElements();
+        set->appendSetElements(set_key_columns);
+    }
+
+    return set;
+}
+
+
+FutureSetFromSubquery::FutureSetFromSubquery(
+    String key,
+    std::unique_ptr<QueryPlan> source_,
+    StoragePtr external_table_,
+    FutureSetPtr external_table_set_,
+    const Settings & settings)
+    : external_table(std::move(external_table_))
+    , external_table_set(std::move(external_table_set_))
+    , source(std::move(source_))
+{
+    set_and_key = std::make_shared<SetAndKey>();
+    set_and_key->key = std::move(key);
+
+    auto size_limits = getSizeLimitsForSet(settings);
+    set_and_key->set = std::make_shared<Set>(size_limits, settings.use_index_for_in_with_subqueries_max_values, settings.transform_null_in);
+    set_and_key->set->setHeader(source->getCurrentDataStream().header.getColumnsWithTypeAndName());
+}
+
+FutureSetFromSubquery::FutureSetFromSubquery(
+    String key,
+    QueryTreeNodePtr query_tree_,
+    const Settings & settings)
+    : query_tree(std::move(query_tree_))
+{
+    set_and_key = std::make_shared<SetAndKey>();
+    set_and_key->key = std::move(key);
+
+    auto size_limits = getSizeLimitsForSet(settings);
+    set_and_key->set = std::make_shared<Set>(size_limits, settings.use_index_for_in_with_subqueries_max_values, settings.transform_null_in);
+}
+
+SetPtr FutureSetFromSubquery::get() const
+{
+    if (set_and_key->set != nullptr && set_and_key->set->isCreated())
+        return set_and_key->set;
+
+    return nullptr;
+}
+
+void FutureSetFromSubquery::setQueryPlan(std::unique_ptr<QueryPlan> source_)
+{
+    source = std::move(source_);
+    set_and_key->set->setHeader(source->getCurrentDataStream().header.getColumnsWithTypeAndName());
+}
+
+const DataTypes & FutureSetFromSubquery::getTypes() const
+{
+    return set_and_key->set->getElementsTypes();
+}
+
+std::unique_ptr<QueryPlan> FutureSetFromSubquery::build(const ContextPtr & context)
+{
+    if (set_and_key->set->isCreated())
+        return nullptr;
+
+    const auto & settings = context->getSettingsRef();
+
+    auto plan = std::move(source);
+
+    if (!plan)
+        return nullptr;
+
+    auto creating_set = std::make_unique<CreatingSetStep>(
+            plan->getCurrentDataStream(),
+            set_and_key,
+            external_table,
+            SizeLimits(settings.max_rows_to_transfer, settings.max_bytes_to_transfer, settings.transfer_overflow_mode),
+            context);
+    creating_set->setStepDescription("Create set for subquery");
+    plan->addStep(std::move(creating_set));
+    return plan;
+}
+
+SetPtr FutureSetFromSubquery::buildOrderedSetInplace(const ContextPtr & context)
+{
+    if (!context->getSettingsRef().use_index_for_in_with_subqueries)
+        return nullptr;
+
+    if (auto set = get())
+    {
+        if (set->hasExplicitSetElements())
+            return set;
+
+        return nullptr;
+    }
+
+    if (external_table_set)
+    {
+        auto set = external_table_set->buildOrderedSetInplace(context);
+        if (set)
+            return set_and_key->set = set;
+    }
+
+    auto plan = build(context);
+    if (!plan)
+        return nullptr;
+
+    set_and_key->set->fillSetElements();
+    auto builder = plan->buildQueryPipeline(QueryPlanOptimizationSettings::fromContext(context), BuildQueryPipelineSettings::fromContext(context));
+    auto pipeline = QueryPipelineBuilder::getPipeline(std::move(*builder));
+    pipeline.complete(std::make_shared<EmptySink>(Block()));
+
+    CompletedPipelineExecutor executor(pipeline);
+    executor.execute();
+
+    set_and_key->set->checkIsCreated();
+
+    return set_and_key->set;
+}
+
+
+String PreparedSets::toString(const PreparedSets::Hash & key, const DataTypes & types)
 {
     WriteBufferFromOwnString buf;
-    buf << "__set_" << ast_hash.first << "_" << ast_hash.second;
+    buf << "__set_" << key.first << "_" << key.second;
     if (!types.empty())
     {
         buf << "(";
@@ -66,114 +224,112 @@ String PreparedSetKey::toString() const
     return buf.str();
 }
 
-SubqueryForSet & PreparedSets::createOrGetSubquery(const String & subquery_id, const PreparedSetKey & key,
-                                                   SizeLimits set_size_limit, bool transform_null_in)
+FutureSetPtr PreparedSets::addFromTuple(const Hash & key, Block block, const Settings & settings)
 {
-    SubqueryForSet & subquery = subqueries[subquery_id];
+    auto from_tuple = std::make_shared<FutureSetFromTuple>(std::move(block), settings);
+    const auto & set_types = from_tuple->getTypes();
+    auto & sets_by_hash = sets_from_tuple[key];
 
-    /// If you already created a Set with the same subquery / table for another ast
-    /// In that case several PreparedSetKey would share same subquery and set
-    /// Not sure if it's really possible case (maybe for distributed query when set was filled by external table?)
-    if (subquery.set.isValid())
-        sets[key] = subquery.set;
-    else
-    {
-        subquery.set_in_progress = std::make_shared<Set>(set_size_limit, false, transform_null_in);
-        sets[key] = FutureSet(subquery.promise_to_fill_set.get_future());
-    }
+    for (const auto & set : sets_by_hash)
+        if (equals(set->getTypes(), set_types))
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Duplicate set: {}", toString(key, set_types));
 
-    if (!subquery.set_in_progress)
-    {
-        subquery.key = key.toString();
-        subquery.set_in_progress = std::make_shared<Set>(set_size_limit, false, transform_null_in);
-    }
-
-    return subquery;
+    sets_by_hash.push_back(from_tuple);
+    return from_tuple;
 }
 
-/// If the subquery is not associated with any set, create default-constructed SubqueryForSet.
-/// It's aimed to fill external table passed to SubqueryForSet::createSource.
-SubqueryForSet & PreparedSets::getSubquery(const String & subquery_id) { return subqueries[subquery_id]; }
-
-void PreparedSets::set(const PreparedSetKey & key, SetPtr set_) { sets[key] = FutureSet(set_); }
-
-FutureSet PreparedSets::getFuture(const PreparedSetKey & key) const
+FutureSetPtr PreparedSets::addFromStorage(const Hash & key, SetPtr set_)
 {
-    auto it = sets.find(key);
-    if (it == sets.end())
-        return {};
+    auto from_storage = std::make_shared<FutureSetFromStorage>(std::move(set_));
+    auto [it, inserted] = sets_from_storage.emplace(key, from_storage);
+
+    if (!inserted)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Duplicate set: {}", toString(key, {}));
+
+    return from_storage;
+}
+
+FutureSetPtr PreparedSets::addFromSubquery(
+    const Hash & key,
+    std::unique_ptr<QueryPlan> source,
+    StoragePtr external_table,
+    FutureSetPtr external_table_set,
+    const Settings & settings)
+{
+    auto from_subquery = std::make_shared<FutureSetFromSubquery>(
+        toString(key, {}),
+        std::move(source),
+        std::move(external_table),
+        std::move(external_table_set),
+        settings);
+
+    auto [it, inserted] = sets_from_subqueries.emplace(key, from_subquery);
+
+    if (!inserted)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Duplicate set: {}", toString(key, {}));
+
+    return from_subquery;
+}
+
+FutureSetPtr PreparedSets::addFromSubquery(
+    const Hash & key,
+    QueryTreeNodePtr query_tree,
+    const Settings & settings)
+{
+    auto from_subquery = std::make_shared<FutureSetFromSubquery>(
+        toString(key, {}),
+        std::move(query_tree),
+        settings);
+
+    auto [it, inserted] = sets_from_subqueries.emplace(key, from_subquery);
+
+    if (!inserted)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Duplicate set: {}", toString(key, {}));
+
+    return from_subquery;
+}
+
+FutureSetPtr PreparedSets::findTuple(const Hash & key, const DataTypes & types) const
+{
+    auto it = sets_from_tuple.find(key);
+    if (it == sets_from_tuple.end())
+        return nullptr;
+
+    for (const auto & set : it->second)
+        if (equals(set->getTypes(), types))
+            return set;
+
+    return nullptr;
+}
+
+std::shared_ptr<FutureSetFromSubquery> PreparedSets::findSubquery(const Hash & key) const
+{
+    auto it = sets_from_subqueries.find(key);
+    if (it == sets_from_subqueries.end())
+        return nullptr;
+
     return it->second;
 }
 
-SetPtr PreparedSets::get(const PreparedSetKey & key) const
+std::shared_ptr<FutureSetFromStorage> PreparedSets::findStorage(const Hash & key) const
 {
-    auto it = sets.find(key);
-    if (it == sets.end() || !it->second.isReady())
+    auto it = sets_from_storage.find(key);
+    if (it == sets_from_storage.end())
         return nullptr;
-    return it->second.get();
+
+    return it->second;
 }
 
-std::vector<FutureSet> PreparedSets::getByTreeHash(IAST::Hash ast_hash) const
+PreparedSets::Subqueries PreparedSets::getSubqueries()
 {
-    std::vector<FutureSet> res;
-    for (const auto & it : this->sets)
-    {
-        if (it.first.ast_hash == ast_hash)
-            res.push_back(it.second);
-    }
+    PreparedSets::Subqueries res;
+    res.reserve(sets_from_subqueries.size());
+    for (auto & [_, set] : sets_from_subqueries)
+        res.push_back(set);
+
     return res;
 }
 
-PreparedSets::SubqueriesForSets PreparedSets::detachSubqueries()
-{
-    auto res = std::move(subqueries);
-    subqueries = SubqueriesForSets();
-    return res;
-}
-
-bool PreparedSets::empty() const { return sets.empty(); }
-
-void SubqueryForSet::createSource(InterpreterSelectWithUnionQuery & interpreter, StoragePtr table_)
-{
-    source = std::make_unique<QueryPlan>();
-    interpreter.buildQueryPlan(*source);
-    if (table_)
-        table = table_;
-}
-
-bool SubqueryForSet::hasSource() const
-{
-    return source != nullptr;
-}
-
-QueryPlanPtr SubqueryForSet::detachSource()
-{
-    auto res = std::move(source);
-    source = nullptr;
-    return res;
-}
-
-
-FutureSet::FutureSet(SetPtr set)
-{
-    std::promise<SetPtr> promise;
-    promise.set_value(set);
-    *this = FutureSet(promise.get_future());
-}
-
-
-bool FutureSet::isReady() const
-{
-    return future_set.valid() &&
-        future_set.wait_for(std::chrono::seconds(0)) == std::future_status::ready;
-}
-
-bool FutureSet::isCreated() const
-{
-    return isReady() && get() != nullptr && get()->isCreated();
-}
-
-
 std::variant<std::promise<SetPtr>, SharedSet> PreparedSetsCache::findOrPromiseToBuild(const String & key)
 {
     std::lock_guard lock(cache_mutex);
diff --git a/src/Interpreters/PreparedSets.h b/src/Interpreters/PreparedSets.h
index 4a7d1c3de46..cb240f5260a 100644
--- a/src/Interpreters/PreparedSets.h
+++ b/src/Interpreters/PreparedSets.h
@@ -2,14 +2,13 @@
 
 #include <Parsers/IAST.h>
 #include <DataTypes/IDataType.h>
-#include <future>
 #include <memory>
 #include <unordered_map>
 #include <vector>
-#include <DataTypes/DataTypeLowCardinality.h>
+#include <future>
 #include <Storages/IStorage_fwd.h>
-#include <QueryPipeline/SizeLimits.h>
-#include <Processors/QueryPlan/QueryPlan.h>
+#include <Interpreters/Context_fwd.h>
+#include <Interpreters/SetKeys.h>
 
 namespace DB
 {
@@ -18,121 +17,158 @@ class QueryPlan;
 
 class Set;
 using SetPtr = std::shared_ptr<Set>;
-class InterpreterSelectWithUnionQuery;
+struct SetKeyColumns;
+
+class IQueryTreeNode;
+using QueryTreeNodePtr = std::shared_ptr<IQueryTreeNode>;
+
+struct Settings;
+
+/// This is a structure for prepared sets cache.
+/// SetPtr can be taken from cache, so we should pass holder for it.
+struct SetAndKey
+{
+    String key;
+    SetPtr set;
+};
+
+using SetAndKeyPtr = std::shared_ptr<SetAndKey>;
 
 /// Represents a set in a query that might be referenced at analysis time and built later during execution.
 /// Also it can represent a constant set that is ready to use.
 /// At analysis stage the FutureSets are created but not necessarily filled. Then for non-constant sets there
 /// must be an explicit step to build them before they can be used.
-/// FutureSet objects can be stored in PreparedSets and are not intended to be used from multiple threads.
-class FutureSet final
+/// Set may be useful for indexes, in this case special ordered set with stored elements is build inplace.
+class FutureSet
 {
 public:
-    FutureSet() = default;
+    virtual ~FutureSet() = default;
 
-    /// Create FutureSet from an object that will be created in the future.
-    explicit FutureSet(const std::shared_future<SetPtr> & future_set_) : future_set(future_set_) {}
+    /// Returns set if set is ready (created and filled) or nullptr if not.
+    virtual SetPtr get() const = 0;
+    /// Returns set->getElementsTypes(), even if set is not created yet.
+    virtual const DataTypes & getTypes() const = 0;
+    /// If possible, return set with stored elements useful for PK analysis.
+    virtual SetPtr buildOrderedSetInplace(const ContextPtr & context) = 0;
+};
 
-    /// Create FutureSet from a ready set.
-    explicit FutureSet(SetPtr readySet);
+using FutureSetPtr = std::shared_ptr<FutureSet>;
 
-    /// The set object will be ready in the future, as opposed to 'null' object  when FutureSet is default constructed.
-    bool isValid() const { return future_set.valid(); }
+/// Future set from already filled set.
+/// Usually it is from StorageSet.
+class FutureSetFromStorage final : public FutureSet
+{
+public:
+    FutureSetFromStorage(SetPtr set_);
 
-    /// The the value of SetPtr is ready, but the set object might not have been filled yet.
-    bool isReady() const;
-
-    /// The set object is ready and filled.
-    bool isCreated() const;
-
-    SetPtr get() const { chassert(isReady()); return future_set.get(); }
+    SetPtr get() const override;
+    const DataTypes & getTypes() const override;
+    SetPtr buildOrderedSetInplace(const ContextPtr &) override;
 
 private:
-    std::shared_future<SetPtr> future_set;
+    SetPtr set;
 };
 
-/// Information on how to build set for the [GLOBAL] IN section.
-class SubqueryForSet
+/// Set from tuple is filled as well as set from storage.
+/// Additionally, it can be converted to set useful for PK.
+class FutureSetFromTuple final : public FutureSet
 {
 public:
+    FutureSetFromTuple(Block block, const Settings & settings);
 
-    void createSource(InterpreterSelectWithUnionQuery & interpreter, StoragePtr table_ = nullptr);
+    SetPtr get() const override { return set; }
+    SetPtr buildOrderedSetInplace(const ContextPtr & context) override;
 
-    bool hasSource() const;
+    const DataTypes & getTypes() const override;
 
-    /// Returns query plan for the set's source
-    /// and removes it from SubqueryForSet because we need to build it only once.
-    std::unique_ptr<QueryPlan> detachSource();
-
-    /// Build this set from the result of the subquery.
-    String key;
-    SetPtr set_in_progress;
-    /// After set_in_progress is finished it will be put into promise_to_fill_set and thus all FutureSet's
-    /// that are referencing this set will be filled.
-    std::promise<SetPtr> promise_to_fill_set;
-    FutureSet set = FutureSet{promise_to_fill_set.get_future()};
-
-    /// If set, put the result into the table.
-    /// This is a temporary table for transferring to remote servers for distributed query processing.
-    StoragePtr table;
-
-    /// The source is obtained using the InterpreterSelectQuery subquery.
-    std::unique_ptr<QueryPlan> source;
+private:
+    SetPtr set;
+    SetKeyColumns set_key_columns;
 };
 
-struct PreparedSetKey
+/// Set from subquery can be built inplace for PK or in CreatingSet step.
+/// If use_index_for_in_with_subqueries_max_values is reached, set for PK won't be created,
+/// but ordinary set would be created instead.
+class FutureSetFromSubquery final : public FutureSet
 {
-    /// Prepared sets for tuple literals are indexed by the hash of the tree contents and by the desired
-    /// data types of set elements (two different Sets can be required for two tuples with the same contents
-    /// if left hand sides of the IN operators have different types).
-    static PreparedSetKey forLiteral(const IAST & ast, DataTypes types_);
+public:
+    FutureSetFromSubquery(
+        String key,
+        std::unique_ptr<QueryPlan> source_,
+        StoragePtr external_table_,
+        FutureSetPtr external_table_set_,
+        const Settings & settings);
 
-    /// Prepared sets for subqueries are indexed only by the AST contents because the type of the resulting
-    /// set is fully determined by the subquery.
-    static PreparedSetKey forSubquery(const IAST & ast);
+    FutureSetFromSubquery(
+        String key,
+        QueryTreeNodePtr query_tree_,
+        const Settings & settings);
 
-    IAST::Hash ast_hash;
-    DataTypes types; /// Empty for subqueries.
+    SetPtr get() const override;
+    const DataTypes & getTypes() const override;
+    SetPtr buildOrderedSetInplace(const ContextPtr & context) override;
 
-    bool operator==(const PreparedSetKey & other) const;
+    std::unique_ptr<QueryPlan> build(const ContextPtr & context);
 
-    String toString() const;
+    QueryTreeNodePtr detachQueryTree() { return std::move(query_tree); }
+    void setQueryPlan(std::unique_ptr<QueryPlan> source_);
 
-    struct Hash
-    {
-        UInt64 operator()(const PreparedSetKey & key) const { return key.ast_hash.first; }
-    };
+private:
+    SetAndKeyPtr set_and_key;
+    StoragePtr external_table;
+    FutureSetPtr external_table_set;
+
+    std::unique_ptr<QueryPlan> source;
+    QueryTreeNodePtr query_tree;
 };
 
+/// Container for all the sets used in query.
 class PreparedSets
 {
 public:
-    using SubqueriesForSets = std::unordered_map<String, SubqueryForSet>;
 
-    SubqueryForSet & createOrGetSubquery(const String & subquery_id, const PreparedSetKey & key,
-                                         SizeLimits set_size_limit, bool transform_null_in);
-    SubqueryForSet & getSubquery(const String & subquery_id);
+    using Hash = std::pair<UInt64, UInt64>;
+    struct Hashing
+    {
+        UInt64 operator()(const Hash & key) const { return key.first ^ key.second; }
+    };
 
-    void set(const PreparedSetKey & key, SetPtr set_);
-    FutureSet getFuture(const PreparedSetKey & key) const;
-    SetPtr get(const PreparedSetKey & key) const;
+    using SetsFromTuple = std::unordered_map<Hash, std::vector<std::shared_ptr<FutureSetFromTuple>>, Hashing>;
+    using SetsFromStorage = std::unordered_map<Hash, std::shared_ptr<FutureSetFromStorage>, Hashing>;
+    using SetsFromSubqueries = std::unordered_map<Hash, std::shared_ptr<FutureSetFromSubquery>, Hashing>;
 
-    /// Get subqueries and clear them.
-    /// We need to build a plan for subqueries just once. That's why we can clear them after accessing them.
-    /// SetPtr would still be available for consumers of PreparedSets.
-    SubqueriesForSets detachSubqueries();
+    FutureSetPtr addFromStorage(const Hash & key, SetPtr set_);
+    FutureSetPtr addFromTuple(const Hash & key, Block block, const Settings & settings);
 
-    /// Returns all sets that match the given ast hash not checking types
-    /// Used in KeyCondition and MergeTreeIndexConditionBloomFilter to make non exact match for types in PreparedSetKey
-    std::vector<FutureSet> getByTreeHash(IAST::Hash ast_hash) const;
+    FutureSetPtr addFromSubquery(
+        const Hash & key,
+        std::unique_ptr<QueryPlan> source,
+        StoragePtr external_table,
+        FutureSetPtr external_table_set,
+        const Settings & settings);
 
-    bool empty() const;
+    FutureSetPtr addFromSubquery(
+        const Hash & key,
+        QueryTreeNodePtr query_tree,
+        const Settings & settings);
+
+    FutureSetPtr findTuple(const Hash & key, const DataTypes & types) const;
+    std::shared_ptr<FutureSetFromStorage> findStorage(const Hash & key) const;
+    std::shared_ptr<FutureSetFromSubquery> findSubquery(const Hash & key) const;
+
+    using Subqueries = std::vector<std::shared_ptr<FutureSetFromSubquery>>;
+    Subqueries getSubqueries();
+
+    const SetsFromTuple & getSetsFromTuple() const { return sets_from_tuple; }
+    // const SetsFromStorage & getSetsFromStorage() const { return sets_from_storage; }
+    // const SetsFromSubqueries & getSetsFromSubquery() const { return sets_from_subqueries; }
+
+    static String toString(const Hash & key, const DataTypes & types);
 
 private:
-    std::unordered_map<PreparedSetKey, FutureSet, PreparedSetKey::Hash> sets;
-
-    /// This is the information required for building sets
-    SubqueriesForSets subqueries;
+    SetsFromTuple sets_from_tuple;
+    SetsFromStorage sets_from_storage;
+    SetsFromSubqueries sets_from_subqueries;
 };
 
 using PreparedSetsPtr = std::shared_ptr<PreparedSets>;
diff --git a/src/Interpreters/ProcessList.cpp b/src/Interpreters/ProcessList.cpp
index aca474bf152..daa8d434ab6 100644
--- a/src/Interpreters/ProcessList.cpp
+++ b/src/Interpreters/ProcessList.cpp
@@ -246,6 +246,7 @@ ProcessList::insert(const String & query_, const IAST * ast, ContextMutablePtr q
                 priorities.insert(static_cast<int>(settings.priority)),
                 std::move(thread_group),
                 query_kind,
+                settings,
                 watch_start_nanoseconds));
 
         increaseQueryKindAmount(query_kind);
@@ -342,6 +343,7 @@ QueryStatus::QueryStatus(
     QueryPriorities::Handle && priority_handle_,
     ThreadGroupPtr && thread_group_,
     IAST::QueryKind query_kind_,
+    const Settings & query_settings_,
     UInt64 watch_start_nanoseconds)
     : WithContext(context_)
     , query(query_)
@@ -353,9 +355,11 @@ QueryStatus::QueryStatus(
     , query_kind(query_kind_)
     , num_queries_increment(CurrentMetrics::Query)
 {
-    auto settings = getContext()->getSettings();
-    limits.max_execution_time = settings.max_execution_time;
-    overflow_mode = settings.timeout_overflow_mode;
+    /// We have to pass `query_settings_` to this constructor because we can't use `context_->getSettings().max_execution_time` here:
+    /// a QueryStatus is created with `ProcessList::mutex` locked (see ProcessList::insert) and calling `context_->getSettings()`
+    /// would lock the context's lock too, whereas holding two those locks simultaneously is not good.
+    limits.max_execution_time = query_settings_.max_execution_time;
+    overflow_mode = query_settings_.timeout_overflow_mode;
 }
 
 QueryStatus::~QueryStatus()
@@ -589,10 +593,13 @@ QueryStatusInfo QueryStatus::getInfo(bool get_thread_list, bool get_profile_even
             res.profile_counters = std::make_shared<ProfileEvents::Counters::Snapshot>(thread_group->performance_counters.getPartiallyAtomicSnapshot());
     }
 
-    if (get_settings && getContext())
+    if (get_settings)
     {
-        res.query_settings = std::make_shared<Settings>(getContext()->getSettings());
-        res.current_database = getContext()->getCurrentDatabase();
+        if (auto ctx = context.lock())
+        {
+            res.query_settings = std::make_shared<Settings>(ctx->getSettings());
+            res.current_database = ctx->getCurrentDatabase();
+        }
     }
 
     return res;
@@ -601,12 +608,18 @@ QueryStatusInfo QueryStatus::getInfo(bool get_thread_list, bool get_profile_even
 
 ProcessList::Info ProcessList::getInfo(bool get_thread_list, bool get_profile_events, bool get_settings) const
 {
+    /// We have to copy `processes` first because `process->getInfo()` below can access the context to get the query settings,
+    /// and it's better not to keep the process list's lock while doing that.
+    std::vector<QueryStatusPtr> processes_copy;
+
+    {
+        auto lock = safeLock();
+        processes_copy.assign(processes.begin(), processes.end());
+    }
+
     Info per_query_infos;
-
-    auto lock = safeLock();
-
-    per_query_infos.reserve(processes.size());
-    for (const auto & process : processes)
+    per_query_infos.reserve(processes_copy.size());
+    for (const auto & process : processes_copy)
         per_query_infos.emplace_back(process->getInfo(get_thread_list, get_profile_events, get_settings));
 
     return per_query_infos;
diff --git a/src/Interpreters/ProcessList.h b/src/Interpreters/ProcessList.h
index b593bcef395..e5a61497ff2 100644
--- a/src/Interpreters/ProcessList.h
+++ b/src/Interpreters/ProcessList.h
@@ -164,6 +164,7 @@ public:
         QueryPriorities::Handle && priority_handle_,
         ThreadGroupPtr && thread_group_,
         IAST::QueryKind query_kind_,
+        const Settings & query_settings_,
         UInt64 watch_start_nanoseconds);
 
     ~QueryStatus();
diff --git a/src/Interpreters/Set.cpp b/src/Interpreters/Set.cpp
index a7bea63bd99..b8b61c7c11f 100644
--- a/src/Interpreters/Set.cpp
+++ b/src/Interpreters/Set.cpp
@@ -103,6 +103,21 @@ void NO_INLINE Set::insertFromBlockImplCase(
 }
 
 
+DataTypes Set::getElementTypes(DataTypes types, bool transform_null_in)
+{
+    for (auto & type : types)
+    {
+        if (const auto * low_cardinality_type = typeid_cast<const DataTypeLowCardinality *>(type.get()))
+            type = low_cardinality_type->getDictionaryType();
+
+        if (!transform_null_in)
+            type = removeNullable(type);
+    }
+
+    return types;
+}
+
+
 void Set::setHeader(const ColumnsWithTypeAndName & header)
 {
     std::lock_guard lock(rwlock);
@@ -152,46 +167,67 @@ void Set::setHeader(const ColumnsWithTypeAndName & header)
         extractNestedColumnsAndNullMap(key_columns, null_map);
     }
 
-    if (fill_set_elements)
-    {
-        /// Create empty columns with set values in advance.
-        /// It is needed because set may be empty, so method 'insertFromBlock' will be never called.
-        set_elements.reserve(keys_size);
-        for (const auto & type : set_elements_types)
-            set_elements.emplace_back(type->createColumn());
-    }
-
     /// Choose data structure to use for the set.
     data.init(data.chooseMethod(key_columns, key_sizes));
 }
 
+void Set::fillSetElements()
+{
+    fill_set_elements = true;
+    set_elements.reserve(keys_size);
+    for (const auto & type : set_elements_types)
+        set_elements.emplace_back(type->createColumn());
+}
+
 bool Set::insertFromBlock(const ColumnsWithTypeAndName & columns)
 {
     Columns cols;
     cols.reserve(columns.size());
     for (const auto & column : columns)
         cols.emplace_back(column.column);
-    return insertFromBlock(cols);
+    return insertFromColumns(cols);
 }
 
-bool Set::insertFromBlock(const Columns & columns)
+bool Set::insertFromColumns(const Columns & columns)
+{
+    size_t rows = columns.at(0)->size();
+
+    SetKeyColumns holder;
+    /// Filter to extract distinct values from the block.
+    if (fill_set_elements)
+        holder.filter = ColumnUInt8::create(rows);
+
+    bool inserted = insertFromColumns(columns, holder);
+    if (inserted && fill_set_elements)
+    {
+        if (max_elements_to_fill && max_elements_to_fill < data.getTotalRowCount())
+        {
+            /// Drop filled elementes
+            fill_set_elements = false;
+            set_elements.clear();
+        }
+        else
+            appendSetElements(holder);
+    }
+
+    return inserted;
+}
+
+bool Set::insertFromColumns(const Columns & columns, SetKeyColumns & holder)
 {
     std::lock_guard lock(rwlock);
 
     if (data.empty())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Method Set::setHeader must be called before Set::insertFromBlock");
 
-    ColumnRawPtrs key_columns;
-    key_columns.reserve(keys_size);
-
-    /// The constant columns to the right of IN are not supported directly. For this, they first materialize.
-    Columns materialized_columns;
+    holder.key_columns.reserve(keys_size);
+    holder.materialized_columns.reserve(keys_size);
 
     /// Remember the columns we will work with
     for (size_t i = 0; i < keys_size; ++i)
     {
-        materialized_columns.emplace_back(columns.at(i)->convertToFullIfNeeded());
-        key_columns.emplace_back(materialized_columns.back().get());
+        holder.materialized_columns.emplace_back(columns.at(i)->convertToFullIfNeeded());
+        holder.key_columns.emplace_back(holder.materialized_columns.back().get());
     }
 
     size_t rows = columns.at(0)->size();
@@ -200,12 +236,7 @@ bool Set::insertFromBlock(const Columns & columns)
     ConstNullMapPtr null_map{};
     ColumnPtr null_map_holder;
     if (!transform_null_in)
-        null_map_holder = extractNestedColumnsAndNullMap(key_columns, null_map);
-
-    /// Filter to extract distinct values from the block.
-    ColumnUInt8::MutablePtr filter;
-    if (fill_set_elements)
-        filter = ColumnUInt8::create(rows);
+        null_map_holder = extractNestedColumnsAndNullMap(holder.key_columns, null_map);
 
     switch (data.type)
     {
@@ -213,29 +244,34 @@ bool Set::insertFromBlock(const Columns & columns)
             break;
 #define M(NAME) \
         case SetVariants::Type::NAME: \
-            insertFromBlockImpl(*data.NAME, key_columns, rows, data, null_map, filter ? &filter->getData() : nullptr); \
+            insertFromBlockImpl(*data.NAME, holder.key_columns, rows, data, null_map, holder.filter ? &holder.filter->getData() : nullptr); \
             break;
         APPLY_FOR_SET_VARIANTS(M)
 #undef M
     }
 
-    if (fill_set_elements)
-    {
-        for (size_t i = 0; i < keys_size; ++i)
-        {
-            auto filtered_column = key_columns[i]->filter(filter->getData(), rows);
-            if (set_elements[i]->empty())
-                set_elements[i] = filtered_column;
-            else
-                set_elements[i]->insertRangeFrom(*filtered_column, 0, filtered_column->size());
-            if (transform_null_in && null_map_holder)
-                set_elements[i]->insert(Null{});
-        }
-    }
-
     return limits.check(data.getTotalRowCount(), data.getTotalByteCount(), "IN-set", ErrorCodes::SET_SIZE_LIMIT_EXCEEDED);
 }
 
+void Set::appendSetElements(SetKeyColumns & holder)
+{
+    if (holder.key_columns.size() != keys_size || set_elements.size() != keys_size)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid number of key columns for set. Expected {} got {} and {}",
+                        keys_size, holder.key_columns.size(), set_elements.size());
+
+    size_t rows = holder.key_columns.at(0)->size();
+    for (size_t i = 0; i < keys_size; ++i)
+    {
+        auto filtered_column = holder.key_columns[i]->filter(holder.filter->getData(), rows);
+        if (set_elements[i]->empty())
+            set_elements[i] = filtered_column;
+        else
+            set_elements[i]->insertRangeFrom(*filtered_column, 0, filtered_column->size());
+        if (transform_null_in && holder.null_map_holder)
+            set_elements[i]->insert(Null{});
+    }
+}
+
 void Set::checkIsCreated() const
 {
     if (!is_created.load())
@@ -429,6 +465,11 @@ void Set::checkTypesEqual(size_t set_type_idx, const DataTypePtr & other_type) c
 MergeTreeSetIndex::MergeTreeSetIndex(const Columns & set_elements, std::vector<KeyTuplePositionMapping> && indexes_mapping_)
     : has_all_keys(set_elements.size() == indexes_mapping_.size()), indexes_mapping(std::move(indexes_mapping_))
 {
+    // std::cerr << "MergeTreeSetIndex::MergeTreeSetIndex "
+    //     << set_elements.size() << ' ' << indexes_mapping.size() << std::endl;
+    // for (const auto & vv : indexes_mapping)
+    //     std::cerr << vv.key_index << ' ' << vv.tuple_index << std::endl;
+
     ::sort(indexes_mapping.begin(), indexes_mapping.end(),
         [](const KeyTuplePositionMapping & l, const KeyTuplePositionMapping & r)
         {
@@ -471,6 +512,7 @@ MergeTreeSetIndex::MergeTreeSetIndex(const Columns & set_elements, std::vector<K
 BoolMask MergeTreeSetIndex::checkInRange(const std::vector<Range> & key_ranges, const DataTypes & data_types, bool single_point) const
 {
     size_t tuple_size = indexes_mapping.size();
+    // std::cerr << "MergeTreeSetIndex::checkInRange " << single_point << ' ' << tuple_size << ' ' << has_all_keys << std::endl;
 
     FieldValues left_point;
     FieldValues right_point;
diff --git a/src/Interpreters/Set.h b/src/Interpreters/Set.h
index fff5fa4e1b1..9ea46e117ef 100644
--- a/src/Interpreters/Set.h
+++ b/src/Interpreters/Set.h
@@ -4,6 +4,7 @@
 #include <QueryPipeline/SizeLimits.h>
 #include <DataTypes/IDataType.h>
 #include <Interpreters/SetVariants.h>
+#include <Interpreters/SetKeys.h>
 #include <Parsers/IAST.h>
 #include <Storages/MergeTree/BoolMask.h>
 
@@ -30,9 +31,9 @@ public:
     /// (that is useful only for checking that some value is in the set and may not store the original values),
     /// store all set elements in explicit form.
     /// This is needed for subsequent use for index.
-    Set(const SizeLimits & limits_, bool fill_set_elements_, bool transform_null_in_)
+    Set(const SizeLimits & limits_, size_t max_elements_to_fill_, bool transform_null_in_)
         : log(&Poco::Logger::get("Set")),
-        limits(limits_), fill_set_elements(fill_set_elements_), transform_null_in(transform_null_in_)
+        limits(limits_), max_elements_to_fill(max_elements_to_fill_), transform_null_in(transform_null_in_)
     {
     }
 
@@ -45,9 +46,13 @@ public:
     void setHeader(const ColumnsWithTypeAndName & header);
 
     /// Returns false, if some limit was exceeded and no need to insert more data.
-    bool insertFromBlock(const Columns & columns);
+    bool insertFromColumns(const Columns & columns);
     bool insertFromBlock(const ColumnsWithTypeAndName & columns);
 
+    void fillSetElements();
+    bool insertFromColumns(const Columns & columns, SetKeyColumns & holder);
+    void appendSetElements(SetKeyColumns & holder);
+
     /// Call after all blocks were inserted. To get the information that set is already created.
     void finishInsert() { is_created = true; }
 
@@ -68,13 +73,15 @@ public:
     const DataTypes & getDataTypes() const { return data_types; }
     const DataTypes & getElementsTypes() const { return set_elements_types; }
 
-    bool hasExplicitSetElements() const { return fill_set_elements; }
+    bool hasExplicitSetElements() const { return fill_set_elements || (!set_elements.empty() && set_elements.front()->size() == data.getTotalRowCount()); }
     Columns getSetElements() const { checkIsCreated(); return { set_elements.begin(), set_elements.end() }; }
 
     void checkColumnsNumber(size_t num_key_columns) const;
     bool areTypesEqual(size_t set_type_idx, const DataTypePtr & other_type) const;
     void checkTypesEqual(size_t set_type_idx, const DataTypePtr & other_type) const;
 
+    static DataTypes getElementTypes(DataTypes types, bool transform_null_in);
+
 private:
     size_t keys_size = 0;
     Sizes key_sizes;
@@ -110,7 +117,8 @@ private:
     SizeLimits limits;
 
     /// Do we need to additionally store all elements of the set in explicit form for subsequent use for index.
-    bool fill_set_elements;
+    bool fill_set_elements = false;
+    size_t max_elements_to_fill;
 
     /// If true, insert NULL values to set.
     bool transform_null_in;
diff --git a/src/Interpreters/SetKeys.h b/src/Interpreters/SetKeys.h
new file mode 100644
index 00000000000..2cab9849c9b
--- /dev/null
+++ b/src/Interpreters/SetKeys.h
@@ -0,0 +1,18 @@
+#pragma once
+#include <Columns/ColumnsNumber.h>
+
+namespace DB
+{
+
+/// Prepared key columns for set which can be added to fill set elements.
+/// Used only to upgrade set from tuple.
+struct SetKeyColumns
+{
+    /// The constant columns to the right of IN are not supported directly. For this, they first materialize.
+    ColumnRawPtrs key_columns;
+    Columns materialized_columns;
+    ColumnPtr null_map_holder;
+    ColumnUInt8::MutablePtr filter;
+};
+
+}
diff --git a/src/Interpreters/TableJoin.cpp b/src/Interpreters/TableJoin.cpp
index 5a23fbd00ff..cabd0be1aa3 100644
--- a/src/Interpreters/TableJoin.cpp
+++ b/src/Interpreters/TableJoin.cpp
@@ -14,6 +14,8 @@
 #include <Dictionaries/DictionaryStructure.h>
 
 #include <Interpreters/ExternalDictionariesLoader.h>
+#include <Interpreters/TreeRewriter.h>
+#include <Interpreters/ExpressionAnalyzer.h>
 
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTFunction.h>
@@ -760,4 +762,11 @@ bool TableJoin::allowParallelHashJoin() const
     return true;
 }
 
+ActionsDAGPtr TableJoin::createJoinedBlockActions(ContextPtr context) const
+{
+    ASTPtr expression_list = rightKeysList();
+    auto syntax_result = TreeRewriter(context).analyze(expression_list, columnsFromJoinedTable());
+    return ExpressionAnalyzer(expression_list, syntax_result, context).getActionsDAG(true, false);
+}
+
 }
diff --git a/src/Interpreters/TableJoin.h b/src/Interpreters/TableJoin.h
index 0e0c905e30c..ba3befab59b 100644
--- a/src/Interpreters/TableJoin.h
+++ b/src/Interpreters/TableJoin.h
@@ -217,6 +217,8 @@ public:
     const SizeLimits & sizeLimits() const { return size_limits; }
     VolumePtr getGlobalTemporaryVolume() { return tmp_volume; }
 
+    ActionsDAGPtr createJoinedBlockActions(ContextPtr context) const;
+
     bool isEnabledAlgorithm(JoinAlgorithm val) const
     {
         /// When join_algorithm = 'default' (not specified by user) we use hash or direct algorithm.
@@ -232,8 +234,17 @@ public:
     bool allowParallelHashJoin() const;
 
     bool joinUseNulls() const { return join_use_nulls; }
-    bool forceNullableRight() const { return join_use_nulls && isLeftOrFull(kind()); }
-    bool forceNullableLeft() const { return join_use_nulls && isRightOrFull(kind()); }
+
+    bool forceNullableRight() const
+    {
+        return join_use_nulls && isLeftOrFull(kind());
+    }
+
+    bool forceNullableLeft() const
+    {
+        return join_use_nulls && isRightOrFull(kind());
+    }
+
     size_t defaultMaxBytes() const { return default_max_bytes; }
     size_t maxJoinedBlockRows() const { return max_joined_block_rows; }
     size_t maxRowsInRightBlock() const { return partial_merge_join_rows_in_right_blocks; }
diff --git a/src/Interpreters/ThreadStatusExt.cpp b/src/Interpreters/ThreadStatusExt.cpp
index 6a4f4576eca..5acfe500b1d 100644
--- a/src/Interpreters/ThreadStatusExt.cpp
+++ b/src/Interpreters/ThreadStatusExt.cpp
@@ -158,6 +158,17 @@ void CurrentThread::attachQueryForLog(const String & query_)
     current_thread->attachQueryForLog(query_);
 }
 
+void ThreadStatus::applyGlobalSettings()
+{
+    auto global_context_ptr = global_context.lock();
+    if (!global_context_ptr)
+        return;
+
+    const Settings & settings = global_context_ptr->getSettingsRef();
+
+    DB::Exception::enable_job_stack_trace = settings.enable_job_stack_trace;
+}
+
 void ThreadStatus::applyQuerySettings()
 {
     auto query_context_ptr = query_context.lock();
@@ -166,6 +177,8 @@ void ThreadStatus::applyQuerySettings()
 
     const Settings & settings = query_context_ptr->getSettingsRef();
 
+    DB::Exception::enable_job_stack_trace = settings.enable_job_stack_trace;
+
     query_id_from_query_context = query_context_ptr->getCurrentQueryId();
     initQueryProfiler();
 
@@ -204,6 +217,7 @@ void ThreadStatus::attachToGroupImpl(const ThreadGroupPtr & thread_group_)
 
     local_data = thread_group->getSharedData();
 
+    applyGlobalSettings();
     applyQuerySettings();
     initPerformanceCounters();
 }
diff --git a/src/Interpreters/TreeOptimizer.cpp b/src/Interpreters/TreeOptimizer.cpp
index 825114b20b7..c38b3c79026 100644
--- a/src/Interpreters/TreeOptimizer.cpp
+++ b/src/Interpreters/TreeOptimizer.cpp
@@ -25,7 +25,6 @@
 #include <Interpreters/GatherFunctionQuantileVisitor.h>
 #include <Interpreters/RewriteSumIfFunctionVisitor.h>
 #include <Interpreters/RewriteArrayExistsFunctionVisitor.h>
-#include <Interpreters/OptimizeDateFilterVisitor.h>
 
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTFunction.h>
@@ -678,21 +677,6 @@ void optimizeInjectiveFunctionsInsideUniq(ASTPtr & query, ContextPtr context)
     RemoveInjectiveFunctionsVisitor(data).visit(query);
 }
 
-void optimizeDateFilters(ASTSelectQuery * select_query)
-{
-    /// Predicates in HAVING clause has been moved to WHERE clause.
-    if (select_query->where())
-    {
-        OptimizeDateFilterInPlaceVisitor::Data data;
-        OptimizeDateFilterInPlaceVisitor(data).visit(select_query->refWhere());
-    }
-    if (select_query->prewhere())
-    {
-        OptimizeDateFilterInPlaceVisitor::Data data;
-        OptimizeDateFilterInPlaceVisitor(data).visit(select_query->refPrewhere());
-    }
-}
-
 void transformIfStringsIntoEnum(ASTPtr & query)
 {
     std::unordered_set<String> function_names = {"if", "transform"};
@@ -796,9 +780,6 @@ void TreeOptimizer::apply(ASTPtr & query, TreeRewriterResult & result,
                 tables_with_columns, result.storage_snapshot->metadata, result.storage);
     }
 
-    /// Rewrite date filters to avoid the calls of converters such as toYear, toYYYYMM, toISOWeek, etc.
-    optimizeDateFilters(select_query);
-
     /// GROUP BY injective function elimination.
     optimizeGroupBy(select_query, context);
 
diff --git a/src/Interpreters/convertFieldToType.cpp b/src/Interpreters/convertFieldToType.cpp
index dc61e748db6..89c73117960 100644
--- a/src/Interpreters/convertFieldToType.cpp
+++ b/src/Interpreters/convertFieldToType.cpp
@@ -192,6 +192,22 @@ Field convertFieldToTypeImpl(const Field & src, const IDataType & type, const ID
     {
         return static_cast<const DataTypeDateTime &>(type).getTimeZone().fromDayNum(DayNum(src.get<Int32>()));
     }
+    else if (which_type.isDateTime64() && which_from_type.isDate())
+    {
+        const auto & date_time64_type = static_cast<const DataTypeDateTime64 &>(type);
+        const auto value = date_time64_type.getTimeZone().fromDayNum(DayNum(src.get<UInt16>()));
+        return DecimalField(
+            DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(value, 0, date_time64_type.getScaleMultiplier()),
+            date_time64_type.getScale());
+    }
+    else if (which_type.isDateTime64() && which_from_type.isDate32())
+    {
+        const auto & date_time64_type = static_cast<const DataTypeDateTime64 &>(type);
+        const auto value = date_time64_type.getTimeZone().fromDayNum(ExtendedDayNum(static_cast<Int32>(src.get<Int32>())));
+        return DecimalField(
+            DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(value, 0, date_time64_type.getScaleMultiplier()),
+            date_time64_type.getScale());
+    }
     else if (type.isValueRepresentedByNumber() && src.getType() != Field::Types::String)
     {
         if (which_type.isUInt8()) return convertNumericType<UInt8>(src, type);
@@ -534,7 +550,7 @@ Field convertFieldToType(const Field & from_value, const IDataType & to_type, co
 Field convertFieldToTypeOrThrow(const Field & from_value, const IDataType & to_type, const IDataType * from_type_hint)
 {
     bool is_null = from_value.isNull();
-    if (is_null && !to_type.isNullable())
+    if (is_null && !to_type.isNullable() && !to_type.isLowCardinalityNullable())
         throw Exception(ErrorCodes::TYPE_MISMATCH, "Cannot convert NULL to {}", to_type.getName());
 
     Field converted = convertFieldToType(from_value, to_type, from_type_hint);
diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index de2e2b9ad92..c52dab722c9 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -6,6 +6,7 @@
 #include <Common/SensitiveDataMasker.h>
 
 #include <Interpreters/AsynchronousInsertQueue.h>
+#include <Interpreters/Cache/QueryCache.h>
 #include <IO/WriteBufferFromFile.h>
 #include <IO/WriteBufferFromVector.h>
 #include <IO/LimitReadBuffer.h>
@@ -14,7 +15,6 @@
 #include <QueryPipeline/BlockIO.h>
 #include <Processors/Transforms/CountingTransform.h>
 #include <Processors/Transforms/getSourceFromASTInsertQuery.h>
-#include <Processors/Transforms/StreamInQueryCacheTransform.h>
 
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTInsertQuery.h>
@@ -645,139 +645,133 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
             }
         }
 
-        bool can_use_query_cache = settings.use_query_cache && !internal && !ast->as<ASTExplainQuery>();
+        QueryCachePtr query_cache = context->getQueryCache();
+        const bool can_use_query_cache = query_cache != nullptr && settings.use_query_cache && !internal && (ast->as<ASTSelectQuery>() || ast->as<ASTSelectWithUnionQuery>());
+        bool write_into_query_cache = false;
 
         if (!async_insert)
         {
-            /// We need to start the (implicit) transaction before getting the interpreter as this will get links to the latest snapshots
-            if (!context->getCurrentTransaction() && settings.implicit_transaction && !ast->as<ASTTransactionControl>())
+            /// If it is a non-internal SELECT, and passive/read use of the query cache is enabled, and the cache knows the query, then set
+            /// a pipeline with a source populated by the query cache.
+            auto get_result_from_query_cache = [&]()
             {
-                try
+                if (can_use_query_cache && settings.enable_reads_from_query_cache)
                 {
-                    if (context->isGlobalContext())
-                        throw Exception(ErrorCodes::LOGICAL_ERROR, "Global context cannot create transactions");
-
-                    execute_implicit_tcl_query(context, ASTTransactionControl::BEGIN);
-                }
-                catch (Exception & e)
-                {
-                    e.addMessage("while starting a transaction with 'implicit_transaction'");
-                    throw;
-                }
-            }
-
-            interpreter = InterpreterFactory::get(ast, context, SelectQueryOptions(stage).setInternal(internal));
-
-            const auto & query_settings = context->getSettingsRef();
-            if (context->getCurrentTransaction() && query_settings.throw_on_unsupported_query_inside_transaction)
-            {
-                if (!interpreter->supportsTransactions())
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Transactions are not supported for this type of query ({})", ast->getID());
-
-            }
-
-            if (!interpreter->ignoreQuota() && !quota_checked)
-            {
-                quota = context->getQuota();
-                if (quota)
-                {
-                    if (ast->as<ASTSelectQuery>() || ast->as<ASTSelectWithUnionQuery>())
-                    {
-                        quota->used(QuotaType::QUERY_SELECTS, 1);
-                    }
-                    else if (ast->as<ASTInsertQuery>())
-                    {
-                        quota->used(QuotaType::QUERY_INSERTS, 1);
-                    }
-                    quota->used(QuotaType::QUERIES, 1);
-                    quota->checkExceeded(QuotaType::ERRORS);
-                }
-            }
-
-            if (!interpreter->ignoreLimits())
-            {
-                limits.mode = LimitsMode::LIMITS_CURRENT;
-                limits.size_limits = SizeLimits(settings.max_result_rows, settings.max_result_bytes, settings.result_overflow_mode);
-            }
-
-            if (auto * insert_interpreter = typeid_cast<InterpreterInsertQuery *>(&*interpreter))
-            {
-                /// Save insertion table (not table function). TODO: support remote() table function.
-                auto table_id = insert_interpreter->getDatabaseTable();
-                if (!table_id.empty())
-                    context->setInsertionTable(std::move(table_id));
-
-                if (insert_data_buffer_holder)
-                    insert_interpreter->addBuffer(std::move(insert_data_buffer_holder));
-            }
-
-            {
-                std::unique_ptr<OpenTelemetry::SpanHolder> span;
-                if (OpenTelemetry::CurrentContext().isTraceEnabled())
-                {
-                    auto * raw_interpreter_ptr = interpreter.get();
-                    String class_name(demangle(typeid(*raw_interpreter_ptr).name()));
-                    span = std::make_unique<OpenTelemetry::SpanHolder>(class_name + "::execute()");
-                }
-
-                res = interpreter->execute();
-
-                /// If
-                /// - it is a SELECT query,
-                /// - passive (read) use of the query cache is enabled, and
-                /// - the query cache knows the query result
-                /// then replace the pipeline by a new pipeline with a single source that is populated from the query cache
-                auto query_cache = context->getQueryCache();
-                bool read_result_from_query_cache = false; /// a query must not read from *and* write to the query cache at the same time
-                if (query_cache != nullptr
-                    && (can_use_query_cache && settings.enable_reads_from_query_cache)
-                    && res.pipeline.pulling())
-                {
-                    QueryCache::Key key(
-                        ast, res.pipeline.getHeader(),
-                        context->getUserName(), /*dummy for is_shared*/ false,
-                        /*dummy value for expires_at*/ std::chrono::system_clock::from_time_t(1),
-                        /*dummy value for is_compressed*/ false);
+                    QueryCache::Key key(ast, context->getUserName());
                     QueryCache::Reader reader = query_cache->createReader(key);
                     if (reader.hasCacheEntryForKey())
                     {
                         QueryPipeline pipeline;
                         pipeline.readFromQueryCache(reader.getSource(), reader.getSourceTotals(), reader.getSourceExtremes());
                         res.pipeline = std::move(pipeline);
-                        read_result_from_query_cache = true;
+                        return true;
                     }
                 }
+                return false;
+            };
 
-                /// If
-                /// - it is a SELECT query, and
-                /// - active (write) use of the query cache is enabled
-                /// then add a processor on top of the pipeline which stores the result in the query cache.
-                if (!read_result_from_query_cache
-                    && query_cache != nullptr
-                    && can_use_query_cache && settings.enable_writes_to_query_cache
-                    && res.pipeline.pulling()
-                    && (!astContainsNonDeterministicFunctions(ast, context) || settings.query_cache_store_results_of_queries_with_nondeterministic_functions))
+            if (!get_result_from_query_cache())
+            {
+                /// We need to start the (implicit) transaction before getting the interpreter as this will get links to the latest snapshots
+                if (!context->getCurrentTransaction() && settings.implicit_transaction && !ast->as<ASTTransactionControl>())
                 {
-                    QueryCache::Key key(
-                        ast, res.pipeline.getHeader(),
-                        context->getUserName(), settings.query_cache_share_between_users,
-                        std::chrono::system_clock::now() + std::chrono::seconds(settings.query_cache_ttl),
-                        settings.query_cache_compress_entries);
-
-                    const size_t num_query_runs = query_cache->recordQueryRun(key);
-                    if (num_query_runs > settings.query_cache_min_query_runs)
+                    try
                     {
-                        auto query_cache_writer = std::make_shared<QueryCache::Writer>(query_cache->createWriter(
-                                         key,
-                                         std::chrono::milliseconds(settings.query_cache_min_query_duration.totalMilliseconds()),
-                                         settings.query_cache_squash_partial_results,
-                                         settings.max_block_size,
-                                         settings.query_cache_max_size_in_bytes,
-                                         settings.query_cache_max_entries));
-                        res.pipeline.writeResultIntoQueryCache(query_cache_writer);
+                        if (context->isGlobalContext())
+                            throw Exception(ErrorCodes::LOGICAL_ERROR, "Global context cannot create transactions");
+
+                        execute_implicit_tcl_query(context, ASTTransactionControl::BEGIN);
+                    }
+                    catch (Exception & e)
+                    {
+                        e.addMessage("while starting a transaction with 'implicit_transaction'");
+                        throw;
                     }
                 }
 
+                interpreter = InterpreterFactory::get(ast, context, SelectQueryOptions(stage).setInternal(internal));
+
+                const auto & query_settings = context->getSettingsRef();
+                if (context->getCurrentTransaction() && query_settings.throw_on_unsupported_query_inside_transaction)
+                {
+                    if (!interpreter->supportsTransactions())
+                        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Transactions are not supported for this type of query ({})", ast->getID());
+
+                }
+
+                if (!interpreter->ignoreQuota() && !quota_checked)
+                {
+                    quota = context->getQuota();
+                    if (quota)
+                    {
+                        if (ast->as<ASTSelectQuery>() || ast->as<ASTSelectWithUnionQuery>())
+                        {
+                            quota->used(QuotaType::QUERY_SELECTS, 1);
+                        }
+                        else if (ast->as<ASTInsertQuery>())
+                        {
+                            quota->used(QuotaType::QUERY_INSERTS, 1);
+                        }
+                        quota->used(QuotaType::QUERIES, 1);
+                        quota->checkExceeded(QuotaType::ERRORS);
+                    }
+                }
+
+                if (!interpreter->ignoreLimits())
+                {
+                    limits.mode = LimitsMode::LIMITS_CURRENT;
+                    limits.size_limits = SizeLimits(settings.max_result_rows, settings.max_result_bytes, settings.result_overflow_mode);
+                }
+
+                if (auto * insert_interpreter = typeid_cast<InterpreterInsertQuery *>(&*interpreter))
+                {
+                    /// Save insertion table (not table function). TODO: support remote() table function.
+                    auto table_id = insert_interpreter->getDatabaseTable();
+                    if (!table_id.empty())
+                        context->setInsertionTable(std::move(table_id));
+
+                    if (insert_data_buffer_holder)
+                        insert_interpreter->addBuffer(std::move(insert_data_buffer_holder));
+                }
+
+                {
+                    std::unique_ptr<OpenTelemetry::SpanHolder> span;
+                    if (OpenTelemetry::CurrentContext().isTraceEnabled())
+                    {
+                        auto * raw_interpreter_ptr = interpreter.get();
+                        String class_name(demangle(typeid(*raw_interpreter_ptr).name()));
+                        span = std::make_unique<OpenTelemetry::SpanHolder>(class_name + "::execute()");
+                    }
+
+                    res = interpreter->execute();
+
+                    /// If it is a non-internal SELECT query, and active/write use of the query cache is enabled, then add a processor on
+                    /// top of the pipeline which stores the result in the query cache.
+                    if (can_use_query_cache && settings.enable_writes_to_query_cache
+                        && (!astContainsNonDeterministicFunctions(ast, context) || settings.query_cache_store_results_of_queries_with_nondeterministic_functions))
+                    {
+                        QueryCache::Key key(
+                            ast, res.pipeline.getHeader(),
+                            context->getUserName(), settings.query_cache_share_between_users,
+                            std::chrono::system_clock::now() + std::chrono::seconds(settings.query_cache_ttl),
+                            settings.query_cache_compress_entries);
+
+                        const size_t num_query_runs = query_cache->recordQueryRun(key);
+                        if (num_query_runs > settings.query_cache_min_query_runs)
+                        {
+                            auto query_cache_writer = std::make_shared<QueryCache::Writer>(query_cache->createWriter(
+                                             key,
+                                             std::chrono::milliseconds(settings.query_cache_min_query_duration.totalMilliseconds()),
+                                             settings.query_cache_squash_partial_results,
+                                             settings.max_block_size,
+                                             settings.query_cache_max_size_in_bytes,
+                                             settings.query_cache_max_entries));
+                            res.pipeline.writeResultIntoQueryCache(query_cache_writer);
+                            write_into_query_cache = true;
+                        }
+                    }
+
+                }
             }
         }
 
@@ -930,9 +924,7 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
             auto finish_callback = [elem,
                                     context,
                                     ast,
-                                    my_can_use_query_cache = can_use_query_cache,
-                                    enable_writes_to_query_cache = settings.enable_writes_to_query_cache,
-                                    query_cache_store_results_of_queries_with_nondeterministic_functions = settings.query_cache_store_results_of_queries_with_nondeterministic_functions,
+                                    write_into_query_cache,
                                     log_queries,
                                     log_queries_min_type = settings.log_queries_min_type,
                                     log_queries_min_query_duration_ms = settings.log_queries_min_query_duration_ms.totalMilliseconds(),
@@ -943,16 +935,10 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
                                     pulling_pipeline = pipeline.pulling(),
                                     query_span](QueryPipeline & query_pipeline) mutable
             {
-                /// If active (write) use of the query cache is enabled and the query is eligible for result caching, then store the query
-                /// result buffered in the special-purpose cache processor (added on top of the pipeline) into the cache.
-                auto query_cache = context->getQueryCache();
-                if (query_cache != nullptr
-                    && pulling_pipeline
-                    && my_can_use_query_cache && enable_writes_to_query_cache
-                    && (!astContainsNonDeterministicFunctions(ast, context) || query_cache_store_results_of_queries_with_nondeterministic_functions))
-                {
+                if (write_into_query_cache)
+                    /// Trigger the actual write of the buffered query result into the query cache. This is done explicitly to prevent
+                    /// partial/garbage results in case of exceptions during query execution.
                     query_pipeline.finalizeWriteInQueryCache();
-                }
 
                 QueryStatusPtr process_list_elem = context->getProcessListElement();
 
diff --git a/src/Interpreters/sortBlock.cpp b/src/Interpreters/sortBlock.cpp
index 2ae5edc43b9..89c4220ccdf 100644
--- a/src/Interpreters/sortBlock.cpp
+++ b/src/Interpreters/sortBlock.cpp
@@ -5,6 +5,9 @@
 #include <Columns/ColumnTuple.h>
 #include <Functions/FunctionHelpers.h>
 
+#ifdef __SSE2__
+    #include <emmintrin.h>
+#endif
 
 namespace DB
 {
@@ -190,6 +193,85 @@ void getBlockSortPermutationImpl(const Block & block, const SortDescription & de
     }
 }
 
+bool isIdentityPermutation(const IColumn::Permutation & permutation, size_t limit)
+{
+    static_assert(sizeof(permutation[0]) == sizeof(UInt64), "Invalid permutation value size");
+
+    size_t permutation_size = permutation.size();
+    size_t size = limit == 0 ? permutation_size : std::min(limit, permutation_size);
+    if (size == 0)
+        return true;
+
+    if (permutation[0] != 0)
+        return false;
+
+    size_t i = 0;
+
+#if defined(__SSE2__)
+    if (size >= 8)
+    {
+        static constexpr UInt64 compare_all_elements_equal_mask = (1UL << 16) - 1;
+
+        __m128i permutation_add_vector = { 8, 8 };
+        __m128i permutation_compare_values_vectors[4] { { 0, 1 }, { 2, 3 }, { 4, 5 }, { 6, 7 } };
+
+        const size_t * permutation_data = permutation.data();
+
+        static constexpr size_t unroll_count = 8;
+        size_t size_unrolled = (size / unroll_count) * unroll_count;
+
+        for (; i < size_unrolled; i += 8)
+        {
+            UInt64 permutation_equals_vector_mask = compare_all_elements_equal_mask;
+
+            for (size_t j = 0; j < 4; ++j)
+            {
+                __m128i permutation_data_vector = _mm_loadu_si128(reinterpret_cast<const __m128i *>(permutation_data + i + j * 2));
+                __m128i permutation_equals_vector = _mm_cmpeq_epi8(permutation_data_vector, permutation_compare_values_vectors[j]);
+                permutation_compare_values_vectors[j] = _mm_add_epi64(permutation_compare_values_vectors[j], permutation_add_vector);
+                permutation_equals_vector_mask &= _mm_movemask_epi8(permutation_equals_vector);
+            }
+
+            if (permutation_equals_vector_mask != compare_all_elements_equal_mask)
+                return false;
+        }
+    }
+#endif
+
+    i = std::max(i, static_cast<size_t>(1));
+    for (; i < size; ++i)
+        if (permutation[i] != (permutation[i - 1] + 1))
+            return false;
+
+    return true;
+}
+
+template <typename Comparator>
+bool isAlreadySortedImpl(size_t rows, Comparator compare)
+{
+    /** If the rows are not too few, then let's make a quick attempt to verify that the block is not sorted.
+     * Constants - at random.
+     */
+    static constexpr size_t num_rows_to_try = 10;
+    if (rows > num_rows_to_try * 5)
+    {
+        for (size_t i = 1; i < num_rows_to_try; ++i)
+        {
+            size_t prev_position = rows * (i - 1) / num_rows_to_try;
+            size_t curr_position = rows * i / num_rows_to_try;
+
+            if (compare(curr_position, prev_position))
+                return false;
+        }
+    }
+
+    for (size_t i = 1; i < rows; ++i)
+        if (compare(i, i - 1))
+            return false;
+
+    return true;
+}
+
 }
 
 void sortBlock(Block & block, const SortDescription & description, UInt64 limit)
@@ -200,30 +282,18 @@ void sortBlock(Block & block, const SortDescription & description, UInt64 limit)
     if (permutation.empty())
         return;
 
-    size_t columns = block.columns();
-    for (size_t i = 0; i < columns; ++i)
-    {
-        auto & column_to_sort = block.getByPosition(i).column;
-        column_to_sort = column_to_sort->permute(permutation, limit);
-    }
-}
-
-void stableSortBlock(Block & block, const SortDescription & description)
-{
-    if (!block)
-        return;
-
-    IColumn::Permutation permutation;
-    getBlockSortPermutationImpl(block, description, IColumn::PermutationSortStability::Stable, 0, permutation);
-
-    if (permutation.empty())
+    bool is_identity_permutation = isIdentityPermutation(permutation, limit);
+    if (is_identity_permutation && limit == 0)
         return;
 
     size_t columns = block.columns();
     for (size_t i = 0; i < columns; ++i)
     {
         auto & column_to_sort = block.getByPosition(i).column;
-        column_to_sort = column_to_sort->permute(permutation, 0);
+        if (is_identity_permutation)
+            column_to_sort = column_to_sort->cut(0, std::min(static_cast<size_t>(limit), permutation.size()));
+        else
+            column_to_sort = column_to_sort->permute(permutation, limit);
     }
 }
 
@@ -240,33 +310,28 @@ bool isAlreadySorted(const Block & block, const SortDescription & description)
     if (!block)
         return true;
 
-    size_t rows = block.rows();
-
     ColumnsWithSortDescriptions columns_with_sort_desc = getColumnsWithSortDescription(block, description);
+    bool is_collation_required = false;
 
-    PartialSortingLess less(columns_with_sort_desc);
-
-    /** If the rows are not too few, then let's make a quick attempt to verify that the block is not sorted.
-     * Constants - at random.
-     */
-    static constexpr size_t num_rows_to_try = 10;
-    if (rows > num_rows_to_try * 5)
+    for (auto & column_with_sort_desc : columns_with_sort_desc)
     {
-        for (size_t i = 1; i < num_rows_to_try; ++i)
+        if (isCollationRequired(column_with_sort_desc.description))
         {
-            size_t prev_position = rows * (i - 1) / num_rows_to_try;
-            size_t curr_position = rows * i / num_rows_to_try;
-
-            if (less(curr_position, prev_position))
-                return false;
+            is_collation_required = true;
+            break;
         }
     }
 
-    for (size_t i = 1; i < rows; ++i)
-        if (less(i, i - 1))
-            return false;
+    size_t rows = block.rows();
 
-    return true;
+    if (is_collation_required)
+    {
+        PartialSortingLessWithCollation less(columns_with_sort_desc);
+        return isAlreadySortedImpl(rows, less);
+    }
+
+    PartialSortingLess less(columns_with_sort_desc);
+    return isAlreadySortedImpl(rows, less);
 }
 
 }
diff --git a/src/Interpreters/sortBlock.h b/src/Interpreters/sortBlock.h
index 31ae78e90b0..3c82b4c7517 100644
--- a/src/Interpreters/sortBlock.h
+++ b/src/Interpreters/sortBlock.h
@@ -10,20 +10,15 @@ namespace DB
 /// Sort one block by `description`. If limit != 0, then the partial sort of the first `limit` rows is produced.
 void sortBlock(Block & block, const SortDescription & description, UInt64 limit = 0);
 
-/** Used only in StorageMergeTree to sort the data with INSERT.
+/** Same as sortBlock, but do not sort the block, but only calculate the permutation of the values,
+  *  so that you can rearrange the column values yourself.
   * Sorting is stable. This is important for keeping the order of rows in the CollapsingMergeTree engine
   *  - because based on the order of rows it is determined whether to delete or leave groups of rows when collapsing.
-  * Collations are not supported. Partial sorting is not supported.
-  */
-void stableSortBlock(Block & block, const SortDescription & description);
-
-/** Same as stableSortBlock, but do not sort the block, but only calculate the permutation of the values,
-  *  so that you can rearrange the column values yourself.
+  * Used only in StorageMergeTree to sort the data with INSERT.
   */
 void stableGetPermutation(const Block & block, const SortDescription & description, IColumn::Permutation & out_permutation);
 
 /** Quickly check whether the block is already sorted. If the block is not sorted - returns false as fast as possible.
-  * Collations are not supported.
   */
 bool isAlreadySorted(const Block & block, const SortDescription & description);
 
diff --git a/src/Interpreters/tests/gtest_convertFieldToType.cpp b/src/Interpreters/tests/gtest_convertFieldToType.cpp
new file mode 100644
index 00000000000..cda9311dcbe
--- /dev/null
+++ b/src/Interpreters/tests/gtest_convertFieldToType.cpp
@@ -0,0 +1,184 @@
+#include <initializer_list>
+#include <limits>
+#include <ostream>
+#include <Core/Field.h>
+#include <Core/iostream_debug_helpers.h>
+#include <Interpreters/convertFieldToType.h>
+#include <DataTypes/DataTypeFactory.h>
+
+#include <gtest/gtest.h>
+#include "base/Decimal.h"
+#include "base/types.h"
+
+using namespace DB;
+
+struct ConvertFieldToTypeTestParams
+{
+    const char * from_type; // MUST NOT BE NULL
+    const Field from_value;
+    const char * to_type; // MUST NOT BE NULL
+    const std::optional<Field> expected_value;
+};
+
+std::ostream & operator << (std::ostream & ostr, const ConvertFieldToTypeTestParams & params)
+{
+    return ostr << "{"
+            << "\n\tfrom_type  : " << params.from_type
+            << "\n\tfrom_value : " << params.from_value
+            << "\n\tto_type    : " << params.to_type
+            << "\n\texpected   : " << (params.expected_value ? *params.expected_value : Field())
+            << "\n}";
+}
+
+class ConvertFieldToTypeTest : public ::testing::TestWithParam<ConvertFieldToTypeTestParams>
+{};
+
+TEST_P(ConvertFieldToTypeTest, convert)
+{
+    const auto & params = GetParam();
+
+    ASSERT_NE(nullptr, params.from_type);
+    ASSERT_NE(nullptr, params.to_type);
+
+    const auto & type_factory = DataTypeFactory::instance();
+    const auto from_type = type_factory.get(params.from_type);
+    const auto to_type = type_factory.get(params.to_type);
+
+    if (params.expected_value)
+    {
+        const auto result = convertFieldToType(params.from_value, *to_type, from_type.get());
+        EXPECT_EQ(*params.expected_value, result);
+    }
+    else
+    {
+        EXPECT_ANY_THROW(convertFieldToType(params.from_value, *to_type, from_type.get()));
+    }
+}
+
+// Basically, the number of seconds in a day works for UTC here
+const Int64 Day = 24 * 60 * 60;
+
+// 123 is arbitrary value here
+
+INSTANTIATE_TEST_SUITE_P(
+    DateToDateTime64,
+    ConvertFieldToTypeTest,
+    ::testing::ValuesIn(std::initializer_list<ConvertFieldToTypeTestParams>{
+        // min value of Date
+        {
+            "Date",
+            Field(0),
+            "DateTime64(0, 'UTC')",
+            DecimalField(DateTime64(0), 0)
+        },
+        // Max value of Date
+        {
+            "Date",
+            Field(std::numeric_limits<DB::UInt16>::max()),
+            "DateTime64(0, 'UTC')",
+            DecimalField(DateTime64(std::numeric_limits<DB::UInt16>::max() * Day), 0)
+        },
+        // check that scale is respected
+        {
+            "Date",
+            Field(123),
+            "DateTime64(0, 'UTC')",
+            DecimalField(DateTime64(123 * Day), 0)
+        },
+        {
+            "Date",
+            Field(1),
+            "DateTime64(1, 'UTC')",
+            DecimalField(DateTime64(Day * 10), 1)
+        },
+        {
+            "Date",
+            Field(123),
+            "DateTime64(3, 'UTC')",
+            DecimalField(DateTime64(123 * Day * 1000), 3)
+        },
+        {
+            "Date",
+            Field(123),
+            "DateTime64(6, 'UTC')",
+            DecimalField(DateTime64(123 * Day * 1'000'000), 6)
+        },
+    })
+);
+
+INSTANTIATE_TEST_SUITE_P(
+    Date32ToDateTime64,
+    ConvertFieldToTypeTest,
+    ::testing::ValuesIn(std::initializer_list<ConvertFieldToTypeTestParams>{
+        // min value of Date32: 1st Jan 1900 (see DATE_LUT_MIN_YEAR)
+        {
+            "Date32",
+            Field(-25'567),
+            "DateTime64(0, 'UTC')",
+            DecimalField(DateTime64(-25'567 * Day), 0)
+        },
+        // max value of Date32: 31 Dec 2299 (see DATE_LUT_MAX_YEAR)
+        {
+            "Date32",
+            Field(120'529),
+            "DateTime64(0, 'UTC')",
+            DecimalField(DateTime64(120'529 * Day), 0)
+        },
+        // check that scale is respected
+        {
+            "Date32",
+            Field(123),
+            "DateTime64(0, 'UTC')",
+            DecimalField(DateTime64(123 * Day), 0)
+        },
+        {
+            "Date32",
+            Field(123),
+            "DateTime64(1, 'UTC')",
+            DecimalField(DateTime64(123 * Day * 10), 1)
+        },
+        {
+            "Date32",
+            Field(123),
+            "DateTime64(3, 'UTC')",
+            DecimalField(DateTime64(123 * Day * 1000), 3)
+        },
+        {
+            "Date32",
+            Field(123),
+            "DateTime64(6, 'UTC')",
+            DecimalField(DateTime64(123 * Day * 1'000'000), 6)
+        }
+    })
+    );
+
+INSTANTIATE_TEST_SUITE_P(
+    DateTimeToDateTime64,
+    ConvertFieldToTypeTest,
+    ::testing::ValuesIn(std::initializer_list<ConvertFieldToTypeTestParams>{
+        {
+            "DateTime",
+            Field(1),
+            "DateTime64(0, 'UTC')",
+            DecimalField(DateTime64(1), 0)
+        },
+        {
+            "DateTime",
+            Field(1),
+            "DateTime64(1, 'UTC')",
+            DecimalField(DateTime64(1'0), 1)
+        },
+        {
+            "DateTime",
+            Field(123),
+            "DateTime64(3, 'UTC')",
+            DecimalField(DateTime64(123'000), 3)
+        },
+        {
+            "DateTime",
+            Field(123),
+            "DateTime64(6, 'UTC')",
+            DecimalField(DateTime64(123'000'000), 6)
+        },
+    })
+);
diff --git a/src/Interpreters/tests/gtest_lru_file_cache.cpp b/src/Interpreters/tests/gtest_lru_file_cache.cpp
index fe9e3a18024..b9d12c8ed42 100644
--- a/src/Interpreters/tests/gtest_lru_file_cache.cpp
+++ b/src/Interpreters/tests/gtest_lru_file_cache.cpp
@@ -22,6 +22,8 @@
 
 #include <Poco/ConsoleChannel.h>
 #include <Disks/IO/CachedOnDiskWriteBufferFromFile.h>
+#include <Disks/IO/CachedOnDiskReadBufferFromFile.h>
+#include <Disks/IO/createReadBufferFromFileBase.h>
 #include <Interpreters/Cache/WriteBufferToFileSegment.h>
 
 namespace fs = std::filesystem;
@@ -141,6 +143,15 @@ void increasePriority(const HolderPtr & holder)
 class FileCacheTest : public ::testing::Test
 {
 public:
+    FileCacheTest() {
+        /// Context has to be created before calling cache.initialize();
+        /// Otherwise the tests which run before FileCacheTest.get are failed
+        /// It is logical to call destroyContext() at destructor.
+        /// But that wouldn't work because for proper initialization and destruction global/static objects
+        /// testing::Environment has to be used.
+        getContext();
+    }
+
     static void setupLogs(const std::string & level)
     {
         Poco::AutoPtr<Poco::ConsoleChannel> channel(new Poco::ConsoleChannel(std::cerr));
@@ -466,7 +477,8 @@ TEST_F(FileCacheTest, get)
                 }
                 cv.notify_one();
 
-                file_segment2.wait(file_segment2.range().left);
+                file_segment2.wait(file_segment2.range().right);
+                file_segment2.complete();
                 ASSERT_TRUE(file_segment2.state() == State::DOWNLOADED);
             });
 
@@ -532,8 +544,8 @@ TEST_F(FileCacheTest, get)
                 cv.notify_one();
 
                 file_segment2.wait(file_segment2.range().left);
-                ASSERT_TRUE(file_segment2.state() == DB::FileSegment::State::PARTIALLY_DOWNLOADED);
-                ASSERT_TRUE(file_segment2.getOrSetDownloader() == DB::FileSegment::getCallerId());
+                ASSERT_EQ(file_segment2.state(), DB::FileSegment::State::EMPTY);
+                ASSERT_EQ(file_segment2.getOrSetDownloader(), DB::FileSegment::getCallerId());
                 download(file_segment2);
             });
 
@@ -685,6 +697,7 @@ TEST_F(FileCacheTest, writeBuffer)
         }
         for (auto & t : threads)
             t.join();
+        out.finalize();
         return holder;
     };
 
@@ -851,3 +864,78 @@ TEST_F(FileCacheTest, temporaryData)
     ASSERT_LE(file_cache.getUsedCacheSize(), size_used_before_temporary_data);
     ASSERT_LE(file_cache.getFileSegmentsNum(), segments_used_before_temporary_data);
 }
+
+TEST_F(FileCacheTest, CachedReadBuffer)
+{
+    DB::ThreadStatus thread_status;
+
+    /// To work with cache need query_id and query context.
+    std::string query_id = "query_id";
+
+    Poco::XML::DOMParser dom_parser;
+    std::string xml(R"CONFIG(<clickhouse>
+</clickhouse>)CONFIG");
+    Poco::AutoPtr<Poco::XML::Document> document = dom_parser.parseString(xml);
+    Poco::AutoPtr<Poco::Util::XMLConfiguration> config = new Poco::Util::XMLConfiguration(document);
+    getMutableContext().context->setConfig(config);
+
+    auto query_context = DB::Context::createCopy(getContext().context);
+    query_context->makeQueryContext();
+    query_context->setCurrentQueryId(query_id);
+    chassert(&DB::CurrentThread::get() == &thread_status);
+    DB::CurrentThread::QueryScope query_scope_holder(query_context);
+
+    DB::FileCacheSettings settings;
+    settings.base_path = cache_base_path;
+    settings.max_file_segment_size = 5;
+    settings.max_size = 30;
+    settings.max_elements = 10;
+    settings.boundary_alignment = 1;
+
+    ReadSettings read_settings;
+    read_settings.enable_filesystem_cache = true;
+    read_settings.local_fs_method = LocalFSReadMethod::pread;
+
+    std::string file_path = fs::current_path() / "test";
+    auto read_buffer_creator = [&]()
+    {
+        return createReadBufferFromFileBase(file_path, read_settings, std::nullopt, std::nullopt);
+    };
+
+    auto wb = std::make_unique<WriteBufferFromFile>(file_path, DBMS_DEFAULT_BUFFER_SIZE);
+    std::string s(30, '*');
+    wb->write(s.data(), s.size());
+    wb->next();
+    wb->finalize();
+
+    auto cache = std::make_shared<DB::FileCache>(settings);
+    cache->initialize();
+    auto key = cache->createKeyForPath(file_path);
+
+    {
+        auto cached_buffer = std::make_shared<CachedOnDiskReadBufferFromFile>(
+            file_path, key, cache, read_buffer_creator, read_settings, "test", s.size(), false, false, std::nullopt, nullptr);
+
+        WriteBufferFromOwnString result;
+        copyData(*cached_buffer, result);
+        ASSERT_EQ(result.str(), s);
+
+        assertEqual(cache->dumpQueue(), { Range(0, 4), Range(5, 9), Range(10, 14), Range(15, 19), Range(20, 24), Range(25, 29) });
+    }
+
+    {
+        ReadSettings modified_settings{read_settings};
+        modified_settings.local_fs_buffer_size = 10;
+        modified_settings.remote_fs_buffer_size = 10;
+
+        auto cached_buffer = std::make_shared<CachedOnDiskReadBufferFromFile>(
+            file_path, key, cache, read_buffer_creator, modified_settings, "test", s.size(), false, false, std::nullopt, nullptr);
+
+        cached_buffer->next();
+        assertEqual(cache->dumpQueue(), { Range(5, 9), Range(10, 14), Range(15, 19), Range(20, 24), Range(25, 29), Range(0, 4) });
+
+        cached_buffer->position() = cached_buffer->buffer().end();
+        cached_buffer->next();
+        assertEqual(cache->dumpQueue(), {Range(10, 14), Range(15, 19), Range(20, 24), Range(25, 29), Range(0, 4), Range(5, 9) });
+    }
+}
diff --git a/src/Interpreters/threadPoolCallbackRunner.h b/src/Interpreters/threadPoolCallbackRunner.h
index f7324bfafe6..eb90b61cf31 100644
--- a/src/Interpreters/threadPoolCallbackRunner.h
+++ b/src/Interpreters/threadPoolCallbackRunner.h
@@ -44,6 +44,9 @@ ThreadPoolCallbackRunner<Result, Callback> threadPoolCallbackRunner(ThreadPool &
 
         auto future = task->get_future();
 
+        /// ThreadPool is using "bigger is higher priority" instead of "smaller is more priority".
+        /// Note: calling method scheduleOrThrowOnError in intentional, because we don't want to throw exceptions
+        /// in critical places where this callback runner is used (e.g. loading or deletion of parts)
         my_pool->scheduleOrThrowOnError([my_task = std::move(task)]{ (*my_task)(); }, priority);
 
         return future;
diff --git a/src/Loggers/Loggers.cpp b/src/Loggers/Loggers.cpp
index 645ae5dcc7a..0c3a7bd615d 100644
--- a/src/Loggers/Loggers.cpp
+++ b/src/Loggers/Loggers.cpp
@@ -51,7 +51,7 @@ void Loggers::buildLoggers(Poco::Util::AbstractConfiguration & config, Poco::Log
 #endif
 
     auto current_logger = config.getString("logger", "");
-    if (config_logger == current_logger)
+    if (config_logger.has_value() && *config_logger == current_logger)
         return;
 
     config_logger = current_logger;
diff --git a/src/Loggers/Loggers.h b/src/Loggers/Loggers.h
index 31a215aa9ce..ebc10954b94 100644
--- a/src/Loggers/Loggers.h
+++ b/src/Loggers/Loggers.h
@@ -39,7 +39,7 @@ private:
     Poco::AutoPtr<Poco::Channel> syslog_channel;
 
     /// Previous value of logger element in config. It is used to reinitialize loggers whenever the value changed.
-    std::string config_logger;
+    std::optional<std::string> config_logger;
 
 #ifndef WITHOUT_TEXT_LOG
     std::weak_ptr<DB::TextLog> text_log;
diff --git a/src/Loggers/OwnPatternFormatter.cpp b/src/Loggers/OwnPatternFormatter.cpp
index ccf6c479b80..8d8e35432e8 100644
--- a/src/Loggers/OwnPatternFormatter.cpp
+++ b/src/Loggers/OwnPatternFormatter.cpp
@@ -4,7 +4,6 @@
 #include <IO/WriteBufferFromString.h>
 #include <IO/WriteHelpers.h>
 #include <Common/HashTable/Hash.h>
-#include <Interpreters/InternalTextLogsQueue.h>
 #include <base/terminalColors.h>
 
 
@@ -21,7 +20,7 @@ void OwnPatternFormatter::formatExtended(const DB::ExtendedLogMessage & msg_ext,
     const Poco::Message & msg = msg_ext.base;
 
     /// Change delimiters in date for compatibility with old logs.
-    DB::writeDateTimeText<'.', ':'>(msg_ext.time_seconds, wb);
+    DB::writeDateTimeText<'.', ':'>(msg_ext.time_seconds, wb, server_timezone);
 
     DB::writeChar('.', wb);
     DB::writeChar('0' + ((msg_ext.time_microseconds / 100000) % 10), wb);
diff --git a/src/Loggers/OwnPatternFormatter.h b/src/Loggers/OwnPatternFormatter.h
index d776b097cb2..8b0d11bcec1 100644
--- a/src/Loggers/OwnPatternFormatter.h
+++ b/src/Loggers/OwnPatternFormatter.h
@@ -2,6 +2,7 @@
 
 
 #include <Poco/PatternFormatter.h>
+#include <Common/DateLUT.h>
 #include "ExtendedLogChannel.h"
 
 
@@ -30,5 +31,6 @@ public:
     virtual void formatExtended(const DB::ExtendedLogMessage & msg_ext, std::string & text) const;
 
 private:
+    const DateLUTImpl & server_timezone = DateLUT::serverTimezoneInstance();
     bool color;
 };
diff --git a/src/Parsers/ASTIndexDeclaration.h b/src/Parsers/ASTIndexDeclaration.h
index bd52a611f3f..6ed241f75ab 100644
--- a/src/Parsers/ASTIndexDeclaration.h
+++ b/src/Parsers/ASTIndexDeclaration.h
@@ -12,6 +12,9 @@ class ASTFunction;
 class ASTIndexDeclaration : public IAST
 {
 public:
+    static const auto DEFAULT_INDEX_GRANULARITY = 1uz;
+    static const auto DEFAULT_ANNOY_INDEX_GRANULARITY = 100'000'000uz;
+
     String name;
     IAST * expr;
     ASTFunction * type;
diff --git a/src/Parsers/ASTQueryWithOutput.cpp b/src/Parsers/ASTQueryWithOutput.cpp
index 5f717715a69..4bf1e6cb231 100644
--- a/src/Parsers/ASTQueryWithOutput.cpp
+++ b/src/Parsers/ASTQueryWithOutput.cpp
@@ -39,6 +39,8 @@ void ASTQueryWithOutput::formatImpl(const FormatSettings & s, FormatState & stat
         s.ostr << (s.hilite ? hilite_keyword : "");
         if (is_outfile_append)
             s.ostr << " APPEND";
+        if (is_outfile_truncate)
+            s.ostr << " TRUNCATE";
         if (is_into_outfile_with_stdout)
             s.ostr << " AND STDOUT";
         s.ostr << (s.hilite ? hilite_none : "");
diff --git a/src/Parsers/ASTQueryWithOutput.h b/src/Parsers/ASTQueryWithOutput.h
index 7db021405e7..6f9cafc89a9 100644
--- a/src/Parsers/ASTQueryWithOutput.h
+++ b/src/Parsers/ASTQueryWithOutput.h
@@ -17,6 +17,7 @@ public:
     ASTPtr out_file;
     bool is_into_outfile_with_stdout = false;
     bool is_outfile_append = false;
+    bool is_outfile_truncate = false;
     ASTPtr format;
     ASTPtr settings_ast;
     ASTPtr compression;
diff --git a/src/Parsers/ASTTableOverrides.cpp b/src/Parsers/ASTTableOverrides.cpp
index af846a5dd43..ccb485f6c69 100644
--- a/src/Parsers/ASTTableOverrides.cpp
+++ b/src/Parsers/ASTTableOverrides.cpp
@@ -36,8 +36,6 @@ void ASTTableOverride::formatImpl(const FormatSettings & settings_, FormatState
         settings.ostr << hl_keyword << "TABLE OVERRIDE " << hl_none;
         ASTIdentifier(table_name).formatImpl(settings, state, frame);
     }
-    if (!columns && (!storage || storage->children.empty()))
-        return;
     auto override_frame = frame;
     if (is_standalone)
     {
diff --git a/src/Parsers/ExpressionElementParsers.cpp b/src/Parsers/ExpressionElementParsers.cpp
index 28cef51e571..3a7e8790bb4 100644
--- a/src/Parsers/ExpressionElementParsers.cpp
+++ b/src/Parsers/ExpressionElementParsers.cpp
@@ -829,7 +829,11 @@ static bool parseNumber(char * buffer, size_t size, bool negative, int base, Fie
 
     if (pos_integer == buffer + size && errno != ERANGE && (!negative || uint_value <= (1ULL << 63)))
     {
-        if (negative)
+        /// -0 should be still parsed as UInt instead of Int,
+        /// because otherwise it is not preserved during formatting-parsing roundtrip
+        /// (the signedness is lost during formatting)
+
+        if (negative && uint_value != 0)
             res = static_cast<Int64>(-uint_value);
         else
             res = uint_value;
diff --git a/src/Parsers/MySQL/ASTDropQuery.cpp b/src/Parsers/MySQL/ASTDropQuery.cpp
index fb76d93363a..890451e3e55 100644
--- a/src/Parsers/MySQL/ASTDropQuery.cpp
+++ b/src/Parsers/MySQL/ASTDropQuery.cpp
@@ -44,8 +44,9 @@ bool ParserDropQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected & ex
     bool if_exists = false;
     bool is_truncate = false;
 
-    if (s_truncate.ignore(pos, expected) && s_table.ignore(pos, expected))
+    if (s_truncate.ignore(pos, expected))
     {
+        s_table.ignore(pos, expected);
         is_truncate = true;
         query->kind = ASTDropQuery::Kind::Table;
         ASTDropQuery::QualifiedName name;
diff --git a/src/Parsers/MySQL/tests/gtest_create_parser.cpp b/src/Parsers/MySQL/tests/gtest_create_parser.cpp
index 554b3f0a67d..2f65eb6e592 100644
--- a/src/Parsers/MySQL/tests/gtest_create_parser.cpp
+++ b/src/Parsers/MySQL/tests/gtest_create_parser.cpp
@@ -40,5 +40,5 @@ TEST(CreateTableParser, SS)
     ASTPtr ast = parseQuery(p_create_query, input.data(), input.data() + input.size(), "", 0, 0);
     WriteBufferFromOStream buf(std::cerr, 4096);
     ast->dumpTree(buf);
-
+    buf.finalize();
 }
diff --git a/src/Parsers/ParserCreateIndexQuery.cpp b/src/Parsers/ParserCreateIndexQuery.cpp
index ab31d3f9b7a..f231573b920 100644
--- a/src/Parsers/ParserCreateIndexQuery.cpp
+++ b/src/Parsers/ParserCreateIndexQuery.cpp
@@ -36,17 +36,26 @@ bool ParserCreateIndexDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected
     if (!data_type_p.parse(pos, type, expected))
         return false;
 
-    if (!s_granularity.ignore(pos, expected))
-        return false;
-
-    if (!granularity_p.parse(pos, granularity, expected))
-        return false;
+    if (s_granularity.ignore(pos, expected))
+    {
+        if (!granularity_p.parse(pos, granularity, expected))
+            return false;
+    }
 
     auto index = std::make_shared<ASTIndexDeclaration>();
     index->part_of_create_index_query = true;
-    index->granularity = granularity->as<ASTLiteral &>().value.safeGet<UInt64>();
     index->set(index->expr, expr);
     index->set(index->type, type);
+
+    if (granularity)
+        index->granularity = granularity->as<ASTLiteral &>().value.safeGet<UInt64>();
+    else
+    {
+        if (index->type->name == "annoy")
+            index->granularity = ASTIndexDeclaration::DEFAULT_ANNOY_INDEX_GRANULARITY;
+        else
+            index->granularity = ASTIndexDeclaration::DEFAULT_INDEX_GRANULARITY;
+    }
     node = index;
 
     return true;
diff --git a/src/Parsers/ParserCreateQuery.cpp b/src/Parsers/ParserCreateQuery.cpp
index 8cbfac91465..adf3513ba40 100644
--- a/src/Parsers/ParserCreateQuery.cpp
+++ b/src/Parsers/ParserCreateQuery.cpp
@@ -139,9 +139,19 @@ bool ParserIndexDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
 
     auto index = std::make_shared<ASTIndexDeclaration>();
     index->name = name->as<ASTIdentifier &>().name();
-    index->granularity = granularity ? granularity->as<ASTLiteral &>().value.safeGet<UInt64>() : 1;
     index->set(index->expr, expr);
     index->set(index->type, type);
+
+    if (granularity)
+        index->granularity = granularity->as<ASTLiteral &>().value.safeGet<UInt64>();
+    else
+    {
+        if (index->type->name == "annoy")
+            index->granularity = ASTIndexDeclaration::DEFAULT_ANNOY_INDEX_GRANULARITY;
+        else
+            index->granularity = ASTIndexDeclaration::DEFAULT_INDEX_GRANULARITY;
+    }
+
     node = index;
 
     return true;
diff --git a/src/Parsers/ParserQueryWithOutput.cpp b/src/Parsers/ParserQueryWithOutput.cpp
index 6796f4528c4..2bfe7353be4 100644
--- a/src/Parsers/ParserQueryWithOutput.cpp
+++ b/src/Parsers/ParserQueryWithOutput.cpp
@@ -109,6 +109,12 @@ bool ParserQueryWithOutput::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
             query_with_output.is_outfile_append = true;
         }
 
+        ParserKeyword s_truncate("TRUNCATE");
+        if (s_truncate.ignore(pos, expected))
+        {
+            query_with_output.is_outfile_truncate = true;
+        }
+
         ParserKeyword s_stdout("AND STDOUT");
         if (s_stdout.ignore(pos, expected))
         {
diff --git a/src/Parsers/ParserSetQuery.cpp b/src/Parsers/ParserSetQuery.cpp
index 4df74c2dd82..727d037112f 100644
--- a/src/Parsers/ParserSetQuery.cpp
+++ b/src/Parsers/ParserSetQuery.cpp
@@ -215,7 +215,7 @@ bool ParserSetQuery::parseNameValuePair(SettingChange & change, IParser::Pos & p
     else if (ParserKeyword("FALSE").ignore(pos, expected))
         value = std::make_shared<ASTLiteral>(Field(static_cast<UInt64>(0)));
     /// for SETTINGS disk=disk(type='s3', path='', ...)
-    else if (function_p.parse(pos, function_ast, expected) && function_ast->as<ASTFunction>()->name == "disk")
+    else if (function_p.parse(pos, function_ast, expected) && function_ast->as<ASTFunction>()->name.starts_with("disk"))
     {
         tryGetIdentifierNameInto(name, change.name);
         change.value = createFieldFromAST(function_ast);
@@ -280,7 +280,7 @@ bool ParserSetQuery::parseNameValuePairWithParameterOrDefault(
         node = std::make_shared<ASTLiteral>(Field(static_cast<UInt64>(1)));
     else if (ParserKeyword("FALSE").ignore(pos, expected))
         node = std::make_shared<ASTLiteral>(Field(static_cast<UInt64>(0)));
-    else if (function_p.parse(pos, function_ast, expected) && function_ast->as<ASTFunction>()->name == "disk")
+    else if (function_p.parse(pos, function_ast, expected) && function_ast->as<ASTFunction>()->name.starts_with("disk"))
     {
         change.name = name;
         change.value = createFieldFromAST(function_ast);
diff --git a/src/Parsers/ParserShowIndexesQuery.cpp b/src/Parsers/ParserShowIndexesQuery.cpp
index fe08b463069..7852ed9806d 100644
--- a/src/Parsers/ParserShowIndexesQuery.cpp
+++ b/src/Parsers/ParserShowIndexesQuery.cpp
@@ -28,7 +28,7 @@ bool ParserShowIndexesQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
     if (ParserKeyword("EXTENDED").ignore(pos, expected))
         query->extended = true;
 
-    if (!(ParserKeyword("INDEX").ignore(pos, expected) || ParserKeyword("INDEXES").ignore(pos, expected) || ParserKeyword("KEYS").ignore(pos, expected)))
+    if (!(ParserKeyword("INDEX").ignore(pos, expected) || ParserKeyword("INDEXES").ignore(pos, expected) || ParserKeyword("INDICES").ignore(pos, expected) || ParserKeyword("KEYS").ignore(pos, expected)))
         return false;
 
     if (ParserKeyword("FROM").ignore(pos, expected) || ParserKeyword("IN").ignore(pos, expected))
diff --git a/src/Parsers/isDiskFunction.cpp b/src/Parsers/isDiskFunction.cpp
index e60229cb3f7..5ba626a8b2c 100644
--- a/src/Parsers/isDiskFunction.cpp
+++ b/src/Parsers/isDiskFunction.cpp
@@ -10,7 +10,7 @@ bool isDiskFunction(ASTPtr ast)
         return false;
 
     const auto * function = ast->as<ASTFunction>();
-    return function && function->name == "disk" && function->arguments->as<ASTExpressionList>();
+    return function && function->name.starts_with("disk") && function->arguments->as<ASTExpressionList>();
 }
 
 }
diff --git a/src/Parsers/tests/gtest_Parser.cpp b/src/Parsers/tests/gtest_Parser.cpp
index 19872c4189a..2795de64b1d 100644
--- a/src/Parsers/tests/gtest_Parser.cpp
+++ b/src/Parsers/tests/gtest_Parser.cpp
@@ -215,7 +215,7 @@ INSTANTIATE_TEST_SUITE_P(ParserCreateDatabaseQuery, ParserTest,
         },
         {
             "CREATE DATABASE db ENGINE=Foo TABLE OVERRIDE `tbl` (), TABLE OVERRIDE a (COLUMNS (_created DateTime MATERIALIZED now())), TABLE OVERRIDE b (PARTITION BY rand())",
-            "CREATE DATABASE db\nENGINE = Foo\nTABLE OVERRIDE `tbl`,\nTABLE OVERRIDE `a`\n(\n    COLUMNS\n    (\n        `_created` DateTime MATERIALIZED now()\n    )\n),\nTABLE OVERRIDE `b`\n(\n    PARTITION BY rand()\n)"
+            "CREATE DATABASE db\nENGINE = Foo\nTABLE OVERRIDE `tbl`\n(\n\n),\nTABLE OVERRIDE `a`\n(\n    COLUMNS\n    (\n        `_created` DateTime MATERIALIZED now()\n    )\n),\nTABLE OVERRIDE `b`\n(\n    PARTITION BY rand()\n)"
         },
         {
             "CREATE DATABASE db ENGINE=MaterializeMySQL('addr:port', 'db', 'user', 'pw') TABLE OVERRIDE tbl (COLUMNS (id UUID) PARTITION BY toYYYYMM(created))",
diff --git a/src/Planner/CollectSets.cpp b/src/Planner/CollectSets.cpp
index 02069aad292..8dd7c6637bf 100644
--- a/src/Planner/CollectSets.cpp
+++ b/src/Planner/CollectSets.cpp
@@ -8,9 +8,13 @@
 #include <Analyzer/Utils.h>
 #include <Analyzer/SetUtils.h>
 #include <Analyzer/InDepthQueryTreeVisitor.h>
+#include <Analyzer/ColumnNode.h>
 #include <Analyzer/ConstantNode.h>
 #include <Analyzer/FunctionNode.h>
 #include <Analyzer/TableNode.h>
+#include <DataTypes/DataTypeTuple.h>
+#include <DataTypes/DataTypeLowCardinality.h>
+#include <Planner/Planner.h>
 
 namespace DB
 {
@@ -41,11 +45,7 @@ public:
         auto in_second_argument_node_type = in_second_argument->getNodeType();
 
         const auto & settings = planner_context.getQueryContext()->getSettingsRef();
-
-        String set_key = planner_context.createSetKey(in_second_argument);
-
-        if (planner_context.hasSet(set_key))
-            return;
+        auto & sets = planner_context.getPreparedSets();
 
         /// Tables and table functions are replaced with subquery at Analysis stage, except special Set table.
         auto * second_argument_table = in_second_argument->as<TableNode>();
@@ -54,22 +54,69 @@ public:
         if (storage_set)
         {
             /// Handle storage_set as ready set.
-            planner_context.registerSet(set_key, PlannerSet(FutureSet(storage_set->getSet())));
+            auto set_key = in_second_argument->getTreeHash();
+            sets.addFromStorage(set_key, storage_set->getSet());
         }
         else if (const auto * constant_node = in_second_argument->as<ConstantNode>())
         {
-            auto set = makeSetForConstantValue(
+            auto set = getSetElementsForConstantValue(
                 in_first_argument->getResultType(),
                 constant_node->getValue(),
                 constant_node->getResultType(),
-                settings);
+                settings.transform_null_in);
 
-            planner_context.registerSet(set_key, PlannerSet(FutureSet(std::move(set))));
+            DataTypes set_element_types = {in_first_argument->getResultType()};
+            const auto * left_tuple_type = typeid_cast<const DataTypeTuple *>(set_element_types.front().get());
+            if (left_tuple_type && left_tuple_type->getElements().size() != 1)
+                set_element_types = left_tuple_type->getElements();
+
+            set_element_types = Set::getElementTypes(std::move(set_element_types), settings.transform_null_in);
+            auto set_key = in_second_argument->getTreeHash();
+
+            if (sets.findTuple(set_key, set_element_types))
+                return;
+
+            sets.addFromTuple(set_key, std::move(set), settings);
         }
         else if (in_second_argument_node_type == QueryTreeNodeType::QUERY ||
-            in_second_argument_node_type == QueryTreeNodeType::UNION)
+            in_second_argument_node_type == QueryTreeNodeType::UNION ||
+            in_second_argument_node_type == QueryTreeNodeType::TABLE)
         {
-            planner_context.registerSet(set_key, PlannerSet(in_second_argument));
+            auto set_key = in_second_argument->getTreeHash();
+            if (sets.findSubquery(set_key))
+                return;
+
+            auto subquery_to_execute = in_second_argument;
+
+            if (auto * table_node = in_second_argument->as<TableNode>())
+            {
+                auto storage_snapshot = table_node->getStorageSnapshot();
+                auto columns_to_select = storage_snapshot->getColumns(GetColumnsOptions(GetColumnsOptions::Ordinary));
+
+                size_t columns_to_select_size = columns_to_select.size();
+
+                auto column_nodes_to_select = std::make_shared<ListNode>();
+                column_nodes_to_select->getNodes().reserve(columns_to_select_size);
+
+                NamesAndTypes projection_columns;
+                projection_columns.reserve(columns_to_select_size);
+
+                for (auto & column : columns_to_select)
+                {
+                    column_nodes_to_select->getNodes().emplace_back(std::make_shared<ColumnNode>(column, subquery_to_execute));
+                    projection_columns.emplace_back(column.name, column.type);
+                }
+
+                auto subquery_for_table = std::make_shared<QueryNode>(Context::createCopy(planner_context.getQueryContext()));
+                subquery_for_table->setIsSubquery(true);
+                subquery_for_table->getProjectionNode() = std::move(column_nodes_to_select);
+                subquery_for_table->getJoinTree() = std::move(subquery_to_execute);
+                subquery_for_table->resolveProjectionColumns(std::move(projection_columns));
+
+                subquery_to_execute = std::move(subquery_for_table);
+            }
+
+            sets.addFromSubquery(set_key, std::move(subquery_to_execute), settings);
         }
         else
         {
diff --git a/src/Planner/CollectSets.h b/src/Planner/CollectSets.h
index 94f792e877b..5f9f7a5a466 100644
--- a/src/Planner/CollectSets.h
+++ b/src/Planner/CollectSets.h
@@ -7,6 +7,8 @@
 namespace DB
 {
 
+struct SelectQueryOptions;
+
 /** Collect prepared sets and sets for subqueries that are necessary to execute IN function and its variations.
   * Collected sets are registered in planner context.
   */
diff --git a/src/Planner/Planner.cpp b/src/Planner/Planner.cpp
index 7292f73e21c..9f6c22f90f3 100644
--- a/src/Planner/Planner.cpp
+++ b/src/Planner/Planner.cpp
@@ -3,11 +3,13 @@
 #include <Core/ProtocolDefines.h>
 #include <Common/logger_useful.h>
 #include <Common/ProfileEvents.h>
+#include <Columns/ColumnSet.h>
 
 #include <DataTypes/DataTypeString.h>
 
 #include <Functions/FunctionFactory.h>
 #include <Functions/CastOverloadResolver.h>
+#include <Functions/indexHint.h>
 
 #include <QueryPipeline/Pipe.h>
 #include <Processors/Sources/SourceFromSingleChunk.h>
@@ -43,6 +45,7 @@
 #include <Storages/IStorage.h>
 
 #include <Analyzer/Utils.h>
+#include <Analyzer/ColumnNode.h>
 #include <Analyzer/ConstantNode.h>
 #include <Analyzer/FunctionNode.h>
 #include <Analyzer/SortNode.h>
@@ -893,49 +896,72 @@ void addOffsetStep(QueryPlan & query_plan, const QueryAnalysisResult & query_ana
     query_plan.addStep(std::move(offsets_step));
 }
 
-void addBuildSubqueriesForSetsStepIfNeeded(QueryPlan & query_plan,
+void collectSetsFromActionsDAG(const ActionsDAGPtr & dag, std::unordered_set<const FutureSet *> & useful_sets)
+{
+    for (const auto & node : dag->getNodes())
+    {
+        if (node.column)
+        {
+            const IColumn * column = node.column.get();
+            if (const auto * column_const = typeid_cast<const ColumnConst *>(column))
+                column = &column_const->getDataColumn();
+
+            if (const auto * column_set = typeid_cast<const ColumnSet *>(column))
+                useful_sets.insert(column_set->getData().get());
+        }
+
+        if (node.type == ActionsDAG::ActionType::FUNCTION && node.function_base->getName() == "indexHint")
+        {
+            ActionsDAG::NodeRawConstPtrs children;
+            if (const auto * adaptor = typeid_cast<const FunctionToFunctionBaseAdaptor *>(node.function_base.get()))
+            {
+                if (const auto * index_hint = typeid_cast<const FunctionIndexHint *>(adaptor->getFunction().get()))
+                {
+                    collectSetsFromActionsDAG(index_hint->getActions(), useful_sets);
+                }
+            }
+        }
+    }
+}
+
+void addBuildSubqueriesForSetsStepIfNeeded(
+    QueryPlan & query_plan,
     const SelectQueryOptions & select_query_options,
     const PlannerContextPtr & planner_context,
     const std::vector<ActionsDAGPtr> & result_actions_to_execute)
 {
-    PreparedSets::SubqueriesForSets subqueries_for_sets;
+    auto subqueries = planner_context->getPreparedSets().getSubqueries();
+    std::unordered_set<const FutureSet *> useful_sets;
 
     for (const auto & actions_to_execute : result_actions_to_execute)
+        collectSetsFromActionsDAG(actions_to_execute, useful_sets);
+
+    auto predicate = [&useful_sets](const auto & set) { return !useful_sets.contains(set.get()); };
+    auto it = std::remove_if(subqueries.begin(), subqueries.end(), std::move(predicate));
+    subqueries.erase(it, subqueries.end());
+
+    for (auto & subquery : subqueries)
     {
-        for (const auto & node : actions_to_execute->getNodes())
-        {
-            const auto & set_key = node.result_name;
-            auto * planner_set = planner_context->getSetOrNull(set_key);
-            if (!planner_set)
-                continue;
+        auto query_tree = subquery->detachQueryTree();
+        auto subquery_options = select_query_options.subquery();
+        Planner subquery_planner(
+            query_tree,
+            subquery_options,
+            planner_context->getGlobalPlannerContext());
+        subquery_planner.buildQueryPlanIfNeeded();
 
-            if (planner_set->getSet().isCreated() || !planner_set->getSubqueryNode())
-                continue;
-
-            auto subquery_options = select_query_options.subquery();
-            Planner subquery_planner(
-                planner_set->getSubqueryNode(),
-                subquery_options,
-                planner_context->getGlobalPlannerContext());
-            subquery_planner.buildQueryPlanIfNeeded();
-
-            const auto & settings = planner_context->getQueryContext()->getSettingsRef();
-            SizeLimits size_limits_for_set = {settings.max_rows_in_set, settings.max_bytes_in_set, settings.set_overflow_mode};
-            bool tranform_null_in = settings.transform_null_in;
-            auto set = std::make_shared<Set>(size_limits_for_set, false /*fill_set_elements*/, tranform_null_in);
-
-            SubqueryForSet subquery_for_set;
-            subquery_for_set.key = set_key;
-            subquery_for_set.set_in_progress = set;
-            subquery_for_set.set = planner_set->getSet();
-            subquery_for_set.promise_to_fill_set = planner_set->extractPromiseToBuildSet();
-            subquery_for_set.source = std::make_unique<QueryPlan>(std::move(subquery_planner).extractQueryPlan());
-
-            subqueries_for_sets.emplace(set_key, std::move(subquery_for_set));
-        }
+        subquery->setQueryPlan(std::make_unique<QueryPlan>(std::move(subquery_planner).extractQueryPlan()));
     }
 
-    addCreatingSetsStep(query_plan, std::move(subqueries_for_sets), planner_context->getQueryContext());
+    if (!subqueries.empty())
+    {
+        auto step = std::make_unique<DelayedCreatingSetsStep>(
+            query_plan.getCurrentDataStream(),
+            std::move(subqueries),
+            planner_context->getQueryContext());
+
+        query_plan.addStep(std::move(step));
+    }
 }
 
 /// Support for `additional_result_filter` setting
diff --git a/src/Planner/PlannerActionsVisitor.cpp b/src/Planner/PlannerActionsVisitor.cpp
index c64d82299ca..7575828e64d 100644
--- a/src/Planner/PlannerActionsVisitor.cpp
+++ b/src/Planner/PlannerActionsVisitor.cpp
@@ -16,6 +16,8 @@
 #include <DataTypes/DataTypeSet.h>
 
 #include <Common/FieldVisitorToString.h>
+#include <DataTypes/DataTypeTuple.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 
 #include <Columns/ColumnSet.h>
 #include <Columns/ColumnConst.h>
@@ -623,33 +625,67 @@ PlannerActionsVisitorImpl::NodeNameAndNodeMinLevel PlannerActionsVisitorImpl::vi
 PlannerActionsVisitorImpl::NodeNameAndNodeMinLevel PlannerActionsVisitorImpl::makeSetForInFunction(const QueryTreeNodePtr & node)
 {
     const auto & function_node = node->as<FunctionNode &>();
+    auto in_first_argument = function_node.getArguments().getNodes().at(0);
     auto in_second_argument = function_node.getArguments().getNodes().at(1);
 
-    auto set_key = planner_context->createSetKey(in_second_argument);
-    const auto & planner_set = planner_context->getSetOrThrow(set_key);
+    //auto set_key = planner_context->createSetKey(in_second_argument);
+
+    DataTypes set_element_types;
+
+    auto in_second_argument_node_type = in_second_argument->getNodeType();
+
+    bool subquery_or_table =
+        in_second_argument_node_type == QueryTreeNodeType::QUERY ||
+        in_second_argument_node_type == QueryTreeNodeType::UNION ||
+        in_second_argument_node_type == QueryTreeNodeType::TABLE;
+
+    FutureSetPtr set;
+    auto set_key = in_second_argument->getTreeHash();
+
+    if (!subquery_or_table)
+    {
+        set_element_types = {in_first_argument->getResultType()};
+        const auto * left_tuple_type = typeid_cast<const DataTypeTuple *>(set_element_types.front().get());
+        if (left_tuple_type && left_tuple_type->getElements().size() != 1)
+            set_element_types = left_tuple_type->getElements();
+
+        set_element_types = Set::getElementTypes(std::move(set_element_types), planner_context->getQueryContext()->getSettingsRef().transform_null_in);
+        set = planner_context->getPreparedSets().findTuple(set_key, set_element_types);
+    }
+    else
+    {
+        set = planner_context->getPreparedSets().findSubquery(set_key);
+        if (!set)
+            set = planner_context->getPreparedSets().findStorage(set_key);
+    }
+
+    if (!set)
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+            "No set is registered for key {}",
+            PreparedSets::toString(set_key, set_element_types));
 
     ColumnWithTypeAndName column;
-    column.name = set_key;
+    column.name = planner_context->createSetKey(in_second_argument);
     column.type = std::make_shared<DataTypeSet>();
 
-    bool set_is_created = planner_set.getSet().isCreated();
-    auto column_set = ColumnSet::create(1, planner_set.getSet());
+    bool set_is_created = set->get() != nullptr;
+    auto column_set = ColumnSet::create(1, std::move(set));
 
     if (set_is_created)
         column.column = ColumnConst::create(std::move(column_set), 1);
     else
         column.column = std::move(column_set);
 
-    actions_stack[0].addConstantIfNecessary(set_key, column);
+    actions_stack[0].addConstantIfNecessary(column.name, column);
 
     size_t actions_stack_size = actions_stack.size();
     for (size_t i = 1; i < actions_stack_size; ++i)
     {
         auto & actions_stack_node = actions_stack[i];
-        actions_stack_node.addInputConstantColumnIfNecessary(set_key, column);
+        actions_stack_node.addInputConstantColumnIfNecessary(column.name, column);
     }
 
-    return {set_key, 0};
+    return {column.name, 0};
 }
 
 PlannerActionsVisitorImpl::NodeNameAndNodeMinLevel PlannerActionsVisitorImpl::visitIndexHintFunction(const QueryTreeNodePtr & node)
diff --git a/src/Planner/PlannerContext.cpp b/src/Planner/PlannerContext.cpp
index 346cc6d2080..3c75d4fbea8 100644
--- a/src/Planner/PlannerContext.cpp
+++ b/src/Planner/PlannerContext.cpp
@@ -19,18 +19,10 @@ const ColumnIdentifier & GlobalPlannerContext::createColumnIdentifier(const Quer
     return createColumnIdentifier(column_node_typed.getColumn(), column_source_node);
 }
 
-const ColumnIdentifier & GlobalPlannerContext::createColumnIdentifier(const NameAndTypePair & column, const QueryTreeNodePtr & column_source_node)
+const ColumnIdentifier & GlobalPlannerContext::createColumnIdentifier(const NameAndTypePair & column, const QueryTreeNodePtr & /*column_source_node*/)
 {
     std::string column_identifier;
 
-    if (column_source_node->hasAlias())
-        column_identifier += column_source_node->getAlias();
-    else if (const auto * table_source_node = column_source_node->as<TableNode>())
-        column_identifier += table_source_node->getStorageID().getFullNameNotQuoted();
-
-    if (!column_identifier.empty())
-        column_identifier += '.';
-
     column_identifier += column.name;
     column_identifier += '_' + std::to_string(column_identifiers.size());
 
@@ -126,49 +118,4 @@ PlannerContext::SetKey PlannerContext::createSetKey(const QueryTreeNodePtr & set
     return "__set_" + toString(set_source_hash.first) + '_' + toString(set_source_hash.second);
 }
 
-void PlannerContext::registerSet(const SetKey & key, PlannerSet planner_set)
-{
-    if (!planner_set.getSet().isValid())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Set must be initialized");
-
-    const auto & subquery_node = planner_set.getSubqueryNode();
-    if (subquery_node)
-    {
-        auto node_type = subquery_node->getNodeType();
-
-        if (node_type != QueryTreeNodeType::QUERY &&
-            node_type != QueryTreeNodeType::UNION)
-            throw Exception(ErrorCodes::LOGICAL_ERROR,
-                "Invalid node for set table expression. Expected query or union. Actual {}",
-                subquery_node->formatASTForErrorMessage());
-    }
-
-    set_key_to_set.emplace(key, std::move(planner_set));
-}
-
-bool PlannerContext::hasSet(const SetKey & key) const
-{
-    return set_key_to_set.contains(key);
-}
-
-const PlannerSet & PlannerContext::getSetOrThrow(const SetKey & key) const
-{
-    auto it = set_key_to_set.find(key);
-    if (it == set_key_to_set.end())
-        throw Exception(ErrorCodes::LOGICAL_ERROR,
-            "No set is registered for key {}",
-            key);
-
-    return it->second;
-}
-
-PlannerSet * PlannerContext::getSetOrNull(const SetKey & key)
-{
-    auto it = set_key_to_set.find(key);
-    if (it == set_key_to_set.end())
-        return nullptr;
-
-    return &it->second;
-}
-
 }
diff --git a/src/Planner/PlannerContext.h b/src/Planner/PlannerContext.h
index 4199c863033..aceb313d4b5 100644
--- a/src/Planner/PlannerContext.h
+++ b/src/Planner/PlannerContext.h
@@ -44,52 +44,6 @@ private:
 
 using GlobalPlannerContextPtr = std::shared_ptr<GlobalPlannerContext>;
 
-/** PlannerSet is wrapper around Set that is used during query planning.
-  *
-  * If subquery node is null, such set is already prepared for execution.
-  *
-  * If subquery node is not null, then set must be build from the result of the subquery.
-  * If subquery node is not null, it must have QUERY or UNION type.
-  */
-class PlannerSet
-{
-public:
-    /// Construct planner set that is ready for execution
-    explicit PlannerSet(FutureSet set_)
-        : set(std::move(set_))
-    {}
-
-    /// Construct planner set with set and subquery node
-    explicit PlannerSet(QueryTreeNodePtr subquery_node_)
-        : set(promise_to_build_set.get_future())
-        , subquery_node(std::move(subquery_node_))
-    {}
-
-    /// Get a reference to a set that might be not built yet
-    const FutureSet & getSet() const
-    {
-        return set;
-    }
-
-    /// Get subquery node
-    const QueryTreeNodePtr & getSubqueryNode() const
-    {
-        return subquery_node;
-    }
-
-    /// This promise will be fulfilled when set is built and all FutureSet objects will become ready
-    std::promise<SetPtr> extractPromiseToBuildSet()
-    {
-        return std::move(promise_to_build_set);
-    }
-
-private:
-    std::promise<SetPtr> promise_to_build_set;
-    FutureSet set;
-
-    QueryTreeNodePtr subquery_node;
-};
-
 class PlannerContext
 {
 public:
@@ -177,28 +131,10 @@ public:
 
     using SetKey = std::string;
 
-    using SetKeyToSet = std::unordered_map<String, PlannerSet>;
-
     /// Create set key for set source node
     static SetKey createSetKey(const QueryTreeNodePtr & set_source_node);
 
-    /// Register set for set key
-    void registerSet(const SetKey & key, PlannerSet planner_set);
-
-    /// Returns true if set is registered for key, false otherwise
-    bool hasSet(const SetKey & key) const;
-
-    /// Get set for key, if no set is registered logical exception is thrown
-    const PlannerSet & getSetOrThrow(const SetKey & key) const;
-
-    /// Get set for key, if no set is registered null is returned
-    PlannerSet * getSetOrNull(const SetKey & key);
-
-    /// Get registered sets
-    const SetKeyToSet & getRegisteredSets() const
-    {
-        return set_key_to_set;
-    }
+    PreparedSets & getPreparedSets() { return prepared_sets; }
 
 private:
     /// Query context
@@ -214,8 +150,7 @@ private:
     std::unordered_map<QueryTreeNodePtr, TableExpressionData> table_expression_node_to_data;
 
     /// Set key to set
-    SetKeyToSet set_key_to_set;
-
+    PreparedSets prepared_sets;
 };
 
 using PlannerContextPtr = std::shared_ptr<PlannerContext>;
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index 4f091f73187..5d8f8ca8741 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -106,7 +106,11 @@ void checkAccessRights(const TableNode & table_node, const Names & column_names,
             storage_id.getFullTableName());
     }
 
-    query_context->checkAccess(AccessType::SELECT, storage_id, column_names);
+    // In case of cross-replication we don't know what database is used for the table.
+    // `storage_id.hasDatabase()` can return false only on the initiator node.
+    // Each shard will use the default database (in the case of cross-replication shards may have different defaults).
+    if (storage_id.hasDatabase())
+        query_context->checkAccess(AccessType::SELECT, storage_id, column_names);
 }
 
 NameAndTypePair chooseSmallestColumnToReadFromStorage(const StoragePtr & storage, const StorageSnapshotPtr & storage_snapshot)
@@ -170,7 +174,7 @@ bool applyTrivialCountIfPossible(
     QueryPlan & query_plan,
     const TableNode & table_node,
     const QueryTreeNodePtr & query_tree,
-    const ContextPtr & query_context,
+    ContextMutablePtr & query_context,
     const Names & columns_names)
 {
     const auto & settings = query_context->getSettingsRef();
@@ -208,8 +212,7 @@ bool applyTrivialCountIfPossible(
     if (storage->hasLightweightDeletedMask())
         return false;
 
-    if (settings.max_parallel_replicas > 1 ||
-        settings.allow_experimental_query_deduplication
+    if (settings.allow_experimental_query_deduplication
         || settings.empty_result_for_aggregation_by_empty_set)
         return false;
 
@@ -228,6 +231,18 @@ bool applyTrivialCountIfPossible(
     if (!num_rows)
         return false;
 
+    if (settings.max_parallel_replicas > 1)
+    {
+        if (!settings.parallel_replicas_custom_key.value.empty() || settings.allow_experimental_parallel_reading_from_replicas == 0)
+            return false;
+
+        /// The query could use trivial count if it didn't use parallel replicas, so let's disable it
+        query_context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
+        query_context->setSetting("max_parallel_replicas", UInt64{0});
+        LOG_TRACE(&Poco::Logger::get("Planner"), "Disabling parallel replicas to be able to use a trivial count optimization");
+
+    }
+
     /// Set aggregation state
     const AggregateFunctionCount & agg_count = *count_func;
     std::vector<char> state(agg_count.sizeOfData());
@@ -619,7 +634,7 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
             is_single_table_expression &&
             table_node &&
             select_query_info.has_aggregates &&
-            applyTrivialCountIfPossible(query_plan, *table_node, select_query_info.query_tree, planner_context->getQueryContext(), table_expression_data.getColumnNames());
+            applyTrivialCountIfPossible(query_plan, *table_node, select_query_info.query_tree, planner_context->getMutableQueryContext(), table_expression_data.getColumnNames());
 
         if (is_trivial_count_applied)
         {
@@ -862,10 +877,11 @@ JoinTreeQueryPlan buildQueryPlanForJoinNode(const QueryTreeNodePtr & join_table_
 
     JoinClausesAndActions join_clauses_and_actions;
     JoinKind join_kind = join_node.getKind();
+    JoinStrictness join_strictness = join_node.getStrictness();
 
     std::optional<bool> join_constant;
 
-    if (join_node.getStrictness() == JoinStrictness::All)
+    if (join_strictness == JoinStrictness::All)
         join_constant = tryExtractConstantFromJoinNode(join_table_expression);
 
     if (join_constant)
diff --git a/src/Planner/Utils.cpp b/src/Planner/Utils.cpp
index 5c61b2fc2c7..733db0f00bc 100644
--- a/src/Planner/Utils.cpp
+++ b/src/Planner/Utils.cpp
@@ -107,7 +107,10 @@ Block buildCommonHeaderForUnion(const Blocks & queries_headers, SelectUnionMode
 ASTPtr queryNodeToSelectQuery(const QueryTreeNodePtr & query_node)
 {
     auto & query_node_typed = query_node->as<QueryNode &>();
-    auto result_ast = query_node_typed.toAST();
+
+    // In case of cross-replication we don't know what database is used for the table.
+    // Each shard will use the default database (in the case of cross-replication shards may have different defaults).
+    auto result_ast = query_node_typed.toAST({ .qualify_indentifiers_with_database = false });
 
     while (true)
     {
diff --git a/src/Processors/Chunk.cpp b/src/Processors/Chunk.cpp
index 0a4b2413e4c..9ec5bb7adde 100644
--- a/src/Processors/Chunk.cpp
+++ b/src/Processors/Chunk.cpp
@@ -2,6 +2,7 @@
 #include <IO/WriteHelpers.h>
 #include <IO/Operators.h>
 #include <Columns/ColumnSparse.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 
 namespace DB
 {
@@ -202,13 +203,21 @@ const ChunkMissingValues::RowsBitMask & ChunkMissingValues::getDefaultsBitmask(s
     return none;
 }
 
+void convertToFullIfConst(Chunk & chunk)
+{
+    size_t num_rows = chunk.getNumRows();
+    auto columns = chunk.detachColumns();
+    for (auto & column : columns)
+        column = column->convertToFullColumnIfConst();
+    chunk.setColumns(std::move(columns), num_rows);
+}
+
 void convertToFullIfSparse(Chunk & chunk)
 {
     size_t num_rows = chunk.getNumRows();
     auto columns = chunk.detachColumns();
     for (auto & column : columns)
         column = recursiveRemoveSparse(column);
-
     chunk.setColumns(std::move(columns), num_rows);
 }
 
diff --git a/src/Processors/Chunk.h b/src/Processors/Chunk.h
index 6f2097b71f1..413872d512d 100644
--- a/src/Processors/Chunk.h
+++ b/src/Processors/Chunk.h
@@ -149,6 +149,7 @@ private:
 /// It's needed, when you have to access to the internals of the column,
 /// or when you need to perform operation with two columns
 /// and their structure must be equal (e.g. compareAt).
+void convertToFullIfConst(Chunk & chunk);
 void convertToFullIfSparse(Chunk & chunk);
 
 }
diff --git a/src/Processors/Formats/IInputFormat.h b/src/Processors/Formats/IInputFormat.h
index a5a39a5f5b4..86f892b630d 100644
--- a/src/Processors/Formats/IInputFormat.h
+++ b/src/Processors/Formats/IInputFormat.h
@@ -53,6 +53,8 @@ public:
 
     void setErrorsLogger(const InputFormatErrorsLoggerPtr & errors_logger_) { errors_logger = errors_logger_; }
 
+    virtual size_t getApproxBytesReadForChunk() const { return 0; }
+
 protected:
     ColumnMappingPtr column_mapping{};
 
diff --git a/src/Processors/Formats/IRowInputFormat.cpp b/src/Processors/Formats/IRowInputFormat.cpp
index 2686a44806d..0728aecf61f 100644
--- a/src/Processors/Formats/IRowInputFormat.cpp
+++ b/src/Processors/Formats/IRowInputFormat.cpp
@@ -96,6 +96,7 @@ Chunk IRowInputFormat::generate()
     block_missing_values.clear();
 
     size_t num_rows = 0;
+    size_t chunk_start_offset = getDataOffsetMaybeCompressed(getReadBuffer());
 
     try
     {
@@ -242,6 +243,7 @@ Chunk IRowInputFormat::generate()
         column->finalize();
 
     Chunk chunk(std::move(columns), num_rows);
+    approx_bytes_read_for_chunk = getDataOffsetMaybeCompressed(getReadBuffer()) - chunk_start_offset;
     return chunk;
 }
 
diff --git a/src/Processors/Formats/IRowInputFormat.h b/src/Processors/Formats/IRowInputFormat.h
index a11462549ff..b7b1b0b29a6 100644
--- a/src/Processors/Formats/IRowInputFormat.h
+++ b/src/Processors/Formats/IRowInputFormat.h
@@ -74,6 +74,8 @@ protected:
 
     size_t getTotalRows() const { return total_rows; }
 
+    size_t getApproxBytesReadForChunk() const override { return approx_bytes_read_for_chunk; }
+
     Serializations serializations;
 
 private:
@@ -83,6 +85,7 @@ private:
     size_t num_errors = 0;
 
     BlockMissingValues block_missing_values;
+    size_t approx_bytes_read_for_chunk;
 };
 
 }
diff --git a/src/Processors/Formats/ISchemaReader.cpp b/src/Processors/Formats/ISchemaReader.cpp
index c96cb373a2d..1fa520eaaee 100644
--- a/src/Processors/Formats/ISchemaReader.cpp
+++ b/src/Processors/Formats/ISchemaReader.cpp
@@ -1,6 +1,7 @@
 #include <Processors/Formats/ISchemaReader.h>
 #include <Formats/SchemaInferenceUtils.h>
 #include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypeNullable.h>
 #include <Common/logger_useful.h>
 #include <Interpreters/parseColumnsListForTableFunction.h>
 #include <boost/algorithm/string.hpp>
@@ -54,14 +55,23 @@ void checkFinalInferredType(
 
     if (settings.schema_inference_make_columns_nullable)
         type = makeNullableRecursively(type);
+    /// In case when data for some column could contain nulls and regular values,
+    /// resulting inferred type is Nullable.
+    /// If input_format_null_as_default is enabled, we should remove Nullable type.
+    else if (settings.null_as_default)
+        type = removeNullable(type);
 }
 
 IIRowSchemaReader::IIRowSchemaReader(ReadBuffer & in_, const FormatSettings & format_settings_, DataTypePtr default_type_)
-    : ISchemaReader(in_), default_type(default_type_), hints_str(format_settings_.schema_inference_hints), format_settings(format_settings_)
+    : ISchemaReader(in_)
+    , max_rows_to_read(format_settings_.max_rows_to_read_for_schema_inference)
+    , max_bytes_to_read(format_settings_.max_bytes_to_read_for_schema_inference)
+    , default_type(default_type_)
+    , hints_str(format_settings_.schema_inference_hints)
+    , format_settings(format_settings_)
 {
 }
 
-
 void IIRowSchemaReader::setContext(ContextPtr & context)
 {
     ColumnsDescription columns;
@@ -99,11 +109,11 @@ IRowSchemaReader::IRowSchemaReader(ReadBuffer & in_, const FormatSettings & form
 
 NamesAndTypesList IRowSchemaReader::readSchema()
 {
-    if (max_rows_to_read == 0)
+    if (max_rows_to_read == 0 || max_bytes_to_read == 0)
         throw Exception(
             ErrorCodes::BAD_ARGUMENTS,
-            "Cannot read rows to determine the schema, the maximum number of rows to read is set to 0. "
-            "Most likely setting input_format_max_rows_to_read_for_schema_inference is set to 0");
+            "Cannot read rows to determine the schema, the maximum number of rows (or bytes) to read is set to 0. "
+            "Most likely setting input_format_max_rows_to_read_for_schema_inference or input_format_max_bytes_to_read_for_schema_inference is set to 0");
 
     DataTypes data_types = readRowAndGetDataTypes();
 
@@ -143,7 +153,7 @@ NamesAndTypesList IRowSchemaReader::readSchema()
             data_types[i] = hint_it->second;
     }
 
-    for (rows_read = 1; rows_read < max_rows_to_read; ++rows_read)
+    for (rows_read = 1; rows_read < max_rows_to_read && in.count() < max_bytes_to_read; ++rows_read)
     {
         DataTypes new_data_types = readRowAndGetDataTypes();
         if (new_data_types.empty())
@@ -220,11 +230,11 @@ IRowWithNamesSchemaReader::IRowWithNamesSchemaReader(ReadBuffer & in_, const For
 
 NamesAndTypesList IRowWithNamesSchemaReader::readSchema()
 {
-    if (max_rows_to_read == 0)
+    if (max_rows_to_read == 0 || max_bytes_to_read == 0)
         throw Exception(
             ErrorCodes::BAD_ARGUMENTS,
-            "Cannot read rows to determine the schema, the maximum number of rows to read is set to 0. "
-            "Most likely setting input_format_max_rows_to_read_for_schema_inference is set to 0");
+            "Cannot read rows to determine the schema, the maximum number of rows (or bytes) to read is set to 0. "
+            "Most likely setting input_format_max_rows_to_read_for_schema_inference or input_format_max_bytes_to_read_for_schema_inference is set to 0");
 
     bool eof = false;
     auto names_and_types = readRowAndGetNamesAndDataTypes(eof);
@@ -245,7 +255,7 @@ NamesAndTypesList IRowWithNamesSchemaReader::readSchema()
         names_order.push_back(name);
     }
 
-    for (rows_read = 1; rows_read < max_rows_to_read; ++rows_read)
+    for (rows_read = 1; rows_read < max_rows_to_read && in.count() < max_bytes_to_read; ++rows_read)
     {
         auto new_names_and_types = readRowAndGetNamesAndDataTypes(eof);
         if (eof)
diff --git a/src/Processors/Formats/ISchemaReader.h b/src/Processors/Formats/ISchemaReader.h
index 78b34a07840..40702198a57 100644
--- a/src/Processors/Formats/ISchemaReader.h
+++ b/src/Processors/Formats/ISchemaReader.h
@@ -32,7 +32,7 @@ public:
     virtual bool needContext() const { return false; }
     virtual void setContext(ContextPtr &) {}
 
-    virtual void setMaxRowsToRead(size_t) {}
+    virtual void setMaxRowsAndBytesToRead(size_t, size_t) {}
     virtual size_t getNumRowsRead() const { return 0; }
 
     virtual ~ISchemaReader() = default;
@@ -54,12 +54,17 @@ public:
     virtual void transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type);
 
 protected:
-    void setMaxRowsToRead(size_t max_rows) override { max_rows_to_read = max_rows; }
+    void setMaxRowsAndBytesToRead(size_t max_rows, size_t max_bytes) override
+    {
+        max_rows_to_read = max_rows;
+        max_bytes_to_read = max_bytes;
+    }
     size_t getNumRowsRead() const override { return rows_read; }
 
     virtual void transformFinalTypeIfNeeded(DataTypePtr &) {}
 
     size_t max_rows_to_read;
+    size_t max_bytes_to_read;
     size_t rows_read = 0;
     DataTypePtr default_type;
     String hints_str;
diff --git a/src/Processors/Formats/Impl/ArrowBlockInputFormat.cpp b/src/Processors/Formats/Impl/ArrowBlockInputFormat.cpp
index ef1a4d9754d..2fadc09e80f 100644
--- a/src/Processors/Formats/Impl/ArrowBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ArrowBlockInputFormat.cpp
@@ -33,7 +33,7 @@ Chunk ArrowBlockInputFormat::generate()
     Chunk res;
     block_missing_values.clear();
     arrow::Result<std::shared_ptr<arrow::RecordBatch>> batch_result;
-
+    size_t batch_start = getDataOffsetMaybeCompressed(*in);
     if (stream)
     {
         if (!stream_reader)
@@ -76,6 +76,11 @@ Chunk ArrowBlockInputFormat::generate()
     BlockMissingValues * block_missing_values_ptr = format_settings.defaults_for_omitted_fields ? &block_missing_values : nullptr;
     arrow_column_to_ch_column->arrowTableToCHChunk(res, *table_result, (*table_result)->num_rows(), block_missing_values_ptr);
 
+    /// There is no easy way to get original record batch size from Arrow metadata.
+    /// Let's just use the number of bytes read from read buffer.
+    auto batch_end = getDataOffsetMaybeCompressed(*in);
+    if (batch_end > batch_start)
+        approx_bytes_read_for_chunk = batch_end - batch_start;
     return res;
 }
 
diff --git a/src/Processors/Formats/Impl/ArrowBlockInputFormat.h b/src/Processors/Formats/Impl/ArrowBlockInputFormat.h
index 3db76777891..df77994c3d5 100644
--- a/src/Processors/Formats/Impl/ArrowBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/ArrowBlockInputFormat.h
@@ -27,6 +27,8 @@ public:
 
     const BlockMissingValues & getMissingValues() const override;
 
+    size_t getApproxBytesReadForChunk() const override { return approx_bytes_read_for_chunk; }
+
 private:
     Chunk generate() override;
 
@@ -48,6 +50,7 @@ private:
     int record_batch_current = 0;
 
     BlockMissingValues block_missing_values;
+    size_t approx_bytes_read_for_chunk;
 
     const FormatSettings format_settings;
 
diff --git a/src/Processors/Formats/Impl/ArrowBlockOutputFormat.cpp b/src/Processors/Formats/Impl/ArrowBlockOutputFormat.cpp
index 1e72c949b09..8bd1cf3897d 100644
--- a/src/Processors/Formats/Impl/ArrowBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/ArrowBlockOutputFormat.cpp
@@ -58,7 +58,9 @@ void ArrowBlockOutputFormat::consume(Chunk chunk)
             format_settings.arrow.output_fixed_string_as_fixed_byte_array);
     }
 
-    ch_column_to_arrow_column->chChunkToArrowTable(arrow_table, chunk, columns_num);
+    auto chunks = std::vector<Chunk>();
+    chunks.push_back(std::move(chunk));
+    ch_column_to_arrow_column->chChunkToArrowTable(arrow_table, chunks, columns_num);
 
     if (!writer)
         prepareWriter(arrow_table->schema());
diff --git a/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp b/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp
index 0b4700c9d4c..5a7306111a5 100644
--- a/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp
+++ b/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp
@@ -202,13 +202,10 @@ static ColumnWithTypeAndName readColumnWithBigNumberFromBinaryData(std::shared_p
 
         for (size_t i = 0; i != chunk_length; ++i)
         {
+            /// If at least one value size is not equal to the size if big integer, fallback to reading String column and further cast to result type.
             if (!chunk.IsNull(i) && chunk.value_length(i) != sizeof(ValueType))
-                throw Exception(
-                    ErrorCodes::BAD_ARGUMENTS,
-                    "Cannot insert data into {} column from binary value, expected data with size {}, got {}",
-                    column_type->getName(),
-                    sizeof(ValueType),
-                    chunk.value_length(i));
+                return readColumnWithStringData<arrow::BinaryArray>(arrow_column, column_name);
+
             total_size += chunk_length;
         }
     }
diff --git a/src/Processors/Formats/Impl/AvroRowInputFormat.cpp b/src/Processors/Formats/Impl/AvroRowInputFormat.cpp
index c2602a4d1d5..1ec7491658e 100644
--- a/src/Processors/Formats/Impl/AvroRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/AvroRowInputFormat.cpp
@@ -176,13 +176,22 @@ static AvroDeserializer::DeserializeFn createDecimalDeserializeFn(const avro::No
     {
         static constexpr size_t field_type_size = sizeof(typename DecimalType::FieldType);
         decoder.decodeString(tmp);
-        if (tmp.size() != field_type_size)
+        if (tmp.size() > field_type_size)
             throw ParsingException(
                 ErrorCodes::CANNOT_PARSE_UUID,
-                "Cannot parse type {}, expected binary data with size {}, got {}",
+                "Cannot parse type {}, expected binary data with size equal to or less than {}, got {}",
                 target_type->getName(),
                 field_type_size,
                 tmp.size());
+        else if (tmp.size() != field_type_size)
+        {
+            /// Extent value to required size by adding padding.
+            /// Check if value is negative or positive.
+            if (tmp[0] & 128)
+                tmp = std::string(field_type_size - tmp.size(), 0xff) + tmp;
+            else
+                tmp = std::string(field_type_size - tmp.size(), 0) + tmp;
+        }
 
         typename DecimalType::FieldType field;
         ReadBufferFromString buf(tmp);
@@ -256,8 +265,7 @@ AvroDeserializer::DeserializeFn AvroDeserializer::createDeserializeFn(const avro
                     if (tmp.length() != 36)
                         throw ParsingException(ErrorCodes::CANNOT_PARSE_UUID, "Cannot parse uuid {}", tmp);
 
-                    UUID uuid;
-                    parseUUID(reinterpret_cast<const UInt8 *>(tmp.data()), std::reverse_iterator<UInt8 *>(reinterpret_cast<UInt8 *>(&uuid) + 16));
+                    const UUID uuid = parseUUID({reinterpret_cast<const UInt8 *>(tmp.data()), tmp.length()});
                     assert_cast<DataTypeUUID::ColumnType &>(column).insertValue(uuid);
                     return true;
                 };
diff --git a/src/Processors/Formats/Impl/AvroRowOutputFormat.cpp b/src/Processors/Formats/Impl/AvroRowOutputFormat.cpp
index c743b2c1766..f0985e7cffc 100644
--- a/src/Processors/Formats/Impl/AvroRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/AvroRowOutputFormat.cpp
@@ -329,9 +329,8 @@ AvroSerializer::SchemaWithSerializeFn AvroSerializer::createSchemaWithSerializeF
             return {schema, [](const IColumn & column, size_t row_num, avro::Encoder & encoder)
             {
                 const auto & uuid = assert_cast<const DataTypeUUID::ColumnType &>(column).getElement(row_num);
-                std::array<UInt8, 36> s;
-                formatUUID(std::reverse_iterator<const UInt8 *>(reinterpret_cast<const UInt8 *>(&uuid) + 16), s.data());
-                encoder.encodeBytes(reinterpret_cast<const uint8_t *>(s.data()), s.size());
+                const auto serialized_uuid = formatUUID(uuid);
+                encoder.encodeBytes(reinterpret_cast<const uint8_t *>(serialized_uuid.data()), serialized_uuid.size());
             }};
         }
         case TypeIndex::Array:
diff --git a/src/Processors/Formats/Impl/CHColumnToArrowColumn.cpp b/src/Processors/Formats/Impl/CHColumnToArrowColumn.cpp
index 19b2dcccf64..c3685e813d3 100644
--- a/src/Processors/Formats/Impl/CHColumnToArrowColumn.cpp
+++ b/src/Processors/Formats/Impl/CHColumnToArrowColumn.cpp
@@ -976,56 +976,75 @@ namespace DB
 
     void CHColumnToArrowColumn::chChunkToArrowTable(
         std::shared_ptr<arrow::Table> & res,
-        const Chunk & chunk,
+        const std::vector<Chunk> & chunks,
         size_t columns_num)
     {
-        /// For arrow::Schema and arrow::Table creation
-        std::vector<std::shared_ptr<arrow::Array>> arrow_arrays;
-        arrow_arrays.reserve(columns_num);
-        for (size_t column_i = 0; column_i < columns_num; ++column_i)
+        std::shared_ptr<arrow::Schema> arrow_schema;
+        std::vector<arrow::ArrayVector> table_data(columns_num);
+
+        for (const auto & chunk : chunks)
         {
-            const ColumnWithTypeAndName & header_column = header_columns[column_i];
-            auto column = chunk.getColumns()[column_i];
-
-            if (!low_cardinality_as_dictionary)
-                column = recursiveRemoveLowCardinality(column);
-
-            if (!is_arrow_fields_initialized)
+            /// For arrow::Schema and arrow::Table creation
+            for (size_t column_i = 0; column_i < columns_num; ++column_i)
             {
-                bool is_column_nullable = false;
-                auto arrow_type = getArrowType(header_column.type, column, header_column.name, format_name, output_string_as_string, output_fixed_string_as_fixed_byte_array, &is_column_nullable);
-                arrow_fields.emplace_back(std::make_shared<arrow::Field>(header_column.name, arrow_type, is_column_nullable));
+                const ColumnWithTypeAndName & header_column = header_columns[column_i];
+                auto column = chunk.getColumns()[column_i];
+
+                if (!low_cardinality_as_dictionary)
+                    column = recursiveRemoveLowCardinality(column);
+
+                if (!is_arrow_fields_initialized)
+                {
+                    bool is_column_nullable = false;
+                    auto arrow_type = getArrowType(
+                        header_column.type,
+                        column,
+                        header_column.name,
+                        format_name,
+                        output_string_as_string,
+                        output_fixed_string_as_fixed_byte_array,
+                        &is_column_nullable);
+                    arrow_fields.emplace_back(std::make_shared<arrow::Field>(header_column.name, arrow_type, is_column_nullable));
+                }
+
+                arrow::MemoryPool * pool = arrow::default_memory_pool();
+                std::unique_ptr<arrow::ArrayBuilder> array_builder;
+                arrow::Status status = MakeBuilder(pool, arrow_fields[column_i]->type(), &array_builder);
+                checkStatus(status, column->getName(), format_name);
+
+                fillArrowArray(
+                    header_column.name,
+                    column,
+                    header_column.type,
+                    nullptr,
+                    array_builder.get(),
+                    format_name,
+                    0,
+                    column->size(),
+                    output_string_as_string,
+                    output_fixed_string_as_fixed_byte_array,
+                    dictionary_values);
+
+                std::shared_ptr<arrow::Array> arrow_array;
+                status = array_builder->Finish(&arrow_array);
+                checkStatus(status, column->getName(), format_name);
+
+                table_data.at(column_i).emplace_back(std::move(arrow_array));
             }
 
-            arrow::MemoryPool* pool = arrow::default_memory_pool();
-            std::unique_ptr<arrow::ArrayBuilder> array_builder;
-            arrow::Status status = MakeBuilder(pool, arrow_fields[column_i]->type(), &array_builder);
-            checkStatus(status, column->getName(), format_name);
-
-            fillArrowArray(
-                header_column.name,
-                column,
-                header_column.type,
-                nullptr,
-                array_builder.get(),
-                format_name,
-                0,
-                column->size(),
-                output_string_as_string,
-                output_fixed_string_as_fixed_byte_array,
-                dictionary_values);
-
-            std::shared_ptr<arrow::Array> arrow_array;
-            status = array_builder->Finish(&arrow_array);
-            checkStatus(status, column->getName(), format_name);
-            arrow_arrays.emplace_back(std::move(arrow_array));
+            is_arrow_fields_initialized = true;
+            if (!arrow_schema)
+                arrow_schema = std::make_shared<arrow::Schema>(arrow_fields);
         }
 
-        std::shared_ptr<arrow::Schema> arrow_schema = std::make_shared<arrow::Schema>(arrow_fields);
+        std::vector<std::shared_ptr<arrow::ChunkedArray>> columns;
+        columns.reserve(columns_num);
+        for (size_t column_i = 0; column_i < columns_num; ++column_i)
+            columns.emplace_back(std::make_shared<arrow::ChunkedArray>(table_data.at(column_i)));
 
-        res = arrow::Table::Make(arrow_schema, arrow_arrays);
-        is_arrow_fields_initialized = true;
+        res = arrow::Table::Make(arrow_schema, columns);
     }
+
 }
 
 #endif
diff --git a/src/Processors/Formats/Impl/CHColumnToArrowColumn.h b/src/Processors/Formats/Impl/CHColumnToArrowColumn.h
index 3649d0eed9b..02766e299a0 100644
--- a/src/Processors/Formats/Impl/CHColumnToArrowColumn.h
+++ b/src/Processors/Formats/Impl/CHColumnToArrowColumn.h
@@ -16,7 +16,7 @@ class CHColumnToArrowColumn
 public:
     CHColumnToArrowColumn(const Block & header, const std::string & format_name_, bool low_cardinality_as_dictionary_, bool output_string_as_string_, bool output_fixed_string_as_fixed_byte_array_);
 
-    void chChunkToArrowTable(std::shared_ptr<arrow::Table> & res, const Chunk & chunk, size_t columns_num);
+    void chChunkToArrowTable(std::shared_ptr<arrow::Table> & res, const std::vector<Chunk> & chunk, size_t columns_num);
 
 private:
     ColumnsWithTypeAndName header_columns;
diff --git a/src/Processors/Formats/Impl/CSVRowInputFormat.cpp b/src/Processors/Formats/Impl/CSVRowInputFormat.cpp
index de955d81651..c17828c6c38 100644
--- a/src/Processors/Formats/Impl/CSVRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/CSVRowInputFormat.cpp
@@ -10,6 +10,7 @@
 #include <Processors/Formats/Impl/CSVRowInputFormat.h>
 #include <DataTypes/Serializations/SerializationNullable.h>
 #include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypeNullable.h>
 
 
 namespace DB
@@ -24,8 +25,12 @@ namespace ErrorCodes
 
 namespace
 {
-    void checkBadDelimiter(char delimiter)
+    void checkBadDelimiter(char delimiter, bool allow_whitespace_or_tab_as_delimiter)
     {
+        if ((delimiter == ' ' || delimiter == '\t') && allow_whitespace_or_tab_as_delimiter)
+        {
+            return;
+        }
         constexpr std::string_view bad_delimiters = " \t\"'.UL";
         if (bad_delimiters.find(delimiter) != std::string_view::npos)
             throw Exception(
@@ -67,7 +72,7 @@ CSVRowInputFormat::CSVRowInputFormat(
         format_settings_.csv.try_detect_header),
     buf(std::move(in_))
 {
-    checkBadDelimiter(format_settings_.csv.delimiter);
+    checkBadDelimiter(format_settings_.csv.delimiter, format_settings_.csv.allow_whitespace_or_tab_as_delimiter);
 }
 
 CSVRowInputFormat::CSVRowInputFormat(
@@ -89,7 +94,7 @@ CSVRowInputFormat::CSVRowInputFormat(
         format_settings_.csv.try_detect_header),
     buf(std::move(in_))
 {
-    checkBadDelimiter(format_settings_.csv.delimiter);
+    checkBadDelimiter(format_settings_.csv.delimiter, format_settings_.csv.allow_whitespace_or_tab_as_delimiter);
 }
 
 void CSVRowInputFormat::syncAfterError()
@@ -133,8 +138,12 @@ static void skipEndOfLine(ReadBuffer & in)
 }
 
 /// Skip `whitespace` symbols allowed in CSV.
-static inline void skipWhitespacesAndTabs(ReadBuffer & in)
+static inline void skipWhitespacesAndTabs(ReadBuffer & in, const bool & allow_whitespace_or_tab_as_delimiter)
 {
+    if (allow_whitespace_or_tab_as_delimiter)
+    {
+        return;
+    }
     while (!in.eof() && (*in.position() == ' ' || *in.position() == '\t'))
         ++in.position();
 }
@@ -145,14 +154,16 @@ CSVFormatReader::CSVFormatReader(PeekableReadBuffer & buf_, const FormatSettings
 
 void CSVFormatReader::skipFieldDelimiter()
 {
-    skipWhitespacesAndTabs(*buf);
+    skipWhitespacesAndTabs(*buf, format_settings.csv.allow_whitespace_or_tab_as_delimiter);
     assertChar(format_settings.csv.delimiter, *buf);
 }
 
 template <bool read_string>
 String CSVFormatReader::readCSVFieldIntoString()
 {
-    skipWhitespacesAndTabs(*buf);
+    if (format_settings.csv.trim_whitespaces) [[likely]]
+        skipWhitespacesAndTabs(*buf, format_settings.csv.allow_whitespace_or_tab_as_delimiter);
+
     String field;
     if constexpr (read_string)
         readCSVString(field, *buf, format_settings.csv);
@@ -163,14 +174,14 @@ String CSVFormatReader::readCSVFieldIntoString()
 
 void CSVFormatReader::skipField()
 {
-    skipWhitespacesAndTabs(*buf);
+    skipWhitespacesAndTabs(*buf, format_settings.csv.allow_whitespace_or_tab_as_delimiter);
     NullOutput out;
     readCSVStringInto(out, *buf, format_settings.csv);
 }
 
 void CSVFormatReader::skipRowEndDelimiter()
 {
-    skipWhitespacesAndTabs(*buf);
+    skipWhitespacesAndTabs(*buf, format_settings.csv.allow_whitespace_or_tab_as_delimiter);
 
     if (buf->eof())
         return;
@@ -179,7 +190,7 @@ void CSVFormatReader::skipRowEndDelimiter()
     if (*buf->position() == format_settings.csv.delimiter)
         ++buf->position();
 
-    skipWhitespacesAndTabs(*buf);
+    skipWhitespacesAndTabs(*buf, format_settings.csv.allow_whitespace_or_tab_as_delimiter);
     if (buf->eof())
         return;
 
@@ -191,7 +202,7 @@ void CSVFormatReader::skipHeaderRow()
     do
     {
         skipField();
-        skipWhitespacesAndTabs(*buf);
+        skipWhitespacesAndTabs(*buf, format_settings.csv.allow_whitespace_or_tab_as_delimiter);
     } while (checkChar(format_settings.csv.delimiter, *buf));
 
     skipRowEndDelimiter();
@@ -200,12 +211,11 @@ void CSVFormatReader::skipHeaderRow()
 template <bool is_header>
 std::vector<String> CSVFormatReader::readRowImpl()
 {
-
     std::vector<String> fields;
     do
     {
         fields.push_back(readCSVFieldIntoString<is_header>());
-        skipWhitespacesAndTabs(*buf);
+        skipWhitespacesAndTabs(*buf, format_settings.csv.allow_whitespace_or_tab_as_delimiter);
     } while (checkChar(format_settings.csv.delimiter, *buf));
 
     skipRowEndDelimiter();
@@ -218,7 +228,7 @@ bool CSVFormatReader::parseFieldDelimiterWithDiagnosticInfo(WriteBuffer & out)
 
     try
     {
-        skipWhitespacesAndTabs(*buf);
+        skipWhitespacesAndTabs(*buf, format_settings.csv.allow_whitespace_or_tab_as_delimiter);
         assertChar(delimiter, *buf);
     }
     catch (const DB::Exception &)
@@ -244,7 +254,7 @@ bool CSVFormatReader::parseFieldDelimiterWithDiagnosticInfo(WriteBuffer & out)
 
 bool CSVFormatReader::parseRowEndWithDiagnosticInfo(WriteBuffer & out)
 {
-    skipWhitespacesAndTabs(*buf);
+    skipWhitespacesAndTabs(*buf, format_settings.csv.allow_whitespace_or_tab_as_delimiter);
 
     if (buf->eof())
         return true;
@@ -253,7 +263,7 @@ bool CSVFormatReader::parseRowEndWithDiagnosticInfo(WriteBuffer & out)
     if (*buf->position() == format_settings.csv.delimiter)
     {
         ++buf->position();
-        skipWhitespacesAndTabs(*buf);
+        skipWhitespacesAndTabs(*buf, format_settings.csv.allow_whitespace_or_tab_as_delimiter);
         if (buf->eof())
             return true;
     }
@@ -280,7 +290,8 @@ bool CSVFormatReader::readField(
     bool is_last_file_column,
     const String & /*column_name*/)
 {
-    skipWhitespacesAndTabs(*buf);
+    if (format_settings.csv.trim_whitespaces || !isStringOrFixedString(removeNullable(type))) [[likely]]
+        skipWhitespacesAndTabs(*buf, format_settings.csv.allow_whitespace_or_tab_as_delimiter);
 
     const bool at_delimiter = !buf->eof() && *buf->position() == format_settings.csv.delimiter;
     const bool at_last_column_line_end = is_last_file_column && (buf->eof() || *buf->position() == '\n' || *buf->position() == '\r');
@@ -322,6 +333,20 @@ void CSVFormatReader::setReadBuffer(ReadBuffer & in_)
     FormatWithNamesAndTypesReader::setReadBuffer(*buf);
 }
 
+bool CSVFormatReader::checkForSuffix()
+{
+    if (!format_settings.csv.skip_trailing_empty_lines)
+        return buf->eof();
+
+    PeekableReadBufferCheckpoint checkpoint(*buf);
+    while (checkChar('\n', *buf) || checkChar('\r', *buf));
+    if (buf->eof())
+        return true;
+
+    buf->rollbackToCheckpoint();
+    return false;
+}
+
 CSVSchemaReader::CSVSchemaReader(ReadBuffer & in_, bool with_names_, bool with_types_, const FormatSettings & format_settings_)
     : FormatWithNamesAndTypesSchemaReader(
         buf,
diff --git a/src/Processors/Formats/Impl/CSVRowInputFormat.h b/src/Processors/Formats/Impl/CSVRowInputFormat.h
index f51f674e4af..0c8099a216c 100644
--- a/src/Processors/Formats/Impl/CSVRowInputFormat.h
+++ b/src/Processors/Formats/Impl/CSVRowInputFormat.h
@@ -75,6 +75,7 @@ public:
     std::vector<String> readRow() { return readRowImpl<false>(); }
     std::vector<String> readRowForHeaderDetection() override { return readHeaderRow(); }
 
+    bool checkForSuffix() override;
 
     template <bool is_header>
     std::vector<String> readRowImpl();
diff --git a/src/Processors/Formats/Impl/CapnProtoRowInputFormat.cpp b/src/Processors/Formats/Impl/CapnProtoRowInputFormat.cpp
index 2f84e9bde3c..c056ee2b4a4 100644
--- a/src/Processors/Formats/Impl/CapnProtoRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/CapnProtoRowInputFormat.cpp
@@ -9,42 +9,22 @@
 #include <capnp/dynamic.h>
 #include <capnp/common.h>
 
-#include <Columns/ColumnsNumber.h>
-#include <Columns/ColumnArray.h>
-#include <Columns/ColumnTuple.h>
-#include <Columns/ColumnFixedString.h>
-#include <Columns/ColumnLowCardinality.h>
-#include <Columns/ColumnNullable.h>
-#include <Columns/ColumnDecimal.h>
-#include <Columns/ColumnMap.h>
-
-#include <DataTypes/DataTypeEnum.h>
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeNullable.h>
-#include <DataTypes/DataTypesNumber.h>
-#include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypeLowCardinality.h>
-#include <DataTypes/DataTypeMap.h>
-
 namespace DB
 {
 
 namespace ErrorCodes
 {
-    extern const int LOGICAL_ERROR;
     extern const int INCORRECT_DATA;
 }
 
-CapnProtoRowInputFormat::CapnProtoRowInputFormat(ReadBuffer & in_, Block header, Params params_, const FormatSchemaInfo & info, const FormatSettings & format_settings_)
-    : IRowInputFormat(std::move(header), in_, std::move(params_))
+CapnProtoRowInputFormat::CapnProtoRowInputFormat(ReadBuffer & in_, Block header_, Params params_, const FormatSchemaInfo & info, const FormatSettings & format_settings)
+    : IRowInputFormat(std::move(header_), in_, std::move(params_))
     , parser(std::make_shared<CapnProtoSchemaParser>())
-    , format_settings(format_settings_)
-    , column_types(getPort().getHeader().getDataTypes())
-    , column_names(getPort().getHeader().getNames())
 {
     // Parse the schema and fetch the root object
-    root = parser->getMessageSchema(info);
-    checkCapnProtoSchemaStructure(root, getPort().getHeader(), format_settings.capn_proto.enum_comparing_mode);
+    schema = parser->getMessageSchema(info);
+    const auto & header = getPort().getHeader();
+    serializer = std::make_unique<CapnProtoSerializer>(header.getDataTypes(), header.getNames(), schema, format_settings.capn_proto);
 }
 
 kj::Array<capnp::word> CapnProtoRowInputFormat::readMessage()
@@ -82,213 +62,6 @@ kj::Array<capnp::word> CapnProtoRowInputFormat::readMessage()
     return msg;
 }
 
-static void insertInteger(IColumn & column, const DataTypePtr & column_type, UInt64 value)
-{
-    switch (column_type->getTypeId())
-    {
-        case TypeIndex::Int8:
-            assert_cast<ColumnInt8 &>(column).insertValue(value);
-            break;
-        case TypeIndex::UInt8:
-            assert_cast<ColumnUInt8 &>(column).insertValue(value);
-            break;
-        case TypeIndex::Int16:
-            assert_cast<ColumnInt16 &>(column).insertValue(value);
-            break;
-        case TypeIndex::Date: [[fallthrough]];
-        case TypeIndex::UInt16:
-            assert_cast<ColumnUInt16 &>(column).insertValue(value);
-            break;
-        case TypeIndex::Int32:
-            assert_cast<ColumnInt32 &>(column).insertValue(static_cast<Int32>(value));
-            break;
-        case TypeIndex::DateTime: [[fallthrough]];
-        case TypeIndex::UInt32:
-            assert_cast<ColumnUInt32 &>(column).insertValue(static_cast<UInt32>(value));
-            break;
-        case TypeIndex::IPv4:
-            assert_cast<ColumnIPv4 &>(column).insertValue(IPv4(static_cast<UInt32>(value)));
-            break;
-        case TypeIndex::Int64:
-            assert_cast<ColumnInt64 &>(column).insertValue(value);
-            break;
-        case TypeIndex::UInt64:
-            assert_cast<ColumnUInt64 &>(column).insertValue(value);
-            break;
-        case TypeIndex::DateTime64:
-            assert_cast<ColumnDecimal<DateTime64> &>(column).insertValue(value);
-            break;
-        case TypeIndex::Decimal32:
-            assert_cast<ColumnDecimal<Decimal32> &>(column).insertValue(static_cast<Int32>(value));
-            break;
-        case TypeIndex::Decimal64:
-            assert_cast<ColumnDecimal<Decimal64> &>(column).insertValue(value);
-            break;
-        default:
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Column type {} cannot be parsed from integer", column_type->getName());
-    }
-}
-
-static void insertFloat(IColumn & column, const DataTypePtr & column_type, Float64 value)
-{
-    switch (column_type->getTypeId())
-    {
-        case TypeIndex::Float32:
-            assert_cast<ColumnFloat32 &>(column).insertValue(static_cast<Float32>(value));
-            break;
-        case TypeIndex::Float64:
-            assert_cast<ColumnFloat64 &>(column).insertValue(value);
-            break;
-        default:
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Column type is not a float.");
-    }
-}
-
-template <typename Value>
-static void insertData(IColumn & column, const DataTypePtr & column_type, Value value)
-{
-    if (column_type->haveMaximumSizeOfValue() && value.size() != column_type->getSizeOfValueInMemory())
-        throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected size of {} value: {}", column_type->getName(), value.size());
-
-    column.insertData(reinterpret_cast<const char *>(value.begin()), value.size());
-}
-
-template <typename ValueType>
-static void insertEnum(IColumn & column, const DataTypePtr & column_type, const capnp::DynamicEnum & enum_value, FormatSettings::EnumComparingMode enum_comparing_mode)
-{
-    auto enumerant = *kj::_::readMaybe(enum_value.getEnumerant());
-    auto enum_type = assert_cast<const DataTypeEnum<ValueType> *>(column_type.get());
-    DataTypePtr nested_type = std::make_shared<DataTypeNumber<ValueType>>();
-    switch (enum_comparing_mode)
-    {
-        case FormatSettings::EnumComparingMode::BY_VALUES:
-            insertInteger(column, nested_type, Int64(enumerant.getOrdinal()));
-            return;
-        case FormatSettings::EnumComparingMode::BY_NAMES:
-            insertInteger(column, nested_type, Int64(enum_type->getValue(String(enumerant.getProto().getName()))));
-            return;
-        case FormatSettings::EnumComparingMode::BY_NAMES_CASE_INSENSITIVE:
-        {
-            /// Find the same enum name case insensitive.
-            String enum_name = enumerant.getProto().getName();
-            for (auto & name : enum_type->getAllRegisteredNames())
-            {
-                if (compareEnumNames(name, enum_name, enum_comparing_mode))
-                {
-                    insertInteger(column, nested_type, Int64(enum_type->getValue(name)));
-                    break;
-                }
-            }
-        }
-    }
-}
-
-static void insertValue(IColumn & column, const DataTypePtr & column_type, const String & column_name, const capnp::DynamicValue::Reader & value, FormatSettings::EnumComparingMode enum_comparing_mode)
-{
-    if (column_type->lowCardinality())
-    {
-        auto & lc_column = assert_cast<ColumnLowCardinality &>(column);
-        auto tmp_column = lc_column.getDictionary().getNestedColumn()->cloneEmpty();
-        auto dict_type = assert_cast<const DataTypeLowCardinality *>(column_type.get())->getDictionaryType();
-        insertValue(*tmp_column, dict_type, column_name, value, enum_comparing_mode);
-        lc_column.insertFromFullColumn(*tmp_column, 0);
-        return;
-    }
-
-    switch (value.getType())
-    {
-        case capnp::DynamicValue::Type::INT:
-            insertInteger(column, column_type, value.as<Int64>());
-            break;
-        case capnp::DynamicValue::Type::UINT:
-            insertInteger(column, column_type, value.as<UInt64>());
-            break;
-        case capnp::DynamicValue::Type::FLOAT:
-            insertFloat(column, column_type, value.as<Float64>());
-            break;
-        case capnp::DynamicValue::Type::BOOL:
-            insertInteger(column, column_type, UInt64(value.as<bool>()));
-            break;
-        case capnp::DynamicValue::Type::DATA:
-            insertData(column, column_type, value.as<capnp::Data>());
-            break;
-        case capnp::DynamicValue::Type::TEXT:
-            insertData(column, column_type, value.as<capnp::Text>());
-            break;
-        case capnp::DynamicValue::Type::ENUM:
-            if (column_type->getTypeId() == TypeIndex::Enum8)
-                insertEnum<Int8>(column, column_type, value.as<capnp::DynamicEnum>(), enum_comparing_mode);
-            else
-                insertEnum<Int16>(column, column_type, value.as<capnp::DynamicEnum>(), enum_comparing_mode);
-            break;
-        case capnp::DynamicValue::LIST:
-        {
-            auto list_value = value.as<capnp::DynamicList>();
-            auto & column_array = assert_cast<ColumnArray &>(column);
-            auto & offsets = column_array.getOffsets();
-            offsets.push_back(offsets.back() + list_value.size());
-
-            auto & nested_column = column_array.getData();
-            auto nested_type = assert_cast<const DataTypeArray *>(column_type.get())->getNestedType();
-            for (const auto & nested_value : list_value)
-                insertValue(nested_column, nested_type, column_name, nested_value, enum_comparing_mode);
-            break;
-        }
-        case capnp::DynamicValue::Type::STRUCT:
-        {
-            auto struct_value = value.as<capnp::DynamicStruct>();
-            if (column_type->isNullable())
-            {
-                auto & nullable_column = assert_cast<ColumnNullable &>(column);
-                auto field = *kj::_::readMaybe(struct_value.which());
-                if (field.getType().isVoid())
-                    nullable_column.insertDefault();
-                else
-                {
-                    auto & nested_column = nullable_column.getNestedColumn();
-                    auto nested_type = assert_cast<const DataTypeNullable *>(column_type.get())->getNestedType();
-                    auto nested_value = struct_value.get(field);
-                    insertValue(nested_column, nested_type, column_name, nested_value, enum_comparing_mode);
-                    nullable_column.getNullMapData().push_back(0);
-                }
-            }
-            else if (isTuple(column_type))
-            {
-                auto & tuple_column = assert_cast<ColumnTuple &>(column);
-                const auto * tuple_type = assert_cast<const DataTypeTuple *>(column_type.get());
-                bool have_explicit_names = tuple_type->haveExplicitNames();
-                auto struct_schema = struct_value.getSchema();
-                for (uint32_t i = 0; i != tuple_column.tupleSize(); ++i)
-                    insertValue(
-                        tuple_column.getColumn(i),
-                        tuple_type->getElements()[i],
-                        tuple_type->getElementNames()[i],
-                        struct_value.get(have_explicit_names ? struct_schema.getFieldByName(tuple_type->getElementNames()[i]) : struct_schema.getFields()[i]),
-                        enum_comparing_mode);
-            }
-            else if (isMap(column_type))
-            {
-                const auto & map_type = assert_cast<const DataTypeMap &>(*column_type);
-                DataTypes key_value_types = {map_type.getKeyType(), map_type.getValueType()};
-                Names key_value_names = {"key", "value"};
-                auto entries_type = std::make_shared<DataTypeArray>(std::make_shared<DataTypeTuple>(key_value_types, key_value_names));
-                auto & entries_column = assert_cast<ColumnMap &>(column).getNestedColumn();
-                auto entries_field = struct_value.getSchema().getFields()[0];
-                insertValue(entries_column, entries_type, column_name, struct_value.get(entries_field), enum_comparing_mode);
-            }
-            else
-            {
-                /// It can be nested column from Nested type.
-                auto [field_name, nested_name] = splitCapnProtoFieldName(column_name);
-                insertValue(column, column_type, nested_name, struct_value.get(nested_name), enum_comparing_mode);
-            }
-            break;
-        }
-        default:
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected CapnProto value type.");
-    }
-}
-
 bool CapnProtoRowInputFormat::readRow(MutableColumns & columns, RowReadExtension &)
 {
     if (in->eof())
@@ -298,12 +71,8 @@ bool CapnProtoRowInputFormat::readRow(MutableColumns & columns, RowReadExtension
     {
         auto array = readMessage();
         capnp::FlatArrayMessageReader msg(array);
-        auto root_reader = msg.getRoot<capnp::DynamicStruct>(root);
-        for (size_t i = 0; i != columns.size(); ++i)
-        {
-            auto value = getReaderByColumnName(root_reader, column_names[i]);
-            insertValue(*columns[i], column_types[i], column_names[i], value, format_settings.capn_proto.enum_comparing_mode);
-        }
+        auto root_reader = msg.getRoot<capnp::DynamicStruct>(schema);
+        serializer->readRow(columns, root_reader);
     }
     catch (const kj::Exception & e)
     {
@@ -343,7 +112,14 @@ void registerInputFormatCapnProto(FormatFactory & factory)
     factory.markFormatSupportsSubsetOfColumns("CapnProto");
     factory.registerFileExtension("capnp", "CapnProto");
     factory.registerAdditionalInfoForSchemaCacheGetter(
-        "CapnProto", [](const FormatSettings & settings) { return fmt::format("format_schema={}", settings.schema.format_schema); });
+        "CapnProto",
+        [](const FormatSettings & settings)
+        {
+            return fmt::format(
+                "format_schema={}, skip_fields_with_unsupported_types_in_schema_inference={}",
+                settings.schema.format_schema,
+                settings.capn_proto.skip_fields_with_unsupported_types_in_schema_inference);
+        });
 }
 
 void registerCapnProtoSchemaReader(FormatFactory & factory)
diff --git a/src/Processors/Formats/Impl/CapnProtoRowInputFormat.h b/src/Processors/Formats/Impl/CapnProtoRowInputFormat.h
index cf23f22b643..06e94da123f 100644
--- a/src/Processors/Formats/Impl/CapnProtoRowInputFormat.h
+++ b/src/Processors/Formats/Impl/CapnProtoRowInputFormat.h
@@ -4,7 +4,8 @@
 #if USE_CAPNP
 
 #include <Core/Block.h>
-#include <Formats/CapnProtoUtils.h>
+#include <Formats/CapnProtoSchema.h>
+#include <Formats/CapnProtoSerializer.h>
 #include <Processors/Formats/IRowInputFormat.h>
 #include <Processors/Formats/ISchemaReader.h>
 
@@ -33,10 +34,8 @@ private:
     kj::Array<capnp::word> readMessage();
 
     std::shared_ptr<CapnProtoSchemaParser> parser;
-    capnp::StructSchema root;
-    const FormatSettings format_settings;
-    DataTypes column_types;
-    Names column_names;
+    capnp::StructSchema schema;
+    std::unique_ptr<CapnProtoSerializer> serializer;
 };
 
 class CapnProtoSchemaReader : public IExternalSchemaReader
diff --git a/src/Processors/Formats/Impl/CapnProtoRowOutputFormat.cpp b/src/Processors/Formats/Impl/CapnProtoRowOutputFormat.cpp
index 0225680b396..66a7160dd89 100644
--- a/src/Processors/Formats/Impl/CapnProtoRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/CapnProtoRowOutputFormat.cpp
@@ -1,37 +1,16 @@
 #include <Processors/Formats/Impl/CapnProtoRowOutputFormat.h>
 #if USE_CAPNP
 
-#include <Formats/CapnProtoUtils.h>
+#include <Formats/CapnProtoSchema.h>
 #include <Formats/FormatSettings.h>
+#include <Formats/CapnProtoSerializer.h>
 #include <IO/WriteBuffer.h>
 #include <capnp/dynamic.h>
 #include <capnp/serialize-packed.h>
 
-#include <Columns/ColumnArray.h>
-#include <Columns/ColumnNullable.h>
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnFixedString.h>
-#include <Columns/ColumnTuple.h>
-#include <Columns/ColumnLowCardinality.h>
-#include <Columns/ColumnDecimal.h>
-#include <Columns/ColumnMap.h>
-
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeEnum.h>
-#include <DataTypes/DataTypeNullable.h>
-#include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypeLowCardinality.h>
-#include <DataTypes/DataTypeMap.h>
-
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int LOGICAL_ERROR;
-}
-
-
 CapnProtoOutputStream::CapnProtoOutputStream(WriteBuffer & out_) : out(out_)
 {
 }
@@ -45,252 +24,25 @@ CapnProtoRowOutputFormat::CapnProtoRowOutputFormat(
     WriteBuffer & out_,
     const Block & header_,
     const FormatSchemaInfo & info,
-    const FormatSettings & format_settings_)
-    : IRowOutputFormat(header_, out_), column_names(header_.getNames()), column_types(header_.getDataTypes()), output_stream(std::make_unique<CapnProtoOutputStream>(out_)), format_settings(format_settings_)
+    const FormatSettings & format_settings)
+    : IRowOutputFormat(header_, out_)
+    , column_names(header_.getNames())
+    , column_types(header_.getDataTypes())
+    , output_stream(std::make_unique<CapnProtoOutputStream>(out_))
 {
     schema = schema_parser.getMessageSchema(info);
-    checkCapnProtoSchemaStructure(schema, getPort(PortKind::Main).getHeader(), format_settings.capn_proto.enum_comparing_mode);
-}
-
-template <typename EnumValue>
-static capnp::DynamicEnum getDynamicEnum(
-    const ColumnPtr & column,
-    const DataTypePtr & data_type,
-    size_t row_num,
-    const capnp::EnumSchema & enum_schema,
-    FormatSettings::EnumComparingMode mode)
-{
-    const auto * enum_data_type = assert_cast<const DataTypeEnum<EnumValue> *>(data_type.get());
-    EnumValue enum_value = column->getInt(row_num);
-    if (mode == FormatSettings::EnumComparingMode::BY_VALUES)
-        return capnp::DynamicEnum(enum_schema, enum_value);
-
-    auto enum_name = enum_data_type->getNameForValue(enum_value);
-    for (const auto enumerant : enum_schema.getEnumerants())
-    {
-        if (compareEnumNames(String(enum_name), enumerant.getProto().getName(), mode))
-            return capnp::DynamicEnum(enumerant);
-    }
-
-    throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot convert CLickHouse Enum value to CapnProto Enum");
-}
-
-static capnp::DynamicValue::Builder initStructFieldBuilder(const ColumnPtr & column, size_t row_num, capnp::DynamicStruct::Builder & struct_builder, capnp::StructSchema::Field field)
-{
-    if (const auto * array_column = checkAndGetColumn<ColumnArray>(*column))
-    {
-        size_t size = array_column->getOffsets()[row_num] - array_column->getOffsets()[row_num - 1];
-        return struct_builder.init(field, static_cast<unsigned>(size));
-    }
-
-    if (field.getType().isStruct())
-        return struct_builder.init(field);
-
-    return struct_builder.get(field);
-}
-
-static std::optional<capnp::DynamicValue::Reader> convertToDynamicValue(
-    const ColumnPtr & column,
-    const DataTypePtr & data_type,
-    size_t row_num,
-    const String & column_name,
-    capnp::DynamicValue::Builder builder,
-    FormatSettings::EnumComparingMode enum_comparing_mode,
-    std::vector<std::unique_ptr<String>> & temporary_text_data_storage)
-{
-    /// Here we don't do any types validation, because we did it in CapnProtoRowOutputFormat constructor.
-
-    if (data_type->lowCardinality())
-    {
-        const auto * lc_column = assert_cast<const ColumnLowCardinality *>(column.get());
-        const auto & dict_type = assert_cast<const DataTypeLowCardinality *>(data_type.get())->getDictionaryType();
-        size_t index = lc_column->getIndexAt(row_num);
-        return convertToDynamicValue(lc_column->getDictionary().getNestedColumn(), dict_type, index, column_name, builder, enum_comparing_mode, temporary_text_data_storage);
-    }
-
-    switch (builder.getType())
-    {
-        case capnp::DynamicValue::Type::INT:
-            return capnp::DynamicValue::Reader(column->getInt(row_num));
-        case capnp::DynamicValue::Type::UINT:
-        {
-            /// IPv4 column doesn't support getUInt method.
-            if (isIPv4(data_type))
-                return capnp::DynamicValue::Reader(assert_cast<const ColumnIPv4 *>(column.get())->getElement(row_num));
-            return capnp::DynamicValue::Reader(column->getUInt(row_num));
-        }
-        case capnp::DynamicValue::Type::BOOL:
-            return capnp::DynamicValue::Reader(column->getBool(row_num));
-        case capnp::DynamicValue::Type::FLOAT:
-            return capnp::DynamicValue::Reader(column->getFloat64(row_num));
-        case capnp::DynamicValue::Type::ENUM:
-        {
-            auto enum_schema = builder.as<capnp::DynamicEnum>().getSchema();
-            if (data_type->getTypeId() == TypeIndex::Enum8)
-                return capnp::DynamicValue::Reader(
-                    getDynamicEnum<Int8>(column, data_type, row_num, enum_schema, enum_comparing_mode));
-            return capnp::DynamicValue::Reader(
-                    getDynamicEnum<Int16>(column, data_type, row_num, enum_schema, enum_comparing_mode));
-        }
-        case capnp::DynamicValue::Type::DATA:
-        {
-            auto data = column->getDataAt(row_num);
-            return capnp::DynamicValue::Reader(capnp::Data::Reader(reinterpret_cast<const kj::byte *>(data.data), data.size));
-        }
-        case capnp::DynamicValue::Type::TEXT:
-        {
-            /// In TEXT type data should be null-terminated, but ClickHouse String data could not be.
-            /// To make data null-terminated we should copy it to temporary String object, but
-            /// capnp::Text::Reader works only with pointer to the data and it's size, so we should
-            /// guarantee that new String object life time is longer than capnp::Text::Reader life time.
-            /// To do this we store new String object in a temporary storage, passed in this function
-            /// by reference. We use unique_ptr<String> instead of just String to avoid pointers
-            /// invalidation on vector reallocation.
-            temporary_text_data_storage.push_back(std::make_unique<String>(column->getDataAt(row_num)));
-            auto & data = temporary_text_data_storage.back();
-            return capnp::DynamicValue::Reader(capnp::Text::Reader(data->data(), data->size()));
-        }
-        case capnp::DynamicValue::Type::STRUCT:
-        {
-            auto struct_builder = builder.as<capnp::DynamicStruct>();
-            auto nested_struct_schema = struct_builder.getSchema();
-            /// Struct can represent Tuple, Nullable (named union with two fields) or single column when it contains one nested column.
-            if (data_type->isNullable())
-            {
-                const auto * nullable_type = assert_cast<const DataTypeNullable *>(data_type.get());
-                const auto * nullable_column = assert_cast<const ColumnNullable *>(column.get());
-                auto fields = nested_struct_schema.getUnionFields();
-                if (nullable_column->isNullAt(row_num))
-                {
-                    auto null_field = fields[0].getType().isVoid() ? fields[0] : fields[1];
-                    struct_builder.set(null_field, capnp::Void());
-                }
-                else
-                {
-                    auto value_field = fields[0].getType().isVoid() ? fields[1] : fields[0];
-                    struct_builder.clear(value_field);
-                    const auto & nested_column = nullable_column->getNestedColumnPtr();
-                    auto value_builder = initStructFieldBuilder(nested_column, row_num, struct_builder, value_field);
-                    auto value = convertToDynamicValue(nested_column, nullable_type->getNestedType(), row_num, column_name, value_builder, enum_comparing_mode, temporary_text_data_storage);
-                    if (value)
-                        struct_builder.set(value_field, *value);
-                }
-            }
-            else if (isTuple(data_type))
-            {
-                const auto * tuple_data_type = assert_cast<const DataTypeTuple *>(data_type.get());
-                const auto & nested_types = tuple_data_type->getElements();
-                const auto & nested_names = tuple_data_type->getElementNames();
-                const auto & nested_columns = assert_cast<const ColumnTuple *>(column.get())->getColumns();
-                bool have_explicit_names = tuple_data_type->haveExplicitNames();
-                for (uint32_t i = 0; i != nested_names.size(); ++i)
-                {
-                    capnp::StructSchema::Field nested_field = have_explicit_names ? nested_struct_schema.getFieldByName(nested_names[i]) : nested_struct_schema.getFields()[i];
-                    auto field_builder = initStructFieldBuilder(nested_columns[i], row_num, struct_builder, nested_field);
-                    auto value = convertToDynamicValue(nested_columns[i], nested_types[i], row_num, nested_names[i], field_builder, enum_comparing_mode, temporary_text_data_storage);
-                    if (value)
-                        struct_builder.set(nested_field, *value);
-                }
-            }
-            else if (isMap(data_type))
-            {
-                /// We output Map type as follow CapnProto schema
-                ///
-                /// struct Map {
-                ///     struct Entry {
-                ///         key @0: Key;
-                ///         value @1: Value;
-                ///     }
-                ///     entries @0 :List(Entry);
-                /// }
-                ///
-                /// And we don't need to check that struct have this form here because we checked it before.
-                const auto & map_type = assert_cast<const DataTypeMap &>(*data_type);
-                DataTypes key_value_types = {map_type.getKeyType(), map_type.getValueType()};
-                Names key_value_names = {"key", "value"};
-                auto entries_type = std::make_shared<DataTypeArray>(std::make_shared<DataTypeTuple>(key_value_types, key_value_names));
-
-                /// Nested column in Map is actually Array(Tuple), so we can output it according to "entries" field schema.
-                const auto & entries_column = assert_cast<const ColumnMap *>(column.get())->getNestedColumnPtr();
-
-                auto entries_field = nested_struct_schema.getFields()[0];
-                auto field_builder = initStructFieldBuilder(entries_column, row_num, struct_builder, entries_field);
-                auto entries_value = convertToDynamicValue(entries_column, entries_type, row_num, column_name, field_builder, enum_comparing_mode, temporary_text_data_storage);
-                if (entries_value)
-                    struct_builder.set(entries_field, *entries_value);
-            }
-            else
-            {
-                /// It can be nested column from Nested type.
-                auto [field_name, nested_name] = splitCapnProtoFieldName(column_name);
-                auto nested_field = nested_struct_schema.getFieldByName(nested_name);
-                auto field_builder = initStructFieldBuilder(column, row_num, struct_builder, nested_field);
-                auto value = convertToDynamicValue(column, data_type, row_num, nested_name, field_builder, enum_comparing_mode, temporary_text_data_storage);
-                if (value)
-                    struct_builder.set(nested_field, *value);
-            }
-            return std::nullopt;
-        }
-        case capnp::DynamicValue::Type::LIST:
-        {
-            auto list_builder = builder.as<capnp::DynamicList>();
-            const auto * array_column = assert_cast<const ColumnArray *>(column.get());
-            const auto & nested_column = array_column->getDataPtr();
-            const auto & nested_type = assert_cast<const DataTypeArray *>(data_type.get())->getNestedType();
-            const auto & offsets = array_column->getOffsets();
-            auto offset = offsets[row_num - 1];
-            size_t size = offsets[row_num] - offset;
-
-            const auto * nested_array_column = checkAndGetColumn<ColumnArray>(*nested_column);
-            for (unsigned i = 0; i != static_cast<unsigned>(size); ++i)
-            {
-                capnp::DynamicValue::Builder value_builder;
-                /// For nested arrays we need to initialize nested list builder.
-                if (nested_array_column)
-                {
-                    const auto & nested_offset = nested_array_column->getOffsets();
-                    size_t nested_array_size = nested_offset[offset + i] - nested_offset[offset + i - 1];
-                    value_builder = list_builder.init(i, static_cast<unsigned>(nested_array_size));
-                }
-                else
-                    value_builder = list_builder[i];
-
-                auto value = convertToDynamicValue(nested_column, nested_type, offset + i, column_name, value_builder, enum_comparing_mode, temporary_text_data_storage);
-                if (value)
-                    list_builder.set(i, *value);
-            }
-            return std::nullopt;
-        }
-        default:
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected CapnProto type.");
-    }
+    const auto & header = getPort(PortKind::Main).getHeader();
+    serializer = std::make_unique<CapnProtoSerializer>(header.getDataTypes(), header.getNames(), schema, format_settings.capn_proto);
+    capnp::MallocMessageBuilder message;
 }
 
 void CapnProtoRowOutputFormat::write(const Columns & columns, size_t row_num)
 {
     capnp::MallocMessageBuilder message;
-    /// Temporary storage for data that will be outputted in fields with CapnProto type TEXT.
-    /// See comment in convertToDynamicValue() for more details.
-    std::vector<std::unique_ptr<String>> temporary_text_data_storage;
     capnp::DynamicStruct::Builder root = message.initRoot<capnp::DynamicStruct>(schema);
-
-    /// Some columns can share same field builder. For example when we have
-    /// column with Nested type that was flattened into several columns.
-    std::unordered_map<size_t, capnp::DynamicValue::Builder> field_builders;
-    for (size_t i = 0; i != columns.size(); ++i)
-    {
-        auto [struct_builder, field] = getStructBuilderAndFieldByColumnName(root, column_names[i]);
-        if (!field_builders.contains(field.getIndex()))
-        {
-            auto field_builder = initStructFieldBuilder(columns[i], row_num, struct_builder, field);
-            field_builders[field.getIndex()] = field_builder;
-        }
-        auto value = convertToDynamicValue(columns[i], column_types[i], row_num, column_names[i], field_builders[field.getIndex()], format_settings.capn_proto.enum_comparing_mode, temporary_text_data_storage);
-        if (value)
-            struct_builder.set(field, *value);
-    }
-
+    serializer->writeRow(columns, std::move(root), row_num);
     capnp::writeMessage(*output_stream, message);
+
 }
 
 void registerOutputFormatCapnProto(FormatFactory & factory)
diff --git a/src/Processors/Formats/Impl/CapnProtoRowOutputFormat.h b/src/Processors/Formats/Impl/CapnProtoRowOutputFormat.h
index 5cc7099d4c7..dd9dcc6b340 100644
--- a/src/Processors/Formats/Impl/CapnProtoRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/CapnProtoRowOutputFormat.h
@@ -3,15 +3,17 @@
 #include "config.h"
 #if USE_CAPNP
 
-#include <Processors/Formats/IRowOutputFormat.h>
-#include <Formats/FormatSchemaInfo.h>
-#include <Formats/CapnProtoUtils.h>
-#include <capnp/schema.h>
-#include <capnp/dynamic.h>
-#include <kj/io.h>
+#    include <Formats/CapnProtoSchema.h>
+#    include <Formats/CapnProtoSerializer.h>
+#    include <Formats/FormatSchemaInfo.h>
+#    include <Processors/Formats/IRowOutputFormat.h>
+#    include <capnp/dynamic.h>
+#    include <capnp/schema.h>
+#    include <kj/io.h>
 
 namespace DB
 {
+
 class CapnProtoOutputStream : public kj::OutputStream
 {
 public:
@@ -43,8 +45,9 @@ private:
     DataTypes column_types;
     capnp::StructSchema schema;
     std::unique_ptr<CapnProtoOutputStream> output_stream;
-    const FormatSettings format_settings;
     CapnProtoSchemaParser schema_parser;
+    std::unique_ptr<CapnProtoSerializer> serializer;
+
 };
 
 }
diff --git a/src/Processors/Formats/Impl/CustomSeparatedRowInputFormat.cpp b/src/Processors/Formats/Impl/CustomSeparatedRowInputFormat.cpp
index 1c2efe3a41d..1e67db79a2c 100644
--- a/src/Processors/Formats/Impl/CustomSeparatedRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/CustomSeparatedRowInputFormat.cpp
@@ -283,6 +283,8 @@ bool CustomSeparatedFormatReader::checkForSuffixImpl(bool check_eof)
 
         /// Allow optional \n before eof.
         checkChar('\n', *buf);
+        if (format_settings.custom.skip_trailing_empty_lines)
+            while (checkChar('\n', *buf) || checkChar('\r', *buf));
         return buf->eof();
     }
 
@@ -294,6 +296,8 @@ bool CustomSeparatedFormatReader::checkForSuffixImpl(bool check_eof)
 
         /// Allow optional \n before eof.
         checkChar('\n', *buf);
+        if (format_settings.custom.skip_trailing_empty_lines)
+            while (checkChar('\n', *buf) || checkChar('\r', *buf));
         if (buf->eof())
             return true;
     }
diff --git a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormat.cpp b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormat.cpp
index 8d4c4b0c6cf..3d003658e64 100644
--- a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormat.cpp
@@ -55,7 +55,7 @@ void registerJSONColumnsSchemaReader(FormatFactory & factory)
     );
     factory.registerAdditionalInfoForSchemaCacheGetter("JSONColumns", [](const FormatSettings & settings)
     {
-        return getAdditionalFormatInfoByEscapingRule(settings, FormatSettings::EscapingRule::JSON);
+        return getAdditionalFormatInfoForAllRowBasedFormats(settings) + getAdditionalFormatInfoByEscapingRule(settings, FormatSettings::EscapingRule::JSON);
     });
 }
 
diff --git a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp
index 2e264c59f56..3cdeb0199b3 100644
--- a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp
+++ b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp
@@ -117,6 +117,7 @@ Chunk JSONColumnsBlockInputFormatBase::generate()
     if (reader->checkChunkEnd())
         return Chunk(std::move(columns), 0);
 
+    size_t chunk_start = getDataOffsetMaybeCompressed(*in);
     std::vector<UInt8> seen_columns(columns.size(), 0);
     Int64 rows = -1;
     size_t iteration = 0;
@@ -151,6 +152,8 @@ Chunk JSONColumnsBlockInputFormatBase::generate()
     }
     while (!reader->checkChunkEndOrSkipColumnDelimiter());
 
+    approx_bytes_read_for_chunk = getDataOffsetMaybeCompressed(*in) - chunk_start;
+
     if (rows <= 0)
         return Chunk(std::move(columns), 0);
 
@@ -176,6 +179,8 @@ JSONColumnsSchemaReaderBase::JSONColumnsSchemaReaderBase(
     , hints_str(format_settings_.schema_inference_hints)
     , reader(std::move(reader_))
     , column_names_from_settings(splitColumnNames(format_settings_.column_names_for_schema_inference))
+    , max_rows_to_read(format_settings_.max_rows_to_read_for_schema_inference)
+    , max_bytes_to_read(format_settings_.max_bytes_to_read_for_schema_inference)
 {
 }
 
@@ -196,12 +201,12 @@ void JSONColumnsSchemaReaderBase::transformTypesIfNeeded(DataTypePtr & type, Dat
 
 NamesAndTypesList JSONColumnsSchemaReaderBase::readSchema()
 {
-    size_t total_rows_read = 0;
     std::unordered_map<String, DataTypePtr> names_to_types;
     std::vector<String> names_order;
     /// Read data block by block and determine the type for each column
-    /// until max_rows_to_read_for_schema_inference is reached.
-    while (total_rows_read < format_settings.max_rows_to_read_for_schema_inference)
+    /// until max_rows_to_read/max_bytes_to_read is reached.
+    /// Note that we can exceed max_bytes_to_read to compete block parsing.
+    while (total_rows_read < max_rows_to_read && in.count() < max_bytes_to_read)
     {
         if (in.eof())
             break;
@@ -268,7 +273,7 @@ NamesAndTypesList JSONColumnsSchemaReaderBase::readSchema()
     return result;
 }
 
-DataTypePtr JSONColumnsSchemaReaderBase::readColumnAndGetDataType(const String & column_name, size_t & rows_read, size_t max_rows_to_read)
+DataTypePtr JSONColumnsSchemaReaderBase::readColumnAndGetDataType(const String & column_name, size_t & rows_read, size_t max_rows)
 {
     /// Check for empty column.
     if (reader->checkColumnEnd())
@@ -279,7 +284,7 @@ DataTypePtr JSONColumnsSchemaReaderBase::readColumnAndGetDataType(const String &
     do
     {
         /// If we reached max_rows_to_read, skip the rest part of this column.
-        if (rows_read == max_rows_to_read)
+        if (rows_read == max_rows)
         {
             reader->skipColumn();
             break;
diff --git a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h
index 2babc0734f9..5ab20c796ea 100644
--- a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h
+++ b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h
@@ -53,6 +53,8 @@ public:
 
     const BlockMissingValues & getMissingValues() const override { return block_missing_values; }
 
+    size_t getApproxBytesReadForChunk() const override { return approx_bytes_read_for_chunk; }
+
 protected:
     Chunk generate() override;
 
@@ -65,6 +67,7 @@ protected:
     Serializations serializations;
     std::unique_ptr<JSONColumnsReaderBase> reader;
     BlockMissingValues block_missing_values;
+    size_t approx_bytes_read_for_chunk;
 };
 
 
@@ -82,11 +85,19 @@ public:
     bool needContext() const override { return !hints_str.empty(); }
     void setContext(ContextPtr & ctx) override;
 
+    void setMaxRowsAndBytesToRead(size_t max_rows, size_t max_bytes) override
+    {
+        max_rows_to_read = max_rows;
+        max_bytes_to_read = max_bytes;
+    }
+
+    size_t getNumRowsRead() const override { return total_rows_read; }
+
 private:
     NamesAndTypesList readSchema() override;
 
-    /// Read whole column in the block (up to max_rows_to_read rows) and extract the data type.
-    DataTypePtr readColumnAndGetDataType(const String & column_name, size_t & rows_read, size_t max_rows_to_read);
+    /// Read whole column in the block (up to max_rows rows) and extract the data type.
+    DataTypePtr readColumnAndGetDataType(const String & column_name, size_t & rows_read, size_t max_rows);
 
     const FormatSettings format_settings;
     String hints_str;
@@ -95,6 +106,10 @@ private:
     std::unique_ptr<JSONColumnsReaderBase> reader;
     Names column_names_from_settings;
     JSONInferenceInfo inference_info;
+
+    size_t total_rows_read = 0;
+    size_t max_rows_to_read;
+    size_t max_bytes_to_read;
 };
 
 }
diff --git a/src/Processors/Formats/Impl/JSONCompactColumnsBlockInputFormat.cpp b/src/Processors/Formats/Impl/JSONCompactColumnsBlockInputFormat.cpp
index ade18d21892..09df7beaa73 100644
--- a/src/Processors/Formats/Impl/JSONCompactColumnsBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONCompactColumnsBlockInputFormat.cpp
@@ -53,7 +53,7 @@ void registerJSONCompactColumnsSchemaReader(FormatFactory & factory)
     );
     factory.registerAdditionalInfoForSchemaCacheGetter("JSONCompactColumns", [](const FormatSettings & settings)
     {
-        auto result = getAdditionalFormatInfoByEscapingRule(settings, FormatSettings::EscapingRule::JSON);
+        auto result = getAdditionalFormatInfoForAllRowBasedFormats(settings) + getAdditionalFormatInfoByEscapingRule(settings, FormatSettings::EscapingRule::JSON);
         return result + fmt::format(", column_names_for_schema_inference={}", settings.column_names_for_schema_inference);
     });
 }
diff --git a/src/Processors/Formats/Impl/NativeFormat.cpp b/src/Processors/Formats/Impl/NativeFormat.cpp
index cf1fecca810..f8c9a39eedf 100644
--- a/src/Processors/Formats/Impl/NativeFormat.cpp
+++ b/src/Processors/Formats/Impl/NativeFormat.cpp
@@ -38,7 +38,10 @@ public:
     Chunk generate() override
     {
         block_missing_values.clear();
+        size_t block_start = getDataOffsetMaybeCompressed(*in);
         auto block = reader->read();
+        approx_bytes_read_for_chunk = getDataOffsetMaybeCompressed(*in) - block_start;
+
         if (!block)
             return {};
 
@@ -57,10 +60,13 @@ public:
 
     const BlockMissingValues & getMissingValues() const override { return block_missing_values; }
 
+    size_t getApproxBytesReadForChunk() const override { return approx_bytes_read_for_chunk; }
+
 private:
     std::unique_ptr<NativeReader> reader;
     Block header;
     BlockMissingValues block_missing_values;
+    size_t approx_bytes_read_for_chunk;
 };
 
 class NativeOutputFormat final : public IOutputFormat
diff --git a/src/Processors/Formats/Impl/NullFormat.cpp b/src/Processors/Formats/Impl/NullFormat.cpp
index 59514be9abc..4bd2249ac16 100644
--- a/src/Processors/Formats/Impl/NullFormat.cpp
+++ b/src/Processors/Formats/Impl/NullFormat.cpp
@@ -6,7 +6,9 @@
 namespace DB
 {
 
-WriteBuffer NullOutputFormat::empty_buffer(nullptr, 0);
+WriteBufferFromPointer NullOutputFormat::empty_buffer(nullptr, 0);
+
+NullOutputFormat::NullOutputFormat(const Block & header) : IOutputFormat(header, empty_buffer) {}
 
 void registerOutputFormatNull(FormatFactory & factory)
 {
diff --git a/src/Processors/Formats/Impl/NullFormat.h b/src/Processors/Formats/Impl/NullFormat.h
index 7aa9102790f..3362131c4d3 100644
--- a/src/Processors/Formats/Impl/NullFormat.h
+++ b/src/Processors/Formats/Impl/NullFormat.h
@@ -4,10 +4,12 @@
 namespace DB
 {
 
+class WriteBufferFromPointer;
+
 class NullOutputFormat final : public IOutputFormat
 {
 public:
-    explicit NullOutputFormat(const Block & header) : IOutputFormat(header, empty_buffer) {}
+    explicit NullOutputFormat(const Block & header);
 
     String getName() const override { return "Null"; }
 
@@ -15,7 +17,7 @@ protected:
     void consume(Chunk) override {}
 
 private:
-    static WriteBuffer empty_buffer;
+    static WriteBufferFromPointer empty_buffer;
 };
 
 }
diff --git a/src/Processors/Formats/Impl/ORCBlockInputFormat.cpp b/src/Processors/Formats/Impl/ORCBlockInputFormat.cpp
index 5cbe2e24359..016f07731d5 100644
--- a/src/Processors/Formats/Impl/ORCBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ORCBlockInputFormat.cpp
@@ -64,6 +64,7 @@ Chunk ORCBlockInputFormat::generate()
     if (!table || !num_rows)
         return {};
 
+    approx_bytes_read_for_chunk = file_reader->GetRawORCReader()->getStripe(stripe_current)->getDataLength();
     ++stripe_current;
 
     Chunk res;
diff --git a/src/Processors/Formats/Impl/ORCBlockInputFormat.h b/src/Processors/Formats/Impl/ORCBlockInputFormat.h
index 3d8bc781278..98561e72e61 100644
--- a/src/Processors/Formats/Impl/ORCBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/ORCBlockInputFormat.h
@@ -29,6 +29,8 @@ public:
 
     const BlockMissingValues & getMissingValues() const override;
 
+    size_t getApproxBytesReadForChunk() const override { return approx_bytes_read_for_chunk; }
+
 protected:
     Chunk generate() override;
 
@@ -50,6 +52,7 @@ private:
     std::vector<int> include_indices;
 
     BlockMissingValues block_missing_values;
+    size_t approx_bytes_read_for_chunk;
 
     const FormatSettings format_settings;
     const std::unordered_set<int> & skip_stripes;
diff --git a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp
index 62ee4e4a48d..46fe2ba26a8 100644
--- a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp
@@ -224,6 +224,8 @@ namespace DB
 
             /// Flush all the data to handmade buffer.
             formatter->flush();
+            formatter->finalizeBuffers();
+            out_buffer.finalize();
             unit.actual_memory_size = out_buffer.getActualSize();
 
             {
diff --git a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
index fddcd059be5..490f033b87e 100644
--- a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
+++ b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
@@ -87,6 +87,7 @@ public:
 
         NullWriteBuffer buf;
         save_totals_and_extremes_in_statistics = internal_formatter_creator(buf)->areTotalsAndExtremesUsedInFinalize();
+        buf.finalize();
 
         /// Just heuristic. We need one thread for collecting, one thread for receiving chunks
         /// and n threads for formatting.
diff --git a/src/Processors/Formats/Impl/ParallelParsingInputFormat.cpp b/src/Processors/Formats/Impl/ParallelParsingInputFormat.cpp
index f4d619a263b..06d5c80281f 100644
--- a/src/Processors/Formats/Impl/ParallelParsingInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ParallelParsingInputFormat.cpp
@@ -39,8 +39,10 @@ void ParallelParsingInputFormat::segmentatorThreadFunction(ThreadGroupPtr thread
             // Segmentating the original input.
             unit.segment.resize(0);
 
+            size_t segment_start = getDataOffsetMaybeCompressed(*in);
             auto [have_more_data, currently_read_rows] = file_segmentation_engine(*in, unit.segment, min_chunk_bytes, max_block_size);
 
+            unit.original_segment_size = getDataOffsetMaybeCompressed(*in) - segment_start;
             unit.offset = successfully_read_rows_count;
             successfully_read_rows_count += currently_read_rows;
 
@@ -108,6 +110,11 @@ void ParallelParsingInputFormat::parserThreadFunction(ThreadGroupPtr thread_grou
             /// NOLINTNEXTLINE(bugprone-use-after-move, hicpp-invalid-access-moved)
             unit.chunk_ext.chunk.emplace_back(std::move(chunk));
             unit.chunk_ext.block_missing_values.emplace_back(parser.getMissingValues());
+            size_t approx_chunk_size = input_format->getApproxBytesReadForChunk();
+            /// We could decompress data during file segmentation.
+            /// Correct chunk size using original segment size.
+            approx_chunk_size = static_cast<size_t>(std::ceil(static_cast<double>(approx_chunk_size) / unit.segment.size() * unit.original_segment_size));
+            unit.chunk_ext.approx_chunk_sizes.push_back(approx_chunk_size);
         }
 
         /// Extract column_mapping from first parser to propagate it to others
@@ -237,6 +244,7 @@ Chunk ParallelParsingInputFormat::generate()
 
     Chunk res = std::move(unit.chunk_ext.chunk.at(*next_block_in_current_unit));
     last_block_missing_values = std::move(unit.chunk_ext.block_missing_values[*next_block_in_current_unit]);
+    last_approx_bytes_read_for_chunk = unit.chunk_ext.approx_chunk_sizes.at(*next_block_in_current_unit);
 
     next_block_in_current_unit.value() += 1;
 
diff --git a/src/Processors/Formats/Impl/ParallelParsingInputFormat.h b/src/Processors/Formats/Impl/ParallelParsingInputFormat.h
index 6b084962710..4495680f5b2 100644
--- a/src/Processors/Formats/Impl/ParallelParsingInputFormat.h
+++ b/src/Processors/Formats/Impl/ParallelParsingInputFormat.h
@@ -126,6 +126,8 @@ public:
         return last_block_missing_values;
     }
 
+    size_t getApproxBytesReadForChunk() const override { return last_approx_bytes_read_for_chunk; }
+
     String getName() const override final { return "ParallelParsingBlockInputFormat"; }
 
 private:
@@ -200,6 +202,7 @@ private:
     const size_t max_block_size;
 
     BlockMissingValues last_block_missing_values;
+    size_t last_approx_bytes_read_for_chunk;
 
     /// Non-atomic because it is used in one thread.
     std::optional<size_t> next_block_in_current_unit;
@@ -245,6 +248,7 @@ private:
     {
         std::vector<Chunk> chunk;
         std::vector<BlockMissingValues> block_missing_values;
+        std::vector<size_t> approx_chunk_sizes;
     };
 
     struct ProcessingUnit
@@ -256,6 +260,7 @@ private:
 
         ChunkExt chunk_ext;
         Memory<> segment;
+        size_t original_segment_size;
         std::atomic<ProcessingUnitStatus> status;
         /// Needed for better exception message.
         size_t offset = 0;
diff --git a/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp b/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp
index 2f3c68aa481..3dde8ad6a6c 100644
--- a/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp
@@ -147,6 +147,9 @@ void ParquetBlockInputFormat::initializeRowGroupReader(size_t row_group_idx)
         format_settings.parquet.allow_missing_columns,
         format_settings.null_as_default,
         format_settings.parquet.case_insensitive_column_matching);
+
+    row_group.row_group_bytes_uncompressed = metadata->RowGroup(static_cast<int>(row_group_idx))->total_compressed_size();
+    row_group.row_group_rows = metadata->RowGroup(static_cast<int>(row_group_idx))->num_rows();
 }
 
 void ParquetBlockInputFormat::scheduleRowGroup(size_t row_group_idx)
@@ -253,7 +256,8 @@ void ParquetBlockInputFormat::decodeOneChunk(size_t row_group_idx, std::unique_l
 
     auto tmp_table = arrow::Table::FromRecordBatches({*batch});
 
-    PendingChunk res = {.chunk_idx = row_group.next_chunk_idx, .row_group_idx = row_group_idx};
+    size_t approx_chunk_original_size = static_cast<size_t>(std::ceil(static_cast<double>(row_group.row_group_bytes_uncompressed) / row_group.row_group_rows * (*tmp_table)->num_rows()));
+    PendingChunk res = {.chunk_idx = row_group.next_chunk_idx, .row_group_idx = row_group_idx, .approx_original_chunk_size = approx_chunk_original_size};
 
     /// If defaults_for_omitted_fields is true, calculate the default values from default expression for omitted fields.
     /// Otherwise fill the missing columns with zero values of its type.
@@ -327,6 +331,7 @@ Chunk ParquetBlockInputFormat::generate()
             scheduleMoreWorkIfNeeded(chunk.row_group_idx);
 
             previous_block_missing_values = std::move(chunk.block_missing_values);
+            previous_approx_bytes_read_for_chunk = chunk.approx_original_chunk_size;
             return std::move(chunk.chunk);
         }
 
diff --git a/src/Processors/Formats/Impl/ParquetBlockInputFormat.h b/src/Processors/Formats/Impl/ParquetBlockInputFormat.h
index ad7074547fc..a14c51f8b9f 100644
--- a/src/Processors/Formats/Impl/ParquetBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/ParquetBlockInputFormat.h
@@ -60,6 +60,8 @@ public:
 
     const BlockMissingValues & getMissingValues() const override;
 
+    size_t getApproxBytesReadForChunk() const override { return previous_approx_bytes_read_for_chunk; }
+
 private:
     Chunk generate() override;
 
@@ -200,6 +202,9 @@ private:
         size_t next_chunk_idx = 0;
         size_t num_pending_chunks = 0;
 
+        size_t row_group_bytes_uncompressed = 0;
+        size_t row_group_rows = 0;
+
         // These are only used by the decoding thread, so don't require locking the mutex.
         std::unique_ptr<parquet::arrow::FileReader> file_reader;
         std::shared_ptr<arrow::RecordBatchReader> record_batch_reader;
@@ -213,6 +218,7 @@ private:
         BlockMissingValues block_missing_values;
         size_t chunk_idx; // within row group
         size_t row_group_idx;
+        size_t approx_original_chunk_size;
 
         // For priority_queue.
         // In ordered mode we deliver strictly in order of increasing row group idx,
@@ -267,6 +273,7 @@ private:
     std::unique_ptr<ThreadPool> pool;
 
     BlockMissingValues previous_block_missing_values;
+    size_t previous_approx_bytes_read_for_chunk;
 
     std::exception_ptr background_exception = nullptr;
     std::atomic<int> is_stopped{0};
diff --git a/src/Processors/Formats/Impl/ParquetBlockOutputFormat.cpp b/src/Processors/Formats/Impl/ParquetBlockOutputFormat.cpp
index 031e499b545..91840cd2c50 100644
--- a/src/Processors/Formats/Impl/ParquetBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/ParquetBlockOutputFormat.cpp
@@ -20,47 +20,47 @@ namespace ErrorCodes
 namespace
 {
 
-parquet::ParquetVersion::type getParquetVersion(const FormatSettings & settings)
-{
-    switch (settings.parquet.output_version)
+    parquet::ParquetVersion::type getParquetVersion(const FormatSettings & settings)
     {
-        case FormatSettings::ParquetVersion::V1_0:
-            return parquet::ParquetVersion::PARQUET_1_0;
-        case FormatSettings::ParquetVersion::V2_4:
-            return parquet::ParquetVersion::PARQUET_2_4;
-        case FormatSettings::ParquetVersion::V2_6:
-            return parquet::ParquetVersion::PARQUET_2_6;
-        case FormatSettings::ParquetVersion::V2_LATEST:
-            return parquet::ParquetVersion::PARQUET_2_LATEST;
+        switch (settings.parquet.output_version)
+        {
+            case FormatSettings::ParquetVersion::V1_0:
+                return parquet::ParquetVersion::PARQUET_1_0;
+            case FormatSettings::ParquetVersion::V2_4:
+                return parquet::ParquetVersion::PARQUET_2_4;
+            case FormatSettings::ParquetVersion::V2_6:
+                return parquet::ParquetVersion::PARQUET_2_6;
+            case FormatSettings::ParquetVersion::V2_LATEST:
+                return parquet::ParquetVersion::PARQUET_2_LATEST;
+        }
     }
-}
 
-parquet::Compression::type getParquetCompression(FormatSettings::ParquetCompression method)
-{
-    if (method == FormatSettings::ParquetCompression::NONE)
-        return parquet::Compression::type::UNCOMPRESSED;
+    parquet::Compression::type getParquetCompression(FormatSettings::ParquetCompression method)
+    {
+        if (method == FormatSettings::ParquetCompression::NONE)
+            return parquet::Compression::type::UNCOMPRESSED;
 
 #if USE_SNAPPY
-    if (method == FormatSettings::ParquetCompression::SNAPPY)
-        return parquet::Compression::type::SNAPPY;
+        if (method == FormatSettings::ParquetCompression::SNAPPY)
+            return parquet::Compression::type::SNAPPY;
 #endif
 
 #if USE_BROTLI
-    if (method == FormatSettings::ParquetCompression::BROTLI)
-        return parquet::Compression::type::BROTLI;
+        if (method == FormatSettings::ParquetCompression::BROTLI)
+            return parquet::Compression::type::BROTLI;
 #endif
 
-    if (method == FormatSettings::ParquetCompression::ZSTD)
-        return parquet::Compression::type::ZSTD;
+        if (method == FormatSettings::ParquetCompression::ZSTD)
+            return parquet::Compression::type::ZSTD;
 
-    if (method == FormatSettings::ParquetCompression::LZ4)
-        return parquet::Compression::type::LZ4;
+        if (method == FormatSettings::ParquetCompression::LZ4)
+            return parquet::Compression::type::LZ4;
 
-    if (method == FormatSettings::ParquetCompression::GZIP)
-        return parquet::Compression::type::GZIP;
+        if (method == FormatSettings::ParquetCompression::GZIP)
+            return parquet::Compression::type::GZIP;
 
-    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Unsupported compression method");
-}
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Unsupported compression method");
+    }
 
 }
 
@@ -69,70 +69,9 @@ ParquetBlockOutputFormat::ParquetBlockOutputFormat(WriteBuffer & out_, const Blo
 {
 }
 
-void ParquetBlockOutputFormat::consume(Chunk chunk)
+void ParquetBlockOutputFormat::consumeStaged()
 {
-    /// Do something like SquashingTransform to produce big enough row groups.
-    /// Because the real SquashingTransform is only used for INSERT, not for SELECT ... INTO OUTFILE.
-    /// The latter doesn't even have a pipeline where a transform could be inserted, so it's more
-    /// convenient to do the squashing here.
-
-    appendToAccumulatedChunk(std::move(chunk));
-
-    if (!accumulated_chunk)
-        return;
-
-    const size_t target_rows = std::max(static_cast<UInt64>(1), format_settings.parquet.row_group_rows);
-
-    if (accumulated_chunk.getNumRows() < target_rows &&
-        accumulated_chunk.bytes() < format_settings.parquet.row_group_bytes)
-        return;
-
-    /// Increase row group size slightly (by < 2x) to avoid adding a small row groups for the
-    /// remainder of the new chunk.
-    /// E.g. suppose input chunks are 70K rows each, and max_rows = 1M. Then we'll have
-    /// getNumRows() = 1.05M. We want to write all 1.05M as one row group instead of 1M and 0.05M.
-    size_t num_row_groups = std::max(static_cast<UInt64>(1), accumulated_chunk.getNumRows() / target_rows);
-    size_t row_group_size = (accumulated_chunk.getNumRows() - 1) / num_row_groups + 1; // round up
-
-    write(std::move(accumulated_chunk), row_group_size);
-    accumulated_chunk.clear();
-}
-
-void ParquetBlockOutputFormat::finalizeImpl()
-{
-    if (accumulated_chunk)
-        write(std::move(accumulated_chunk), format_settings.parquet.row_group_rows);
-
-    if (!file_writer)
-    {
-        Block header = materializeBlock(getPort(PortKind::Main).getHeader());
-        write(Chunk(header.getColumns(), 0), 1);
-    }
-
-    auto status = file_writer->Close();
-    if (!status.ok())
-        throw Exception(ErrorCodes::UNKNOWN_EXCEPTION, "Error while closing a table: {}", status.ToString());
-}
-
-void ParquetBlockOutputFormat::resetFormatterImpl()
-{
-    file_writer.reset();
-}
-
-void ParquetBlockOutputFormat::appendToAccumulatedChunk(Chunk chunk)
-{
-    if (!accumulated_chunk)
-    {
-        accumulated_chunk = std::move(chunk);
-        return;
-    }
-    chassert(accumulated_chunk.getNumColumns() == chunk.getNumColumns());
-    accumulated_chunk.append(chunk);
-}
-
-void ParquetBlockOutputFormat::write(Chunk chunk, size_t row_group_size)
-{
-    const size_t columns_num = chunk.getNumColumns();
+    const size_t columns_num = staging_chunks.at(0).getNumColumns();
     std::shared_ptr<arrow::Table> arrow_table;
 
     if (!ch_column_to_arrow_column)
@@ -146,7 +85,7 @@ void ParquetBlockOutputFormat::write(Chunk chunk, size_t row_group_size)
             format_settings.parquet.output_fixed_string_as_fixed_byte_array);
     }
 
-    ch_column_to_arrow_column->chChunkToArrowTable(arrow_table, chunk, columns_num);
+    ch_column_to_arrow_column->chChunkToArrowTable(arrow_table, staging_chunks, columns_num);
 
     if (!file_writer)
     {
@@ -173,12 +112,66 @@ void ParquetBlockOutputFormat::write(Chunk chunk, size_t row_group_size)
         file_writer = std::move(result.ValueOrDie());
     }
 
-    auto status = file_writer->WriteTable(*arrow_table, row_group_size);
+    // TODO: calculate row_group_size depending on a number of rows and table size
+
+    // allow slightly bigger than row_group_size to avoid a very small tail row group
+    auto status = file_writer->WriteTable(*arrow_table, std::max<size_t>(format_settings.parquet.row_group_rows, staging_rows));
 
     if (!status.ok())
         throw Exception(ErrorCodes::UNKNOWN_EXCEPTION, "Error while writing a table: {}", status.ToString());
 }
 
+void ParquetBlockOutputFormat::consume(Chunk chunk)
+{
+    /// Do something like SquashingTransform to produce big enough row groups.
+    /// Because the real SquashingTransform is only used for INSERT, not for SELECT ... INTO OUTFILE.
+    /// The latter doesn't even have a pipeline where a transform could be inserted, so it's more
+    /// convenient to do the squashing here.
+    staging_rows += chunk.getNumRows();
+    staging_bytes += chunk.bytes();
+    staging_chunks.push_back(std::move(chunk));
+    chassert(staging_chunks.back().getNumColumns() == staging_chunks.front().getNumColumns());
+    if (staging_rows < format_settings.parquet.row_group_rows &&
+        staging_bytes < format_settings.parquet.row_group_bytes)
+    {
+        return;
+    }
+    else
+    {
+        consumeStaged();
+        staging_chunks.clear();
+        staging_rows = 0;
+        staging_bytes = 0;
+    }
+}
+
+void ParquetBlockOutputFormat::finalizeImpl()
+{
+    if (!file_writer && staging_chunks.empty())
+    {
+        Block header = materializeBlock(getPort(PortKind::Main).getHeader());
+
+        consume(Chunk(header.getColumns(), 0)); // this will make staging_chunks non-empty
+    }
+
+    if (!staging_chunks.empty())
+    {
+        consumeStaged();
+        staging_chunks.clear();
+        staging_rows = 0;
+        staging_bytes = 0;
+    }
+
+    auto status = file_writer->Close();
+    if (!status.ok())
+        throw Exception(ErrorCodes::UNKNOWN_EXCEPTION, "Error while closing a table: {}", status.ToString());
+}
+
+void ParquetBlockOutputFormat::resetFormatterImpl()
+{
+    file_writer.reset();
+}
+
 void registerOutputFormatParquet(FormatFactory & factory)
 {
     factory.registerOutputFormat(
diff --git a/src/Processors/Formats/Impl/ParquetBlockOutputFormat.h b/src/Processors/Formats/Impl/ParquetBlockOutputFormat.h
index 0fb7013e6d6..482c778bc52 100644
--- a/src/Processors/Formats/Impl/ParquetBlockOutputFormat.h
+++ b/src/Processors/Formats/Impl/ParquetBlockOutputFormat.h
@@ -34,18 +34,19 @@ public:
     String getContentType() const override { return "application/octet-stream"; }
 
 private:
+    void consumeStaged();
     void consume(Chunk) override;
-    void appendToAccumulatedChunk(Chunk chunk);
-    void write(Chunk chunk, size_t row_group_size);
     void finalizeImpl() override;
     void resetFormatterImpl() override;
 
+    std::vector<Chunk> staging_chunks;
+    size_t staging_rows = 0;
+    size_t staging_bytes = 0;
+
     const FormatSettings format_settings;
 
     std::unique_ptr<parquet::arrow::FileWriter> file_writer;
     std::unique_ptr<CHColumnToArrowColumn> ch_column_to_arrow_column;
-
-    Chunk accumulated_chunk;
 };
 
 }
diff --git a/src/Processors/Formats/Impl/ProtobufListInputFormat.cpp b/src/Processors/Formats/Impl/ProtobufListInputFormat.cpp
index 9777f2361a2..6098923a195 100644
--- a/src/Processors/Formats/Impl/ProtobufListInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ProtobufListInputFormat.cpp
@@ -88,7 +88,14 @@ void registerInputFormatProtobufList(FormatFactory & factory)
             });
     factory.markFormatSupportsSubsetOfColumns("ProtobufList");
     factory.registerAdditionalInfoForSchemaCacheGetter(
-        "ProtobufList", [](const FormatSettings & settings) { return fmt::format("format_schema={}", settings.schema.format_schema); });
+        "ProtobufList",
+        [](const FormatSettings & settings)
+        {
+            return fmt::format(
+                "format_schema={}, skip_fields_with_unsupported_types_in_schema_inference={}",
+                settings.schema.format_schema,
+                settings.protobuf.skip_fields_with_unsupported_types_in_schema_inference);
+        });
 }
 
 void registerProtobufListSchemaReader(FormatFactory & factory)
diff --git a/src/Processors/Formats/Impl/ProtobufRowInputFormat.cpp b/src/Processors/Formats/Impl/ProtobufRowInputFormat.cpp
index ee60501dba5..126f3673571 100644
--- a/src/Processors/Formats/Impl/ProtobufRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ProtobufRowInputFormat.cpp
@@ -128,7 +128,14 @@ void registerProtobufSchemaReader(FormatFactory & factory)
 
     for (const auto & name : {"Protobuf", "ProtobufSingle"})
         factory.registerAdditionalInfoForSchemaCacheGetter(
-            name, [](const FormatSettings & settings) { return fmt::format("format_schema={}", settings.schema.format_schema); });
+            name,
+            [](const FormatSettings & settings)
+            {
+                return fmt::format(
+                    "format_schema={}, skip_fields_with_unsupported_types_in_schema_inference={}",
+                    settings.schema.format_schema,
+                    settings.protobuf.skip_fields_with_unsupported_types_in_schema_inference);
+            });
 }
 
 }
diff --git a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
index af5f1f90732..2239c8539e3 100644
--- a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
@@ -286,6 +286,20 @@ void TabSeparatedFormatReader::setReadBuffer(ReadBuffer & in_)
     FormatWithNamesAndTypesReader::setReadBuffer(*buf);
 }
 
+bool TabSeparatedFormatReader::checkForSuffix()
+{
+    if (!format_settings.tsv.skip_trailing_empty_lines)
+        return buf->eof();
+
+    PeekableReadBufferCheckpoint checkpoint(*buf);
+    while (checkChar('\n', *buf) || checkChar('\r', *buf));
+    if (buf->eof())
+        return true;
+
+    buf->rollbackToCheckpoint();
+    return false;
+}
+
 TabSeparatedSchemaReader::TabSeparatedSchemaReader(
     ReadBuffer & in_, bool with_names_, bool with_types_, bool is_raw_, const FormatSettings & format_settings_)
     : FormatWithNamesAndTypesSchemaReader(
diff --git a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h
index 0f4bff8d7d0..8df57675cf5 100644
--- a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h
+++ b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h
@@ -75,6 +75,8 @@ public:
 
     void setReadBuffer(ReadBuffer & in_) override;
 
+    bool checkForSuffix() override;
+
 private:
     template <bool is_header>
     std::vector<String> readRowImpl();
diff --git a/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp b/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
index ad4e259d874..d61e723fd75 100644
--- a/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
@@ -61,6 +61,7 @@ Chunk ValuesBlockInputFormat::generate()
     const Block & header = getPort().getHeader();
     MutableColumns columns = header.cloneEmptyColumns();
     block_missing_values.clear();
+    size_t chunk_start = getDataOffsetMaybeCompressed(*buf);
 
     for (size_t rows_in_block = 0; rows_in_block < params.max_block_size; ++rows_in_block)
     {
@@ -79,6 +80,8 @@ Chunk ValuesBlockInputFormat::generate()
         }
     }
 
+    approx_bytes_read_for_chunk = getDataOffsetMaybeCompressed(*buf) - chunk_start;
+
     /// Evaluate expressions, which were parsed using templates, if any
     for (size_t i = 0; i < columns.size(); ++i)
     {
diff --git a/src/Processors/Formats/Impl/ValuesBlockInputFormat.h b/src/Processors/Formats/Impl/ValuesBlockInputFormat.h
index 9abade72af1..d540a24fa70 100644
--- a/src/Processors/Formats/Impl/ValuesBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/ValuesBlockInputFormat.h
@@ -40,6 +40,7 @@ public:
 
     const BlockMissingValues & getMissingValues() const override { return block_missing_values; }
 
+    size_t getApproxBytesReadForChunk() const override { return approx_bytes_read_for_chunk; }
 private:
     ValuesBlockInputFormat(std::unique_ptr<PeekableReadBuffer> buf_, const Block & header_, const RowInputFormatParams & params_,
                            const FormatSettings & format_settings_);
@@ -95,6 +96,7 @@ private:
     Serializations serializations;
 
     BlockMissingValues block_missing_values;
+    size_t approx_bytes_read_for_chunk;
 };
 
 class ValuesSchemaReader : public IRowSchemaReader
diff --git a/src/Processors/Formats/LazyOutputFormat.cpp b/src/Processors/Formats/LazyOutputFormat.cpp
index 792d805eac3..4f6b10dd068 100644
--- a/src/Processors/Formats/LazyOutputFormat.cpp
+++ b/src/Processors/Formats/LazyOutputFormat.cpp
@@ -5,7 +5,7 @@
 namespace DB
 {
 
-WriteBuffer LazyOutputFormat::out(nullptr, 0);
+WriteBufferFromPointer LazyOutputFormat::out(nullptr, 0);
 
 Chunk LazyOutputFormat::getChunk(UInt64 milliseconds)
 {
diff --git a/src/Processors/Formats/LazyOutputFormat.h b/src/Processors/Formats/LazyOutputFormat.h
index b539a8494c7..9cf609ed2d7 100644
--- a/src/Processors/Formats/LazyOutputFormat.h
+++ b/src/Processors/Formats/LazyOutputFormat.h
@@ -57,7 +57,7 @@ private:
     Chunk extremes;
 
     /// Is not used.
-    static WriteBuffer out;
+    static WriteBufferFromPointer out;
 
     ProfileInfo info;
 };
diff --git a/src/Processors/Formats/PullingOutputFormat.cpp b/src/Processors/Formats/PullingOutputFormat.cpp
index c2036ce37c9..b2378e62d34 100644
--- a/src/Processors/Formats/PullingOutputFormat.cpp
+++ b/src/Processors/Formats/PullingOutputFormat.cpp
@@ -9,7 +9,12 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-WriteBuffer PullingOutputFormat::out(nullptr, 0);
+WriteBufferFromPointer PullingOutputFormat::out(nullptr, 0);
+
+PullingOutputFormat::PullingOutputFormat(const Block & header, std::atomic_bool & consume_data_flag_)
+    : IOutputFormat(header, out)
+    , has_data_flag(consume_data_flag_)
+{}
 
 void PullingOutputFormat::consume(Chunk chunk)
 {
diff --git a/src/Processors/Formats/PullingOutputFormat.h b/src/Processors/Formats/PullingOutputFormat.h
index a231b7679f3..a8efb8dd962 100644
--- a/src/Processors/Formats/PullingOutputFormat.h
+++ b/src/Processors/Formats/PullingOutputFormat.h
@@ -5,14 +5,13 @@
 namespace DB
 {
 
+class WriteBufferFromPointer;
+
 /// Output format which is used in PullingPipelineExecutor.
 class PullingOutputFormat : public IOutputFormat
 {
 public:
-    explicit PullingOutputFormat(const Block & header, std::atomic_bool & consume_data_flag_)
-        : IOutputFormat(header, out)
-        , has_data_flag(consume_data_flag_)
-    {}
+    PullingOutputFormat(const Block & header, std::atomic_bool & consume_data_flag_);
 
     String getName() const override { return "PullingOutputFormat"; }
 
@@ -41,7 +40,7 @@ private:
     ProfileInfo info;
 
     /// Is not used.
-    static WriteBuffer out;
+    static WriteBufferFromPointer out;
 };
 
 }
diff --git a/src/Processors/QueryPlan/CreateSetAndFilterOnTheFlyStep.cpp b/src/Processors/QueryPlan/CreateSetAndFilterOnTheFlyStep.cpp
index fe362f64b96..c54d32c1385 100644
--- a/src/Processors/QueryPlan/CreateSetAndFilterOnTheFlyStep.cpp
+++ b/src/Processors/QueryPlan/CreateSetAndFilterOnTheFlyStep.cpp
@@ -105,7 +105,7 @@ CreateSetAndFilterOnTheFlyStep::CreateSetAndFilterOnTheFlyStep(
     : ITransformingStep(input_stream_, input_stream_.header, getTraits())
     , column_names(column_names_)
     , max_rows_in_set(max_rows_in_set_)
-    , own_set(std::make_shared<SetWithState>(SizeLimits(max_rows_in_set, 0, OverflowMode::BREAK), false, true))
+    , own_set(std::make_shared<SetWithState>(SizeLimits(max_rows_in_set, 0, OverflowMode::BREAK), 0, true))
     , filtering_set(nullptr)
     , crosswise_connection(crosswise_connection_)
     , position(position_)
diff --git a/src/Processors/QueryPlan/CreatingSetsStep.cpp b/src/Processors/QueryPlan/CreatingSetsStep.cpp
index b5d773d889f..3e4dfb0c7d1 100644
--- a/src/Processors/QueryPlan/CreatingSetsStep.cpp
+++ b/src/Processors/QueryPlan/CreatingSetsStep.cpp
@@ -1,6 +1,8 @@
 #include <exception>
 #include <Processors/QueryPlan/CreatingSetsStep.h>
 #include <Processors/QueryPlan/QueryPlan.h>
+//#include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
+#include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
 #include <QueryPipeline/QueryPipelineBuilder.h>
 #include <Processors/Transforms/CreatingSetsTransform.h>
 #include <IO/Operators.h>
@@ -34,21 +36,21 @@ static ITransformingStep::Traits getTraits()
 
 CreatingSetStep::CreatingSetStep(
     const DataStream & input_stream_,
-    String description_,
-    SubqueryForSet subquery_for_set_,
+    SetAndKeyPtr set_and_key_,
+    StoragePtr external_table_,
     SizeLimits network_transfer_limits_,
     ContextPtr context_)
     : ITransformingStep(input_stream_, Block{}, getTraits())
-    , WithContext(context_)
-    , description(std::move(description_))
-    , subquery_for_set(std::move(subquery_for_set_))
+    , set_and_key(std::move(set_and_key_))
+    , external_table(std::move(external_table_))
     , network_transfer_limits(std::move(network_transfer_limits_))
+    , context(std::move(context_))
 {
 }
 
 void CreatingSetStep::transformPipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
 {
-    pipeline.addCreatingSetsTransform(getOutputStream().header, std::move(subquery_for_set), network_transfer_limits, getContext());
+    pipeline.addCreatingSetsTransform(getOutputStream().header, std::move(set_and_key), std::move(external_table), network_transfer_limits, context->getPreparedSetsCache());
 }
 
 void CreatingSetStep::updateOutputStream()
@@ -61,16 +63,16 @@ void CreatingSetStep::describeActions(FormatSettings & settings) const
     String prefix(settings.offset, ' ');
 
     settings.out << prefix;
-    if (subquery_for_set.set_in_progress)
+    if (set_and_key->set)
         settings.out << "Set: ";
 
-    settings.out << description << '\n';
+    settings.out << set_and_key->key << '\n';
 }
 
 void CreatingSetStep::describeActions(JSONBuilder::JSONMap & map) const
 {
-    if (subquery_for_set.set_in_progress)
-        map.add("Set", description);
+    if (set_and_key->set)
+        map.add("Set", set_and_key->key);
 }
 
 
@@ -80,7 +82,7 @@ CreatingSetsStep::CreatingSetsStep(DataStreams input_streams_)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "CreatingSetsStep cannot be created with no inputs");
 
     input_streams = std::move(input_streams_);
-    output_stream = input_streams.front();
+    output_stream = DataStream{input_streams.front().header};
 
     for (size_t i = 1; i < input_streams.size(); ++i)
         if (input_streams[i].header)
@@ -122,7 +124,7 @@ void CreatingSetsStep::describePipeline(FormatSettings & settings) const
     IQueryPlanStep::describePipeline(processors, settings);
 }
 
-void addCreatingSetsStep(QueryPlan & query_plan, PreparedSets::SubqueriesForSets subqueries_for_sets, ContextPtr context)
+void addCreatingSetsStep(QueryPlan & query_plan, PreparedSets::Subqueries subqueries, ContextPtr context)
 {
     DataStreams input_streams;
     input_streams.emplace_back(query_plan.getCurrentDataStream());
@@ -131,26 +133,14 @@ void addCreatingSetsStep(QueryPlan & query_plan, PreparedSets::SubqueriesForSets
     plans.emplace_back(std::make_unique<QueryPlan>(std::move(query_plan)));
     query_plan = QueryPlan();
 
-    for (auto & [description, subquery_for_set] : subqueries_for_sets)
+    for (auto & future_set : subqueries)
     {
-        if (!subquery_for_set.hasSource())
-        {
-            subquery_for_set.promise_to_fill_set.set_exception(std::make_exception_ptr(
-                Exception(ErrorCodes::LOGICAL_ERROR, "Subquery for set {} has no source", subquery_for_set.key)));
+        if (future_set->get())
             continue;
-        }
 
-        auto plan = subquery_for_set.detachSource();
-
-        const Settings & settings = context->getSettingsRef();
-        auto creating_set = std::make_unique<CreatingSetStep>(
-                plan->getCurrentDataStream(),
-                description,
-                std::move(subquery_for_set),
-                SizeLimits(settings.max_rows_to_transfer, settings.max_bytes_to_transfer, settings.transfer_overflow_mode),
-                context);
-        creating_set->setStepDescription("Create set for subquery");
-        plan->addStep(std::move(creating_set));
+        auto plan = future_set->build(context);
+        if (!plan)
+            continue;
 
         input_streams.emplace_back(plan->getCurrentDataStream());
         plans.emplace_back(std::move(plan));
@@ -167,12 +157,52 @@ void addCreatingSetsStep(QueryPlan & query_plan, PreparedSets::SubqueriesForSets
     query_plan.unitePlans(std::move(creating_sets), std::move(plans));
 }
 
+std::vector<std::unique_ptr<QueryPlan>> DelayedCreatingSetsStep::makePlansForSets(DelayedCreatingSetsStep && step)
+{
+    std::vector<std::unique_ptr<QueryPlan>> plans;
+
+    for (auto & future_set : step.subqueries)
+    {
+        if (future_set->get())
+            continue;
+
+        auto plan = future_set->build(step.context);
+        if (!plan)
+            continue;
+
+        plan->optimize(QueryPlanOptimizationSettings::fromContext(step.context));
+
+        plans.emplace_back(std::move(plan));
+    }
+
+    return plans;
+}
+
 void addCreatingSetsStep(QueryPlan & query_plan, PreparedSetsPtr prepared_sets, ContextPtr context)
 {
-    if (!prepared_sets || prepared_sets->empty())
+    if (!prepared_sets)
         return;
 
-    addCreatingSetsStep(query_plan, prepared_sets->detachSubqueries(), context);
+    auto subqueries = prepared_sets->getSubqueries();
+    if (subqueries.empty())
+        return;
+
+    addCreatingSetsStep(query_plan, std::move(subqueries), context);
+}
+
+DelayedCreatingSetsStep::DelayedCreatingSetsStep(
+    DataStream input_stream, PreparedSets::Subqueries subqueries_, ContextPtr context_)
+    : subqueries(std::move(subqueries_)), context(std::move(context_))
+{
+    input_streams = {input_stream};
+    output_stream = std::move(input_stream);
+}
+
+QueryPipelineBuilderPtr DelayedCreatingSetsStep::updatePipeline(QueryPipelineBuilders, const BuildQueryPipelineSettings &)
+{
+    throw Exception(
+        ErrorCodes::LOGICAL_ERROR,
+        "Cannot build pipeline in DelayedCreatingSets. This step should be optimized out.");
 }
 
 }
diff --git a/src/Processors/QueryPlan/CreatingSetsStep.h b/src/Processors/QueryPlan/CreatingSetsStep.h
index b4777578a30..a90b70a2fa4 100644
--- a/src/Processors/QueryPlan/CreatingSetsStep.h
+++ b/src/Processors/QueryPlan/CreatingSetsStep.h
@@ -9,15 +9,15 @@ namespace DB
 {
 
 /// Creates sets for subqueries and JOIN. See CreatingSetsTransform.
-class CreatingSetStep : public ITransformingStep, WithContext
+class CreatingSetStep : public ITransformingStep
 {
 public:
     CreatingSetStep(
-            const DataStream & input_stream_,
-            String description_,
-            SubqueryForSet subquery_for_set_,
-            SizeLimits network_transfer_limits_,
-            ContextPtr context_);
+        const DataStream & input_stream_,
+        SetAndKeyPtr set_and_key_,
+        StoragePtr external_table_,
+        SizeLimits network_transfer_limits_,
+        ContextPtr context_);
 
     String getName() const override { return "CreatingSet"; }
 
@@ -29,9 +29,10 @@ public:
 private:
     void updateOutputStream() override;
 
-    String description;
-    SubqueryForSet subquery_for_set;
+    SetAndKeyPtr set_and_key;
+    StoragePtr external_table;
     SizeLimits network_transfer_limits;
+    ContextPtr context;
 };
 
 class CreatingSetsStep : public IQueryPlanStep
@@ -46,7 +47,28 @@ public:
     void describePipeline(FormatSettings & settings) const override;
 };
 
-void addCreatingSetsStep(QueryPlan & query_plan, PreparedSets::SubqueriesForSets subqueries_for_sets, ContextPtr context);
+/// This is a temporary step which is converted to CreatingSetStep after plan optimization.
+/// Can't be used by itself.
+class DelayedCreatingSetsStep final : public IQueryPlanStep
+{
+public:
+    DelayedCreatingSetsStep(DataStream input_stream, PreparedSets::Subqueries subqueries_, ContextPtr context_);
+
+    String getName() const override { return "DelayedCreatingSets"; }
+
+    QueryPipelineBuilderPtr updatePipeline(QueryPipelineBuilders, const BuildQueryPipelineSettings &) override;
+
+    static std::vector<std::unique_ptr<QueryPlan>> makePlansForSets(DelayedCreatingSetsStep && step);
+
+    ContextPtr getContext() const { return context; }
+    PreparedSets::Subqueries detachSets() { return std::move(subqueries); }
+
+private:
+    PreparedSets::Subqueries subqueries;
+    ContextPtr context;
+};
+
+void addCreatingSetsStep(QueryPlan & query_plan, PreparedSets::Subqueries subqueries, ContextPtr context);
 
 void addCreatingSetsStep(QueryPlan & query_plan, PreparedSetsPtr prepared_sets, ContextPtr context);
 
diff --git a/src/Processors/QueryPlan/DistributedCreateLocalPlan.h b/src/Processors/QueryPlan/DistributedCreateLocalPlan.h
index 1afdc07fa4d..c08b9bdf67e 100644
--- a/src/Processors/QueryPlan/DistributedCreateLocalPlan.h
+++ b/src/Processors/QueryPlan/DistributedCreateLocalPlan.h
@@ -10,6 +10,9 @@
 namespace DB
 {
 
+class PreparedSets;
+using PreparedSetsPtr = std::shared_ptr<PreparedSets>;
+
 std::unique_ptr<QueryPlan> createLocalPlan(
     const ASTPtr & query_ast,
     const Block & header,
diff --git a/src/Processors/QueryPlan/Optimizations/Optimizations.h b/src/Processors/QueryPlan/Optimizations/Optimizations.h
index de1d43bed1b..bc47413cbb5 100644
--- a/src/Processors/QueryPlan/Optimizations/Optimizations.h
+++ b/src/Processors/QueryPlan/Optimizations/Optimizations.h
@@ -14,6 +14,9 @@ namespace QueryPlanOptimizations
 void optimizeTreeFirstPass(const QueryPlanOptimizationSettings & settings, QueryPlan::Node & root, QueryPlan::Nodes & nodes);
 /// Second pass is used to apply read-in-order and attach a predicate to PK.
 void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_settings, QueryPlan::Node & root, QueryPlan::Nodes & nodes);
+/// Third pass is used to apply filters such as key conditions and skip indexes to the storages that support them.
+/// After that it add CreateSetsStep for the subqueries that has not be used in the filters.
+void optimizeTreeThirdPass(QueryPlan::Node & root, QueryPlan::Nodes & nodes);
 
 /// Optimization (first pass) is a function applied to QueryPlan::Node.
 /// It can read and update subtree of specified node.
@@ -110,6 +113,7 @@ void optimizeReadInOrder(QueryPlan::Node & node, QueryPlan::Nodes & nodes);
 void optimizeAggregationInOrder(QueryPlan::Node & node, QueryPlan::Nodes &);
 bool optimizeUseAggregateProjections(QueryPlan::Node & node, QueryPlan::Nodes & nodes);
 bool optimizeUseNormalProjections(Stack & stack, QueryPlan::Nodes & nodes);
+bool addPlansForSets(QueryPlan::Node & node, QueryPlan::Nodes & nodes);
 
 /// Enable memory bound merging of aggregation states for remote queries
 /// in case it was enabled for local plan
diff --git a/src/Processors/QueryPlan/Optimizations/addPlansForSets.cpp b/src/Processors/QueryPlan/Optimizations/addPlansForSets.cpp
new file mode 100644
index 00000000000..e9100ae9d02
--- /dev/null
+++ b/src/Processors/QueryPlan/Optimizations/addPlansForSets.cpp
@@ -0,0 +1,35 @@
+#include <memory>
+#include <Processors/QueryPlan/Optimizations/Optimizations.h>
+#include <Processors/QueryPlan/CreatingSetsStep.h>
+#include <Common/typeid_cast.h>
+
+namespace DB::QueryPlanOptimizations
+{
+
+bool addPlansForSets(QueryPlan::Node & node, QueryPlan::Nodes & nodes)
+{
+    auto * delayed = typeid_cast<DelayedCreatingSetsStep *>(node.step.get());
+    if (!delayed)
+        return false;
+
+    auto plans = DelayedCreatingSetsStep::makePlansForSets(std::move(*delayed));
+    node.children.reserve(1 + plans.size());
+
+    DataStreams input_streams;
+    input_streams.reserve(1 + plans.size());
+    input_streams.push_back(node.children.front()->step->getOutputStream());
+
+    for (const auto & plan : plans)
+    {
+        input_streams.push_back(plan->getCurrentDataStream());
+        node.children.push_back(plan->getRootNode());
+        nodes.splice(nodes.end(), QueryPlan::detachNodes(std::move(*plan)));
+    }
+
+    auto creating_sets = std::make_unique<CreatingSetsStep>(std::move(input_streams));
+    creating_sets->setStepDescription("Create sets before main query execution");
+    node.step = std::move(creating_sets);
+    return true;
+}
+
+}
diff --git a/src/Processors/QueryPlan/Optimizations/filterPushDown.cpp b/src/Processors/QueryPlan/Optimizations/filterPushDown.cpp
index 37bc894339f..4336de41b7b 100644
--- a/src/Processors/QueryPlan/Optimizations/filterPushDown.cpp
+++ b/src/Processors/QueryPlan/Optimizations/filterPushDown.cpp
@@ -268,11 +268,24 @@ size_t tryPushDownFilter(QueryPlan::Node * parent_node, QueryPlan::Nodes & nodes
         return 2;
     }
 
+    if (auto * delayed = typeid_cast<DelayedCreatingSetsStep *>(child.get()))
+    {
+        /// CreatingSets does not change header.
+        /// We can push down filter and update header.
+        /// Filter - DelayedCreatingSets - Something
+        child = std::make_unique<DelayedCreatingSetsStep>(filter->getOutputStream(), delayed->detachSets(), delayed->getContext());
+        std::swap(parent, child);
+        std::swap(parent_node->children, child_node->children);
+        std::swap(parent_node->children.front(), child_node->children.front());
+        /// DelayedCreatingSets - Filter - Something
+        return 2;
+    }
+
     if (auto * totals_having = typeid_cast<TotalsHavingStep *>(child.get()))
     {
         /// If totals step has HAVING expression, skip it for now.
         /// TODO:
-        /// We can merge HAVING expression with current filer.
+        /// We can merge HAVING expression with current filter.
         /// Also, we can push down part of HAVING which depend only on aggregation keys.
         if (totals_having->getActions())
             return 0;
@@ -323,9 +336,9 @@ size_t tryPushDownFilter(QueryPlan::Node * parent_node, QueryPlan::Nodes & nodes
         {
             const auto & table_join = join ? join->getJoin()->getTableJoin() : filled_join->getJoin()->getTableJoin();
 
-            /// Only inner and left(/right) join are supported. Other types may generate default values for left table keys.
+            /// Only inner, cross and left(/right) join are supported. Other types may generate default values for left table keys.
             /// So, if we push down a condition like `key != 0`, not all rows may be filtered.
-            if (table_join.kind() != JoinKind::Inner && table_join.kind() != kind)
+            if (table_join.kind() != JoinKind::Inner && table_join.kind() != JoinKind::Cross && table_join.kind() != kind)
                 return 0;
 
             bool is_left = kind == JoinKind::Left;
diff --git a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
index dd17c1b5a30..e788918703e 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
@@ -114,32 +114,35 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
 
     while (!stack.empty())
     {
-        auto & frame = stack.back();
-
-        if (frame.next_child == 0)
         {
-            has_reading_from_mt |= typeid_cast<const ReadFromMergeTree *>(frame.node->step.get()) != nullptr;
+            /// NOTE: frame cannot be safely used after stack was modified.
+            auto & frame = stack.back();
 
-            if (optimization_settings.read_in_order)
-                optimizeReadInOrder(*frame.node, nodes);
+            if (frame.next_child == 0)
+            {
+                has_reading_from_mt |= typeid_cast<const ReadFromMergeTree *>(frame.node->step.get()) != nullptr;
 
-            if (optimization_settings.optimize_projection)
-                num_applied_projection += optimizeUseAggregateProjections(*frame.node, nodes);
+                if (optimization_settings.read_in_order)
+                    optimizeReadInOrder(*frame.node, nodes);
 
-            if (optimization_settings.aggregation_in_order)
-                optimizeAggregationInOrder(*frame.node, nodes);
+                if (optimization_settings.optimize_projection)
+                    num_applied_projection += optimizeUseAggregateProjections(*frame.node, nodes);
 
-            if (optimization_settings.distinct_in_order)
-                tryDistinctReadInOrder(frame.node);
-        }
+                if (optimization_settings.aggregation_in_order)
+                    optimizeAggregationInOrder(*frame.node, nodes);
 
-        /// Traverse all children first.
-        if (frame.next_child < frame.node->children.size())
-        {
-            auto next_frame = Frame{.node = frame.node->children[frame.next_child]};
-            ++frame.next_child;
-            stack.push_back(next_frame);
-            continue;
+                if (optimization_settings.distinct_in_order)
+                    tryDistinctReadInOrder(frame.node);
+            }
+
+            /// Traverse all children first.
+            if (frame.next_child < frame.node->children.size())
+            {
+                auto next_frame = Frame{.node = frame.node->children[frame.next_child]};
+                ++frame.next_child;
+                stack.push_back(next_frame);
+                continue;
+            }
         }
 
         if (optimization_settings.optimize_projection)
@@ -160,9 +163,10 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
             }
         }
 
+        /// NOTE: optimizePrewhere can modify the stack.
         optimizePrewhere(stack, nodes);
         optimizePrimaryKeyCondition(stack);
-        enableMemoryBoundMerging(*frame.node, nodes);
+        enableMemoryBoundMerging(*stack.back().node, nodes);
 
         stack.pop_back();
     }
@@ -173,5 +177,35 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
             "No projection is used when optimize_use_projections = 1 and force_optimize_projection = 1");
 }
 
+void optimizeTreeThirdPass(QueryPlan::Node & root, QueryPlan::Nodes & nodes)
+{
+    Stack stack;
+    stack.push_back({.node = &root});
+
+    while (!stack.empty())
+    {
+        /// NOTE: frame cannot be safely used after stack was modified.
+        auto & frame = stack.back();
+
+        /// Traverse all children first.
+        if (frame.next_child < frame.node->children.size())
+        {
+            auto next_frame = Frame{.node = frame.node->children[frame.next_child]};
+            ++frame.next_child;
+            stack.push_back(next_frame);
+            continue;
+        }
+
+        if (auto * source_step_with_filter = dynamic_cast<SourceStepWithFilter *>(frame.node->step.get()))
+        {
+            source_step_with_filter->applyFilters();
+        }
+
+        addPlansForSets(*frame.node, nodes);
+
+        stack.pop_back();
+    }
+}
+
 }
 }
diff --git a/src/Processors/QueryPlan/Optimizations/projectionsCommon.cpp b/src/Processors/QueryPlan/Optimizations/projectionsCommon.cpp
index 2f73e14b2a0..cb76ffa84ba 100644
--- a/src/Processors/QueryPlan/Optimizations/projectionsCommon.cpp
+++ b/src/Processors/QueryPlan/Optimizations/projectionsCommon.cpp
@@ -38,6 +38,9 @@ bool canUseProjectionForReadingStep(ReadFromMergeTree * reading)
     if (reading->isParallelReadingEnabled())
         return false;
 
+    if (reading->readsInOrder())
+        return false;
+
     // Currently projection don't support deduplication when moving parts between shards.
     if (reading->getContext()->getSettingsRef().allow_experimental_query_deduplication)
         return false;
diff --git a/src/Processors/QueryPlan/PartsSplitter.cpp b/src/Processors/QueryPlan/PartsSplitter.cpp
index 936182f8c00..9796e696f6c 100644
--- a/src/Processors/QueryPlan/PartsSplitter.cpp
+++ b/src/Processors/QueryPlan/PartsSplitter.cpp
@@ -126,7 +126,9 @@ std::pair<std::vector<Values>, std::vector<RangesInDataParts>> split(RangesInDat
             return marks_in_current_layer < intersected_parts * 2;
         };
 
-        result_layers.emplace_back();
+        auto & current_layer = result_layers.emplace_back();
+        /// Map part_idx into index inside layer, used to merge marks from the same part into one reader
+        std::unordered_map<size_t, size_t> part_idx_in_layer;
 
         while (rows_in_current_layer < rows_per_layer || layers_intersection_is_too_big() || result_layers.size() == max_layers)
         {
@@ -140,11 +142,16 @@ std::pair<std::vector<Values>, std::vector<RangesInDataParts>> split(RangesInDat
 
                 if (current.event == PartsRangesIterator::EventType::RangeEnd)
                 {
-                    result_layers.back().emplace_back(
-                        parts[part_idx].data_part,
-                        parts[part_idx].alter_conversions,
-                        parts[part_idx].part_index_in_query,
-                        MarkRanges{{current_part_range_begin[part_idx], current.range.end}});
+                    const auto & mark = MarkRange{current_part_range_begin[part_idx], current.range.end};
+                    auto it = part_idx_in_layer.emplace(std::make_pair(part_idx, current_layer.size()));
+                    if (it.second)
+                        current_layer.emplace_back(
+                            parts[part_idx].data_part,
+                            parts[part_idx].alter_conversions,
+                            parts[part_idx].part_index_in_query,
+                            MarkRanges{mark});
+                    else
+                        current_layer[it.first->second].ranges.push_back(mark);
 
                     current_part_range_begin.erase(part_idx);
                     current_part_range_end.erase(part_idx);
@@ -170,11 +177,17 @@ std::pair<std::vector<Values>, std::vector<RangesInDataParts>> split(RangesInDat
         }
         for (const auto & [part_idx, last_mark] : current_part_range_end)
         {
-            result_layers.back().emplace_back(
-                parts[part_idx].data_part,
-                parts[part_idx].alter_conversions,
-                parts[part_idx].part_index_in_query,
-                MarkRanges{{current_part_range_begin[part_idx], last_mark + 1}});
+            const auto & mark = MarkRange{current_part_range_begin[part_idx], last_mark + 1};
+            auto it = part_idx_in_layer.emplace(std::make_pair(part_idx, current_layer.size()));
+
+            if (it.second)
+                result_layers.back().emplace_back(
+                    parts[part_idx].data_part,
+                    parts[part_idx].alter_conversions,
+                    parts[part_idx].part_index_in_query,
+                    MarkRanges{mark});
+            else
+                current_layer[it.first->second].ranges.push_back(mark);
 
             current_part_range_begin[part_idx] = current_part_range_end[part_idx];
         }
diff --git a/src/Processors/QueryPlan/QueryPlan.cpp b/src/Processors/QueryPlan/QueryPlan.cpp
index 3fbe3d89845..687260441ff 100644
--- a/src/Processors/QueryPlan/QueryPlan.cpp
+++ b/src/Processors/QueryPlan/QueryPlan.cpp
@@ -482,6 +482,7 @@ void QueryPlan::optimize(const QueryPlanOptimizationSettings & optimization_sett
 
     QueryPlanOptimizations::optimizeTreeFirstPass(optimization_settings, *root, nodes);
     QueryPlanOptimizations::optimizeTreeSecondPass(optimization_settings, *root, nodes);
+    QueryPlanOptimizations::optimizeTreeThirdPass(*root, nodes);
 
     updateDataStreams(*root);
 }
@@ -541,4 +542,9 @@ void QueryPlan::explainEstimate(MutableColumns & columns)
     }
 }
 
+QueryPlan::Nodes QueryPlan::detachNodes(QueryPlan && plan)
+{
+    return std::move(plan.nodes);
+}
+
 }
diff --git a/src/Processors/QueryPlan/QueryPlan.h b/src/Processors/QueryPlan/QueryPlan.h
index 19d87b101de..d89bdc534be 100644
--- a/src/Processors/QueryPlan/QueryPlan.h
+++ b/src/Processors/QueryPlan/QueryPlan.h
@@ -105,10 +105,11 @@ public:
         std::vector<Node *> children = {};
     };
 
-    const Node * getRootNode() const { return root; }
-
     using Nodes = std::list<Node>;
 
+    Node * getRootNode() const { return root; }
+    static Nodes detachNodes(QueryPlan && plan);
+
 private:
     QueryPlanResourceHolder resources;
     Nodes nodes;
diff --git a/src/Processors/QueryPlan/ReadFromMemoryStorageStep.cpp b/src/Processors/QueryPlan/ReadFromMemoryStorageStep.cpp
index 2080c31d253..188956b34fc 100644
--- a/src/Processors/QueryPlan/ReadFromMemoryStorageStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromMemoryStorageStep.cpp
@@ -96,11 +96,13 @@ private:
 };
 
 ReadFromMemoryStorageStep::ReadFromMemoryStorageStep(const Names & columns_to_read_,
+                                                     StoragePtr storage_,
                                                      const StorageSnapshotPtr & storage_snapshot_,
                                                      const size_t num_streams_,
                                                      const bool delay_read_for_global_sub_queries_) :
     SourceStepWithFilter(DataStream{.header=storage_snapshot_->getSampleBlockForColumns(columns_to_read_)}),
     columns_to_read(columns_to_read_),
+    storage(std::move(storage_)),
     storage_snapshot(storage_snapshot_),
     num_streams(num_streams_),
     delay_read_for_global_sub_queries(delay_read_for_global_sub_queries_)
@@ -142,9 +144,9 @@ Pipe ReadFromMemoryStorageStep::makePipe()
             storage_snapshot,
             nullptr /* data */,
             nullptr /* parallel execution index */,
-            [current_data](std::shared_ptr<const Blocks> & data_to_initialize)
+            [my_storage = storage](std::shared_ptr<const Blocks> & data_to_initialize)
             {
-                data_to_initialize = current_data;
+                data_to_initialize = assert_cast<const StorageMemory &>(*my_storage).data.get();
             }));
     }
 
diff --git a/src/Processors/QueryPlan/ReadFromMemoryStorageStep.h b/src/Processors/QueryPlan/ReadFromMemoryStorageStep.h
index cec523ed58b..1122bfbb2a5 100644
--- a/src/Processors/QueryPlan/ReadFromMemoryStorageStep.h
+++ b/src/Processors/QueryPlan/ReadFromMemoryStorageStep.h
@@ -16,6 +16,7 @@ class ReadFromMemoryStorageStep final : public SourceStepWithFilter
 {
 public:
     ReadFromMemoryStorageStep(const Names & columns_to_read_,
+                              StoragePtr storage_,
                               const StorageSnapshotPtr & storage_snapshot_,
                               size_t num_streams_,
                               bool delay_read_for_global_sub_queries_);
@@ -35,6 +36,7 @@ private:
     static constexpr auto name = "ReadFromMemoryStorage";
 
     Names columns_to_read;
+    StoragePtr storage;
     StorageSnapshotPtr storage_snapshot;
     size_t num_streams;
     bool delay_read_for_global_sub_queries;
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.cpp b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
index 2415507a6eb..e7bf1ce2edf 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.cpp
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
@@ -37,6 +37,8 @@
 #include <Common/JSONBuilder.h>
 #include <Common/isLocalAddress.h>
 #include <Common/logger_useful.h>
+#include <Parsers/parseIdentifierOrStringLiteral.h>
+#include <Parsers/ExpressionListParsers.h>
 
 #include <algorithm>
 #include <functional>
@@ -100,6 +102,7 @@ namespace ErrorCodes
     extern const int INDEX_NOT_USED;
     extern const int LOGICAL_ERROR;
     extern const int TOO_MANY_ROWS;
+    extern const int CANNOT_PARSE_TEXT;
 }
 
 static MergeTreeReaderSettings getMergeTreeReaderSettings(
@@ -249,7 +252,7 @@ ReadFromMergeTree::ReadFromMergeTree(
 
     { /// build sort description for output stream
         SortDescription sort_description;
-        const Names & sorting_key_columns = storage_snapshot->getMetadataForQuery()->getSortingKeyColumns();
+        const Names & sorting_key_columns = metadata_for_reading->getSortingKeyColumns();
         const Block & header = output_stream->header;
         const int sort_direction = getSortDirection();
         for (const auto & column_name : sorting_key_columns)
@@ -1122,7 +1125,7 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToRead(
         prewhere_info,
         filter_nodes,
         storage_snapshot->metadata,
-        storage_snapshot->getMetadataForQuery(),
+        metadata_for_reading,
         query_info,
         context,
         requested_num_streams,
@@ -1130,7 +1133,176 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToRead(
         data,
         real_column_names,
         sample_factor_column_queried,
-        log);
+        log,
+        indexes);
+}
+
+static ActionsDAGPtr buildFilterDAG(
+    const ContextPtr & context,
+    const PrewhereInfoPtr & prewhere_info,
+    const ActionDAGNodes & added_filter_nodes,
+    const SelectQueryInfo & query_info)
+{
+    const auto & settings = context->getSettingsRef();
+    ActionsDAG::NodeRawConstPtrs nodes;
+
+    if (prewhere_info)
+    {
+        {
+            const auto & node = prewhere_info->prewhere_actions->findInOutputs(prewhere_info->prewhere_column_name);
+            nodes.push_back(&node);
+        }
+
+        if (prewhere_info->row_level_filter)
+        {
+            const auto & node = prewhere_info->row_level_filter->findInOutputs(prewhere_info->row_level_column_name);
+            nodes.push_back(&node);
+        }
+    }
+
+    for (const auto & node : added_filter_nodes.nodes)
+        nodes.push_back(node);
+
+    std::unordered_map<std::string, ColumnWithTypeAndName> node_name_to_input_node_column;
+
+    if (settings.allow_experimental_analyzer && query_info.planner_context)
+    {
+        const auto & table_expression_data = query_info.planner_context->getTableExpressionDataOrThrow(query_info.table_expression);
+        for (const auto & [column_identifier, column_name] : table_expression_data.getColumnIdentifierToColumnName())
+        {
+            const auto & column = table_expression_data.getColumnOrThrow(column_name);
+            node_name_to_input_node_column.emplace(column_identifier, ColumnWithTypeAndName(column.type, column_name));
+        }
+    }
+
+    return ActionsDAG::buildFilterActionsDAG(nodes, node_name_to_input_node_column, context);
+}
+
+static void buildIndexes(
+    std::optional<ReadFromMergeTree::Indexes> & indexes,
+    ActionsDAGPtr filter_actions_dag,
+    const MergeTreeData & data,
+    const ContextPtr & context,
+    const SelectQueryInfo & query_info,
+    const StorageMetadataPtr & metadata_snapshot)
+{
+    indexes.reset();
+
+    // Build and check if primary key is used when necessary
+    const auto & primary_key = metadata_snapshot->getPrimaryKey();
+    const Names & primary_key_column_names = primary_key.column_names;
+
+    const auto & settings = context->getSettingsRef();
+    if (settings.query_plan_optimize_primary_key)
+    {
+        NameSet array_join_name_set;
+        if (query_info.syntax_analyzer_result)
+            array_join_name_set = query_info.syntax_analyzer_result->getArrayJoinSourceNameSet();
+
+        indexes.emplace(ReadFromMergeTree::Indexes{{
+            filter_actions_dag,
+            context,
+            primary_key_column_names,
+            primary_key.expression,
+            array_join_name_set}, {}, {}, {}, false});
+    }
+    else
+    {
+        indexes.emplace(ReadFromMergeTree::Indexes{{
+            query_info,
+            context,
+            primary_key_column_names,
+            primary_key.expression}, {}, {}, {}, false});
+    }
+
+    if (metadata_snapshot->hasPartitionKey())
+    {
+        const auto & partition_key = metadata_snapshot->getPartitionKey();
+        auto minmax_columns_names = data.getMinMaxColumnsNames(partition_key);
+        auto minmax_expression_actions = data.getMinMaxExpr(partition_key, ExpressionActionsSettings::fromContext(context));
+
+        indexes->minmax_idx_condition.emplace(filter_actions_dag, context, minmax_columns_names, minmax_expression_actions, NameSet());
+        indexes->partition_pruner.emplace(metadata_snapshot, filter_actions_dag, context, false /* strict */);
+    }
+
+    indexes->use_skip_indexes = settings.use_skip_indexes;
+    bool final = query_info.isFinal();
+
+    if (final && !settings.use_skip_indexes_if_final)
+        indexes->use_skip_indexes = false;
+
+    if (!indexes->use_skip_indexes)
+        return;
+
+    const SelectQueryInfo * info = &query_info;
+    std::optional<SelectQueryInfo> info_copy;
+    if (settings.allow_experimental_analyzer)
+    {
+        info_copy.emplace(query_info);
+        info_copy->filter_actions_dag = filter_actions_dag;
+        info = &*info_copy;
+    }
+
+    std::unordered_set<std::string> ignored_index_names;
+
+    if (settings.ignore_data_skipping_indices.changed)
+    {
+        const auto & indices = settings.ignore_data_skipping_indices.toString();
+        Tokens tokens(indices.data(), indices.data() + indices.size(), settings.max_query_size);
+        IParser::Pos pos(tokens, static_cast<unsigned>(settings.max_parser_depth));
+        Expected expected;
+
+        /// Use an unordered list rather than string vector
+        auto parse_single_id_or_literal = [&]
+        {
+            String str;
+            if (!parseIdentifierOrStringLiteral(pos, expected, str))
+                return false;
+
+            ignored_index_names.insert(std::move(str));
+            return true;
+        };
+
+        if (!ParserList::parseUtil(pos, expected, parse_single_id_or_literal, false))
+            throw Exception(ErrorCodes::CANNOT_PARSE_TEXT, "Cannot parse ignore_data_skipping_indices ('{}')", indices);
+    }
+
+    UsefulSkipIndexes skip_indexes;
+    using Key = std::pair<String, size_t>;
+    std::map<Key, size_t> merged;
+
+    for (const auto & index : metadata_snapshot->getSecondaryIndices())
+    {
+        if (!ignored_index_names.contains(index.name))
+        {
+            auto index_helper = MergeTreeIndexFactory::instance().get(index);
+            if (index_helper->isMergeable())
+            {
+                auto [it, inserted] = merged.emplace(Key{index_helper->index.type, index_helper->getGranularity()}, skip_indexes.merged_indices.size());
+                if (inserted)
+                {
+                    skip_indexes.merged_indices.emplace_back();
+                    skip_indexes.merged_indices.back().condition = index_helper->createIndexMergedCondition(*info, metadata_snapshot);
+                }
+
+                skip_indexes.merged_indices[it->second].addIndex(index_helper);
+            }
+            else
+            {
+                auto condition = index_helper->createIndexCondition(*info, context);
+                if (!condition->alwaysUnknownOrTrue())
+                    skip_indexes.useful_indices.emplace_back(index_helper, condition);
+            }
+        }
+    }
+
+    indexes->skip_indexes = std::move(skip_indexes);
+}
+
+void ReadFromMergeTree::applyFilters()
+{
+    auto filter_actions_dag = buildFilterDAG(context, prewhere_info, filter_nodes, query_info);
+    buildIndexes(indexes, filter_actions_dag, data, context, query_info, metadata_for_reading);
 }
 
 MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToRead(
@@ -1147,44 +1319,14 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToRead(
     const MergeTreeData & data,
     const Names & real_column_names,
     bool sample_factor_column_queried,
-    Poco::Logger * log)
+    Poco::Logger * log,
+    std::optional<Indexes> & indexes)
 {
     const auto & settings = context->getSettingsRef();
     if (settings.allow_experimental_analyzer || settings.query_plan_optimize_primary_key)
     {
-        ActionsDAG::NodeRawConstPtrs nodes;
-
-        if (prewhere_info)
-        {
-            {
-                const auto & node = prewhere_info->prewhere_actions->findInOutputs(prewhere_info->prewhere_column_name);
-                nodes.push_back(&node);
-            }
-
-            if (prewhere_info->row_level_filter)
-            {
-                const auto & node = prewhere_info->row_level_filter->findInOutputs(prewhere_info->row_level_column_name);
-                nodes.push_back(&node);
-            }
-        }
-
-        for (const auto & node : added_filter_nodes.nodes)
-            nodes.push_back(node);
-
-        std::unordered_map<std::string, ColumnWithTypeAndName> node_name_to_input_node_column;
-
-        if (settings.allow_experimental_analyzer && query_info.planner_context)
-        {
-            const auto & table_expression_data = query_info.planner_context->getTableExpressionDataOrThrow(query_info.table_expression);
-            for (const auto & [column_identifier, column_name] : table_expression_data.getColumnIdentifierToColumnName())
-            {
-                const auto & column = table_expression_data.getColumnOrThrow(column_name);
-                node_name_to_input_node_column.emplace(column_identifier, ColumnWithTypeAndName(column.type, column_name));
-            }
-        }
-
         auto updated_query_info_with_filter_dag = query_info;
-        updated_query_info_with_filter_dag.filter_actions_dag = ActionsDAG::buildFilterActionsDAG(nodes, node_name_to_input_node_column, context);
+        updated_query_info_with_filter_dag.filter_actions_dag = buildFilterDAG(context, prewhere_info, added_filter_nodes, query_info);
 
         return selectRangesToReadImpl(
             std::move(parts),
@@ -1198,7 +1340,8 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToRead(
             data,
             real_column_names,
             sample_factor_column_queried,
-            log);
+            log,
+            indexes);
     }
 
     return selectRangesToReadImpl(
@@ -1213,7 +1356,8 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToRead(
         data,
         real_column_names,
         sample_factor_column_queried,
-        log);
+        log,
+        indexes);
 }
 
 MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToReadImpl(
@@ -1228,7 +1372,8 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToReadImpl(
     const MergeTreeData & data,
     const Names & real_column_names,
     bool sample_factor_column_queried,
-    Poco::Logger * log)
+    Poco::Logger * log,
+    std::optional<Indexes> & indexes)
 {
     AnalysisResult result;
     const auto & settings = context->getSettingsRef();
@@ -1249,31 +1394,14 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToReadImpl(
         result.column_names_to_read.push_back(ExpressionActions::getSmallestColumn(available_real_columns).name);
     }
 
-    // storage_snapshot->check(result.column_names_to_read);
-
     // Build and check if primary key is used when necessary
     const auto & primary_key = metadata_snapshot->getPrimaryKey();
     const Names & primary_key_column_names = primary_key.column_names;
-    std::optional<KeyCondition> key_condition;
 
-    if (settings.query_plan_optimize_primary_key)
-    {
-        NameSet array_join_name_set;
-        if (query_info.syntax_analyzer_result)
-            array_join_name_set = query_info.syntax_analyzer_result->getArrayJoinSourceNameSet();
+    if (!indexes)
+        buildIndexes(indexes, query_info.filter_actions_dag, data, context, query_info, metadata_snapshot);
 
-        key_condition.emplace(query_info.filter_actions_dag,
-            context,
-            primary_key_column_names,
-            primary_key.expression,
-            array_join_name_set);
-    }
-    else
-    {
-        key_condition.emplace(query_info, context, primary_key_column_names, primary_key.expression);
-    }
-
-    if (settings.force_primary_key && key_condition->alwaysUnknownOrTrue())
+    if (settings.force_primary_key && indexes->key_condition.alwaysUnknownOrTrue())
     {
         return std::make_shared<MergeTreeDataSelectAnalysisResult>(MergeTreeDataSelectAnalysisResult{
             .result = std::make_exception_ptr(Exception(
@@ -1281,9 +1409,9 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToReadImpl(
                 "Primary key ({}) is not used and setting 'force_primary_key' is set",
                 fmt::join(primary_key_column_names, ", ")))});
     }
-    LOG_DEBUG(log, "Key condition: {}", key_condition->toString());
+    LOG_DEBUG(log, "Key condition: {}", indexes->key_condition.toString());
 
-    if (key_condition->alwaysFalse())
+    if (indexes->key_condition.alwaysFalse())
         return std::make_shared<MergeTreeDataSelectAnalysisResult>(MergeTreeDataSelectAnalysisResult{.result = std::move(result)});
 
     size_t total_marks_pk = 0;
@@ -1291,12 +1419,13 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToReadImpl(
     try
     {
         MergeTreeDataSelectExecutor::filterPartsByPartition(
+            indexes->partition_pruner,
+            indexes->minmax_idx_condition,
             parts,
             alter_conversions,
             part_values,
             metadata_snapshot_base,
             data,
-            query_info,
             context,
             max_block_numbers_to_read.get(),
             log,
@@ -1306,7 +1435,7 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToReadImpl(
             query_info,
             metadata_snapshot->getColumns().getAllPhysical(),
             parts,
-            *key_condition,
+            indexes->key_condition,
             data,
             metadata_snapshot,
             context,
@@ -1322,24 +1451,18 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToReadImpl(
 
         auto reader_settings = getMergeTreeReaderSettings(context, query_info);
 
-        bool use_skip_indexes = settings.use_skip_indexes;
-        bool final = InterpreterSelectQuery::isQueryWithFinal(query_info);
-
-        if (final && !settings.use_skip_indexes_if_final)
-            use_skip_indexes = false;
-
         result.parts_with_ranges = MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipIndexes(
             std::move(parts),
             std::move(alter_conversions),
             metadata_snapshot,
-            query_info,
             context,
-            *key_condition,
+            indexes->key_condition,
+            indexes->skip_indexes,
             reader_settings,
             log,
             num_streams,
             result.index_stats,
-            use_skip_indexes);
+            indexes->use_skip_indexes);
     }
     catch (...)
     {
@@ -1387,7 +1510,7 @@ bool ReadFromMergeTree::requestReadingInOrder(size_t prefix_size, int direction,
 
     /// Disable read-in-order optimization for reverse order with final.
     /// Otherwise, it can lead to incorrect final behavior because the implementation may rely on the reading in direct order).
-    if (direction != 1 && isQueryWithFinal())
+    if (direction != 1 && query_info.isFinal())
         return false;
 
     auto order_info = std::make_shared<InputOrderInfo>(SortDescription{}, prefix_size, direction, limit);
@@ -1405,7 +1528,7 @@ bool ReadFromMergeTree::requestReadingInOrder(size_t prefix_size, int direction,
 
     /// update sort info for output stream
     SortDescription sort_description;
-    const Names & sorting_key_columns = storage_snapshot->getMetadataForQuery()->getSortingKeyColumns();
+    const Names & sorting_key_columns = metadata_for_reading->getSortingKeyColumns();
     const Block & header = output_stream->header;
     const int sort_direction = getSortDirection();
     for (const auto & column_name : sorting_key_columns)
@@ -1427,6 +1550,11 @@ bool ReadFromMergeTree::requestReadingInOrder(size_t prefix_size, int direction,
     return true;
 }
 
+bool ReadFromMergeTree::readsInOrder() const
+{
+    return reader_settings.read_in_order;
+}
+
 void ReadFromMergeTree::updatePrewhereInfo(const PrewhereInfoPtr & prewhere_info_value)
 {
     query_info.prewhere_info = prewhere_info_value;
@@ -1510,7 +1638,7 @@ ReadFromMergeTree::AnalysisResult ReadFromMergeTree::getAnalysisResult() const
 
 bool ReadFromMergeTree::isQueryWithFinal() const
 {
-    return InterpreterSelectQuery::isQueryWithFinal(query_info);
+    return query_info.isFinal();
 }
 
 bool ReadFromMergeTree::isQueryWithSampling() const
@@ -1731,6 +1859,7 @@ void ReadFromMergeTree::initializePipeline(QueryPipelineBuilder & pipeline, cons
         processors.emplace_back(processor);
 
     pipeline.init(std::move(pipe));
+    pipeline.addContext(context);
     // Attach QueryIdHolder if needed
     if (query_id_holder)
         pipeline.setQueryIdHolder(std::move(query_id_holder));
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.h b/src/Processors/QueryPlan/ReadFromMergeTree.h
index 45beaaaf013..3e3edd4dc5c 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.h
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.h
@@ -6,6 +6,7 @@
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <Storages/MergeTree/MergeTreeReadPool.h>
 #include <Storages/MergeTree/AlterConversions.h>
+#include <Storages/MergeTree/PartitionPruner.h>
 
 namespace DB
 {
@@ -25,6 +26,35 @@ struct MergeTreeDataSelectSamplingData
     ActionsDAGPtr filter_expression;
 };
 
+struct UsefulSkipIndexes
+{
+    struct DataSkippingIndexAndCondition
+    {
+        MergeTreeIndexPtr index;
+        MergeTreeIndexConditionPtr condition;
+
+        DataSkippingIndexAndCondition(MergeTreeIndexPtr index_, MergeTreeIndexConditionPtr condition_)
+            : index(index_), condition(condition_)
+        {
+        }
+    };
+
+    struct MergedDataSkippingIndexAndCondition
+    {
+        std::vector<MergeTreeIndexPtr> indices;
+        MergeTreeIndexMergedConditionPtr condition;
+
+        void addIndex(const MergeTreeIndexPtr & index)
+        {
+            indices.push_back(index);
+            condition->addIndex(indices.back());
+        }
+    };
+
+    std::vector<DataSkippingIndexAndCondition> useful_indices;
+    std::vector<MergedDataSkippingIndexAndCondition> merged_indices;
+};
+
 struct MergeTreeDataSelectAnalysisResult;
 using MergeTreeDataSelectAnalysisResultPtr = std::shared_ptr<MergeTreeDataSelectAnalysisResult>;
 
@@ -134,6 +164,15 @@ public:
     UInt64 getSelectedRows() const { return selected_rows; }
     UInt64 getSelectedMarks() const { return selected_marks; }
 
+    struct Indexes
+    {
+        KeyCondition key_condition;
+        std::optional<PartitionPruner> partition_pruner;
+        std::optional<KeyCondition> minmax_idx_condition;
+        UsefulSkipIndexes skip_indexes;
+        bool use_skip_indexes;
+    };
+
     static MergeTreeDataSelectAnalysisResultPtr selectRangesToRead(
         MergeTreeData::DataPartsVector parts,
         std::vector<AlterConversionsPtr> alter_conversions,
@@ -148,7 +187,8 @@ public:
         const MergeTreeData & data,
         const Names & real_column_names,
         bool sample_factor_column_queried,
-        Poco::Logger * log);
+        Poco::Logger * log,
+        std::optional<Indexes> & indexes);
 
     MergeTreeDataSelectAnalysisResultPtr selectRangesToRead(
         MergeTreeData::DataPartsVector parts,
@@ -161,9 +201,9 @@ public:
 
     /// Returns `false` if requested reading cannot be performed.
     bool requestReadingInOrder(size_t prefix_size, int direction, size_t limit);
+    bool readsInOrder() const;
 
     void updatePrewhereInfo(const PrewhereInfoPtr & prewhere_info_value);
-
     bool isQueryWithFinal() const;
     bool isQueryWithSampling() const;
 
@@ -186,6 +226,8 @@ public:
     size_t getNumStreams() const { return requested_num_streams; }
     bool isParallelReadingEnabled() const { return read_task_callback != std::nullopt; }
 
+    void applyFilters() override;
+
 private:
     static MergeTreeDataSelectAnalysisResultPtr selectRangesToReadImpl(
         MergeTreeData::DataPartsVector parts,
@@ -199,7 +241,8 @@ private:
         const MergeTreeData & data,
         const Names & real_column_names,
         bool sample_factor_column_queried,
-        Poco::Logger * log);
+        Poco::Logger * log,
+        std::optional<Indexes> & indexes);
 
     int getSortDirection() const
     {
@@ -240,6 +283,9 @@ private:
 
     std::shared_ptr<PartitionIdToMaxBlock> max_block_numbers_to_read;
 
+    /// Pre-computed value, needed to trigger sets creating for PK
+    mutable std::optional<Indexes> indexes;
+
     Poco::Logger * log;
     UInt64 selected_parts = 0;
     UInt64 selected_rows = 0;
diff --git a/src/Processors/QueryPlan/SourceStepWithFilter.h b/src/Processors/QueryPlan/SourceStepWithFilter.h
index a363451fff2..dbaff06fde6 100644
--- a/src/Processors/QueryPlan/SourceStepWithFilter.h
+++ b/src/Processors/QueryPlan/SourceStepWithFilter.h
@@ -37,6 +37,9 @@ public:
         filter_dags.push_back(std::move(filter_dag));
     }
 
+    /// Apply filters that can optimize reading from storage.
+    virtual void applyFilters() {}
+
 protected:
     std::vector<ActionsDAGPtr> filter_dags;
     ActionDAGNodes filter_nodes;
diff --git a/src/Processors/Sources/MongoDBSource.cpp b/src/Processors/Sources/MongoDBSource.cpp
index 279a842143f..cd4db416a29 100644
--- a/src/Processors/Sources/MongoDBSource.cpp
+++ b/src/Processors/Sources/MongoDBSource.cpp
@@ -3,10 +3,12 @@
 #include <string>
 #include <vector>
 
+#include <Poco/MongoDB/Array.h>
+#include <Poco/MongoDB/Database.h>
 #include <Poco/MongoDB/Connection.h>
 #include <Poco/MongoDB/Cursor.h>
+#include <Poco/MongoDB/OpMsgCursor.h>
 #include <Poco/MongoDB/ObjectId.h>
-#include <Poco/MongoDB/Array.h>
 
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnNullable.h>
@@ -365,27 +367,79 @@ namespace
 }
 
 
-std::unique_ptr<Poco::MongoDB::Cursor> createCursor(const std::string & database, const std::string & collection, const Block & sample_block_to_select)
+bool isMongoDBWireProtocolOld(Poco::MongoDB::Connection & connection_)
 {
-    auto cursor = std::make_unique<Poco::MongoDB::Cursor>(database, collection);
+    Poco::MongoDB::Database db("config");
+    Poco::MongoDB::Document::Ptr doc = db.queryServerHello(connection_);
+    auto wire_version = doc->getInteger("maxWireVersion");
+    return wire_version < Poco::MongoDB::Database::WireVersion::VER_36;
+}
+
+
+MongoDBCursor::MongoDBCursor(
+    const std::string & database,
+    const std::string & collection,
+    const Block & sample_block_to_select,
+    const Poco::MongoDB::Document & query,
+    Poco::MongoDB::Connection & connection)
+    : is_wire_protocol_old(isMongoDBWireProtocolOld(connection))
+{
+    Poco::MongoDB::Document projection;
 
     /// Looks like selecting _id column is implicit by default.
     if (!sample_block_to_select.has("_id"))
-        cursor->query().returnFieldSelector().add("_id", 0);
+        projection.add("_id", 0);
 
     for (const auto & column : sample_block_to_select)
-        cursor->query().returnFieldSelector().add(column.name, 1);
-    return cursor;
+        projection.add(column.name, 1);
+
+    if (is_wire_protocol_old)
+    {
+        old_cursor = std::make_unique<Poco::MongoDB::Cursor>(database, collection);
+        old_cursor->query().selector() = query;
+        old_cursor->query().returnFieldSelector() = projection;
+    }
+    else
+    {
+        new_cursor = std::make_unique<Poco::MongoDB::OpMsgCursor>(database, collection);
+        new_cursor->query().setCommandName(Poco::MongoDB::OpMsgMessage::CMD_FIND);
+        new_cursor->query().body().addNewDocument("filter") = query;
+        new_cursor->query().body().addNewDocument("projection") = projection;
+    }
 }
 
+Poco::MongoDB::Document::Vector MongoDBCursor::nextDocuments(Poco::MongoDB::Connection & connection)
+{
+    if (is_wire_protocol_old)
+    {
+        auto response = old_cursor->next(connection);
+        cursor_id = response.cursorID();
+        return std::move(response.documents());
+    }
+    else
+    {
+        auto response = new_cursor->next(connection);
+        cursor_id = new_cursor->cursorID();
+        return std::move(response.documents());
+    }
+}
+
+Int64 MongoDBCursor::cursorID() const
+{
+    return cursor_id;
+}
+
+
 MongoDBSource::MongoDBSource(
     std::shared_ptr<Poco::MongoDB::Connection> & connection_,
-    std::unique_ptr<Poco::MongoDB::Cursor> cursor_,
+    const String & database_name_,
+    const String & collection_name_,
+    const Poco::MongoDB::Document & query_,
     const Block & sample_block,
     UInt64 max_block_size_)
     : ISource(sample_block.cloneEmpty())
     , connection(connection_)
-    , cursor{std::move(cursor_)}
+    , cursor(database_name_, collection_name_, sample_block, query_, *connection_)
     , max_block_size{max_block_size_}
 {
     description.init(sample_block);
@@ -412,9 +466,9 @@ Chunk MongoDBSource::generate()
     size_t num_rows = 0;
     while (num_rows < max_block_size)
     {
-        Poco::MongoDB::ResponseMessage & response = cursor->next(*connection);
+        auto documents = cursor.nextDocuments(*connection);
 
-        for (auto & document : response.documents())
+        for (auto & document : documents)
         {
             if (document->exists("ok") && document->exists("$err")
                 && document->exists("code") && document->getInteger("ok") == 0)
@@ -458,7 +512,7 @@ Chunk MongoDBSource::generate()
             }
         }
 
-        if (response.cursorID() == 0)
+        if (cursor.cursorID() == 0)
         {
             all_read = true;
             break;
diff --git a/src/Processors/Sources/MongoDBSource.h b/src/Processors/Sources/MongoDBSource.h
index d4681d2c05f..0e95d42c028 100644
--- a/src/Processors/Sources/MongoDBSource.h
+++ b/src/Processors/Sources/MongoDBSource.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <Poco/MongoDB/Element.h>
+#include <Poco/MongoDB/Array.h>
 
 #include <Core/Block.h>
 #include <Processors/ISource.h>
@@ -14,7 +15,9 @@ namespace Poco
 namespace MongoDB
 {
     class Connection;
+    class Document;
     class Cursor;
+    class OpMsgCursor;
 }
 }
 
@@ -30,7 +33,28 @@ struct MongoDBArrayInfo
 
 void authenticate(Poco::MongoDB::Connection & connection, const std::string & database, const std::string & user, const std::string & password);
 
-std::unique_ptr<Poco::MongoDB::Cursor> createCursor(const std::string & database, const std::string & collection, const Block & sample_block_to_select);
+bool isMongoDBWireProtocolOld(Poco::MongoDB::Connection & connection_);
+
+class MongoDBCursor
+{
+public:
+    MongoDBCursor(
+        const std::string & database,
+        const std::string & collection,
+        const Block & sample_block_to_select,
+        const Poco::MongoDB::Document & query,
+        Poco::MongoDB::Connection & connection);
+
+    Poco::MongoDB::Document::Vector nextDocuments(Poco::MongoDB::Connection & connection);
+
+    Int64 cursorID() const;
+
+private:
+    const bool is_wire_protocol_old;
+    std::unique_ptr<Poco::MongoDB::Cursor> old_cursor;
+    std::unique_ptr<Poco::MongoDB::OpMsgCursor> new_cursor;
+    Int64 cursor_id = 0;
+};
 
 /// Converts MongoDB Cursor to a stream of Blocks
 class MongoDBSource final : public ISource
@@ -38,7 +62,9 @@ class MongoDBSource final : public ISource
 public:
     MongoDBSource(
         std::shared_ptr<Poco::MongoDB::Connection> & connection_,
-        std::unique_ptr<Poco::MongoDB::Cursor> cursor_,
+        const String & database_name_,
+        const String & collection_name_,
+        const Poco::MongoDB::Document & query_,
         const Block & sample_block,
         UInt64 max_block_size_);
 
@@ -50,7 +76,7 @@ private:
     Chunk generate() override;
 
     std::shared_ptr<Poco::MongoDB::Connection> connection;
-    std::unique_ptr<Poco::MongoDB::Cursor> cursor;
+    MongoDBCursor cursor;
     const UInt64 max_block_size;
     ExternalResultDescription description;
     bool all_read = false;
diff --git a/src/Processors/Sources/ShellCommandSource.cpp b/src/Processors/Sources/ShellCommandSource.cpp
index ed8f9b41e78..ace175f251c 100644
--- a/src/Processors/Sources/ShellCommandSource.cpp
+++ b/src/Processors/Sources/ShellCommandSource.cpp
@@ -352,7 +352,11 @@ namespace
                 }
 
                 if (!executor->pull(chunk))
+                {
+                    if (configuration.check_exit_code)
+                        command->wait();
                     return {};
+                }
 
                 current_read_rows += chunk.getNumRows();
             }
@@ -550,11 +554,11 @@ Pipe ShellCommandSourceCoordinator::createPipe(
             CompletedPipelineExecutor executor(*pipeline);
             executor.execute();
 
+            timeout_write_buffer->finalize();
+            timeout_write_buffer->reset();
+
             if (!is_executable_pool)
             {
-                timeout_write_buffer->next();
-                timeout_write_buffer->reset();
-
                 write_buffer->close();
             }
         };
diff --git a/src/Processors/Sources/ShellCommandSource.h b/src/Processors/Sources/ShellCommandSource.h
index b9afaa345cf..6dc6781cc4c 100644
--- a/src/Processors/Sources/ShellCommandSource.h
+++ b/src/Processors/Sources/ShellCommandSource.h
@@ -33,6 +33,9 @@ struct ShellCommandSourceConfiguration
     size_t number_of_rows_to_read = 0;
     /// Max block size
     size_t max_block_size = DEFAULT_BLOCK_SIZE;
+    /// Will throw if the command exited with
+    /// non-zero status code
+    size_t check_exit_code = false;
 };
 
 class ShellCommandSourceCoordinator
diff --git a/src/Processors/Transforms/CreateSetAndFilterOnTheFlyTransform.cpp b/src/Processors/Transforms/CreateSetAndFilterOnTheFlyTransform.cpp
index 4278eb8e8b2..59c4b9a6a87 100644
--- a/src/Processors/Transforms/CreateSetAndFilterOnTheFlyTransform.cpp
+++ b/src/Processors/Transforms/CreateSetAndFilterOnTheFlyTransform.cpp
@@ -106,7 +106,7 @@ void CreatingSetsOnTheFlyTransform::transform(Chunk & chunk)
     if (chunk.getNumRows())
     {
         Columns key_columns = getColumnsByIndices(chunk, key_column_indices);
-        bool limit_exceeded = !set->insertFromBlock(key_columns);
+        bool limit_exceeded = !set->insertFromColumns(key_columns);
         if (limit_exceeded)
         {
             auto prev_state = set->state.exchange(SetWithState::State::Suspended);
diff --git a/src/Processors/Transforms/CreatingSetsTransform.cpp b/src/Processors/Transforms/CreatingSetsTransform.cpp
index e3ae2d4fd4e..afce1355f7a 100644
--- a/src/Processors/Transforms/CreatingSetsTransform.cpp
+++ b/src/Processors/Transforms/CreatingSetsTransform.cpp
@@ -25,13 +25,15 @@ CreatingSetsTransform::~CreatingSetsTransform() = default;
 CreatingSetsTransform::CreatingSetsTransform(
     Block in_header_,
     Block out_header_,
-    SubqueryForSet subquery_for_set_,
+    SetAndKeyPtr set_and_key_,
+    StoragePtr external_table_,
     SizeLimits network_transfer_limits_,
-    ContextPtr context_)
+    PreparedSetsCachePtr prepared_sets_cache_)
     : IAccumulatingTransform(std::move(in_header_), std::move(out_header_))
-    , WithContext(context_)
-    , subquery(std::move(subquery_for_set_))
+    , set_and_key(std::move(set_and_key_))
+    , external_table(std::move(external_table_))
     , network_transfer_limits(std::move(network_transfer_limits_))
+    , prepared_sets_cache(std::move(prepared_sets_cache_))
 {
 }
 
@@ -52,31 +54,30 @@ void CreatingSetsTransform::work()
 void CreatingSetsTransform::startSubquery()
 {
     /// Lookup the set in the cache if we don't need to build table.
-    auto ctx = context.lock();
-    if (ctx && ctx->getPreparedSetsCache() && !subquery.table)
+    if (prepared_sets_cache && !external_table)
     {
         /// Try to find the set in the cache and wait for it to be built.
         /// Retry if the set from cache fails to be built.
         while (true)
         {
-            auto from_cache = ctx->getPreparedSetsCache()->findOrPromiseToBuild(subquery.key);
+            auto from_cache = prepared_sets_cache->findOrPromiseToBuild(set_and_key->key);
             if (from_cache.index() == 0)
             {
+                LOG_TRACE(log, "Building set, key: {}", set_and_key->key);
                 promise_to_build = std::move(std::get<0>(from_cache));
             }
             else
             {
-                LOG_TRACE(log, "Waiting for set to be build by another thread, key: {}", subquery.key);
+                LOG_TRACE(log, "Waiting for set to be build by another thread, key: {}", set_and_key->key);
                 SharedSet set_built_by_another_thread = std::move(std::get<1>(from_cache));
                 const SetPtr & ready_set = set_built_by_another_thread.get();
                 if (!ready_set)
                 {
-                    LOG_TRACE(log, "Failed to use set from cache, key: {}", subquery.key);
+                    LOG_TRACE(log, "Failed to use set from cache, key: {}", set_and_key->key);
                     continue;
                 }
 
-                subquery.promise_to_fill_set.set_value(ready_set);
-                subquery.set_in_progress.reset();
+                set_and_key->set = ready_set;
                 done_with_set = true;
                 set_from_cache = true;
             }
@@ -84,19 +85,19 @@ void CreatingSetsTransform::startSubquery()
         }
     }
 
-    if (subquery.set_in_progress)
-        LOG_TRACE(log, "Creating set, key: {}", subquery.key);
-    if (subquery.table)
+    if (set_and_key->set && !set_from_cache)
+        LOG_TRACE(log, "Creating set, key: {}", set_and_key->key);
+    if (external_table)
         LOG_TRACE(log, "Filling temporary table.");
 
-    if (subquery.table)
+    if (external_table)
         /// TODO: make via port
-        table_out = QueryPipeline(subquery.table->write({}, subquery.table->getInMemoryMetadataPtr(), getContext()));
+        table_out = QueryPipeline(external_table->write({}, external_table->getInMemoryMetadataPtr(), nullptr, /*async_insert=*/false));
 
-    done_with_set = !subquery.set_in_progress;
-    done_with_table = !subquery.table;
+    done_with_set = !set_and_key->set || set_from_cache;
+    done_with_table = !external_table;
 
-    if ((done_with_set && !set_from_cache) /*&& done_with_join*/ && done_with_table)
+    if ((done_with_set && !set_from_cache) && done_with_table)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: nothing to do with subquery");
 
     if (table_out.initialized())
@@ -116,9 +117,9 @@ void CreatingSetsTransform::finishSubquery()
     }
     else if (read_rows != 0)
     {
-        if (subquery.set_in_progress)
-            LOG_DEBUG(log, "Created Set with {} entries from {} rows in {} sec.", subquery.set_in_progress->getTotalRowCount(), read_rows, seconds);
-        if (subquery.table)
+        if (set_and_key->set)
+            LOG_DEBUG(log, "Created Set with {} entries from {} rows in {} sec.", set_and_key->set->getTotalRowCount(), read_rows, seconds);
+        if (external_table)
             LOG_DEBUG(log, "Created Table with {} rows in {} sec.", read_rows, seconds);
     }
     else
@@ -131,11 +132,6 @@ void CreatingSetsTransform::init()
 {
     is_initialized = true;
 
-    if (subquery.set_in_progress)
-    {
-        subquery.set_in_progress->setHeader(getInputPort().getHeader().getColumnsWithTypeAndName());
-    }
-
     watch.restart();
     startSubquery();
 }
@@ -147,7 +143,7 @@ void CreatingSetsTransform::consume(Chunk chunk)
 
     if (!done_with_set)
     {
-        if (!subquery.set_in_progress->insertFromBlock(block.getColumnsWithTypeAndName()))
+        if (!set_and_key->set->insertFromBlock(block.getColumnsWithTypeAndName()))
             done_with_set = true;
     }
 
@@ -170,12 +166,11 @@ void CreatingSetsTransform::consume(Chunk chunk)
 
 Chunk CreatingSetsTransform::generate()
 {
-    if (subquery.set_in_progress)
+    if (set_and_key->set && !set_from_cache)
     {
-        subquery.set_in_progress->finishInsert();
-        subquery.promise_to_fill_set.set_value(subquery.set_in_progress);
+        set_and_key->set->finishInsert();
         if (promise_to_build)
-            promise_to_build->set_value(subquery.set_in_progress);
+            promise_to_build->set_value(set_and_key->set);
     }
 
     if (table_out.initialized())
diff --git a/src/Processors/Transforms/CreatingSetsTransform.h b/src/Processors/Transforms/CreatingSetsTransform.h
index 26bbc45933d..d1ec7dcbca7 100644
--- a/src/Processors/Transforms/CreatingSetsTransform.h
+++ b/src/Processors/Transforms/CreatingSetsTransform.h
@@ -23,15 +23,16 @@ class PushingPipelineExecutor;
 /// Don't return any data. Sets are created when Finish status is returned.
 /// In general, several work() methods need to be called to finish.
 /// Independent processors is created for each subquery.
-class CreatingSetsTransform : public IAccumulatingTransform, WithContext
+class CreatingSetsTransform : public IAccumulatingTransform
 {
 public:
     CreatingSetsTransform(
         Block in_header_,
         Block out_header_,
-        SubqueryForSet subquery_for_set_,
+        SetAndKeyPtr set_and_key_,
+        StoragePtr external_table_,
         SizeLimits network_transfer_limits_,
-        ContextPtr context_);
+        PreparedSetsCachePtr prepared_sets_cache_);
 
     ~CreatingSetsTransform() override;
 
@@ -42,7 +43,8 @@ public:
     Chunk generate() override;
 
 private:
-    SubqueryForSet subquery;
+    SetAndKeyPtr set_and_key;
+    StoragePtr external_table;
     std::optional<std::promise<SetPtr>> promise_to_build;
 
     QueryPipeline table_out;
@@ -55,6 +57,7 @@ private:
     bool done_with_table = true;
 
     SizeLimits network_transfer_limits;
+    PreparedSetsCachePtr prepared_sets_cache;
 
     size_t rows_to_transfer = 0;
     size_t bytes_to_transfer = 0;
diff --git a/src/Processors/Transforms/ExceptionKeepingTransform.cpp b/src/Processors/Transforms/ExceptionKeepingTransform.cpp
index 266407f21a5..3c40c078225 100644
--- a/src/Processors/Transforms/ExceptionKeepingTransform.cpp
+++ b/src/Processors/Transforms/ExceptionKeepingTransform.cpp
@@ -76,7 +76,7 @@ IProcessor::Status ExceptionKeepingTransform::prepare()
         if (data.exception)
         {
             stage = Stage::Exception;
-            onException();
+            onException(data.exception);
             output.pushData(std::move(data));
             return Status::PortFull;
         }
@@ -139,7 +139,7 @@ void ExceptionKeepingTransform::work()
             stage = Stage::Exception;
             ready_output = true;
             data.exception = exception;
-            onException();
+            onException(data.exception);
         }
     }
     else if (stage == Stage::Consume || stage == Stage::Generate)
@@ -153,7 +153,7 @@ void ExceptionKeepingTransform::work()
                 stage = Stage::Exception;
                 ready_output = true;
                 data.exception = exception;
-                onException();
+                onException(data.exception);
             }
             else
                 stage = Stage::Generate;
@@ -167,7 +167,7 @@ void ExceptionKeepingTransform::work()
                 stage = Stage::Exception;
                 ready_output = true;
                 data.exception = exception;
-                onException();
+                onException(data.exception);
             }
             else
             {
@@ -189,7 +189,7 @@ void ExceptionKeepingTransform::work()
             stage = Stage::Exception;
             ready_output = true;
             data.exception = exception;
-            onException();
+            onException(data.exception);
         }
     }
 }
diff --git a/src/Processors/Transforms/ExceptionKeepingTransform.h b/src/Processors/Transforms/ExceptionKeepingTransform.h
index e2bc161971e..cec0e0eea31 100644
--- a/src/Processors/Transforms/ExceptionKeepingTransform.h
+++ b/src/Processors/Transforms/ExceptionKeepingTransform.h
@@ -52,7 +52,7 @@ protected:
     virtual void onConsume(Chunk chunk) = 0;
     virtual GenerateResult onGenerate() = 0;
     virtual void onFinish() {}
-    virtual void onException() {}
+    virtual void onException(std::exception_ptr /* exception */) {}
 
 public:
     ExceptionKeepingTransform(const Block & in_header, const Block & out_header, bool ignore_on_start_and_finish_ = true);
diff --git a/src/Processors/Transforms/ExpressionTransform.cpp b/src/Processors/Transforms/ExpressionTransform.cpp
index 49988932947..0d3341b000c 100644
--- a/src/Processors/Transforms/ExpressionTransform.cpp
+++ b/src/Processors/Transforms/ExpressionTransform.cpp
@@ -39,7 +39,6 @@ void ConvertingTransform::onConsume(Chunk chunk)
     expression->execute(block, num_rows);
 
     chunk.setColumns(block.getColumns(), num_rows);
-    chunk.setChunkInfo(chunk.getChunkInfo());
     cur_chunk = std::move(chunk);
 }
 
diff --git a/src/Processors/Transforms/JoiningTransform.cpp b/src/Processors/Transforms/JoiningTransform.cpp
index 256ef66a27d..bba8ec6fa16 100644
--- a/src/Processors/Transforms/JoiningTransform.cpp
+++ b/src/Processors/Transforms/JoiningTransform.cpp
@@ -189,6 +189,7 @@ void JoiningTransform::transform(Chunk & chunk)
     }
     else
         block = readExecute(chunk);
+
     auto num_rows = block.rows();
     chunk.setColumns(block.getColumns(), num_rows);
 }
@@ -310,16 +311,8 @@ void FillingRightJoinSideTransform::work()
 }
 
 
-DelayedJoinedBlocksWorkerTransform::DelayedJoinedBlocksWorkerTransform(
-    Block left_header_,
-    Block output_header_,
-    size_t max_block_size_,
-    JoinPtr join_)
-    : IProcessor(InputPorts{Block()}, OutputPorts{output_header_})
-    , left_header(left_header_)
-    , output_header(output_header_)
-    , max_block_size(max_block_size_)
-    , join(join_)
+DelayedJoinedBlocksWorkerTransform::DelayedJoinedBlocksWorkerTransform(Block output_header)
+    : IProcessor(InputPorts{Block()}, OutputPorts{output_header})
 {
 }
 
@@ -373,7 +366,6 @@ IProcessor::Status DelayedJoinedBlocksWorkerTransform::prepare()
         if (!data.chunk.hasChunkInfo())
             throw Exception(ErrorCodes::LOGICAL_ERROR, "DelayedJoinedBlocksWorkerTransform must have chunk info");
         task = std::dynamic_pointer_cast<const DelayedBlocksTask>(data.chunk.getChunkInfo());
-
     }
     else
     {
@@ -394,24 +386,12 @@ void DelayedJoinedBlocksWorkerTransform::work()
 {
     if (!task)
         return;
-    Block block;
-    if (!left_delayed_stream_finished)
-    {
-        block = task->delayed_blocks->next();
 
-        if (!block)
-        {
-            left_delayed_stream_finished = true;
-            block = nextNonJoinedBlock();
-        }
-    }
-    else
-    {
-        block = nextNonJoinedBlock();
-    }
+    Block block = task->delayed_blocks->next();
+
     if (!block)
     {
-        resetTask();
+        task.reset();
         return;
     }
 
@@ -420,38 +400,6 @@ void DelayedJoinedBlocksWorkerTransform::work()
     output_chunk.setColumns(block.getColumns(), rows);
 }
 
-void DelayedJoinedBlocksWorkerTransform::resetTask()
-{
-    task.reset();
-    left_delayed_stream_finished = false;
-    setup_non_joined_stream = false;
-    non_joined_delayed_stream = nullptr;
-}
-
-Block DelayedJoinedBlocksWorkerTransform::nextNonJoinedBlock()
-{
-    if (!setup_non_joined_stream)
-    {
-        setup_non_joined_stream = true;
-        // Before read from non-joined stream, all blocks in left file reader must have been joined.
-        // For example, in HashJoin, it may return invalid mismatch rows from non-joined stream before
-        // the all blocks in left file reader have been finished, since the used flags are incomplete.
-        // To make only one processor could read from non-joined stream seems be a easy way.
-        if (task && task->left_delayed_stream_finish_counter->isLast())
-        {
-            if (!non_joined_delayed_stream)
-            {
-                non_joined_delayed_stream = join->getNonJoinedBlocks(left_header, output_header, max_block_size);
-            }
-        }
-    }
-    if (non_joined_delayed_stream)
-    {
-        return non_joined_delayed_stream->next();
-    }
-    return {};
-}
-
 DelayedJoinedBlocksTransform::DelayedJoinedBlocksTransform(size_t num_streams, JoinPtr join_)
     : IProcessor(InputPorts{}, OutputPorts(num_streams, Block()))
     , join(std::move(join_))
@@ -485,9 +433,6 @@ IProcessor::Status DelayedJoinedBlocksTransform::prepare()
 
     if (finished)
     {
-        // Since have memory limit, cannot handle all buckets parallelly by different
-        // DelayedJoinedBlocksWorkerTransform. So send the same task to all outputs.
-        // Wait for all DelayedJoinedBlocksWorkerTransform be idle before getting next bucket.
         for (auto & output : outputs)
         {
             if (output.isFinished())
@@ -503,14 +448,10 @@ IProcessor::Status DelayedJoinedBlocksTransform::prepare()
 
     if (delayed_blocks)
     {
-        // This counter is used to ensure that only the last DelayedJoinedBlocksWorkerTransform
-        // could read right non-joined blocks from the join.
-        auto left_delayed_stream_finished_counter = std::make_shared<JoiningTransform::FinishCounter>(outputs.size());
         for (auto & output : outputs)
         {
             Chunk chunk;
-            auto task = std::make_shared<DelayedBlocksTask>(delayed_blocks, left_delayed_stream_finished_counter);
-            chunk.setChunkInfo(task);
+            chunk.setChunkInfo(std::make_shared<DelayedBlocksTask>(delayed_blocks));
             output.push(std::move(chunk));
         }
         delayed_blocks = nullptr;
diff --git a/src/Processors/Transforms/JoiningTransform.h b/src/Processors/Transforms/JoiningTransform.h
index 3577906b26a..e7edff40c56 100644
--- a/src/Processors/Transforms/JoiningTransform.h
+++ b/src/Processors/Transforms/JoiningTransform.h
@@ -116,14 +116,9 @@ class DelayedBlocksTask : public ChunkInfo
 public:
 
     explicit DelayedBlocksTask() : finished(true) {}
-    explicit DelayedBlocksTask(IBlocksStreamPtr delayed_blocks_, JoiningTransform::FinishCounterPtr left_delayed_stream_finish_counter_)
-        : delayed_blocks(std::move(delayed_blocks_))
-        , left_delayed_stream_finish_counter(left_delayed_stream_finish_counter_)
-    {
-    }
+    explicit DelayedBlocksTask(IBlocksStreamPtr delayed_blocks_) : delayed_blocks(std::move(delayed_blocks_)) {}
 
     IBlocksStreamPtr delayed_blocks = nullptr;
-    JoiningTransform::FinishCounterPtr left_delayed_stream_finish_counter = nullptr;
 
     bool finished = false;
 };
@@ -152,11 +147,7 @@ private:
 class DelayedJoinedBlocksWorkerTransform : public IProcessor
 {
 public:
-    explicit DelayedJoinedBlocksWorkerTransform(
-        Block left_header_,
-        Block output_header_,
-        size_t max_block_size_,
-        JoinPtr join_);
+    explicit DelayedJoinedBlocksWorkerTransform(Block output_header);
 
     String getName() const override { return "DelayedJoinedBlocksWorkerTransform"; }
 
@@ -164,20 +155,10 @@ public:
     void work() override;
 
 private:
-    Block left_header;
-    Block output_header;
-    size_t max_block_size;
-    JoinPtr join;
     DelayedBlocksTaskPtr task;
     Chunk output_chunk;
 
-    /// All joined and non-joined rows from left stream are emitted, only right non-joined rows are left
-    bool left_delayed_stream_finished = false;
-    bool setup_non_joined_stream = false;
-    IBlocksStreamPtr non_joined_delayed_stream = nullptr;
-
-    void resetTask();
-    Block nextNonJoinedBlock();
+    bool finished = false;
 };
 
 }
diff --git a/src/Processors/Transforms/ReverseTransform.cpp b/src/Processors/Transforms/ReverseTransform.cpp
index 98f2bf54aa5..66b774ab50d 100644
--- a/src/Processors/Transforms/ReverseTransform.cpp
+++ b/src/Processors/Transforms/ReverseTransform.cpp
@@ -6,11 +6,11 @@ namespace DB
 
 void ReverseTransform::transform(Chunk & chunk)
 {
-    IColumn::Permutation permutation;
-
     size_t num_rows = chunk.getNumRows();
+    IColumn::Permutation permutation(num_rows);
+
     for (size_t i = 0; i < num_rows; ++i)
-        permutation.emplace_back(num_rows - 1 - i);
+        permutation[i] = num_rows - 1 - i;
 
     auto columns = chunk.detachColumns();
 
diff --git a/src/Processors/Transforms/buildPushingToViewsChain.cpp b/src/Processors/Transforms/buildPushingToViewsChain.cpp
index 31bab46b868..43085690519 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.cpp
+++ b/src/Processors/Transforms/buildPushingToViewsChain.cpp
@@ -196,6 +196,7 @@ Chain buildPushingToViewsChain(
     ThreadStatusesHolderPtr thread_status_holder,
     ThreadGroupPtr running_group,
     std::atomic_uint64_t * elapsed_counter_ms,
+    bool async_insert,
     const Block & live_view_header)
 {
     checkStackSize();
@@ -244,6 +245,10 @@ Chain buildPushingToViewsChain(
         if (disable_deduplication_for_children)
             insert_context->setSetting("insert_deduplicate", Field{false});
 
+        // Processing of blocks for MVs is done block by block, and there will
+        // be no parallel reading after (plus it is not a costless operation)
+        select_context->setSetting("parallelize_output_from_storages", Field{false});
+
         // Separate min_insert_block_size_rows/min_insert_block_size_bytes for children
         if (insert_settings.min_insert_block_size_rows_for_materialized_views)
             insert_context->setSetting("min_insert_block_size_rows", insert_settings.min_insert_block_size_rows_for_materialized_views.value);
@@ -347,7 +352,7 @@ Chain buildPushingToViewsChain(
             out = buildPushingToViewsChain(
                 view, view_metadata_snapshot, insert_context, ASTPtr(),
                 /* no_destination= */ true,
-                thread_status_holder, running_group, view_counter_ms, storage_header);
+                thread_status_holder, running_group, view_counter_ms, async_insert, storage_header);
         }
         else if (auto * window_view = dynamic_cast<StorageWindowView *>(view.get()))
         {
@@ -356,13 +361,13 @@ Chain buildPushingToViewsChain(
             out = buildPushingToViewsChain(
                 view, view_metadata_snapshot, insert_context, ASTPtr(),
                 /* no_destination= */ true,
-                thread_status_holder, running_group, view_counter_ms);
+                thread_status_holder, running_group, view_counter_ms, async_insert);
         }
         else
             out = buildPushingToViewsChain(
                 view, view_metadata_snapshot, insert_context, ASTPtr(),
                 /* no_destination= */ false,
-                thread_status_holder, running_group, view_counter_ms);
+                thread_status_holder, running_group, view_counter_ms, async_insert);
 
         views_data->views.emplace_back(ViewRuntimeData{
             std::move(query),
@@ -444,7 +449,7 @@ Chain buildPushingToViewsChain(
     /// Do not push to destination table if the flag is set
     else if (!no_destination)
     {
-        auto sink = storage->write(query_ptr, metadata_snapshot, context);
+        auto sink = storage->write(query_ptr, metadata_snapshot, context, async_insert);
         metadata_snapshot->check(sink->getHeader().getColumnsWithTypeAndName());
         sink->setRuntimeData(thread_status, elapsed_counter_ms);
         result_chain.addSource(std::move(sink));
diff --git a/src/Processors/Transforms/buildPushingToViewsChain.h b/src/Processors/Transforms/buildPushingToViewsChain.h
index 0f413bee5c6..53aceeda1cc 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.h
+++ b/src/Processors/Transforms/buildPushingToViewsChain.h
@@ -69,6 +69,8 @@ Chain buildPushingToViewsChain(
     ThreadGroupPtr running_group,
     /// Counter to measure time spent separately per view. Should be improved.
     std::atomic_uint64_t * elapsed_counter_ms,
+    /// True if it's part of async insert flush
+    bool async_insert,
     /// LiveView executes query itself, it needs source block structure.
     const Block & live_view_header = {});
 
diff --git a/src/QueryPipeline/BlockIO.cpp b/src/QueryPipeline/BlockIO.cpp
index 231c369707e..76da01bee0e 100644
--- a/src/QueryPipeline/BlockIO.cpp
+++ b/src/QueryPipeline/BlockIO.cpp
@@ -71,19 +71,21 @@ void BlockIO::onCancelOrConnectionLoss()
 {
     /// Query was not finished gracefully, so we should call exception_callback
     /// But we don't have a real exception
-    if (exception_callback)
+    try
     {
-        try
-        {
-            throw Exception(ErrorCodes::QUERY_WAS_CANCELLED, "Query was cancelled or a client has unexpectedly dropped the connection");
-        }
-        catch (...)
+        throw Exception(ErrorCodes::QUERY_WAS_CANCELLED, "Query was cancelled or a client has unexpectedly dropped the connection");
+    }
+    catch (...)
+    {
+        if (exception_callback)
         {
             exception_callback(/* log_error */ false);
         }
+
+        /// destroy pipeline and write buffers with an exception context
+        pipeline.reset();
     }
 
-    pipeline.reset();
 }
 
 void BlockIO::setAllDataSent() const
diff --git a/src/QueryPipeline/QueryPipelineBuilder.cpp b/src/QueryPipeline/QueryPipelineBuilder.cpp
index 764997e7b7e..dedf85e409c 100644
--- a/src/QueryPipeline/QueryPipelineBuilder.cpp
+++ b/src/QueryPipeline/QueryPipelineBuilder.cpp
@@ -491,7 +491,7 @@ std::unique_ptr<QueryPipelineBuilder> QueryPipelineBuilder::joinPipelinesRightLe
         if (delayed_root)
         {
             // Process delayed joined blocks when all JoiningTransform are finished.
-            auto delayed = std::make_shared<DelayedJoinedBlocksWorkerTransform>(left_header, joined_header, max_block_size, join);
+            auto delayed = std::make_shared<DelayedJoinedBlocksWorkerTransform>(joined_header);
             if (delayed->getInputs().size() != 1 || delayed->getOutputs().size() != 1)
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "DelayedJoinedBlocksWorkerTransform should have one input and one output");
 
@@ -569,16 +569,22 @@ std::unique_ptr<QueryPipelineBuilder> QueryPipelineBuilder::joinPipelinesRightLe
     return left;
 }
 
-void QueryPipelineBuilder::addCreatingSetsTransform(const Block & res_header, SubqueryForSet subquery_for_set, const SizeLimits & limits, ContextPtr context)
+void QueryPipelineBuilder::addCreatingSetsTransform(
+    const Block & res_header,
+    SetAndKeyPtr set_and_key,
+    StoragePtr external_table,
+    const SizeLimits & limits,
+    PreparedSetsCachePtr prepared_sets_cache)
 {
     resize(1);
 
     auto transform = std::make_shared<CreatingSetsTransform>(
             getHeader(),
             res_header,
-            std::move(subquery_for_set),
+            std::move(set_and_key),
+            std::move(external_table),
             limits,
-            context);
+            std::move(prepared_sets_cache));
 
     InputPort * totals_port = nullptr;
 
diff --git a/src/QueryPipeline/QueryPipelineBuilder.h b/src/QueryPipeline/QueryPipelineBuilder.h
index 3a5d65d4388..e744e3612ce 100644
--- a/src/QueryPipeline/QueryPipelineBuilder.h
+++ b/src/QueryPipeline/QueryPipelineBuilder.h
@@ -33,6 +33,12 @@ class TableJoin;
 class QueryPipelineBuilder;
 using QueryPipelineBuilderPtr = std::unique_ptr<QueryPipelineBuilder>;
 
+struct SetAndKey;
+using SetAndKeyPtr = std::shared_ptr<SetAndKey>;
+
+class PreparedSetsCache;
+using PreparedSetsCachePtr = std::shared_ptr<PreparedSetsCache>;
+
 class QueryPipelineBuilder
 {
 public:
@@ -138,7 +144,12 @@ public:
     /// This is used for CreatingSets.
     void addPipelineBefore(QueryPipelineBuilder pipeline);
 
-    void addCreatingSetsTransform(const Block & res_header, SubqueryForSet subquery_for_set, const SizeLimits & limits, ContextPtr context);
+    void addCreatingSetsTransform(
+        const Block & res_header,
+        SetAndKeyPtr set_and_key,
+        StoragePtr external_table,
+        const SizeLimits & limits,
+        PreparedSetsCachePtr prepared_sets_cache);
 
     PipelineExecutorPtr execute();
 
@@ -174,6 +185,7 @@ public:
 
     void addResources(QueryPlanResourceHolder resources_) { resources = std::move(resources_); }
     void setQueryIdHolder(std::shared_ptr<QueryIdHolder> query_id_holder) { resources.query_id_holders.emplace_back(std::move(query_id_holder)); }
+    void addContext(ContextPtr context) { resources.interpreter_context.emplace_back(std::move(context)); }
 
     /// Convert query pipeline to pipe.
     static Pipe getPipe(QueryPipelineBuilder pipeline, QueryPlanResourceHolder & resources);
diff --git a/src/QueryPipeline/RemoteInserter.cpp b/src/QueryPipeline/RemoteInserter.cpp
index b8a878b56c3..134c169e35f 100644
--- a/src/QueryPipeline/RemoteInserter.cpp
+++ b/src/QueryPipeline/RemoteInserter.cpp
@@ -130,7 +130,7 @@ void RemoteInserter::onFinish()
             break;
         else if (Protocol::Server::Exception == packet.type)
             packet.exception->rethrow();
-        else if (Protocol::Server::Log == packet.type)
+        else if (Protocol::Server::Log == packet.type || Protocol::Server::TimezoneUpdate == packet.type)
         {
             // Do nothing
         }
diff --git a/src/QueryPipeline/RemoteQueryExecutor.cpp b/src/QueryPipeline/RemoteQueryExecutor.cpp
index 3f9f945fd45..cd6f65b7b43 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.cpp
+++ b/src/QueryPipeline/RemoteQueryExecutor.cpp
@@ -434,11 +434,13 @@ RemoteQueryExecutor::ReadResult RemoteQueryExecutor::processPacket(Packet packet
     switch (packet.type)
     {
         case Protocol::Server::MergeTreeReadTaskRequest:
-            processMergeTreeReadTaskRequest(packet.request);
+            chassert(packet.request.has_value());
+            processMergeTreeReadTaskRequest(packet.request.value());
             return ReadResult(ReadResult::Type::ParallelReplicasToken);
 
         case Protocol::Server::MergeTreeAllRangesAnnounecement:
-            processMergeTreeInitialReadAnnounecement(packet.announcement);
+            chassert(packet.announcement.has_value());
+            processMergeTreeInitialReadAnnounecement(packet.announcement.value());
             return ReadResult(ReadResult::Type::ParallelReplicasToken);
 
         case Protocol::Server::ReadTaskRequest:
@@ -512,6 +514,9 @@ RemoteQueryExecutor::ReadResult RemoteQueryExecutor::processPacket(Packet packet
                     throw Exception(ErrorCodes::SYSTEM_ERROR, "Could not push into profile queue");
             break;
 
+        case Protocol::Server::TimezoneUpdate:
+            break;
+
         default:
             got_unknown_packet_from_replica = true;
             throw Exception(
@@ -616,6 +621,9 @@ void RemoteQueryExecutor::finish()
                     throw Exception(ErrorCodes::SYSTEM_ERROR, "Could not push into profile queue");
             break;
 
+        case Protocol::Server::TimezoneUpdate:
+            break;
+
         default:
             got_unknown_packet_from_replica = true;
             throw Exception(ErrorCodes::UNKNOWN_PACKET_FROM_SERVER, "Unknown packet {} from one of the following replicas: {}",
diff --git a/src/Server/GRPCServer.cpp b/src/Server/GRPCServer.cpp
index 7b8eaa21947..bf9ba20a5cf 100644
--- a/src/Server/GRPCServer.cpp
+++ b/src/Server/GRPCServer.cpp
@@ -1101,7 +1101,7 @@ namespace
                 {
                     /// The data will be written directly to the table.
                     auto metadata_snapshot = storage->getInMemoryMetadataPtr();
-                    auto sink = storage->write(ASTPtr(), metadata_snapshot, query_context);
+                    auto sink = storage->write(ASTPtr(), metadata_snapshot, query_context, /*async_insert=*/false);
 
                     std::unique_ptr<ReadBuffer> buf = std::make_unique<ReadBufferFromMemory>(external_table.data().data(), external_table.data().size());
                     buf = wrapReadBufferWithCompressionMethod(std::move(buf), chooseCompressionMethod("", external_table.compression_type()));
@@ -1299,7 +1299,7 @@ namespace
     {
         io.onException();
 
-        LOG_ERROR(log, getExceptionMessageAndPattern(exception, /* with_stacktrace */ true));
+        LOG_ERROR(log, getExceptionMessageAndPattern(exception, send_exception_with_stacktrace));
 
         if (responder && !responder_finished)
         {
diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index 5a2bf0bad6c..fe98ae5f69e 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -289,14 +289,15 @@ void HTTPHandler::pushDelayedResults(Output & used_output)
 
     for (auto & write_buf : write_buffers)
     {
-        IReadableWriteBuffer * write_buf_concrete;
-        ReadBufferPtr reread_buf;
+        if (!write_buf)
+            continue;
 
-        if (write_buf
-            && (write_buf_concrete = dynamic_cast<IReadableWriteBuffer *>(write_buf.get()))
-            && (reread_buf = write_buf_concrete->tryGetReadBuffer()))
+        IReadableWriteBuffer * write_buf_concrete = dynamic_cast<IReadableWriteBuffer *>(write_buf.get());
+        if (write_buf_concrete)
         {
-            read_buffers.emplace_back(wrapReadBufferPointer(reread_buf));
+            ReadBufferPtr reread_buf = write_buf_concrete->tryGetReadBuffer();
+            if (reread_buf)
+                read_buffers.emplace_back(wrapReadBufferPointer(reread_buf));
         }
     }
 
@@ -900,7 +901,13 @@ try
     {
         /// Destroy CascadeBuffer to actualize buffers' positions and reset extra references
         if (used_output.hasDelayed())
+        {
+            if (used_output.out_maybe_delayed_and_compressed)
+            {
+                used_output.out_maybe_delayed_and_compressed->finalize();
+            }
             used_output.out_maybe_delayed_and_compressed.reset();
+        }
 
         /// Send the error message into already used (and possibly compressed) stream.
         /// Note that the error message will possibly be sent after some data.
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index 0522b6d8a48..4d9fb47c893 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -350,6 +350,7 @@ void TCPHandler::runImpl()
                 /// Send block to the client - input storage structure.
                 state.input_header = metadata_snapshot->getSampleBlock();
                 sendData(state.input_header);
+                sendTimezone();
             });
 
             query_context->setInputBlocksReaderCallback([this] (ContextPtr context) -> Block
@@ -588,7 +589,7 @@ void TCPHandler::runImpl()
                 }
 
                 const auto & e = *exception;
-                LOG_ERROR(log, getExceptionMessageAndPattern(e, /* with_stacktrace */ true));
+                LOG_ERROR(log, getExceptionMessageAndPattern(e, send_exception_with_stack_trace));
                 sendException(*exception, send_exception_with_stack_trace);
             }
         }
@@ -763,7 +764,6 @@ void TCPHandler::processInsertQuery()
 
         /// Send block to the client - table structure.
         sendData(executor.getHeader());
-
         sendLogs();
 
         while (readDataNext())
@@ -1063,6 +1063,20 @@ void TCPHandler::sendInsertProfileEvents()
     sendProfileEvents();
 }
 
+void TCPHandler::sendTimezone()
+{
+    if (client_tcp_protocol_version < DBMS_MIN_PROTOCOL_VERSION_WITH_TIMEZONE_UPDATES)
+        return;
+
+    const String & tz = query_context->getSettingsRef().session_timezone.value;
+
+    LOG_DEBUG(log, "TCPHandler::sendTimezone(): {}", tz);
+    writeVarUInt(Protocol::Server::TimezoneUpdate, *out);
+    writeStringBinary(tz, *out);
+    out->next();
+}
+
+
 bool TCPHandler::receiveProxyHeader()
 {
     if (in->eof())
@@ -1692,7 +1706,7 @@ bool TCPHandler::receiveData(bool scalar)
         }
         auto metadata_snapshot = storage->getInMemoryMetadataPtr();
         /// The data will be written directly to the table.
-        QueryPipeline temporary_table_out(storage->write(ASTPtr(), metadata_snapshot, query_context));
+        QueryPipeline temporary_table_out(storage->write(ASTPtr(), metadata_snapshot, query_context, /*async_insert=*/false));
         PushingPipelineExecutor executor(temporary_table_out);
         executor.start();
         executor.push(block);
@@ -1775,7 +1789,7 @@ void TCPHandler::initBlockOutput(const Block & block)
 
             if (state.compression == Protocol::Compression::Enable)
             {
-                CompressionCodecFactory::instance().validateCodec(method, level, !query_settings.allow_suspicious_codecs, query_settings.allow_experimental_codecs);
+                CompressionCodecFactory::instance().validateCodec(method, level, !query_settings.allow_suspicious_codecs, query_settings.allow_experimental_codecs, query_settings.enable_deflate_qpl_codec);
 
                 state.maybe_compressed_out = std::make_shared<CompressedWriteBuffer>(
                     *out, CompressionCodecFactory::instance().get(method, level));
diff --git a/src/Server/TCPHandler.h b/src/Server/TCPHandler.h
index d18ffc5afe8..235f634afec 100644
--- a/src/Server/TCPHandler.h
+++ b/src/Server/TCPHandler.h
@@ -83,8 +83,6 @@ struct QueryState
         NOT_CANCELLED
     };
 
-    static std::string cancellationStatusToName(CancellationStatus status);
-
     /// Is request cancelled
     CancellationStatus cancellation_status = CancellationStatus::NOT_CANCELLED;
     bool is_connection_closed = false;
@@ -274,6 +272,7 @@ private:
     void sendProfileEvents();
     void sendSelectProfileEvents();
     void sendInsertProfileEvents();
+    void sendTimezone();
 
     /// Creates state.block_in/block_out for blocks read/write, depending on whether compression is enabled.
     void initBlockInput();
diff --git a/src/Storages/AlterCommands.cpp b/src/Storages/AlterCommands.cpp
index 5fd823b9e01..a9247f9b898 100644
--- a/src/Storages/AlterCommands.cpp
+++ b/src/Storages/AlterCommands.cpp
@@ -388,7 +388,7 @@ void AlterCommand::apply(StorageInMemoryMetadata & metadata, ContextPtr context)
             column.comment = *comment;
 
         if (codec)
-            column.codec = CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(codec, data_type, false, true);
+            column.codec = CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(codec, data_type, false, true, true);
 
         column.ttl = ttl;
 
@@ -429,7 +429,7 @@ void AlterCommand::apply(StorageInMemoryMetadata & metadata, ContextPtr context)
             else
             {
                 if (codec)
-                    column.codec = CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(codec, data_type ? data_type : column.type, false, true);
+                    column.codec = CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(codec, data_type ? data_type : column.type, false, true, true);
 
                 if (comment)
                     column.comment = *comment;
@@ -1067,7 +1067,7 @@ void AlterCommands::validate(const StoragePtr & table, ContextPtr context) const
                                 "this column name is reserved for lightweight delete feature", backQuote(column_name));
 
             if (command.codec)
-                CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(command.codec, command.data_type, !context->getSettingsRef().allow_suspicious_codecs, context->getSettingsRef().allow_experimental_codecs);
+                CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(command.codec, command.data_type, !context->getSettingsRef().allow_suspicious_codecs, context->getSettingsRef().allow_experimental_codecs, context->getSettingsRef().enable_deflate_qpl_codec);
 
             all_columns.add(ColumnDescription(column_name, command.data_type));
         }
@@ -1093,7 +1093,7 @@ void AlterCommands::validate(const StoragePtr & table, ContextPtr context) const
             {
                 if (all_columns.hasAlias(column_name))
                     throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot specify codec for column type ALIAS");
-                CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(command.codec, command.data_type, !context->getSettingsRef().allow_suspicious_codecs, context->getSettingsRef().allow_experimental_codecs);
+                CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(command.codec, command.data_type, !context->getSettingsRef().allow_suspicious_codecs, context->getSettingsRef().allow_experimental_codecs, context->getSettingsRef().enable_deflate_qpl_codec);
             }
             auto column_default = all_columns.getDefault(column_name);
             if (column_default)
diff --git a/src/Storages/ColumnsDescription.cpp b/src/Storages/ColumnsDescription.cpp
index 8eabae7929c..045afd7e6e6 100644
--- a/src/Storages/ColumnsDescription.cpp
+++ b/src/Storages/ColumnsDescription.cpp
@@ -130,7 +130,7 @@ void ColumnDescription::readText(ReadBuffer & buf)
                 comment = col_ast->comment->as<ASTLiteral &>().value.get<String>();
 
             if (col_ast->codec)
-                codec = CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(col_ast->codec, type, false, true);
+                codec = CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(col_ast->codec, type, false, true, true);
 
             if (col_ast->ttl)
                 ttl = col_ast->ttl;
diff --git a/src/Storages/DataLakes/IcebergMetadataParser.cpp b/src/Storages/DataLakes/IcebergMetadataParser.cpp
index 144dace2fc1..3820bb08247 100644
--- a/src/Storages/DataLakes/IcebergMetadataParser.cpp
+++ b/src/Storages/DataLakes/IcebergMetadataParser.cpp
@@ -184,11 +184,17 @@ struct IcebergMetadataParser<Configuration, MetadataReadHelper>::Impl
      * Manifest file has the following format: '/iceberg_data/db/table_name/metadata/c87bfec7-d36c-4075-ad04-600b6b0f2020-m0.avro'
      *
      * `manifest file` is different in format version V1 and V2 and has the following contents:
-     * Format version V1:
+     *                        v1     v2
+     * status                 req    req
+     * snapshot_id            req    opt
+     * sequence_number               opt
+     * file_sequence_number          opt
+     * data_file              req    req
+     * Example format version V1:
      * ┌─status─┬─────────snapshot_id─┬─data_file───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┐
      * │      1 │ 2819310504515118887 │ ('/iceberg_data/db/table_name/data/00000-1-3edca534-15a0-4f74-8a28-4733e0bf1270-00001.parquet','PARQUET',(),100,1070,67108864,[(1,233),(2,210)],[(1,100),(2,100)],[(1,0),(2,0)],[],[(1,'\0'),(2,'0')],[(1,'c'),(2,'99')],NULL,[4],0) │
      * └────────┴─────────────────────┴─────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┘
-     * Format version V2:
+     * Example format version V2:
      * ┌─status─┬─────────snapshot_id─┬─sequence_number─┬─file_sequence_number─┬─data_file───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┐
      * │      1 │ 5887006101709926452 │            ᴺᵁᴸᴸ │                 ᴺᵁᴸᴸ │ (0,'/iceberg_data/db/table_name/data/00000-1-c8045c90-8799-4eac-b957-79a0484e223c-00001.parquet','PARQUET',(),100,1070,[(1,233),(2,210)],[(1,100),(2,100)],[(1,0),(2,0)],[],[(1,'\0'),(2,'0')],[(1,'c'),(2,'99')],NULL,[4],[],0) │
      * └────────┴─────────────────────┴─────────────────┴──────────────────────┴─────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┘
@@ -209,22 +215,26 @@ struct IcebergMetadataParser<Configuration, MetadataReadHelper>::Impl
             auto buffer = MetadataReadHelper::createReadBuffer(manifest_file, context, configuration);
             auto file_reader = std::make_unique<avro::DataFileReaderBase>(std::make_unique<AvroInputStreamReadBufferAdapter>(*buffer));
 
-            avro::NodePtr node;
-            if (metadata.format_version == 1)
-                node = file_reader->dataSchema().root()->leafAt(2);
-            else if (metadata.format_version == 2)
-                node = file_reader->dataSchema().root()->leafAt(4);
-            else
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unexpected format version: {}", metadata.format_version);
+            avro::NodePtr root_node = file_reader->dataSchema().root();
+            size_t leaves_num = root_node->leaves();
+            size_t expected_min_num = metadata.format_version == 1 ? 3 : 2;
+            if (leaves_num < expected_min_num)
+            {
+                throw Exception(
+                    ErrorCodes::BAD_ARGUMENTS,
+                    "Unexpected number of columns {}. Expected at least {}",
+                    root_node->leaves(), expected_min_num);
+            }
 
-            if (node->type() != avro::Type::AVRO_RECORD)
+            avro::NodePtr data_file_node = root_node->leafAt(static_cast<int>(leaves_num) - 1);
+            if (data_file_node->type() != avro::Type::AVRO_RECORD)
             {
                 throw Exception(
                     ErrorCodes::ILLEGAL_COLUMN,
                     "The parsed column from Avro file of `data_file` field should be Tuple type, got {}",
-                    node->type());
+                    data_file_node->type());
             }
-            auto data_type = AvroSchemaReader::avroNodeToDataType(node);
+            auto data_type = AvroSchemaReader::avroNodeToDataType(data_file_node);
             const auto columns = parseAvro(*file_reader, data_type, manifest_path, getFormatSettings(context));
             const auto col_tuple = typeid_cast<ColumnTuple *>(columns.at(0).get());
 
diff --git a/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.cpp b/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.cpp
index 9a9a6651bc4..d8d9a0c9d1e 100644
--- a/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.cpp
+++ b/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.cpp
@@ -35,6 +35,8 @@ namespace CurrentMetrics
     extern const Metric DistributedSend;
     extern const Metric DistributedFilesToInsert;
     extern const Metric BrokenDistributedFilesToInsert;
+    extern const Metric DistributedBytesToInsert;
+    extern const Metric BrokenDistributedBytesToInsert;
 }
 
 namespace fs = std::filesystem;
@@ -138,7 +140,9 @@ DistributedAsyncInsertDirectoryQueue::DistributedAsyncInsertDirectoryQueue(
     , max_sleep_time(storage.getDistributedSettingsRef().monitor_max_sleep_time_ms.totalMilliseconds())
     , log(&Poco::Logger::get(getLoggerName()))
     , monitor_blocker(monitor_blocker_)
+    , metric_pending_bytes(CurrentMetrics::DistributedBytesToInsert, 0)
     , metric_pending_files(CurrentMetrics::DistributedFilesToInsert, 0)
+    , metric_broken_bytes(CurrentMetrics::BrokenDistributedBytesToInsert, 0)
     , metric_broken_files(CurrentMetrics::BrokenDistributedFilesToInsert, 0)
 {
     fs::create_directory(broken_path);
@@ -357,6 +361,7 @@ void DistributedAsyncInsertDirectoryQueue::initializeFilesFromDisk()
         LOG_TRACE(log, "Files set to {}", pending_files.size());
         LOG_TRACE(log, "Bytes set to {}", bytes_count);
 
+        metric_pending_bytes.changeTo(bytes_count);
         metric_pending_files.changeTo(pending_files.size());
         status.files_count = pending_files.size();
         status.bytes_count = bytes_count;
@@ -380,6 +385,7 @@ void DistributedAsyncInsertDirectoryQueue::initializeFilesFromDisk()
         LOG_TRACE(log, "Broken bytes set to {}", broken_bytes_count);
 
         metric_broken_files.changeTo(broken_files);
+        metric_broken_bytes.changeTo(broken_bytes_count);
         status.broken_files_count = broken_files;
         status.broken_bytes_count = broken_bytes_count;
     }
@@ -520,6 +526,7 @@ bool DistributedAsyncInsertDirectoryQueue::addFileAndSchedule(const std::string
     {
         std::lock_guard lock(status_mutex);
         metric_pending_files.add();
+        metric_pending_bytes.add(file_size);
         status.bytes_count += file_size;
         ++status.files_count;
     }
@@ -679,6 +686,7 @@ void DistributedAsyncInsertDirectoryQueue::markAsBroken(const std::string & file
         status.broken_bytes_count += file_size;
 
         metric_broken_files.add();
+        metric_broken_bytes.add(file_size);
     }
 
     fs::rename(file_path, broken_file_path);
@@ -692,6 +700,7 @@ void DistributedAsyncInsertDirectoryQueue::markAsSend(const std::string & file_p
     {
         std::lock_guard status_lock(status_mutex);
         metric_pending_files.sub();
+        metric_pending_bytes.sub(file_size);
         --status.files_count;
         status.bytes_count -= file_size;
     }
diff --git a/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h b/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h
index de8bb813824..9a8a235e265 100644
--- a/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h
+++ b/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h
@@ -149,7 +149,9 @@ private:
 
     BackgroundSchedulePoolTaskHolder task_handle;
 
+    CurrentMetrics::Increment metric_pending_bytes;
     CurrentMetrics::Increment metric_pending_files;
+    CurrentMetrics::Increment metric_broken_bytes;
     CurrentMetrics::Increment metric_broken_files;
 };
 
diff --git a/src/Storages/Distributed/DistributedAsyncInsertHeader.cpp b/src/Storages/Distributed/DistributedAsyncInsertHeader.cpp
index 018c1d863bb..a8ed89e66f1 100644
--- a/src/Storages/Distributed/DistributedAsyncInsertHeader.cpp
+++ b/src/Storages/Distributed/DistributedAsyncInsertHeader.cpp
@@ -39,9 +39,8 @@ DistributedAsyncInsertHeader DistributedAsyncInsertHeader::read(ReadBufferFromFi
         if (expected_checksum != calculated_checksum)
         {
             throw Exception(ErrorCodes::CHECKSUM_DOESNT_MATCH,
-                            "Checksum of extra info doesn't match: corrupted data. Reference: {}{}. Actual: {}{}.",
-                            getHexUIntLowercase(expected_checksum.first), getHexUIntLowercase(expected_checksum.second),
-                            getHexUIntLowercase(calculated_checksum.first), getHexUIntLowercase(calculated_checksum.second));
+                            "Checksum of extra info doesn't match: corrupted data. Reference: {}. Actual: {}.",
+                            getHexUIntLowercase(expected_checksum), getHexUIntLowercase(calculated_checksum));
         }
 
         /// Read the parts of the header.
diff --git a/src/Storages/Distributed/DistributedSink.cpp b/src/Storages/Distributed/DistributedSink.cpp
index 720a951299a..875764f7633 100644
--- a/src/Storages/Distributed/DistributedSink.cpp
+++ b/src/Storages/Distributed/DistributedSink.cpp
@@ -733,7 +733,7 @@ void DistributedSink::writeToShard(const Cluster::ShardInfo & shard_info, const
     if (compression_method == "ZSTD")
         compression_level = settings.network_zstd_compression_level;
 
-    CompressionCodecFactory::instance().validateCodec(compression_method, compression_level, !settings.allow_suspicious_codecs, settings.allow_experimental_codecs);
+    CompressionCodecFactory::instance().validateCodec(compression_method, compression_level, !settings.allow_suspicious_codecs, settings.allow_experimental_codecs, settings.enable_deflate_qpl_codec);
     CompressionCodecPtr compression_codec = CompressionCodecFactory::instance().get(compression_method, compression_level);
 
     /// tmp directory is used to ensure atomicity of transactions
diff --git a/src/Storages/HDFS/StorageHDFS.cpp b/src/Storages/HDFS/StorageHDFS.cpp
index 98c2579e355..a41c65cdb2e 100644
--- a/src/Storages/HDFS/StorageHDFS.cpp
+++ b/src/Storages/HDFS/StorageHDFS.cpp
@@ -30,6 +30,7 @@
 #include <Storages/PartitionedSink.h>
 #include <Storages/getVirtualsForStorage.h>
 #include <Storages/checkAndGetLiteralArgument.h>
+#include <Storages/ReadFromStorageProgress.h>
 
 #include <Formats/ReadSchemaUtils.h>
 #include <Formats/FormatFactory.h>
@@ -66,7 +67,7 @@ namespace
     /* Recursive directory listing with matched paths as a result.
      * Have the same method in StorageFile.
      */
-    Strings LSWithRegexpMatching(const String & path_for_ls, const HDFSFSPtr & fs, const String & for_match, std::unordered_map<String, time_t> * last_mod_times)
+    std::vector<StorageHDFS::PathWithInfo> LSWithRegexpMatching(const String & path_for_ls, const HDFSFSPtr & fs, const String & for_match)
     {
         const size_t first_glob = for_match.find_first_of("*?{");
 
@@ -88,7 +89,7 @@ namespace
             throw Exception(
                 ErrorCodes::ACCESS_DENIED, "Cannot list directory {}: {}", prefix_without_globs, String(hdfsGetLastError()));
         }
-        Strings result;
+        std::vector<StorageHDFS::PathWithInfo> result;
         if (!ls.file_info && ls.length > 0)
             throw Exception(ErrorCodes::LOGICAL_ERROR, "file_info shouldn't be null");
         for (int i = 0; i < ls.length; ++i)
@@ -102,17 +103,15 @@ namespace
             if (!is_directory && !looking_for_directory)
             {
                 if (re2::RE2::FullMatch(file_name, matcher))
-                {
-                    result.push_back(String(ls.file_info[i].mName));
-                    if (last_mod_times)
-                        (*last_mod_times)[result.back()] = ls.file_info[i].mLastMod;
-                }
+                    result.push_back(StorageHDFS::PathWithInfo{
+                        String(ls.file_info[i].mName),
+                        StorageHDFS::PathInfo{ls.file_info[i].mLastMod, static_cast<size_t>(ls.file_info[i].mSize)}});
             }
             else if (is_directory && looking_for_directory)
             {
                 if (re2::RE2::FullMatch(file_name, matcher))
                 {
-                    Strings result_part = LSWithRegexpMatching(fs::path(full_path) / "", fs, suffix_with_globs.substr(next_slash), last_mod_times);
+                    std::vector<StorageHDFS::PathWithInfo> result_part = LSWithRegexpMatching(fs::path(full_path) / "", fs, suffix_with_globs.substr(next_slash));
                     /// Recursion depth is limited by pattern. '*' works only for depth = 1, for depth = 2 pattern path is '*/*'. So we do not need additional check.
                     std::move(result_part.begin(), result_part.end(), std::back_inserter(result));
                 }
@@ -135,12 +134,12 @@ namespace
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Storage HDFS requires valid URL to be set");
     }
 
-    std::vector<String> getPathsList(const String & path_from_uri, const String & uri_without_path, ContextPtr context, std::unordered_map<String, time_t> * last_mod_times = nullptr)
+    std::vector<StorageHDFS::PathWithInfo> getPathsList(const String & path_from_uri, const String & uri_without_path, ContextPtr context)
     {
         HDFSBuilderWrapper builder = createHDFSBuilder(uri_without_path + "/", context->getGlobalContext()->getConfigRef());
         HDFSFSPtr fs = createHDFSFS(builder.get());
 
-        return LSWithRegexpMatching("/", fs, path_from_uri, last_mod_times);
+        return LSWithRegexpMatching("/", fs, path_from_uri);
     }
 }
 
@@ -199,9 +198,8 @@ ColumnsDescription StorageHDFS::getTableStructureFromData(
     ContextPtr ctx)
 {
     const auto [path_from_uri, uri_without_path] = getPathFromUriAndUriWithoutPath(uri);
-    std::unordered_map<String, time_t> last_mod_time;
-    auto paths = getPathsList(path_from_uri, uri, ctx, &last_mod_time);
-    if (paths.empty() && !FormatFactory::instance().checkIfFormatHasExternalSchemaReader(format))
+    auto paths_with_info = getPathsList(path_from_uri, uri, ctx);
+    if (paths_with_info.empty() && !FormatFactory::instance().checkIfFormatHasExternalSchemaReader(format))
         throw Exception(
             ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
             "Cannot extract table structure from {} format file, because there are no files in HDFS with provided path."
@@ -209,26 +207,47 @@ ColumnsDescription StorageHDFS::getTableStructureFromData(
 
     std::optional<ColumnsDescription> columns_from_cache;
     if (ctx->getSettingsRef().schema_inference_use_cache_for_hdfs)
-        columns_from_cache = tryGetColumnsFromCache(paths, path_from_uri, last_mod_time, format, ctx);
+        columns_from_cache = tryGetColumnsFromCache(paths_with_info, path_from_uri, format, ctx);
 
-    ReadBufferIterator read_buffer_iterator = [&, my_uri_without_path = uri_without_path, it = paths.begin()](ColumnsDescription &) mutable -> std::unique_ptr<ReadBuffer>
+    ReadBufferIterator read_buffer_iterator
+        = [&, my_uri_without_path = uri_without_path, it = paths_with_info.begin(), first = true](
+              ColumnsDescription &) mutable -> std::unique_ptr<ReadBuffer>
     {
-        if (it == paths.end())
-            return nullptr;
-        auto compression = chooseCompressionMethod(*it, compression_method);
-        auto impl = std::make_unique<ReadBufferFromHDFS>(my_uri_without_path, *it++, ctx->getGlobalContext()->getConfigRef(), ctx->getReadSettings());
-        const Int64 zstd_window_log_max = ctx->getSettingsRef().zstd_window_log_max;
-        return wrapReadBufferWithCompressionMethod(std::move(impl), compression, static_cast<int>(zstd_window_log_max));
+        PathWithInfo path_with_info;
+        while (true)
+        {
+            if (it == paths_with_info.end())
+            {
+                if (first)
+                    throw Exception(ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                                    "Cannot extract table structure from {} format file, because all files are empty. "
+                                    "You must specify table structure manually", format);
+                return nullptr;
+            }
+
+            path_with_info = *it++;
+            if (ctx->getSettingsRef().hdfs_skip_empty_files && path_with_info.info && path_with_info.info->size == 0)
+                continue;
+
+            auto compression = chooseCompressionMethod(path_with_info.path, compression_method);
+            auto impl = std::make_unique<ReadBufferFromHDFS>(my_uri_without_path, path_with_info.path, ctx->getGlobalContext()->getConfigRef(), ctx->getReadSettings());
+            if (!ctx->getSettingsRef().hdfs_skip_empty_files || !impl->eof())
+            {
+                const Int64 zstd_window_log_max = ctx->getSettingsRef().zstd_window_log_max;
+                first = false;
+                return wrapReadBufferWithCompressionMethod(std::move(impl), compression, static_cast<int>(zstd_window_log_max));
+            }
+        }
     };
 
     ColumnsDescription columns;
     if (columns_from_cache)
         columns = *columns_from_cache;
     else
-        columns = readSchemaFromFormat(format, std::nullopt, read_buffer_iterator, paths.size() > 1, ctx);
+        columns = readSchemaFromFormat(format, std::nullopt, read_buffer_iterator, paths_with_info.size() > 1, ctx);
 
     if (ctx->getSettingsRef().schema_inference_use_cache_for_hdfs)
-        addColumnsToCache(paths, path_from_uri, columns, format, ctx);
+        addColumnsToCache(paths_with_info, path_from_uri, columns, format, ctx);
 
     return columns;
 }
@@ -241,11 +260,11 @@ public:
         const auto [path_from_uri, uri_without_path] = getPathFromUriAndUriWithoutPath(uri);
         uris = getPathsList(path_from_uri, uri_without_path, context_);
         for (auto & elem : uris)
-            elem = uri_without_path + elem;
+            elem.path = uri_without_path + elem.path;
         uris_iter = uris.begin();
     }
 
-    String next()
+    StorageHDFS::PathWithInfo next()
     {
         std::lock_guard lock(mutex);
         if (uris_iter != uris.end())
@@ -258,8 +277,8 @@ public:
     }
 private:
     std::mutex mutex;
-    Strings uris;
-    Strings::iterator uris_iter;
+    std::vector<StorageHDFS::PathWithInfo> uris;
+    std::vector<StorageHDFS::PathWithInfo>::iterator uris_iter;
 };
 
 class HDFSSource::URISIterator::Impl
@@ -279,14 +298,14 @@ public:
         uris_iter = uris.begin();
     }
 
-    String next()
+    StorageHDFS::PathWithInfo next()
     {
         std::lock_guard lock(mutex);
         if (uris_iter == uris.end())
-            return "";
+            return {"", {}};
         auto key = *uris_iter;
         ++uris_iter;
-        return key;
+        return {key, {}};
     }
 
 private:
@@ -298,7 +317,7 @@ private:
 HDFSSource::DisclosedGlobIterator::DisclosedGlobIterator(ContextPtr context_, const String & uri)
     : pimpl(std::make_shared<HDFSSource::DisclosedGlobIterator::Impl>(context_, uri)) {}
 
-String HDFSSource::DisclosedGlobIterator::next()
+StorageHDFS::PathWithInfo HDFSSource::DisclosedGlobIterator::next()
 {
     return pimpl->next();
 }
@@ -308,7 +327,7 @@ HDFSSource::URISIterator::URISIterator(const std::vector<String> & uris_, Contex
 {
 }
 
-String HDFSSource::URISIterator::next()
+StorageHDFS::PathWithInfo HDFSSource::URISIterator::next()
 {
     return pimpl->next();
 }
@@ -343,19 +362,42 @@ HDFSSource::HDFSSource(
 
 bool HDFSSource::initialize()
 {
-    current_path = (*file_iterator)();
-    if (current_path.empty())
-        return false;
+    bool skip_empty_files = getContext()->getSettingsRef().hdfs_skip_empty_files;
+    StorageHDFS::PathWithInfo path_with_info;
+    while (true)
+    {
+        path_with_info = (*file_iterator)();
+        if (path_with_info.path.empty())
+            return false;
 
-    const auto [path_from_uri, uri_without_path] = getPathFromUriAndUriWithoutPath(current_path);
+        if (path_with_info.info && skip_empty_files && path_with_info.info->size == 0)
+            continue;
 
-    auto compression = chooseCompressionMethod(path_from_uri, storage->compression_method);
-    auto impl = std::make_unique<ReadBufferFromHDFS>(
-        uri_without_path, path_from_uri, getContext()->getGlobalContext()->getConfigRef(), getContext()->getReadSettings());
-    const Int64 zstd_window_log_max = getContext()->getSettingsRef().zstd_window_log_max;
-    read_buf = wrapReadBufferWithCompressionMethod(std::move(impl), compression, static_cast<int>(zstd_window_log_max));
+        current_path = path_with_info.path;
+        const auto [path_from_uri, uri_without_path] = getPathFromUriAndUriWithoutPath(current_path);
 
-    auto input_format = getContext()->getInputFormat(storage->format_name, *read_buf, block_for_format, max_block_size);
+        auto compression = chooseCompressionMethod(path_from_uri, storage->compression_method);
+        auto impl = std::make_unique<ReadBufferFromHDFS>(
+            uri_without_path, path_from_uri, getContext()->getGlobalContext()->getConfigRef(), getContext()->getReadSettings());
+        if (!skip_empty_files || !impl->eof())
+        {
+            const Int64 zstd_window_log_max = getContext()->getSettingsRef().zstd_window_log_max;
+            read_buf = wrapReadBufferWithCompressionMethod(std::move(impl), compression, static_cast<int>(zstd_window_log_max));
+            break;
+        }
+    }
+
+    current_path = path_with_info.path;
+
+    if (path_with_info.info && path_with_info.info->size)
+    {
+        /// Adjust total_rows_approx_accumulated with new total size.
+        if (total_files_size)
+            total_rows_approx_accumulated = static_cast<size_t>(std::ceil(static_cast<double>(total_files_size + path_with_info.info->size) / total_files_size * total_rows_approx_accumulated));
+        total_files_size += path_with_info.info->size;
+    }
+
+    input_format = getContext()->getInputFormat(storage->format_name, *read_buf, block_for_format, max_block_size);
 
     QueryPipelineBuilder builder;
     builder.init(Pipe(input_format));
@@ -393,6 +435,14 @@ Chunk HDFSSource::generate()
             Columns columns = chunk.getColumns();
             UInt64 num_rows = chunk.getNumRows();
 
+            if (num_rows && total_files_size)
+            {
+                size_t chunk_size = input_format->getApproxBytesReadForChunk();
+                if (!chunk_size)
+                    chunk_size = chunk.bytes();
+                updateRowsProgressApprox(*this, num_rows, chunk_size, total_files_size, total_rows_approx_accumulated, total_rows_count_times, total_rows_approx_max);
+            }
+
             for (const auto & virtual_column : requested_virtual_columns)
             {
                 if (virtual_column.name == "_path")
@@ -415,6 +465,7 @@ Chunk HDFSSource::generate()
 
         reader.reset();
         pipeline.reset();
+        input_format.reset();
         read_buf.reset();
 
         if (!initialize())
@@ -461,10 +512,18 @@ public:
         cancelled = true;
     }
 
-    void onException() override
+    void onException(std::exception_ptr exception) override
     {
         std::lock_guard lock(cancel_mutex);
-        finalize();
+        try
+        {
+            std::rethrow_exception(exception);
+        }
+        catch (...)
+        {
+            /// An exception context is needed to proper delete write buffers without finalization
+            release();
+        }
     }
 
     void onFinish() override
@@ -489,12 +548,17 @@ private:
         catch (...)
         {
             /// Stop ParallelFormattingOutputFormat correctly.
-            writer.reset();
-            write_buf->finalize();
+            release();
             throw;
         }
     }
 
+    void release()
+    {
+        writer.reset();
+        write_buf->finalize();
+    }
+
     std::unique_ptr<WriteBuffer> write_buf;
     OutputFormatPtr writer;
     std::mutex cancel_mutex;
@@ -554,8 +618,8 @@ Pipe StorageHDFS::read(
     if (distributed_processing)
     {
         iterator_wrapper = std::make_shared<HDFSSource::IteratorWrapper>(
-            [callback = context_->getReadTaskCallback()]() -> String {
-                return callback();
+            [callback = context_->getReadTaskCallback()]() -> StorageHDFS::PathWithInfo {
+                return StorageHDFS::PathWithInfo{callback(), std::nullopt};
         });
     }
     else if (is_path_with_globs)
@@ -624,7 +688,7 @@ Pipe StorageHDFS::read(
     return Pipe::unitePipes(std::move(pipes));
 }
 
-SinkToStoragePtr StorageHDFS::write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context_)
+SinkToStoragePtr StorageHDFS::write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context_, bool /*async_insert*/)
 {
     String current_uri = uris.back();
 
@@ -762,24 +826,22 @@ SchemaCache & StorageHDFS::getSchemaCache(const ContextPtr & ctx)
 }
 
 std::optional<ColumnsDescription> StorageHDFS::tryGetColumnsFromCache(
-    const Strings & paths,
+    const std::vector<StorageHDFS::PathWithInfo> & paths_with_info,
     const String & uri_without_path,
-    std::unordered_map<String, time_t> & last_mod_time,
     const String & format_name,
     const ContextPtr & ctx)
 {
     auto & schema_cache = getSchemaCache(ctx);
-    for (const auto & path : paths)
+    for (const auto & path_with_info : paths_with_info)
     {
         auto get_last_mod_time = [&]() -> std::optional<time_t>
         {
-            auto it = last_mod_time.find(path);
-            if (it == last_mod_time.end())
-                return std::nullopt;
-            return it->second;
+            if (path_with_info.info)
+                return path_with_info.info->last_mod_time;
+            return std::nullopt;
         };
 
-        String url = fs::path(uri_without_path) / path;
+        String url = fs::path(uri_without_path) / path_with_info.path;
         auto cache_key = getKeyForSchemaCache(url, format_name, {}, ctx);
         auto columns = schema_cache.tryGet(cache_key, get_last_mod_time);
         if (columns)
@@ -790,7 +852,7 @@ std::optional<ColumnsDescription> StorageHDFS::tryGetColumnsFromCache(
 }
 
 void StorageHDFS::addColumnsToCache(
-    const Strings & paths,
+    const std::vector<StorageHDFS::PathWithInfo> & paths_with_info,
     const String & uri_without_path,
     const ColumnsDescription & columns,
     const String & format_name,
@@ -798,8 +860,8 @@ void StorageHDFS::addColumnsToCache(
 {
     auto & schema_cache = getSchemaCache(ctx);
     Strings sources;
-    sources.reserve(paths.size());
-    std::transform(paths.begin(), paths.end(), std::back_inserter(sources), [&](const String & path){ return fs::path(uri_without_path) / path; });
+    sources.reserve(paths_with_info.size());
+    std::transform(paths_with_info.begin(), paths_with_info.end(), std::back_inserter(sources), [&](const PathWithInfo & path_with_info){ return fs::path(uri_without_path) / path_with_info.path; });
     auto cache_keys = getKeysForSchemaCache(sources, format_name, {}, ctx);
     schema_cache.addMany(cache_keys, columns);
 }
diff --git a/src/Storages/HDFS/StorageHDFS.h b/src/Storages/HDFS/StorageHDFS.h
index b123834e981..74801b68f73 100644
--- a/src/Storages/HDFS/StorageHDFS.h
+++ b/src/Storages/HDFS/StorageHDFS.h
@@ -11,6 +11,9 @@
 
 namespace DB
 {
+
+class IInputFormat;
+
 /**
  * This class represents table engine for external hdfs files.
  * Read method is supported for now.
@@ -18,6 +21,18 @@ namespace DB
 class StorageHDFS final : public IStorage, WithContext
 {
 public:
+    struct PathInfo
+    {
+        time_t last_mod_time;
+        size_t size;
+    };
+
+    struct PathWithInfo
+    {
+        String path;
+        std::optional<PathInfo> info;
+    };
+
     StorageHDFS(
         const String & uri_,
         const StorageID & table_id_,
@@ -41,7 +56,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, bool async_insert) override;
 
     void truncate(
         const ASTPtr & query,
@@ -72,14 +87,13 @@ protected:
 
 private:
     static std::optional<ColumnsDescription> tryGetColumnsFromCache(
-        const Strings & paths,
+        const std::vector<StorageHDFS::PathWithInfo> & paths_with_info,
         const String & uri_without_path,
-        std::unordered_map<String, time_t> & last_mod_time,
         const String & format_name,
         const ContextPtr & ctx);
 
     static void addColumnsToCache(
-        const Strings & paths,
+        const std::vector<StorageHDFS::PathWithInfo> & paths,
         const String & uri_without_path,
         const ColumnsDescription & columns,
         const String & format_name,
@@ -105,7 +119,7 @@ public:
     {
         public:
             DisclosedGlobIterator(ContextPtr context_, const String & uri_);
-            String next();
+            StorageHDFS::PathWithInfo next();
         private:
             class Impl;
             /// shared_ptr to have copy constructor
@@ -116,14 +130,14 @@ public:
     {
         public:
             URISIterator(const std::vector<String> & uris_, ContextPtr context);
-            String next();
+            StorageHDFS::PathWithInfo next();
         private:
             class Impl;
             /// shared_ptr to have copy constructor
             std::shared_ptr<Impl> pimpl;
     };
 
-    using IteratorWrapper = std::function<String()>;
+    using IteratorWrapper = std::function<StorageHDFS::PathWithInfo()>;
     using StorageHDFSPtr = std::shared_ptr<StorageHDFS>;
 
     static Block getHeader(Block sample_block, const std::vector<NameAndTypePair> & requested_virtual_columns);
@@ -150,10 +164,16 @@ private:
     ColumnsDescription columns_description;
 
     std::unique_ptr<ReadBuffer> read_buf;
+    std::shared_ptr<IInputFormat> input_format;
     std::unique_ptr<QueryPipeline> pipeline;
     std::unique_ptr<PullingPipelineExecutor> reader;
     String current_path;
 
+    UInt64 total_rows_approx_max = 0;
+    size_t total_rows_count_times = 0;
+    UInt64 total_rows_approx_accumulated = 0;
+    size_t total_files_size = 0;
+
     /// Recreate ReadBuffer and PullingPipelineExecutor for each file.
     bool initialize();
 };
diff --git a/src/Storages/HDFS/StorageHDFSCluster.cpp b/src/Storages/HDFS/StorageHDFSCluster.cpp
index 46e67b623e2..b98459aeee3 100644
--- a/src/Storages/HDFS/StorageHDFSCluster.cpp
+++ b/src/Storages/HDFS/StorageHDFSCluster.cpp
@@ -79,7 +79,7 @@ void StorageHDFSCluster::addColumnsStructureToQuery(ASTPtr & query, const String
 RemoteQueryExecutor::Extension StorageHDFSCluster::getTaskIteratorExtension(ASTPtr, const ContextPtr & context) const
 {
     auto iterator = std::make_shared<HDFSSource::DisclosedGlobIterator>(context, uri);
-    auto callback = std::make_shared<HDFSSource::IteratorWrapper>([iter = std::move(iterator)]() mutable -> String { return iter->next(); });
+    auto callback = std::make_shared<std::function<String()>>([iter = std::move(iterator)]() mutable -> String { return iter->next().path; });
     return RemoteQueryExecutor::Extension{.task_iterator = std::move(callback)};
 }
 
diff --git a/src/Storages/Hive/StorageHive.cpp b/src/Storages/Hive/StorageHive.cpp
index f554a14ec75..00c942fd56b 100644
--- a/src/Storages/Hive/StorageHive.cpp
+++ b/src/Storages/Hive/StorageHive.cpp
@@ -905,7 +905,7 @@ HiveFiles StorageHive::collectHiveFiles(
     return hive_files;
 }
 
-SinkToStoragePtr StorageHive::write(const ASTPtr & /*query*/, const StorageMetadataPtr & /* metadata_snapshot*/, ContextPtr /*context*/)
+SinkToStoragePtr StorageHive::write(const ASTPtr & /*query*/, const StorageMetadataPtr & /* metadata_snapshot*/, ContextPtr /*context*/, bool /*async_insert*/)
 {
     throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method write is not implemented for StorageHive");
 }
diff --git a/src/Storages/Hive/StorageHive.h b/src/Storages/Hive/StorageHive.h
index b4afb2421b1..604df70f4d0 100644
--- a/src/Storages/Hive/StorageHive.h
+++ b/src/Storages/Hive/StorageHive.h
@@ -61,7 +61,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr /*context*/) override;
+    SinkToStoragePtr write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr /*context*/, bool async_insert) override;
 
     NamesAndTypesList getVirtuals() const override;
 
diff --git a/src/Storages/IStorage.h b/src/Storages/IStorage.h
index c163e8107ac..b262d88db57 100644
--- a/src/Storages/IStorage.h
+++ b/src/Storages/IStorage.h
@@ -376,10 +376,11 @@ private:
     /// even when the storage returned only one stream of data for reading?
     /// It is beneficial, for example, when you read from a file quickly,
     /// but then do heavy computations on returned blocks.
-    /// This is enabled by default, but in some cases shouldn't be done.
-    /// For example, when you read from system.numbers instead of system.numbers_mt,
-    /// you still expect the data to be processed sequentially.
-    virtual bool parallelizeOutputAfterReading(ContextPtr) const { return true; }
+    ///
+    /// This is enabled by default, but in some cases shouldn't be done (for
+    /// example it is disabled for all system tables, since it is pretty
+    /// useless).
+    virtual bool parallelizeOutputAfterReading(ContextPtr) const { return !isSystemStorage(); }
 
 public:
     /// Other version of read which adds reading step to query plan.
@@ -402,11 +403,14 @@ public:
       * passed in all parts of the returned streams. Storage metadata can be
       * changed during lifetime of the returned streams, but the snapshot is
       * guaranteed to be immutable.
+      *
+      * async_insert - set to true if the write is part of async insert flushing
       */
     virtual SinkToStoragePtr write(
         const ASTPtr & /*query*/,
         const StorageMetadataPtr & /*metadata_snapshot*/,
-        ContextPtr /*context*/)
+        ContextPtr /*context*/,
+        bool /*async_insert*/)
     {
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method write is not supported by storage {}", getName());
     }
diff --git a/src/Storages/KVStorageUtils.cpp b/src/Storages/KVStorageUtils.cpp
index d5563108ad7..16ab99d03b4 100644
--- a/src/Storages/KVStorageUtils.cpp
+++ b/src/Storages/KVStorageUtils.cpp
@@ -66,13 +66,20 @@ bool traverseASTFilter(
                 return false;
             value = args.children.at(1);
 
-            PreparedSetKey set_key;
-            if ((value->as<ASTSubquery>() || value->as<ASTIdentifier>()))
-                set_key = PreparedSetKey::forSubquery(*value);
-            else
-                set_key = PreparedSetKey::forLiteral(*value, {primary_key_type});
+            PreparedSets::Hash set_key = value->getTreeHash();
+            FutureSetPtr future_set;
 
-            SetPtr set = prepared_sets->get(set_key);
+            if ((value->as<ASTSubquery>() || value->as<ASTIdentifier>()))
+                future_set = prepared_sets->findSubquery(set_key);
+            else
+                future_set = prepared_sets->findTuple(set_key, {primary_key_type});
+
+            if (!future_set)
+                return false;
+
+            future_set->buildOrderedSetInplace(context);
+
+            auto set = future_set->get();
             if (!set)
                 return false;
 
@@ -175,7 +182,7 @@ std::vector<std::string> serializeKeysToRawString(const ColumnWithTypeAndName &
     return result;
 }
 
-/// In current implementation rocks db can have key with only one column.
+/// In current implementation rocks db/redis can have key with only one column.
 size_t getPrimaryKeyPos(const Block & header, const Names & primary_key)
 {
     if (primary_key.size() != 1)
diff --git a/src/Storages/Kafka/StorageKafka.cpp b/src/Storages/Kafka/StorageKafka.cpp
index 7d504833a0a..2aba76c1a3f 100644
--- a/src/Storages/Kafka/StorageKafka.cpp
+++ b/src/Storages/Kafka/StorageKafka.cpp
@@ -374,7 +374,7 @@ Pipe StorageKafka::read(
 }
 
 
-SinkToStoragePtr StorageKafka::write(const ASTPtr &, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+SinkToStoragePtr StorageKafka::write(const ASTPtr &, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
     auto modified_context = Context::createCopy(local_context);
     modified_context->applySettingsChanges(settings_adjustments);
diff --git a/src/Storages/Kafka/StorageKafka.h b/src/Storages/Kafka/StorageKafka.h
index 3559129cf74..09aa091ef18 100644
--- a/src/Storages/Kafka/StorageKafka.h
+++ b/src/Storages/Kafka/StorageKafka.h
@@ -60,7 +60,8 @@ public:
     SinkToStoragePtr write(
         const ASTPtr & query,
         const StorageMetadataPtr & /*metadata_snapshot*/,
-        ContextPtr context) override;
+        ContextPtr context,
+        bool async_insert) override;
 
     /// We want to control the number of rows in a chunk inserted into Kafka
     bool prefersLargeBlocks() const override { return false; }
diff --git a/src/Storages/LiveView/LiveViewCommands.h b/src/Storages/LiveView/LiveViewCommands.h
deleted file mode 100644
index 2bb2dfb2752..00000000000
--- a/src/Storages/LiveView/LiveViewCommands.h
+++ /dev/null
@@ -1,65 +0,0 @@
-#pragma once
-/* Copyright (c) 2018 BlackBerry Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-http://www.apache.org/licenses/LICENSE-2.0
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License. */
-
-#include <optional>
-#include <Parsers/ASTAlterQuery.h>
-#include <Storages/LiveView/StorageLiveView.h>
-
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int UNKNOWN_STORAGE;
-}
-
-struct LiveViewCommand
-{
-    enum Type
-    {
-        REFRESH
-    };
-
-    Type type;
-
-    ASTPtr values;
-
-    static LiveViewCommand refresh(const ASTPtr & values)
-    {
-        LiveViewCommand res;
-        res.type = REFRESH;
-        res.values = values;
-        return res;
-    }
-
-    static std::optional<LiveViewCommand> parse(ASTAlterCommand * command)
-    {
-        if (command->type == ASTAlterCommand::LIVE_VIEW_REFRESH)
-            return refresh(command->values);
-        return {};
-    }
-};
-
-
-class LiveViewCommands : public std::vector<LiveViewCommand>
-{
-public:
-    void validate(const IStorage & table)
-    {
-        if (!empty() && !dynamic_cast<const StorageLiveView *>(&table))
-            throw Exception(DB::ErrorCodes::UNKNOWN_STORAGE, "Wrong storage type. Must be StorageLiveView");
-    }
-};
-
-}
diff --git a/src/Storages/MeiliSearch/StorageMeiliSearch.cpp b/src/Storages/MeiliSearch/StorageMeiliSearch.cpp
index e7350d38a20..5d77fc080a4 100644
--- a/src/Storages/MeiliSearch/StorageMeiliSearch.cpp
+++ b/src/Storages/MeiliSearch/StorageMeiliSearch.cpp
@@ -137,7 +137,7 @@ Pipe StorageMeiliSearch::read(
     return Pipe(std::make_shared<MeiliSearchSource>(config, sample_block, max_block_size, route, kv_pairs_params));
 }
 
-SinkToStoragePtr StorageMeiliSearch::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+SinkToStoragePtr StorageMeiliSearch::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
     LOG_TRACE(log, "Trying update index: {}", config.index);
     return std::make_shared<SinkMeiliSearch>(config, metadata_snapshot->getSampleBlock(), local_context);
diff --git a/src/Storages/MeiliSearch/StorageMeiliSearch.h b/src/Storages/MeiliSearch/StorageMeiliSearch.h
index 41c1db53437..77cd2afb80a 100644
--- a/src/Storages/MeiliSearch/StorageMeiliSearch.h
+++ b/src/Storages/MeiliSearch/StorageMeiliSearch.h
@@ -26,7 +26,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool async_insert) override;
 
     static MeiliSearchConfiguration getConfiguration(ASTs engine_args, ContextPtr context);
 
diff --git a/src/Storages/MergeTree/CommonANNIndexes.cpp b/src/Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.cpp
similarity index 61%
rename from src/Storages/MergeTree/CommonANNIndexes.cpp
rename to src/Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.cpp
index 4b360e029e5..69e54dd5f0c 100644
--- a/src/Storages/MergeTree/CommonANNIndexes.cpp
+++ b/src/Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.cpp
@@ -1,17 +1,15 @@
-#include <Storages/MergeTree/CommonANNIndexes.h>
-#include <Storages/MergeTree/KeyCondition.h>
+#include <Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.h>
 
+#include <Interpreters/Context.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTOrderByElement.h>
 #include <Parsers/ASTSelectQuery.h>
 #include <Parsers/ASTSetQuery.h>
-
+#include <Storages/MergeTree/KeyCondition.h>
 #include <Storages/MergeTree/MergeTreeSettings.h>
 
-#include <Interpreters/Context.h>
-
 namespace DB
 {
 
@@ -24,208 +22,166 @@ namespace ErrorCodes
 namespace
 {
 
-namespace ANN = ApproximateNearestNeighbour;
-
 template <typename Literal>
-void extractTargetVectorFromLiteral(ANN::ANNQueryInformation::Embedding & target, Literal literal)
+void extractReferenceVectorFromLiteral(ApproximateNearestNeighborInformation::Embedding & reference_vector, Literal literal)
 {
-    Float64 float_element_of_target_vector;
-    Int64 int_element_of_target_vector;
+    Float64 float_element_of_reference_vector;
+    Int64 int_element_of_reference_vector;
 
     for (const auto & value : literal.value())
     {
-        if (value.tryGet(float_element_of_target_vector))
-        {
-            target.emplace_back(float_element_of_target_vector);
-        }
-        else if (value.tryGet(int_element_of_target_vector))
-        {
-            target.emplace_back(static_cast<float>(int_element_of_target_vector));
-        }
+        if (value.tryGet(float_element_of_reference_vector))
+            reference_vector.emplace_back(float_element_of_reference_vector);
+        else if (value.tryGet(int_element_of_reference_vector))
+            reference_vector.emplace_back(static_cast<float>(int_element_of_reference_vector));
         else
-        {
-            throw Exception(ErrorCodes::INCORRECT_QUERY, "Wrong type of elements in target vector. Only float or int are supported.");
-        }
+            throw Exception(ErrorCodes::INCORRECT_QUERY, "Wrong type of elements in reference vector. Only float or int are supported.");
     }
 }
 
-ANN::ANNQueryInformation::Metric castMetricFromStringToType(String metric_name)
+ApproximateNearestNeighborInformation::Metric stringToMetric(std::string_view metric)
 {
-    if (metric_name == "L2Distance")
-        return ANN::ANNQueryInformation::Metric::L2;
-    if (metric_name == "LpDistance")
-        return ANN::ANNQueryInformation::Metric::Lp;
-    return ANN::ANNQueryInformation::Metric::Unknown;
+    if (metric == "L2Distance")
+        return ApproximateNearestNeighborInformation::Metric::L2;
+    else if (metric == "LpDistance")
+        return ApproximateNearestNeighborInformation::Metric::Lp;
+    else
+        return ApproximateNearestNeighborInformation::Metric::Unknown;
 }
 
 }
 
-namespace ApproximateNearestNeighbour
-{
+ApproximateNearestNeighborCondition::ApproximateNearestNeighborCondition(const SelectQueryInfo & query_info, ContextPtr context)
+    : block_with_constants(KeyCondition::getBlockWithConstants(query_info.query, query_info.syntax_analyzer_result, context))
+    , index_granularity(context->getMergeTreeSettings().index_granularity)
+    , max_limit_for_ann_queries(context->getSettings().max_limit_for_ann_queries)
+    , index_is_useful(checkQueryStructure(query_info))
+{}
 
-ANNCondition::ANNCondition(const SelectQueryInfo & query_info,
-                                 ContextPtr context) :
-    block_with_constants{KeyCondition::getBlockWithConstants(query_info.query, query_info.syntax_analyzer_result, context)},
-    ann_index_select_query_params{context->getSettings().get("ann_index_select_query_params").get<String>()},
-    index_granularity{context->getMergeTreeSettings().get("index_granularity").get<UInt64>()},
-    limit_restriction{context->getSettings().get("max_limit_for_ann_queries").get<UInt64>()},
-    index_is_useful{checkQueryStructure(query_info)} {}
-
-bool ANNCondition::alwaysUnknownOrTrue(String metric_name) const
+bool ApproximateNearestNeighborCondition::alwaysUnknownOrTrue(String metric) const
 {
     if (!index_is_useful)
-    {
         return true; // Query isn't supported
-    }
     // If query is supported, check metrics for match
-    return !(castMetricFromStringToType(metric_name) == query_information->metric);
+    return !(stringToMetric(metric) == query_information->metric);
 }
 
-float ANNCondition::getComparisonDistanceForWhereQuery() const
+float ApproximateNearestNeighborCondition::getComparisonDistanceForWhereQuery() const
 {
     if (index_is_useful && query_information.has_value()
-        && query_information->query_type == ANNQueryInformation::Type::Where)
-    {
+        && query_information->type == ApproximateNearestNeighborInformation::Type::Where)
         return query_information->distance;
-    }
     throw Exception(ErrorCodes::LOGICAL_ERROR, "Not supported method for this query type");
 }
 
-UInt64 ANNCondition::getLimit() const
+UInt64 ApproximateNearestNeighborCondition::getLimit() const
 {
     if (index_is_useful && query_information.has_value())
-    {
         return query_information->limit;
-    }
     throw Exception(ErrorCodes::LOGICAL_ERROR, "No LIMIT section in query, not supported");
 }
 
-std::vector<float> ANNCondition::getTargetVector() const
+std::vector<float> ApproximateNearestNeighborCondition::getReferenceVector() const
 {
     if (index_is_useful && query_information.has_value())
-    {
-        return query_information->target;
-    }
-    throw Exception(ErrorCodes::LOGICAL_ERROR, "Target vector was requested for useless or uninitialized index.");
+        return query_information->reference_vector;
+    throw Exception(ErrorCodes::LOGICAL_ERROR, "Reference vector was requested for useless or uninitialized index.");
 }
 
-size_t ANNCondition::getNumOfDimensions() const
+size_t ApproximateNearestNeighborCondition::getDimensions() const
 {
     if (index_is_useful && query_information.has_value())
-    {
-        return query_information->target.size();
-    }
+        return query_information->reference_vector.size();
     throw Exception(ErrorCodes::LOGICAL_ERROR, "Number of dimensions was requested for useless or uninitialized index.");
 }
 
-String ANNCondition::getColumnName() const
+String ApproximateNearestNeighborCondition::getColumnName() const
 {
     if (index_is_useful && query_information.has_value())
-    {
         return query_information->column_name;
-    }
     throw Exception(ErrorCodes::LOGICAL_ERROR, "Column name was requested for useless or uninitialized index.");
 }
 
-ANNQueryInformation::Metric ANNCondition::getMetricType() const
+ApproximateNearestNeighborInformation::Metric ApproximateNearestNeighborCondition::getMetricType() const
 {
     if (index_is_useful && query_information.has_value())
-    {
         return query_information->metric;
-    }
     throw Exception(ErrorCodes::LOGICAL_ERROR, "Metric name was requested for useless or uninitialized index.");
 }
 
-float ANNCondition::getPValueForLpDistance() const
+float ApproximateNearestNeighborCondition::getPValueForLpDistance() const
 {
     if (index_is_useful && query_information.has_value())
-    {
         return query_information->p_for_lp_dist;
-    }
     throw Exception(ErrorCodes::LOGICAL_ERROR, "P from LPDistance was requested for useless or uninitialized index.");
 }
 
-ANNQueryInformation::Type ANNCondition::getQueryType() const
+ApproximateNearestNeighborInformation::Type ApproximateNearestNeighborCondition::getQueryType() const
 {
     if (index_is_useful && query_information.has_value())
-    {
-        return query_information->query_type;
-    }
+        return query_information->type;
     throw Exception(ErrorCodes::LOGICAL_ERROR, "Query type was requested for useless or uninitialized index.");
 }
 
-bool ANNCondition::checkQueryStructure(const SelectQueryInfo & query)
+bool ApproximateNearestNeighborCondition::checkQueryStructure(const SelectQueryInfo & query)
 {
-    // RPN-s for different sections of the query
+    /// RPN-s for different sections of the query
     RPN rpn_prewhere_clause;
     RPN rpn_where_clause;
     RPN rpn_order_by_clause;
     RPNElement rpn_limit;
     UInt64 limit;
 
-    ANNQueryInformation prewhere_info;
-    ANNQueryInformation where_info;
-    ANNQueryInformation order_by_info;
+    ApproximateNearestNeighborInformation prewhere_info;
+    ApproximateNearestNeighborInformation where_info;
+    ApproximateNearestNeighborInformation order_by_info;
 
-    // Build rpns for query sections
+    /// Build rpns for query sections
     const auto & select = query.query->as<ASTSelectQuery &>();
 
-    if (select.prewhere()) // If query has PREWHERE clause
-    {
+    /// If query has PREWHERE clause
+    if (select.prewhere())
         traverseAST(select.prewhere(), rpn_prewhere_clause);
-    }
 
-    if (select.where()) // If query has WHERE clause
-    {
+    /// If query has WHERE clause
+    if (select.where())
         traverseAST(select.where(), rpn_where_clause);
-    }
 
-    if (select.limitLength()) // If query has LIMIT clause
-    {
+    /// If query has LIMIT clause
+    if (select.limitLength())
         traverseAtomAST(select.limitLength(), rpn_limit);
-    }
 
     if (select.orderBy()) // If query has ORDERBY clause
-    {
         traverseOrderByAST(select.orderBy(), rpn_order_by_clause);
-    }
 
-    // Reverse RPNs for conveniences during parsing
+    /// Reverse RPNs for conveniences during parsing
     std::reverse(rpn_prewhere_clause.begin(), rpn_prewhere_clause.end());
     std::reverse(rpn_where_clause.begin(), rpn_where_clause.end());
     std::reverse(rpn_order_by_clause.begin(), rpn_order_by_clause.end());
 
-    // Match rpns with supported types and extract information
+    /// Match rpns with supported types and extract information
     const bool prewhere_is_valid = matchRPNWhere(rpn_prewhere_clause, prewhere_info);
     const bool where_is_valid = matchRPNWhere(rpn_where_clause, where_info);
     const bool order_by_is_valid = matchRPNOrderBy(rpn_order_by_clause, order_by_info);
     const bool limit_is_valid = matchRPNLimit(rpn_limit, limit);
 
-    // Query without a LIMIT clause or with a limit greater than a restriction is not supported
-    if (!limit_is_valid || limit_restriction < limit)
-    {
+    /// Query without a LIMIT clause or with a limit greater than a restriction is not supported
+    if (!limit_is_valid || max_limit_for_ann_queries < limit)
         return false;
-    }
 
-    // Search type query in both sections isn't supported
+    /// Search type query in both sections isn't supported
     if (prewhere_is_valid && where_is_valid)
-    {
         return false;
-    }
 
-    // Search type should be in WHERE or PREWHERE clause
+    /// Search type should be in WHERE or PREWHERE clause
     if (prewhere_is_valid || where_is_valid)
-    {
         query_information = std::move(prewhere_is_valid ? prewhere_info : where_info);
-    }
 
     if (order_by_is_valid)
     {
-        // Query with valid where and order by type is not supported
+        /// Query with valid where and order by type is not supported
         if (query_information.has_value())
-        {
             return false;
-        }
 
         query_information = std::move(order_by_info);
     }
@@ -236,7 +192,7 @@ bool ANNCondition::checkQueryStructure(const SelectQueryInfo & query)
     return query_information.has_value();
 }
 
-void ANNCondition::traverseAST(const ASTPtr & node, RPN & rpn)
+void ApproximateNearestNeighborCondition::traverseAST(const ASTPtr & node, RPN & rpn)
 {
     // If the node is ASTFunction, it may have children nodes
     if (const auto * func = node->as<ASTFunction>())
@@ -244,27 +200,23 @@ void ANNCondition::traverseAST(const ASTPtr & node, RPN & rpn)
         const ASTs & children = func->arguments->children;
         // Traverse children nodes
         for (const auto& child : children)
-        {
             traverseAST(child, rpn);
-        }
     }
 
     RPNElement element;
-    // Get the data behind node
+    /// Get the data behind node
     if (!traverseAtomAST(node, element))
-    {
         element.function = RPNElement::FUNCTION_UNKNOWN;
-    }
 
     rpn.emplace_back(std::move(element));
 }
 
-bool ANNCondition::traverseAtomAST(const ASTPtr & node, RPNElement & out)
+bool ApproximateNearestNeighborCondition::traverseAtomAST(const ASTPtr & node, RPNElement & out)
 {
-    // Match Functions
+    /// Match Functions
     if (const auto * function = node->as<ASTFunction>())
     {
-        // Set the name
+        /// Set the name
         out.func_name = function->name;
 
         if (function->name == "L1Distance" ||
@@ -273,36 +225,24 @@ bool ANNCondition::traverseAtomAST(const ASTPtr & node, RPNElement & out)
             function->name == "cosineDistance" ||
             function->name == "dotProduct" ||
             function->name == "LpDistance")
-        {
             out.function = RPNElement::FUNCTION_DISTANCE;
-        }
         else if (function->name == "tuple")
-        {
             out.function = RPNElement::FUNCTION_TUPLE;
-        }
         else if (function->name == "array")
-        {
             out.function = RPNElement::FUNCTION_ARRAY;
-        }
         else if (function->name == "less" ||
                  function->name == "greater" ||
                  function->name == "lessOrEquals" ||
                  function->name == "greaterOrEquals")
-        {
             out.function = RPNElement::FUNCTION_COMPARISON;
-        }
         else if (function->name == "_CAST")
-        {
             out.function = RPNElement::FUNCTION_CAST;
-        }
         else
-        {
             return false;
-        }
 
         return true;
     }
-    // Match identifier
+    /// Match identifier
     else if (const auto * identifier = node->as<ASTIdentifier>())
     {
         out.function = RPNElement::FUNCTION_IDENTIFIER;
@@ -312,11 +252,11 @@ bool ANNCondition::traverseAtomAST(const ASTPtr & node, RPNElement & out)
         return true;
     }
 
-    // Check if we have constants behind the node
+    /// Check if we have constants behind the node
     return tryCastToConstType(node, out);
 }
 
-bool ANNCondition::tryCastToConstType(const ASTPtr & node, RPNElement & out)
+bool ApproximateNearestNeighborCondition::tryCastToConstType(const ASTPtr & node, RPNElement & out)
 {
     Field const_value;
     DataTypePtr const_type;
@@ -375,37 +315,29 @@ bool ANNCondition::tryCastToConstType(const ASTPtr & node, RPNElement & out)
     return false;
 }
 
-void ANNCondition::traverseOrderByAST(const ASTPtr & node, RPN & rpn)
+void ApproximateNearestNeighborCondition::traverseOrderByAST(const ASTPtr & node, RPN & rpn)
 {
     if (const auto * expr_list = node->as<ASTExpressionList>())
-    {
         if (const auto * order_by_element = expr_list->children.front()->as<ASTOrderByElement>())
-        {
             traverseAST(order_by_element->children.front(), rpn);
-        }
-    }
 }
 
-// Returns true and stores ANNQueryInformation if the query has valid WHERE clause
-bool ANNCondition::matchRPNWhere(RPN & rpn, ANNQueryInformation & expr)
+/// Returns true and stores ApproximateNearestNeighborInformation if the query has valid WHERE clause
+bool ApproximateNearestNeighborCondition::matchRPNWhere(RPN & rpn, ApproximateNearestNeighborInformation & ann_info)
 {
     /// Fill query type field
-    expr.query_type = ANNQueryInformation::Type::Where;
+    ann_info.type = ApproximateNearestNeighborInformation::Type::Where;
 
-    // WHERE section must have at least 5 expressions
-    // Operator->Distance(float)->DistanceFunc->Column->Tuple(Array)Func(TargetVector(floats))
+    /// WHERE section must have at least 5 expressions
+    /// Operator->Distance(float)->DistanceFunc->Column->Tuple(Array)Func(ReferenceVector(floats))
     if (rpn.size() < 5)
-    {
         return false;
-    }
 
     auto iter = rpn.begin();
 
-    // Query starts from operator less
+    /// Query starts from operator less
     if (iter->function != RPNElement::FUNCTION_COMPARISON)
-    {
         return false;
-    }
 
     const bool greater_case = iter->func_name == "greater" || iter->func_name == "greaterOrEquals";
     const bool less_case = iter->func_name == "less" || iter->func_name == "lessOrEquals";
@@ -415,64 +347,54 @@ bool ANNCondition::matchRPNWhere(RPN & rpn, ANNQueryInformation & expr)
     if (less_case)
     {
         if (iter->function != RPNElement::FUNCTION_FLOAT_LITERAL)
-        {
             return false;
-        }
 
-        expr.distance = getFloatOrIntLiteralOrPanic(iter);
-        if (expr.distance < 0)
-            throw Exception(ErrorCodes::INCORRECT_QUERY, "Distance can't be negative. Got {}", expr.distance);
+        ann_info.distance = getFloatOrIntLiteralOrPanic(iter);
+        if (ann_info.distance < 0)
+            throw Exception(ErrorCodes::INCORRECT_QUERY, "Distance can't be negative. Got {}", ann_info.distance);
 
         ++iter;
 
     }
     else if (!greater_case)
-    {
         return false;
-    }
 
     auto end = rpn.end();
-    if (!matchMainParts(iter, end, expr))
-    {
+    if (!matchMainParts(iter, end, ann_info))
         return false;
-    }
 
     if (greater_case)
     {
-        if (expr.target.size() < 2)
-        {
+        if (ann_info.reference_vector.size() < 2)
             return false;
-        }
-        expr.distance = expr.target.back();
-        if (expr.distance < 0)
-            throw Exception(ErrorCodes::INCORRECT_QUERY, "Distance can't be negative. Got {}", expr.distance);
-        expr.target.pop_back();
+        ann_info.distance = ann_info.reference_vector.back();
+        if (ann_info.distance < 0)
+            throw Exception(ErrorCodes::INCORRECT_QUERY, "Distance can't be negative. Got {}", ann_info.distance);
+        ann_info.reference_vector.pop_back();
     }
 
-    // query is ok
+    /// query is ok
     return true;
 }
 
-// Returns true and stores ANNExpr if the query has valid ORDERBY clause
-bool ANNCondition::matchRPNOrderBy(RPN & rpn, ANNQueryInformation & expr)
+/// Returns true and stores ANNExpr if the query has valid ORDERBY clause
+bool ApproximateNearestNeighborCondition::matchRPNOrderBy(RPN & rpn, ApproximateNearestNeighborInformation & ann_info)
 {
     /// Fill query type field
-    expr.query_type = ANNQueryInformation::Type::OrderBy;
+    ann_info.type = ApproximateNearestNeighborInformation::Type::OrderBy;
 
     // ORDER BY clause must have at least 3 expressions
     if (rpn.size() < 3)
-    {
         return false;
-    }
 
     auto iter = rpn.begin();
     auto end = rpn.end();
 
-    return ANNCondition::matchMainParts(iter, end, expr);
+    return ApproximateNearestNeighborCondition::matchMainParts(iter, end, ann_info);
 }
 
-// Returns true and stores Length if we have valid LIMIT clause in query
-bool ANNCondition::matchRPNLimit(RPNElement & rpn, UInt64 & limit)
+/// Returns true and stores Length if we have valid LIMIT clause in query
+bool ApproximateNearestNeighborCondition::matchRPNLimit(RPNElement & rpn, UInt64 & limit)
 {
     if (rpn.function == RPNElement::FUNCTION_INT_LITERAL)
     {
@@ -483,52 +405,46 @@ bool ANNCondition::matchRPNLimit(RPNElement & rpn, UInt64 & limit)
     return false;
 }
 
-/* Matches dist function, target vector, column name */
-bool ANNCondition::matchMainParts(RPN::iterator & iter, const RPN::iterator & end, ANNQueryInformation & expr)
+/// Matches dist function, referencer vector, column name
+bool ApproximateNearestNeighborCondition::matchMainParts(RPN::iterator & iter, const RPN::iterator & end, ApproximateNearestNeighborInformation & ann_info)
 {
     bool identifier_found = false;
 
-    // Matches DistanceFunc->[Column]->[Tuple(array)Func]->TargetVector(floats)->[Column]
+    /// Matches DistanceFunc->[Column]->[Tuple(array)Func]->ReferenceVector(floats)->[Column]
     if (iter->function != RPNElement::FUNCTION_DISTANCE)
-    {
         return false;
-    }
 
-    expr.metric = castMetricFromStringToType(iter->func_name);
+    ann_info.metric = stringToMetric(iter->func_name);
     ++iter;
 
-    if (expr.metric == ANN::ANNQueryInformation::Metric::Lp)
+    if (ann_info.metric == ApproximateNearestNeighborInformation::Metric::Lp)
     {
         if (iter->function != RPNElement::FUNCTION_FLOAT_LITERAL &&
             iter->function != RPNElement::FUNCTION_INT_LITERAL)
-        {
             return false;
-        }
-        expr.p_for_lp_dist = getFloatOrIntLiteralOrPanic(iter);
+        ann_info.p_for_lp_dist = getFloatOrIntLiteralOrPanic(iter);
         ++iter;
     }
 
     if (iter->function == RPNElement::FUNCTION_IDENTIFIER)
     {
         identifier_found = true;
-        expr.column_name = std::move(iter->identifier.value());
+        ann_info.column_name = std::move(iter->identifier.value());
         ++iter;
     }
 
     if (iter->function == RPNElement::FUNCTION_TUPLE || iter->function == RPNElement::FUNCTION_ARRAY)
-    {
         ++iter;
-    }
 
     if (iter->function == RPNElement::FUNCTION_LITERAL_TUPLE)
     {
-        extractTargetVectorFromLiteral(expr.target, iter->tuple_literal);
+        extractReferenceVectorFromLiteral(ann_info.reference_vector, iter->tuple_literal);
         ++iter;
     }
 
     if (iter->function == RPNElement::FUNCTION_LITERAL_ARRAY)
     {
-        extractTargetVectorFromLiteral(expr.target, iter->array_literal);
+        extractReferenceVectorFromLiteral(ann_info.reference_vector, iter->array_literal);
         ++iter;
     }
 
@@ -539,68 +455,52 @@ bool ANNCondition::matchMainParts(RPN::iterator & iter, const RPN::iterator & en
         ++iter;
         /// Cast should be made to array or tuple
         if (!iter->func_name.starts_with("Array") && !iter->func_name.starts_with("Tuple"))
-        {
             return false;
-        }
         ++iter;
         if (iter->function == RPNElement::FUNCTION_LITERAL_TUPLE)
         {
-            extractTargetVectorFromLiteral(expr.target, iter->tuple_literal);
+            extractReferenceVectorFromLiteral(ann_info.reference_vector, iter->tuple_literal);
             ++iter;
         }
         else if (iter->function == RPNElement::FUNCTION_LITERAL_ARRAY)
         {
-            extractTargetVectorFromLiteral(expr.target, iter->array_literal);
+            extractReferenceVectorFromLiteral(ann_info.reference_vector, iter->array_literal);
             ++iter;
         }
         else
-        {
             return false;
-        }
     }
 
     while (iter != end)
     {
         if (iter->function == RPNElement::FUNCTION_FLOAT_LITERAL ||
             iter->function == RPNElement::FUNCTION_INT_LITERAL)
-        {
-            expr.target.emplace_back(getFloatOrIntLiteralOrPanic(iter));
-        }
+            ann_info.reference_vector.emplace_back(getFloatOrIntLiteralOrPanic(iter));
         else if (iter->function == RPNElement::FUNCTION_IDENTIFIER)
         {
             if (identifier_found)
-            {
                 return false;
-            }
-            expr.column_name = std::move(iter->identifier.value());
+            ann_info.column_name = std::move(iter->identifier.value());
             identifier_found = true;
         }
         else
-        {
             return false;
-        }
 
         ++iter;
     }
 
-    // Final checks of correctness
-    return identifier_found && !expr.target.empty();
+    /// Final checks of correctness
+    return identifier_found && !ann_info.reference_vector.empty();
 }
 
-// Gets float or int from AST node
-float ANNCondition::getFloatOrIntLiteralOrPanic(const RPN::iterator& iter)
+/// Gets float or int from AST node
+float ApproximateNearestNeighborCondition::getFloatOrIntLiteralOrPanic(const RPN::iterator& iter)
 {
     if (iter->float_literal.has_value())
-    {
         return iter->float_literal.value();
-    }
     if (iter->int_literal.has_value())
-    {
         return static_cast<float>(iter->int_literal.value());
-    }
     throw Exception(ErrorCodes::INCORRECT_QUERY, "Wrong parsed AST in buildRPN\n");
 }
 
 }
-
-}
diff --git a/src/Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.h b/src/Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.h
new file mode 100644
index 00000000000..310890eba1e
--- /dev/null
+++ b/src/Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.h
@@ -0,0 +1,223 @@
+#pragma once
+
+#include <Storages/MergeTree/MergeTreeIndices.h>
+#include "base/types.h"
+
+#include <optional>
+#include <vector>
+
+namespace DB
+{
+
+/// Approximate Nearest Neighbour queries have a similar structure:
+/// - reference vector from which all distances are calculated
+/// - metric name (e.g L2Distance, LpDistance, etc.)
+/// - name of column with embeddings
+/// - type of query
+/// - maximum number of returned elements (LIMIT)
+///
+/// And two optional parameters:
+/// - p for LpDistance function
+/// - distance to compare with (only for where queries)
+///
+/// This struct holds all these components.
+struct ApproximateNearestNeighborInformation
+{
+    using Embedding = std::vector<float>;
+    Embedding reference_vector;
+
+    enum class Metric
+    {
+        Unknown,
+        L2,
+        Lp
+    };
+    Metric metric;
+
+    String column_name;
+    UInt64 limit;
+
+    enum class Type
+    {
+        OrderBy,
+        Where
+    };
+    Type type;
+
+    float p_for_lp_dist = -1.0;
+    float distance = -1.0;
+};
+
+
+// Class ANNCondition, is responsible for recognizing if the query is an ANN queries which can utilize ANN indexes. It parses the SQL query
+/// and checks if it matches ANNIndexes. Method alwaysUnknownOrTrue returns false if we can speed up the query, and true otherwise. It has
+/// only one argument, the name of the metric with which index was built. Two main patterns of queries are supported
+///
+/// - 1. WHERE queries:
+///   SELECT * FROM * WHERE DistanceFunc(column, reference_vector) < floatLiteral LIMIT count
+///
+/// - 2. ORDER BY queries:
+///   SELECT * FROM * WHERE * ORDER BY DistanceFunc(column, reference_vector) LIMIT count
+///
+/// Queries without LIMIT count are not supported
+/// If the query is both of type 1. and 2., than we can't use the index and alwaysUnknownOrTrue returns true.
+/// reference_vector should have float coordinates, e.g. (0.2, 0.1, .., 0.5)
+///
+/// If the query matches one of these two types, then this class extracts the main information needed for ANN indexes from the query.
+///
+/// From matching query it extracts
+/// - referenceVector
+/// - metricName(DistanceFunction)
+/// - dimension size if query uses LpDistance
+/// - distance to compare(ONLY for search types, otherwise you get exception)
+/// - spaceDimension(which is referenceVector's components count)
+/// - column
+/// - objects count from LIMIT clause(for both queries)
+/// - queryHasOrderByClause and queryHasWhereClause return true if query matches the type
+///
+/// Search query type is also recognized for PREWHERE clause
+class ApproximateNearestNeighborCondition
+{
+public:
+    ApproximateNearestNeighborCondition(const SelectQueryInfo & query_info, ContextPtr context);
+
+    /// Returns false if query can be speeded up by an ANN index, true otherwise.
+    bool alwaysUnknownOrTrue(String metric) const;
+
+    /// Returns the distance to compare with for search query
+    float getComparisonDistanceForWhereQuery() const;
+
+    /// Distance should be calculated regarding to referenceVector
+    std::vector<float> getReferenceVector() const;
+
+    /// Reference vector's dimension count
+    size_t getDimensions() const;
+
+    String getColumnName() const;
+
+    ApproximateNearestNeighborInformation::Metric getMetricType() const;
+
+    /// The P- value if the metric is 'LpDistance'
+    float getPValueForLpDistance() const;
+
+    ApproximateNearestNeighborInformation::Type getQueryType() const;
+
+    UInt64 getIndexGranularity() const { return index_granularity; }
+
+    /// Length's value from LIMIT clause
+    UInt64 getLimit() const;
+
+private:
+    struct RPNElement
+    {
+        enum Function
+        {
+            /// DistanceFunctions
+            FUNCTION_DISTANCE,
+
+            //tuple(0.1, ..., 0.1)
+            FUNCTION_TUPLE,
+
+            //array(0.1, ..., 0.1)
+            FUNCTION_ARRAY,
+
+            /// Operators <, >, <=, >=
+            FUNCTION_COMPARISON,
+
+            /// Numeric float value
+            FUNCTION_FLOAT_LITERAL,
+
+            /// Numeric int value
+            FUNCTION_INT_LITERAL,
+
+            /// Column identifier
+            FUNCTION_IDENTIFIER,
+
+            /// Unknown, can be any value
+            FUNCTION_UNKNOWN,
+
+            /// (0.1, ...., 0.1) vector without word 'tuple'
+            FUNCTION_LITERAL_TUPLE,
+
+            /// [0.1, ...., 0.1] vector without word 'array'
+            FUNCTION_LITERAL_ARRAY,
+
+            /// if client parameters are used, cast will always be in the query
+            FUNCTION_CAST,
+
+            /// name of type in cast function
+            FUNCTION_STRING_LITERAL,
+        };
+
+        explicit RPNElement(Function function_ = FUNCTION_UNKNOWN)
+            : function(function_)
+            , func_name("Unknown")
+            , float_literal(std::nullopt)
+            , identifier(std::nullopt)
+        {}
+
+        Function function;
+        String func_name;
+
+        std::optional<float> float_literal;
+        std::optional<String> identifier;
+        std::optional<int64_t> int_literal;
+
+        std::optional<Tuple> tuple_literal;
+        std::optional<Array> array_literal;
+
+        UInt32 dim = 0;
+    };
+
+    using RPN = std::vector<RPNElement>;
+
+    bool checkQueryStructure(const SelectQueryInfo & query);
+
+    /// Util functions for the traversal of AST, parses AST and builds rpn
+    void traverseAST(const ASTPtr & node, RPN & rpn);
+    /// Return true if we can identify our node type
+    bool traverseAtomAST(const ASTPtr & node, RPNElement & out);
+    /// Checks if the AST stores ConstType expression
+    bool tryCastToConstType(const ASTPtr & node, RPNElement & out);
+    /// Traverses the AST of ORDERBY section
+    void traverseOrderByAST(const ASTPtr & node, RPN & rpn);
+
+    /// Returns true and stores ANNExpr if the query has valid WHERE section
+    static bool matchRPNWhere(RPN & rpn, ApproximateNearestNeighborInformation & ann_info);
+
+    /// Returns true and stores ANNExpr if the query has valid ORDERBY section
+    static bool matchRPNOrderBy(RPN & rpn, ApproximateNearestNeighborInformation & ann_info);
+
+    /// Returns true and stores Length if we have valid LIMIT clause in query
+    static bool matchRPNLimit(RPNElement & rpn, UInt64 & limit);
+
+    /* Matches dist function, reference vector, column name */
+    static bool matchMainParts(RPN::iterator & iter, const RPN::iterator & end, ApproximateNearestNeighborInformation & ann_info);
+
+    /// Gets float or int from AST node
+    static float getFloatOrIntLiteralOrPanic(const RPN::iterator& iter);
+
+    Block block_with_constants;
+
+    /// true if we have one of two supported query types
+    std::optional<ApproximateNearestNeighborInformation> query_information;
+
+    // Get from settings ANNIndex parameters
+    const UInt64 index_granularity;
+
+    /// only queries with a lower limit can be considered to avoid memory overflow
+    const UInt64 max_limit_for_ann_queries;
+
+    bool index_is_useful = false;
+};
+
+
+/// Common interface of ANN indexes.
+class IMergeTreeIndexConditionApproximateNearestNeighbor : public IMergeTreeIndexCondition
+{
+public:
+    /// Returns vector of indexes of ranges in granule which are useful for query.
+    virtual std::vector<size_t> getUsefulRanges(MergeTreeIndexGranulePtr idx_granule) const = 0;
+};
+
+}
diff --git a/src/Storages/MergeTree/CommonANNIndexes.h b/src/Storages/MergeTree/CommonANNIndexes.h
deleted file mode 100644
index fefb9584863..00000000000
--- a/src/Storages/MergeTree/CommonANNIndexes.h
+++ /dev/null
@@ -1,236 +0,0 @@
-#pragma once
-
-#include <Storages/MergeTree/MergeTreeIndices.h>
-#include "base/types.h"
-
-#include <optional>
-#include <vector>
-
-namespace DB
-{
-
-namespace ApproximateNearestNeighbour
-{
-
-/**
- * Queries for Approximate Nearest Neighbour Search
- * have similar structure:
- *    1) target vector from which all distances are calculated
- *    2) metric name (e.g L2Distance, LpDistance, etc.)
- *    3) name of column with embeddings
- *    4) type of query
- *    5) Number of elements, that should be taken (limit)
- *
- * And two optional parameters:
- *    1) p for LpDistance function
- *    2) distance to compare with (only for where queries)
- */
-struct ANNQueryInformation
-{
-    using Embedding = std::vector<float>;
-
-    // Extracted data from valid query
-    Embedding target;
-    enum class Metric
-    {
-        Unknown,
-        L2,
-        Lp
-    } metric;
-    String column_name;
-    UInt64 limit;
-
-    enum class Type
-    {
-        OrderBy,
-        Where
-    } query_type;
-
-    float p_for_lp_dist = -1.0;
-    float distance = -1.0;
-};
-
-/**
-    Class ANNCondition, is responsible for recognizing special query types which
-    can be speeded up by ANN Indexes. It parses the SQL query and checks
-    if it matches ANNIndexes. The recognizing method - alwaysUnknownOrTrue
-    returns false if we can speed up the query, and true otherwise.
-    It has only one argument, name of the metric with which index was built.
-    There are two main patterns of queries being supported
-
-    1) Search query type
-    SELECT * FROM * WHERE DistanceFunc(column, target_vector) < floatLiteral LIMIT count
-
-    2) OrderBy query type
-    SELECT * FROM * WHERE * ORDERBY DistanceFunc(column, target_vector) LIMIT count
-
-    *Query without LIMIT count is not supported*
-
-    target_vector(should have float coordinates) examples:
-        tuple(0.1, 0.1, ...., 0.1) or (0.1, 0.1, ...., 0.1)
-        [the word tuple is not needed]
-
-    If the query matches one of these two types, than the class extracts useful information
-    from the query. If the query has both 1 and 2 types, than we can't speed and alwaysUnknownOrTrue
-    returns true.
-
-    From matching query it extracts
-    * targetVector
-    * metricName(DistanceFunction)
-    * dimension size if query uses LpDistance
-    * distance to compare(ONLY for search types, otherwise you get exception)
-    * spaceDimension(which is targetVector's components count)
-    * column
-    * objects count from LIMIT clause(for both queries)
-    * settings str, if query has settings section with new 'ann_index_select_query_params' value,
-        than you can get the new value(empty by default) calling method getSettingsStr
-    * queryHasOrderByClause and queryHasWhereClause return true if query matches the type
-
-    Search query type is also recognized for PREWHERE clause
-*/
-
-class ANNCondition
-{
-public:
-    ANNCondition(const SelectQueryInfo & query_info,
-                    ContextPtr context);
-
-    // false if query can be speeded up, true otherwise
-    bool alwaysUnknownOrTrue(String metric_name) const;
-
-    // returns the distance to compare with for search query
-    float getComparisonDistanceForWhereQuery() const;
-
-    // distance should be calculated regarding to targetVector
-    std::vector<float> getTargetVector() const;
-
-    // targetVector dimension size
-    size_t getNumOfDimensions() const;
-
-    String getColumnName() const;
-
-    ANNQueryInformation::Metric getMetricType() const;
-
-    // the P- value if the metric is 'LpDistance'
-    float getPValueForLpDistance() const;
-
-    ANNQueryInformation::Type getQueryType() const;
-
-    UInt64 getIndexGranularity() const { return index_granularity; }
-
-    // length's value from LIMIT clause
-    UInt64 getLimit() const;
-
-    // value of 'ann_index_select_query_params' if have in SETTINGS clause, empty string otherwise
-    String getParamsStr() const { return ann_index_select_query_params; }
-
-private:
-
-    struct RPNElement
-    {
-        enum Function
-        {
-            // DistanceFunctions
-            FUNCTION_DISTANCE,
-
-            //tuple(0.1, ..., 0.1)
-            FUNCTION_TUPLE,
-
-            //array(0.1, ..., 0.1)
-            FUNCTION_ARRAY,
-
-            // Operators <, >, <=, >=
-            FUNCTION_COMPARISON,
-
-            // Numeric float value
-            FUNCTION_FLOAT_LITERAL,
-
-            // Numeric int value
-            FUNCTION_INT_LITERAL,
-
-            // Column identifier
-            FUNCTION_IDENTIFIER,
-
-            // Unknown, can be any value
-            FUNCTION_UNKNOWN,
-
-            // (0.1, ...., 0.1) vector without word 'tuple'
-            FUNCTION_LITERAL_TUPLE,
-
-            // [0.1, ...., 0.1] vector without word 'array'
-            FUNCTION_LITERAL_ARRAY,
-
-            // if client parameters are used, cast will always be in the query
-            FUNCTION_CAST,
-
-            // name of type in cast function
-            FUNCTION_STRING_LITERAL,
-        };
-
-        explicit RPNElement(Function function_ = FUNCTION_UNKNOWN)
-        : function(function_), func_name("Unknown"), float_literal(std::nullopt), identifier(std::nullopt) {}
-
-        Function function;
-        String func_name;
-
-        std::optional<float> float_literal;
-        std::optional<String> identifier;
-        std::optional<int64_t> int_literal;
-
-        std::optional<Tuple> tuple_literal;
-        std::optional<Array> array_literal;
-
-        UInt32 dim = 0;
-    };
-
-    using RPN = std::vector<RPNElement>;
-
-    bool checkQueryStructure(const SelectQueryInfo & query);
-
-    // Util functions for the traversal of AST, parses AST and builds rpn
-    void traverseAST(const ASTPtr & node, RPN & rpn);
-    // Return true if we can identify our node type
-    bool traverseAtomAST(const ASTPtr & node, RPNElement & out);
-    // Checks if the AST stores ConstType expression
-    bool tryCastToConstType(const ASTPtr & node, RPNElement & out);
-    // Traverses the AST of ORDERBY section
-    void traverseOrderByAST(const ASTPtr & node, RPN & rpn);
-
-    // Returns true and stores ANNExpr if the query has valid WHERE section
-    static bool matchRPNWhere(RPN & rpn, ANNQueryInformation & expr);
-
-    // Returns true and stores ANNExpr if the query has valid ORDERBY section
-    static bool matchRPNOrderBy(RPN & rpn, ANNQueryInformation & expr);
-
-    // Returns true and stores Length if we have valid LIMIT clause in query
-    static bool matchRPNLimit(RPNElement & rpn, UInt64 & limit);
-
-    /* Matches dist function, target vector, column name */
-    static bool matchMainParts(RPN::iterator & iter, const RPN::iterator & end, ANNQueryInformation & expr);
-
-    // Gets float or int from AST node
-    static float getFloatOrIntLiteralOrPanic(const RPN::iterator& iter);
-
-    Block block_with_constants;
-
-    // true if we have one of two supported query types
-    std::optional<ANNQueryInformation> query_information;
-
-    // Get from settings ANNIndex parameters
-    String ann_index_select_query_params;
-    UInt64 index_granularity;
-    /// only queries with a lower limit can be considered to avoid memory overflow
-    UInt64 limit_restriction;
-    bool index_is_useful = false;
-};
-
-// condition interface for Ann indexes. Returns vector of indexes of ranges in granule which are useful for query.
-class IMergeTreeIndexConditionAnn : public IMergeTreeIndexCondition
-{
-public:
-    virtual std::vector<size_t> getUsefulRanges(MergeTreeIndexGranulePtr idx_granule) const = 0;
-};
-
-}
-
-}
diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp b/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp
index cfc3ff58f81..b73e2cca314 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp
@@ -202,6 +202,13 @@ bool DataPartStorageOnDiskBase::isStoredOnRemoteDisk() const
     return volume->getDisk()->isRemote();
 }
 
+std::optional<String> DataPartStorageOnDiskBase::getCacheName() const
+{
+    if (volume->getDisk()->supportsCache())
+        return volume->getDisk()->getCacheName();
+    return std::nullopt;
+}
+
 bool DataPartStorageOnDiskBase::supportZeroCopyReplication() const
 {
     return volume->getDisk()->supportZeroCopyReplication();
@@ -393,7 +400,7 @@ void DataPartStorageOnDiskBase::backup(
         if (it != checksums.files.end())
         {
             file_size = it->second.file_size;
-            file_hash = {it->second.file_hash.first, it->second.file_hash.second};
+            file_hash = it->second.file_hash;
         }
 
         BackupEntryPtr backup_entry = std::make_unique<BackupEntryFromImmutableFile>(disk, filepath_on_disk, copy_encrypted, file_size, file_hash);
@@ -408,41 +415,41 @@ void DataPartStorageOnDiskBase::backup(
 MutableDataPartStoragePtr DataPartStorageOnDiskBase::freeze(
     const std::string & to,
     const std::string & dir_path,
-    bool make_source_readonly,
     std::function<void(const DiskPtr &)> save_metadata_callback,
-    bool copy_instead_of_hardlink,
-    const NameSet & files_to_copy_instead_of_hardlinks,
-    DiskTransactionPtr external_transaction) const
+    const ClonePartParams & params) const
 {
     auto disk = volume->getDisk();
-    if (external_transaction)
-        external_transaction->createDirectories(to);
+    if (params.external_transaction)
+        params.external_transaction->createDirectories(to);
     else
         disk->createDirectories(to);
 
-    localBackup(disk, getRelativePath(), fs::path(to) / dir_path, make_source_readonly, {}, copy_instead_of_hardlink, files_to_copy_instead_of_hardlinks, external_transaction);
+    localBackup(disk, getRelativePath(), fs::path(to) / dir_path, params.make_source_readonly, {}, params.copy_instead_of_hardlink,
+                params.files_to_copy_instead_of_hardlinks, params.external_transaction);
 
     if (save_metadata_callback)
         save_metadata_callback(disk);
 
-    if (external_transaction)
+    if (params.external_transaction)
     {
-        external_transaction->removeFileIfExists(fs::path(to) / dir_path / "delete-on-destroy.txt");
-        external_transaction->removeFileIfExists(fs::path(to) / dir_path / "txn_version.txt");
-        external_transaction->removeFileIfExists(fs::path(to) / dir_path / IMergeTreeDataPart::METADATA_VERSION_FILE_NAME);
+        params.external_transaction->removeFileIfExists(fs::path(to) / dir_path / "delete-on-destroy.txt");
+        params.external_transaction->removeFileIfExists(fs::path(to) / dir_path / "txn_version.txt");
+        if (!params.keep_metadata_version)
+            params.external_transaction->removeFileIfExists(fs::path(to) / dir_path / IMergeTreeDataPart::METADATA_VERSION_FILE_NAME);
     }
     else
     {
         disk->removeFileIfExists(fs::path(to) / dir_path / "delete-on-destroy.txt");
         disk->removeFileIfExists(fs::path(to) / dir_path / "txn_version.txt");
-        disk->removeFileIfExists(fs::path(to) / dir_path / IMergeTreeDataPart::METADATA_VERSION_FILE_NAME);
+        if (!params.keep_metadata_version)
+            disk->removeFileIfExists(fs::path(to) / dir_path / IMergeTreeDataPart::METADATA_VERSION_FILE_NAME);
     }
 
     auto single_disk_volume = std::make_shared<SingleDiskVolume>(disk->getName(), disk, 0);
 
     /// Do not initialize storage in case of DETACH because part may be broken.
     bool to_detached = dir_path.starts_with("detached/");
-    return create(single_disk_volume, to, dir_path, /*initialize=*/ !to_detached && !external_transaction);
+    return create(single_disk_volume, to, dir_path, /*initialize=*/ !to_detached && !params.external_transaction);
 }
 
 MutableDataPartStoragePtr DataPartStorageOnDiskBase::clonePart(
diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskBase.h b/src/Storages/MergeTree/DataPartStorageOnDiskBase.h
index 6b27b7296fc..5f7dcc3fd32 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskBase.h
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskBase.h
@@ -36,6 +36,7 @@ public:
     std::string getDiskName() const override;
     std::string getDiskType() const override;
     bool isStoredOnRemoteDisk() const override;
+    std::optional<String> getCacheName() const override;
     bool supportZeroCopyReplication() const override;
     bool supportParallelWrite() const override;
     bool isBroken() const override;
@@ -61,11 +62,8 @@ public:
     MutableDataPartStoragePtr freeze(
         const std::string & to,
         const std::string & dir_path,
-        bool make_source_readonly,
         std::function<void(const DiskPtr &)> save_metadata_callback,
-        bool copy_instead_of_hardlink,
-        const NameSet & files_to_copy_instead_of_hardlinks,
-        DiskTransactionPtr external_transaction) const override;
+        const ClonePartParams & params) const override;
 
     MutableDataPartStoragePtr clonePart(
         const std::string & to,
diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskFull.cpp b/src/Storages/MergeTree/DataPartStorageOnDiskFull.cpp
index 62ea3e6cd4e..20b6c5a919e 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskFull.cpp
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskFull.cpp
@@ -80,6 +80,11 @@ DataPartStorageIteratorPtr DataPartStorageOnDiskFull::iterate() const
         volume->getDisk()->iterateDirectory(fs::path(root_path) / part_dir));
 }
 
+Poco::Timestamp DataPartStorageOnDiskFull::getFileLastModified(const String & file_name) const
+{
+    return volume->getDisk()->getLastModified(fs::path(root_path) / part_dir / file_name);
+}
+
 size_t DataPartStorageOnDiskFull::getFileSize(const String & file_name) const
 {
     return volume->getDisk()->getFileSize(fs::path(root_path) / part_dir / file_name);
@@ -90,6 +95,15 @@ UInt32 DataPartStorageOnDiskFull::getRefCount(const String & file_name) const
     return volume->getDisk()->getRefCount(fs::path(root_path) / part_dir / file_name);
 }
 
+std::string DataPartStorageOnDiskFull::getRemotePath(const std::string & file_name) const
+{
+    auto objects = volume->getDisk()->getStorageObjects(fs::path(root_path) / part_dir / file_name);
+    if (objects.size() != 1)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "One file must be mapped to one object on blob storage in MergeTree tables");
+
+    return objects[0].remote_path;
+}
+
 String DataPartStorageOnDiskFull::getUniqueId() const
 {
     auto disk = volume->getDisk();
diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskFull.h b/src/Storages/MergeTree/DataPartStorageOnDiskFull.h
index 8b38bfd7105..5d70404fcfa 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskFull.h
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskFull.h
@@ -20,8 +20,10 @@ public:
     bool isDirectory(const std::string & name) const override;
 
     DataPartStorageIteratorPtr iterate() const override;
+    Poco::Timestamp getFileLastModified(const String & file_name) const override;
     size_t getFileSize(const std::string & file_name) const override;
     UInt32 getRefCount(const std::string & file_name) const override;
+    std::string getRemotePath(const std::string & file_name) const override;
     String getUniqueId() const override;
 
     std::unique_ptr<ReadBufferFromFileBase> readFile(
diff --git a/src/Storages/MergeTree/DataPartsExchange.cpp b/src/Storages/MergeTree/DataPartsExchange.cpp
index 357d48ae466..23bbc1c7f9d 100644
--- a/src/Storages/MergeTree/DataPartsExchange.cpp
+++ b/src/Storages/MergeTree/DataPartsExchange.cpp
@@ -325,6 +325,7 @@ MergeTreeData::DataPart::Checksums Service::sendPartFromDisk(
         auto file_in = desc.input_buffer_getter();
         HashingWriteBuffer hashing_out(out);
         copyDataWithThrottler(*file_in, hashing_out, blocker.getCounter(), data.getSendsThrottler());
+        hashing_out.finalize();
 
         if (blocker.isCancelled())
             throw Exception(ErrorCodes::ABORTED, "Transferring part to replica was cancelled");
@@ -779,6 +780,7 @@ void Fetcher::downloadBaseOrProjectionPartToDisk(
         written_files.emplace_back(output_buffer_getter(*data_part_storage, file_name, file_size));
         HashingWriteBuffer hashing_out(*written_files.back());
         copyDataWithThrottler(in, hashing_out, file_size, blocker.getCounter(), throttler);
+        hashing_out.finalize();
 
         if (blocker.isCancelled())
         {
diff --git a/src/Storages/MergeTree/IDataPartStorage.h b/src/Storages/MergeTree/IDataPartStorage.h
index f160254350d..8dbf5caa168 100644
--- a/src/Storages/MergeTree/IDataPartStorage.h
+++ b/src/Storages/MergeTree/IDataPartStorage.h
@@ -63,6 +63,9 @@ using DiskPtr = std::shared_ptr<IDisk>;
 class ISyncGuard;
 using SyncGuardPtr = std::unique_ptr<ISyncGuard>;
 
+class MergeTreeTransaction;
+using MergeTreeTransactionPtr = std::shared_ptr<MergeTreeTransaction>;
+
 class IBackupEntry;
 using BackupEntryPtr = std::shared_ptr<const IBackupEntry>;
 using BackupEntries = std::vector<std::pair<String, BackupEntryPtr>>;
@@ -72,8 +75,19 @@ struct WriteSettings;
 
 class TemporaryFileOnDisk;
 
+
+struct HardlinkedFiles
+{
+    /// Shared table uuid where hardlinks live
+    std::string source_table_shared_id;
+    /// Hardlinked from part
+    std::string source_part_name;
+    /// Hardlinked files list
+    NameSet hardlinks_from_source_part;
+};
+
 /// This is an abstraction of storage for data part files.
-/// Ideally, it is assumed to contains read-only methods from IDisk.
+/// Ideally, it is assumed to contain read-only methods from IDisk.
 /// It is not fulfilled now, but let's try our best.
 class IDataPartStorage : public boost::noncopyable
 {
@@ -108,9 +122,13 @@ public:
     virtual DataPartStorageIteratorPtr iterate() const = 0;
 
     /// Get metadata for a file inside path dir.
+    virtual Poco::Timestamp getFileLastModified(const std::string & file_name) const = 0;
     virtual size_t getFileSize(const std::string & file_name) const = 0;
     virtual UInt32 getRefCount(const std::string & file_name) const = 0;
 
+    /// Get path on remote filesystem from file name on local filesystem.
+    virtual std::string getRemotePath(const std::string & file_name) const = 0;
+
     virtual UInt64 calculateTotalSizeOnDisk() const = 0;
 
     /// Open the file for read and return ReadBufferFromFileBase object.
@@ -149,6 +167,7 @@ public:
     virtual std::string getDiskName() const = 0;
     virtual std::string getDiskType() const = 0;
     virtual bool isStoredOnRemoteDisk() const { return false; }
+    virtual std::optional<String> getCacheName() const { return std::nullopt; }
     virtual bool supportZeroCopyReplication() const { return false; }
     virtual bool supportParallelWrite() const = 0;
     virtual bool isBroken() const = 0;
@@ -172,7 +191,6 @@ public:
     /// Required for distinguish different copies of the same part on remote FS.
     virtual String getUniqueId() const = 0;
 
-
     /// Represents metadata which is required for fetching of part.
     struct ReplicatedFilesDescription
     {
@@ -217,14 +235,24 @@ public:
     /// If `external_transaction` is provided, the disk operations (creating directories, hardlinking,
     /// etc) won't be applied immediately; instead, they'll be added to external_transaction, which the
     /// caller then needs to commit.
+
+    struct ClonePartParams
+    {
+        MergeTreeTransactionPtr txn = NO_TRANSACTION_PTR;
+        HardlinkedFiles * hardlinked_files = nullptr;
+        bool copy_instead_of_hardlink = false;
+        NameSet files_to_copy_instead_of_hardlinks;
+        bool keep_metadata_version = false;
+        bool make_source_readonly = false;
+        DiskTransactionPtr external_transaction = nullptr;
+        std::optional<int32_t> metadata_version_to_write = std::nullopt;
+    };
+
     virtual std::shared_ptr<IDataPartStorage> freeze(
         const std::string & to,
         const std::string & dir_path,
-        bool make_source_readonly,
         std::function<void(const DiskPtr &)> save_metadata_callback,
-        bool copy_instead_of_hardlink,
-        const NameSet & files_to_copy_instead_of_hardlinks,
-        DiskTransactionPtr external_transaction = nullptr) const = 0;
+        const ClonePartParams & params) const = 0;
 
     /// Make a full copy of a data part into 'to/dir_path' (possibly to a different disk).
     virtual std::shared_ptr<IDataPartStorage> clonePart(
@@ -283,7 +311,6 @@ public:
         bool remove_new_dir_if_exists,
         bool fsync_part_dir) = 0;
 
-
     /// Starts a transaction of mutable operations.
     virtual void beginTransaction() = 0;
     /// Commits a transaction of mutable operations.
diff --git a/src/Storages/MergeTree/IExecutableTask.h b/src/Storages/MergeTree/IExecutableTask.h
index 9617960c182..d0c2d4a840e 100644
--- a/src/Storages/MergeTree/IExecutableTask.h
+++ b/src/Storages/MergeTree/IExecutableTask.h
@@ -5,6 +5,7 @@
 
 #include <boost/noncopyable.hpp>
 #include <Interpreters/StorageID.h>
+#include <Common/Priority.h>
 
 namespace DB
 {
@@ -32,7 +33,7 @@ public:
     virtual bool executeStep() = 0;
     virtual void onCompleted() = 0;
     virtual StorageID getStorageID() = 0;
-    virtual UInt64 getPriority() = 0;
+    virtual Priority getPriority() = 0;
     virtual ~IExecutableTask() = default;
 };
 
@@ -63,7 +64,7 @@ public:
 
     void onCompleted() override { job_result_callback(!res); }
     StorageID getStorageID() override { return id; }
-    UInt64 getPriority() override
+    Priority getPriority() override
     {
         throw Exception(ErrorCodes::LOGICAL_ERROR, "getPriority() method is not supported by LambdaAdapter");
     }
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index d27b03fff44..b9591864869 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -138,7 +138,7 @@ IMergeTreeDataPart::MinMaxIndex::WrittenFiles IMergeTreeDataPart::MinMaxIndex::s
         HashingWriteBuffer out_hashing(*out);
         serialization->serializeBinary(hyperrectangle[i].left, out_hashing, {});
         serialization->serializeBinary(hyperrectangle[i].right, out_hashing, {});
-        out_hashing.next();
+        out_hashing.finalize();
         out_checksums.files[file_name].file_size = out_hashing.count();
         out_checksums.files[file_name].file_hash = out_hashing.getHash();
         out->preFinalize();
@@ -211,9 +211,9 @@ void IMergeTreeDataPart::MinMaxIndex::appendFiles(const MergeTreeData & data, St
 }
 
 
-static void incrementStateMetric(MergeTreeDataPartState state)
+void IMergeTreeDataPart::incrementStateMetric(MergeTreeDataPartState state_) const
 {
-    switch (state)
+    switch (state_)
     {
         case MergeTreeDataPartState::Temporary:
             CurrentMetrics::add(CurrentMetrics::PartsTemporary);
@@ -227,6 +227,7 @@ static void incrementStateMetric(MergeTreeDataPartState state)
             CurrentMetrics::add(CurrentMetrics::PartsCommitted);
             return;
         case MergeTreeDataPartState::Outdated:
+            storage.total_outdated_parts_count.fetch_add(1, std::memory_order_relaxed);
             CurrentMetrics::add(CurrentMetrics::PartsOutdated);
             return;
         case MergeTreeDataPartState::Deleting:
@@ -238,9 +239,9 @@ static void incrementStateMetric(MergeTreeDataPartState state)
     }
 }
 
-static void decrementStateMetric(MergeTreeDataPartState state)
+void IMergeTreeDataPart::decrementStateMetric(MergeTreeDataPartState state_) const
 {
-    switch (state)
+    switch (state_)
     {
         case MergeTreeDataPartState::Temporary:
             CurrentMetrics::sub(CurrentMetrics::PartsTemporary);
@@ -254,6 +255,7 @@ static void decrementStateMetric(MergeTreeDataPartState state)
             CurrentMetrics::sub(CurrentMetrics::PartsCommitted);
             return;
         case MergeTreeDataPartState::Outdated:
+            storage.total_outdated_parts_count.fetch_sub(1, std::memory_order_relaxed);
             CurrentMetrics::sub(CurrentMetrics::PartsOutdated);
             return;
         case MergeTreeDataPartState::Deleting:
@@ -492,13 +494,17 @@ void IMergeTreeDataPart::removeIfNeeded()
 
         if (is_temp)
         {
-            String file_name = fileName(getDataPartStorage().getPartDirectory());
+            const auto & part_directory = getDataPartStorage().getPartDirectory();
+
+            String file_name = fileName(part_directory);
 
             if (file_name.empty())
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "relative_path {} of part {} is invalid or not set",
                                 getDataPartStorage().getPartDirectory(), name);
 
-            if (!startsWith(file_name, "tmp") && !endsWith(file_name, ".tmp_proj"))
+            const auto part_parent_directory = directoryPath(part_directory);
+            bool is_moving_part = part_parent_directory.ends_with("moving/");
+            if (!startsWith(file_name, "tmp") && !endsWith(file_name, ".tmp_proj") && !is_moving_part)
             {
                 LOG_ERROR(
                     storage.log,
@@ -507,6 +513,11 @@ void IMergeTreeDataPart::removeIfNeeded()
                     path);
                 return;
             }
+
+            if (is_moving_part)
+            {
+                LOG_TRACE(storage.log, "Removing unneeded moved part from {}", path);
+            }
         }
 
         remove();
@@ -632,7 +643,7 @@ void IMergeTreeDataPart::loadColumnsChecksumsIndexes(bool require_columns_checks
         if (!parent_part)
         {
             loadTTLInfos();
-            loadProjections(require_columns_checksums, check_consistency);
+            loadProjections(require_columns_checksums, check_consistency, false /* if_not_loaded */);
         }
 
         if (check_consistency)
@@ -690,13 +701,13 @@ void IMergeTreeDataPart::addProjectionPart(
     const String & projection_name,
     std::shared_ptr<IMergeTreeDataPart> && projection_part)
 {
-    /// Here should be a check that projection we are trying to add
-    /// does not exist, but unfortunately this check fails in tests.
-    /// TODO: fix.
+    if (hasProjection(projection_name))
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Projection part {} in part {} is already loaded. This is a bug", projection_name, name);
+
     projection_parts[projection_name] = std::move(projection_part);
 }
 
-void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool check_consistency)
+void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded)
 {
     auto metadata_snapshot = storage.getInMemoryMetadataPtr();
     for (const auto & projection : metadata_snapshot->projections)
@@ -704,9 +715,18 @@ void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool ch
         auto path = projection.name + ".proj";
         if (getDataPartStorage().exists(path))
         {
-            auto part = getProjectionPartBuilder(projection.name).withPartFormatFromDisk().build();
-            part->loadColumnsChecksumsIndexes(require_columns_checksums, check_consistency);
-            addProjectionPart(projection.name, std::move(part));
+            if (hasProjection(projection.name))
+            {
+                if (!if_not_loaded)
+                    throw Exception(
+                        ErrorCodes::LOGICAL_ERROR, "Projection part {} in part {} is already loaded. This is a bug", projection.name, name);
+            }
+            else
+            {
+                auto part = getProjectionPartBuilder(projection.name).withPartFormatFromDisk().build();
+                part->loadColumnsChecksumsIndexes(require_columns_checksums, check_consistency);
+                addProjectionPart(projection.name, std::move(part));
+            }
         }
     }
 }
@@ -953,24 +973,9 @@ void IMergeTreeDataPart::writeVersionMetadata(const VersionMetadata & version_,
     }
 }
 
-void IMergeTreeDataPart::writeDeleteOnDestroyMarker()
-{
-    static constexpr auto marker_path = "delete-on-destroy.txt";
-
-    try
-    {
-        getDataPartStorage().createFile(marker_path);
-    }
-    catch (Poco::Exception & e)
-    {
-        LOG_ERROR(storage.log, "{} (while creating DeleteOnDestroy marker: {})",
-            e.what(), (fs::path(getDataPartStorage().getFullPath()) / marker_path).string());
-    }
-}
-
 void IMergeTreeDataPart::removeDeleteOnDestroyMarker()
 {
-    getDataPartStorage().removeFileIfExists("delete-on-destroy.txt");
+    getDataPartStorage().removeFileIfExists(DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED);
 }
 
 void IMergeTreeDataPart::removeVersionMetadata()
@@ -1048,7 +1053,7 @@ void IMergeTreeDataPart::loadPartitionAndMinMaxIndex()
         DayNum max_date;
         MergeTreePartInfo::parseMinMaxDatesFromPartName(name, min_date, max_date);
 
-        const auto & date_lut = DateLUT::instance();
+        const auto & date_lut = DateLUT::serverTimezoneInstance();
         partition = MergeTreePartition(date_lut.toNumYYYYMM(min_date));
         minmax_idx = std::make_shared<MinMaxIndex>(min_date, max_date);
     }
@@ -1357,6 +1362,10 @@ void IMergeTreeDataPart::loadColumns(bool require)
     else
     {
         loaded_metadata_version = metadata_snapshot->getMetadataVersion();
+        old_part_with_no_metadata_version_on_disk = true;
+        if (storage.supportsReplication())
+            LOG_WARNING(storage.log, "Part {} doesn't have metadata version on disk, setting it to {}. "
+                    "It's okay if the part was created by an old version of ClickHouse", name, loaded_metadata_version);
     }
 
     setColumns(loaded_columns, infos, loaded_metadata_version);
@@ -1759,12 +1768,6 @@ void IMergeTreeDataPart::renameToDetached(const String & prefix)
 
 DataPartStoragePtr IMergeTreeDataPart::makeCloneInDetached(const String & prefix, const StorageMetadataPtr & /*metadata_snapshot*/) const
 {
-    auto storage_settings = storage.getSettings();
-
-    /// In case of zero-copy replication we copy directory instead of hardlinks
-    /// because hardlinks tracking doesn't work for detached parts.
-    bool copy_instead_of_hardlink = isStoredOnRemoteDiskWithZeroCopySupport() && storage.supportsReplication() && storage_settings->allow_remote_fs_zero_copy_replication;
-
     /// Avoid unneeded duplicates of broken parts if we try to detach the same broken part multiple times.
     /// Otherwise it may pollute detached/ with dirs with _tryN suffix and we will fail to remove broken part after 10 attempts.
     bool broken = !prefix.empty();
@@ -1772,13 +1775,19 @@ DataPartStoragePtr IMergeTreeDataPart::makeCloneInDetached(const String & prefix
     if (!maybe_path_in_detached)
         return nullptr;
 
+    /// In case of zero-copy replication we copy directory instead of hardlinks
+    /// because hardlinks tracking doesn't work for detached parts.
+    auto storage_settings = storage.getSettings();
+    IDataPartStorage::ClonePartParams params
+    {
+        .copy_instead_of_hardlink = isStoredOnRemoteDiskWithZeroCopySupport() && storage.supportsReplication() && storage_settings->allow_remote_fs_zero_copy_replication,
+        .make_source_readonly = true
+    };
     return getDataPartStorage().freeze(
         storage.relative_data_path,
         *maybe_path_in_detached,
-        /*make_source_readonly=*/ true,
         /*save_metadata_callback=*/ {},
-        copy_instead_of_hardlink,
-        /*files_to_copy_instead_of_hardlinks=*/ {});
+        params);
 }
 
 MutableDataPartStoragePtr IMergeTreeDataPart::makeCloneOnDisk(const DiskPtr & disk, const String & directory_name) const
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 411de3af982..3427ac2db68 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -116,6 +116,8 @@ public:
     /// Otherwise return information about column size on disk.
     ColumnSize getColumnSize(const String & column_name) const;
 
+    virtual std::optional<time_t> getColumnModificationTime(const String & column_name) const = 0;
+
     /// NOTE: Returns zeros if secondary indexes are not found in checksums.
     /// Otherwise return information about secondary index size on disk.
     IndexSize getSecondaryIndexSize(const String & secondary_index_name) const;
@@ -249,6 +251,9 @@ public:
     /// Flag for keep S3 data when zero-copy replication over S3 turned on.
     mutable bool force_keep_shared_data = false;
 
+    /// Some old parts don't have metadata version, so we set it to the current table's version when loading the part
+    bool old_part_with_no_metadata_version_on_disk = false;
+
     using TTLInfo = MergeTreeDataPartTTLInfo;
     using TTLInfos = MergeTreeDataPartTTLInfos;
 
@@ -388,7 +393,7 @@ public:
 
     bool hasProjection(const String & projection_name) const { return projection_parts.contains(projection_name); }
 
-    void loadProjections(bool require_columns_checksums, bool check_consistency);
+    void loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded = false);
 
     /// Return set of metadata file names without checksums. For example,
     /// columns.txt or checksums.txt itself.
@@ -399,7 +404,8 @@ public:
     /// default will be stored in this file.
     static inline constexpr auto DEFAULT_COMPRESSION_CODEC_FILE_NAME = "default_compression_codec.txt";
 
-    static inline constexpr auto DELETE_ON_DESTROY_MARKER_FILE_NAME = "delete-on-destroy.txt";
+    /// "delete-on-destroy.txt" is deprecated. It is no longer being created, only is removed.
+    static inline constexpr auto DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED = "delete-on-destroy.txt";
 
     static inline constexpr auto UUID_FILE_NAME = "uuid.txt";
 
@@ -474,8 +480,10 @@ public:
 
     void writeChecksums(const MergeTreeDataPartChecksums & checksums_, const WriteSettings & settings);
 
-    void writeDeleteOnDestroyMarker();
+    /// "delete-on-destroy.txt" is deprecated. It is no longer being created, only is removed.
+    /// TODO: remove this method after some time.
     void removeDeleteOnDestroyMarker();
+
     /// It may look like a stupid joke. but these two methods are absolutely unrelated.
     /// This one is about removing file with metadata about part version (for transactions)
     void removeVersionMetadata();
@@ -625,6 +633,9 @@ private:
     /// for this column with default parameters.
     CompressionCodecPtr detectDefaultCompressionCodec() const;
 
+    void incrementStateMetric(MergeTreeDataPartState state) const;
+    void decrementStateMetric(MergeTreeDataPartState state) const;
+
     mutable MergeTreeDataPartState state{MergeTreeDataPartState::Temporary};
 
     /// This ugly flag is needed for debug assertions only
diff --git a/src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h b/src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h
index 55a9c7b1509..2cc73556f04 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h
@@ -21,7 +21,7 @@ using SerializationPtr = std::shared_ptr<const ISerialization>;
  * in order to use MergeTreeDataPartReader's.
  * It is a separate interface and not a simple struct because
  * otherwise it will need to copy all the information which might not
- * be even used (for example, an IndexGranulary class object is quite heavy).
+ * be even used (for example, an IndexGranularity class object is quite heavy).
  */
 class IMergeTreeDataPartInfoForReader : public WithContext
 {
@@ -66,6 +66,8 @@ public:
 
     virtual const SerializationInfoByName & getSerializationInfos() const = 0;
 
+    virtual String getTableName() const = 0;
+
     virtual void reportBroken() = 0;
 };
 
diff --git a/src/Storages/MergeTree/IMergeTreeReader.cpp b/src/Storages/MergeTree/IMergeTreeReader.cpp
index dc9e9001439..f9b97a6a05d 100644
--- a/src/Storages/MergeTree/IMergeTreeReader.cpp
+++ b/src/Storages/MergeTree/IMergeTreeReader.cpp
@@ -79,7 +79,11 @@ void IMergeTreeReader::fillMissingColumns(Columns & res_columns, bool & should_e
     catch (Exception & e)
     {
         /// Better diagnostics.
-        e.addMessage("(while reading from part " + data_part_info_for_read->getDataPartStorage()->getFullPath() + ")");
+        const auto & part_storage = data_part_info_for_read->getDataPartStorage();
+        e.addMessage(
+            "(while reading from part " + part_storage->getFullPath()
+            + " located on disk " + part_storage->getDiskName()
+            + " of type " + part_storage->getDiskType() + ")");
         throw;
     }
 }
@@ -124,7 +128,11 @@ void IMergeTreeReader::evaluateMissingDefaults(Block additional_columns, Columns
     catch (Exception & e)
     {
         /// Better diagnostics.
-        e.addMessage("(while reading from part " + data_part_info_for_read->getDataPartStorage()->getFullPath() + ")");
+        const auto & part_storage = data_part_info_for_read->getDataPartStorage();
+        e.addMessage(
+            "(while reading from part " + part_storage->getFullPath()
+            + " located on disk " + part_storage->getDiskName()
+            + " of type " + part_storage->getDiskType() + ")");
         throw;
     }
 }
@@ -199,7 +207,11 @@ void IMergeTreeReader::performRequiredConversions(Columns & res_columns) const
     catch (Exception & e)
     {
         /// Better diagnostics.
-        e.addMessage("(while reading from part " + data_part_info_for_read->getDataPartStorage()->getFullPath() + ")");
+        const auto & part_storage = data_part_info_for_read->getDataPartStorage();
+        e.addMessage(
+            "(while reading from part " + part_storage->getFullPath()
+            + " located on disk " + part_storage->getDiskName()
+            + " of type " + part_storage->getDiskType() + ")");
         throw;
     }
 }
@@ -266,4 +278,17 @@ void IMergeTreeReader::checkNumberOfColumns(size_t num_columns_to_read) const
                         "Expected {}, got {}", requested_columns.size(), num_columns_to_read);
 }
 
+String IMergeTreeReader::getMessageForDiagnosticOfBrokenPart(size_t from_mark, size_t max_rows_to_read) const
+{
+    const auto & data_part_storage = data_part_info_for_read->getDataPartStorage();
+    return fmt::format(
+        "(while reading from part {} in table {} located on disk {} of type {}, from mark {} with max_rows_to_read = {})",
+        data_part_storage->getFullPath(),
+        data_part_info_for_read->getTableName(),
+        data_part_storage->getDiskName(),
+        data_part_storage->getDiskType(),
+        from_mark,
+        max_rows_to_read);
+}
+
 }
diff --git a/src/Storages/MergeTree/IMergeTreeReader.h b/src/Storages/MergeTree/IMergeTreeReader.h
index a72d83a55e4..fcab35fb4c2 100644
--- a/src/Storages/MergeTree/IMergeTreeReader.h
+++ b/src/Storages/MergeTree/IMergeTreeReader.h
@@ -74,6 +74,8 @@ protected:
 
     void checkNumberOfColumns(size_t num_columns_to_read) const;
 
+    String getMessageForDiagnosticOfBrokenPart(size_t from_mark, size_t max_rows_to_read) const;
+
     /// avg_value_size_hints are used to reduce the number of reallocations when creating columns of variable size.
     ValueSizeMap avg_value_size_hints;
     /// Stores states for IDataType::deserializeBinaryBulk
diff --git a/src/Storages/MergeTree/KeyCondition.cpp b/src/Storages/MergeTree/KeyCondition.cpp
index 239a534ca93..f909d854cf6 100644
--- a/src/Storages/MergeTree/KeyCondition.cpp
+++ b/src/Storages/MergeTree/KeyCondition.cpp
@@ -943,6 +943,26 @@ static FieldRef applyFunction(const FunctionBasePtr & func, const DataTypePtr &
     return {field.columns, field.row_idx, result_idx};
 }
 
+/** When table's key has expression with these functions from a column,
+  * and when a column in a query is compared with a constant, such as:
+  * CREATE TABLE (x String) ORDER BY toDate(x)
+  * SELECT ... WHERE x LIKE 'Hello%'
+  * we want to apply the function to the constant for index analysis,
+  * but should modify it to pass on unparsable values.
+  */
+static std::set<std::string_view> date_time_parsing_functions = {
+    "toDate",
+    "toDate32",
+    "toDateTime",
+    "toDateTime64",
+    "ParseDateTimeBestEffort",
+    "ParseDateTimeBestEffortUS",
+    "ParseDateTime32BestEffort",
+    "ParseDateTime64BestEffort",
+    "parseDateTime",
+    "parseDateTimeInJodaSyntax",
+};
+
 /** The key functional expression constraint may be inferred from a plain column in the expression.
   * For example, if the key contains `toStartOfHour(Timestamp)` and query contains `WHERE Timestamp >= now()`,
   * it can be assumed that if `toStartOfHour()` is monotonic on [now(), inf), the `toStartOfHour(Timestamp) >= toStartOfHour(now())`
@@ -1026,10 +1046,24 @@ bool KeyCondition::transformConstantWithValidFunctions(
                     if (func->type != ActionsDAG::ActionType::FUNCTION)
                         continue;
 
+                    const auto & func_name = func->function_base->getName();
+                    auto func_base = func->function_base;
+                    const auto & arg_types = func_base->getArgumentTypes();
+                    if (date_time_parsing_functions.contains(func_name) && !arg_types.empty() && isStringOrFixedString(arg_types[0]))
+                    {
+                        auto func_or_null = FunctionFactory::instance().get(func_name + "OrNull", context);
+                        ColumnsWithTypeAndName arguments;
+                        int i = 0;
+                        for (const auto & type : func->function_base->getArgumentTypes())
+                            arguments.push_back({nullptr, type, fmt::format("_{}", i++)});
+
+                        func_base = func_or_null->build(arguments);
+                    }
+
                     if (func->children.size() == 1)
                     {
                         std::tie(const_value, const_type)
-                            = applyFunctionForFieldOfUnknownType(func->function_base, const_type, const_value);
+                            = applyFunctionForFieldOfUnknownType(func_base, const_type, const_value);
                     }
                     else if (func->children.size() == 2)
                     {
@@ -1040,7 +1074,7 @@ bool KeyCondition::transformConstantWithValidFunctions(
                             auto left_arg_type = left->result_type;
                             auto left_arg_value = (*left->column)[0];
                             std::tie(const_value, const_type) = applyBinaryFunctionForFieldOfUnknownType(
-                                FunctionFactory::instance().get(func->function_base->getName(), context),
+                                FunctionFactory::instance().get(func_base->getName(), context),
                                 left_arg_type, left_arg_value, const_type, const_value);
                         }
                         else
@@ -1048,10 +1082,13 @@ bool KeyCondition::transformConstantWithValidFunctions(
                             auto right_arg_type = right->result_type;
                             auto right_arg_value = (*right->column)[0];
                             std::tie(const_value, const_type) = applyBinaryFunctionForFieldOfUnknownType(
-                                FunctionFactory::instance().get(func->function_base->getName(), context),
+                                FunctionFactory::instance().get(func_base->getName(), context),
                                 const_type, const_value, right_arg_type, right_arg_value);
                         }
                     }
+
+                    if (const_value.isNull())
+                        return false;
                 }
 
                 out_key_column_num = it->second;
@@ -1204,7 +1241,11 @@ bool KeyCondition::tryPrepareSetIndex(
 
     const auto right_arg = func.getArgumentAt(1);
 
-    auto prepared_set = right_arg.tryGetPreparedSet(indexes_mapping, data_types);
+    auto future_set = right_arg.tryGetPreparedSet(indexes_mapping, data_types);
+    if (!future_set)
+        return false;
+
+    auto prepared_set = future_set->buildOrderedSetInplace(right_arg.getTreeContext().getQueryContext());
     if (!prepared_set)
         return false;
 
@@ -1217,7 +1258,6 @@ bool KeyCondition::tryPrepareSetIndex(
         prepared_set->checkTypesEqual(indexes_mapping[i].tuple_index, data_types[i]);
 
     out.set_index = std::make_shared<MergeTreeSetIndex>(prepared_set->getSetElements(), std::move(indexes_mapping));
-
     return true;
 }
 
diff --git a/src/Storages/MergeTree/LoadedMergeTreeDataPartInfoForReader.h b/src/Storages/MergeTree/LoadedMergeTreeDataPartInfoForReader.h
index aec102f3f7d..f1cb8b34ecf 100644
--- a/src/Storages/MergeTree/LoadedMergeTreeDataPartInfoForReader.h
+++ b/src/Storages/MergeTree/LoadedMergeTreeDataPartInfoForReader.h
@@ -56,6 +56,8 @@ public:
 
     SerializationPtr getSerialization(const NameAndTypePair & column) const override { return data_part->getSerialization(column.name); }
 
+    String getTableName() const override { return data_part->storage.getStorageID().getNameForLogs(); }
+
     MergeTreeData::DataPartPtr getDataPart() const { return data_part; }
 
 private:
diff --git a/src/Storages/MergeTree/MergeFromLogEntryTask.cpp b/src/Storages/MergeTree/MergeFromLogEntryTask.cpp
index a5b4a29cb18..17582e7df98 100644
--- a/src/Storages/MergeTree/MergeFromLogEntryTask.cpp
+++ b/src/Storages/MergeTree/MergeFromLogEntryTask.cpp
@@ -4,6 +4,9 @@
 #include <Common/ProfileEvents.h>
 #include <Common/ProfileEventsScope.h>
 #include <Storages/StorageReplicatedMergeTree.h>
+#include <pcg_random.hpp>
+#include <Common/randomSeed.h>
+#include <cmath>
 
 namespace ProfileEvents
 {
@@ -30,6 +33,7 @@ MergeFromLogEntryTask::MergeFromLogEntryTask(
         storage_,
         selected_entry_,
         task_result_callback_)
+    , rng(randomSeed())
 {
 }
 
@@ -57,7 +61,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
     {
         LOG_INFO(log, "Will try to fetch part {} until '{}' because this part assigned to recompression merge. "
             "Source replica {} will try to merge this part first", entry.new_part_name,
-            DateLUT::instance().timeToString(entry.create_time + storage_settings_ptr->try_fetch_recompressed_part_timeout.totalSeconds()), entry.source_replica);
+            DateLUT::serverTimezoneInstance().timeToString(entry.create_time + storage_settings_ptr->try_fetch_recompressed_part_timeout.totalSeconds()), entry.source_replica);
             /// Waiting other replica to recompress part. No need to check it.
             return PrepareResult{
                 .prepared_successfully = false,
@@ -216,6 +220,27 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
                 };
             }
 
+            if (storage_settings_ptr->zero_copy_merge_mutation_min_parts_size_sleep_before_lock != 0 &&
+                estimated_space_for_merge >= storage_settings_ptr->zero_copy_merge_mutation_min_parts_size_sleep_before_lock)
+            {
+                /// In zero copy replication only one replica execute merge/mutation, others just download merged parts metadata.
+                /// Here we are trying to mitigate the skew of merges execution because of faster/slower replicas.
+                /// Replicas can be slow because of different reasons like bigger latency for ZooKeeper or just slight step behind because of bigger queue.
+                /// In this case faster replica can pick up all merges execution, especially large merges while other replicas can just idle. And even in this case
+                /// the fast replica is not overloaded because amount of executing merges doesn't affect the ability to acquire locks for new merges.
+                ///
+                /// So here we trying to solve it with the simplest solution -- sleep random time up to 500ms for 1GB part and up to 7 seconds for 300GB part.
+                /// It can sound too much, but we are trying to aquite these locks in background tasks which can be scheduled each 5 seconds or so.
+                double start_to_sleep_seconds = std::logf(storage_settings_ptr->zero_copy_merge_mutation_min_parts_size_sleep_before_lock.value);
+                uint64_t right_border_to_sleep_ms = static_cast<uint64_t>((std::log(estimated_space_for_merge) - start_to_sleep_seconds + 0.5) * 1000);
+                uint64_t time_to_sleep_milliseconds = std::min<uint64_t>(10000UL, std::uniform_int_distribution<uint64_t>(1, 1 + right_border_to_sleep_ms)(rng));
+
+                LOG_INFO(log, "Merge size is {} bytes (it's more than sleep threshold {}) so will intentionally sleep for {} ms to allow other replicas to took this big merge",
+                    estimated_space_for_merge, storage_settings_ptr->zero_copy_merge_mutation_min_parts_size_sleep_before_lock, time_to_sleep_milliseconds);
+
+                std::this_thread::sleep_for(std::chrono::milliseconds(time_to_sleep_milliseconds));
+            }
+
             zero_copy_lock = storage.tryCreateZeroCopyExclusiveLock(entry.new_part_name, disk);
 
             if (!zero_copy_lock || !zero_copy_lock->isLocked())
@@ -291,7 +316,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
 
     /// Adjust priority
     for (auto & item : future_merged_part->parts)
-        priority += item->getBytesOnDisk();
+        priority.value += item->getBytesOnDisk();
 
     return {true, true, [this, stopwatch = *stopwatch_ptr] (const ExecutionStatus & execution_status)
     {
@@ -367,7 +392,7 @@ bool MergeFromLogEntryTask::finalize(ReplicatedMergeMutateTaskBase::PartLogWrite
     /** With `ZSESSIONEXPIRED` or `ZOPERATIONTIMEOUT`, we can inadvertently roll back local changes to the parts.
      * This is not a problem, because in this case the merge will remain in the queue, and we will try again.
      */
-    storage.merge_selecting_task->schedule();
+    finish_callback = [storage_ptr = &storage]() { storage_ptr->merge_selecting_task->schedule(); };
     ProfileEvents::increment(ProfileEvents::ReplicatedPartMerges);
 
     write_part_log({});
diff --git a/src/Storages/MergeTree/MergeFromLogEntryTask.h b/src/Storages/MergeTree/MergeFromLogEntryTask.h
index 9d870cd9a4b..62908f79fb4 100644
--- a/src/Storages/MergeTree/MergeFromLogEntryTask.h
+++ b/src/Storages/MergeTree/MergeFromLogEntryTask.h
@@ -3,6 +3,8 @@
 #include <memory>
 #include <utility>
 
+#include <pcg_random.hpp>
+
 #include <Storages/MergeTree/IExecutableTask.h>
 #include <Storages/MergeTree/MergeTask.h>
 #include <Storages/MergeTree/ReplicatedMergeTreeQueue.h>
@@ -22,7 +24,7 @@ public:
         StorageReplicatedMergeTree & storage_,
         IExecutableTask::TaskResultCallback & task_result_callback_);
 
-    UInt64 getPriority() override { return priority; }
+    Priority getPriority() override { return priority; }
 
 protected:
     /// Both return false if we can't execute merge.
@@ -44,9 +46,10 @@ private:
     StopwatchUniquePtr stopwatch_ptr{nullptr};
     MergeTreeData::MutableDataPartPtr part;
 
-    UInt64 priority{0};
+    Priority priority;
 
     MergeTaskPtr merge_task;
+    pcg64 rng;
 };
 
 
diff --git a/src/Storages/MergeTree/MergePlainMergeTreeTask.cpp b/src/Storages/MergeTree/MergePlainMergeTreeTask.cpp
index 871672c442b..9302bdf11de 100644
--- a/src/Storages/MergeTree/MergePlainMergeTreeTask.cpp
+++ b/src/Storages/MergeTree/MergePlainMergeTreeTask.cpp
@@ -27,7 +27,6 @@ void MergePlainMergeTreeTask::onCompleted()
     task_result_callback(delay);
 }
 
-
 bool MergePlainMergeTreeTask::executeStep()
 {
     /// All metrics will be saved in the thread_group, including all scheduled tasks.
diff --git a/src/Storages/MergeTree/MergePlainMergeTreeTask.h b/src/Storages/MergeTree/MergePlainMergeTreeTask.h
index 369b4390da7..95df8c90c9b 100644
--- a/src/Storages/MergeTree/MergePlainMergeTreeTask.h
+++ b/src/Storages/MergeTree/MergePlainMergeTreeTask.h
@@ -34,13 +34,13 @@ public:
         , task_result_callback(task_result_callback_)
     {
         for (auto & item : merge_mutate_entry->future_part->parts)
-            priority += item->getBytesOnDisk();
+            priority.value += item->getBytesOnDisk();
     }
 
     bool executeStep() override;
     void onCompleted() override;
     StorageID getStorageID() override;
-    UInt64 getPriority() override { return priority; }
+    Priority getPriority() override { return priority; }
 
     void setCurrentTransaction(MergeTreeTransactionHolder && txn_holder_, MergeTreeTransactionPtr && txn_)
     {
@@ -77,7 +77,7 @@ private:
     using MergeListEntryPtr = std::unique_ptr<MergeListEntry>;
     MergeListEntryPtr merge_list_entry;
 
-    UInt64 priority{0};
+    Priority priority;
 
     std::function<void(const ExecutionStatus &)> write_part_log;
     std::function<void()> transfer_profile_counters_to_initial_query;
diff --git a/src/Storages/MergeTree/MergeTreeBackgroundExecutor.cpp b/src/Storages/MergeTree/MergeTreeBackgroundExecutor.cpp
index 6512aad9260..d4f8d1140a2 100644
--- a/src/Storages/MergeTree/MergeTreeBackgroundExecutor.cpp
+++ b/src/Storages/MergeTree/MergeTreeBackgroundExecutor.cpp
@@ -136,6 +136,36 @@ bool MergeTreeBackgroundExecutor<Queue>::trySchedule(ExecutableTaskPtr task)
     return true;
 }
 
+void printExceptionWithRespectToAbort(Poco::Logger * log)
+{
+    std::exception_ptr ex = std::current_exception();
+
+    if (ex == nullptr)
+        return;
+
+    try
+    {
+        std::rethrow_exception(ex);
+    }
+    catch (const Exception & e)
+    {
+        NOEXCEPT_SCOPE({
+            ALLOW_ALLOCATIONS_IN_SCOPE;
+            /// Cancelled merging parts is not an error - log normally.
+            if (e.code() == ErrorCodes::ABORTED)
+                LOG_DEBUG(log, getExceptionMessageAndPattern(e, /* with_stacktrace */ false));
+            else
+                tryLogCurrentException(__PRETTY_FUNCTION__);
+        });
+    }
+    catch (...)
+    {
+        NOEXCEPT_SCOPE({
+            ALLOW_ALLOCATIONS_IN_SCOPE;
+            tryLogCurrentException(__PRETTY_FUNCTION__);
+        });
+    }
+}
 
 template <class Queue>
 void MergeTreeBackgroundExecutor<Queue>::removeTasksCorrespondingToStorage(StorageID id)
@@ -145,7 +175,15 @@ void MergeTreeBackgroundExecutor<Queue>::removeTasksCorrespondingToStorage(Stora
         std::lock_guard lock(mutex);
 
         /// Erase storage related tasks from pending and select active tasks to wait for
-        pending.remove(id);
+        try
+        {
+            /// An exception context is needed to proper delete write buffers without finalization
+            throw Exception(ErrorCodes::ABORTED, "Storage is about to be deleted. Done pending task as if it was aborted.");
+        }
+        catch (...)
+        {
+            pending.remove(id);
+        }
 
         /// Copy items to wait for their completion
         std::copy_if(active.begin(), active.end(), std::back_inserter(tasks_to_wait),
@@ -163,7 +201,6 @@ void MergeTreeBackgroundExecutor<Queue>::removeTasksCorrespondingToStorage(Stora
     }
 }
 
-
 template <class Queue>
 void MergeTreeBackgroundExecutor<Queue>::routine(TaskRuntimeDataPtr item)
 {
@@ -172,9 +209,57 @@ void MergeTreeBackgroundExecutor<Queue>::routine(TaskRuntimeDataPtr item)
 
     /// All operations with queues are considered no to do any allocations
 
-    auto erase_from_active = [this, &item]() TSA_REQUIRES(mutex)
+    auto erase_from_active = [this](TaskRuntimeDataPtr & item_) TSA_REQUIRES(mutex)
     {
-        active.erase(std::remove(active.begin(), active.end(), item), active.end());
+        active.erase(std::remove(active.begin(), active.end(), item_), active.end());
+    };
+
+    auto on_task_done = [] (TaskRuntimeDataPtr && item_) TSA_REQUIRES(mutex)
+    {
+        /// We have to call reset() under a lock, otherwise a race is possible.
+        /// Imagine, that task is finally completed (last execution returned false),
+        /// we removed the task from both queues, but still have pointer.
+        /// The thread that shutdowns storage will scan queues in order to find some tasks to wait for, but will find nothing.
+        /// So, the destructor of a task and the destructor of a storage will be executed concurrently.
+        NOEXCEPT_SCOPE({
+            ALLOW_ALLOCATIONS_IN_SCOPE;
+            item_->task.reset();
+        });
+        item_->is_done.set();
+        item_.reset();
+    };
+
+    auto on_task_restart = [this](TaskRuntimeDataPtr && item_) TSA_REQUIRES(mutex)
+    {
+        /// After the `guard` destruction `item` has to be in moved from state
+        /// Not to own the object it points to.
+        /// Otherwise the destruction of the task won't be ordered with the destruction of the
+        /// storage.
+        pending.push(std::move(item_));
+        has_tasks.notify_one();
+    };
+
+    auto release_task = [this, &erase_from_active, &on_task_done](TaskRuntimeDataPtr && item_)
+    {
+        std::lock_guard guard(mutex);
+
+        erase_from_active(item_);
+        has_tasks.notify_one();
+
+        try
+        {
+            ALLOW_ALLOCATIONS_IN_SCOPE;
+            /// In a situation of a lack of memory this method can throw an exception,
+            /// because it may interact somehow with BackgroundSchedulePool, which may allocate memory
+            /// But it is rather safe, because we have try...catch block here, and another one in ThreadPool.
+            item_->task->onCompleted();
+        }
+        catch (...)
+        {
+            printExceptionWithRespectToAbort(log);
+        }
+
+        on_task_done(std::move(item_));
     };
 
     bool need_execute_again = false;
@@ -184,96 +269,42 @@ void MergeTreeBackgroundExecutor<Queue>::routine(TaskRuntimeDataPtr item)
         ALLOW_ALLOCATIONS_IN_SCOPE;
         need_execute_again = item->task->executeStep();
     }
-    catch (const Exception & e)
-    {
-        NOEXCEPT_SCOPE({
-            ALLOW_ALLOCATIONS_IN_SCOPE;
-            if (e.code() == ErrorCodes::ABORTED)    /// Cancelled merging parts is not an error - log as info.
-                LOG_INFO(log, getExceptionMessageAndPattern(e, /* with_stacktrace */ false));
-            else
-                tryLogCurrentException(__PRETTY_FUNCTION__);
-        });
-    }
     catch (...)
     {
-        NOEXCEPT_SCOPE({
-            ALLOW_ALLOCATIONS_IN_SCOPE;
-            tryLogCurrentException(__PRETTY_FUNCTION__);
-        });
+        printExceptionWithRespectToAbort(log);
+        /// Release the task with exception context.
+        /// An exception context is needed to proper delete write buffers without finalization
+        release_task(std::move(item));
+        return;
     }
 
-    if (need_execute_again)
+    if (!need_execute_again)
     {
-        std::lock_guard guard(mutex);
-        erase_from_active();
-
-        if (item->is_currently_deleting)
-        {
-            NOEXCEPT_SCOPE({
-                ALLOW_ALLOCATIONS_IN_SCOPE;
-                item->task.reset();
-            });
-            item->is_done.set();
-            item = nullptr;
-            return;
-        }
-
-        /// After the `guard` destruction `item` has to be in moved from state
-        /// Not to own the object it points to.
-        /// Otherwise the destruction of the task won't be ordered with the destruction of the
-        /// storage.
-        pending.push(std::move(item));
-        has_tasks.notify_one();
-        item = nullptr;
+        release_task(std::move(item));
         return;
     }
 
     {
         std::lock_guard guard(mutex);
-        erase_from_active();
-        has_tasks.notify_one();
+        erase_from_active(item);
 
-        try
+        if (item->is_currently_deleting)
         {
-            ALLOW_ALLOCATIONS_IN_SCOPE;
-            /// In a situation of a lack of memory this method can throw an exception,
-            /// because it may interact somehow with BackgroundSchedulePool, which may allocate memory
-            /// But it is rather safe, because we have try...catch block here, and another one in ThreadPool.
-            item->task->onCompleted();
-        }
-        catch (const Exception & e)
-        {
-            NOEXCEPT_SCOPE({
+            try
+            {
                 ALLOW_ALLOCATIONS_IN_SCOPE;
-                if (e.code() == ErrorCodes::ABORTED)    /// Cancelled merging parts is not an error - log as info.
-                    LOG_INFO(log, getExceptionMessageAndPattern(e, /* with_stacktrace */ false));
-                else
-                    tryLogCurrentException(__PRETTY_FUNCTION__);
-            });
-        }
-        catch (...)
-        {
-            NOEXCEPT_SCOPE({
-                ALLOW_ALLOCATIONS_IN_SCOPE;
-                tryLogCurrentException(__PRETTY_FUNCTION__);
-            });
+                /// An exception context is needed to proper delete write buffers without finalization
+                throw Exception(ErrorCodes::ABORTED, "Storage is about to be deleted. Done active task as if it was aborted.");
+            }
+            catch (...)
+            {
+                printExceptionWithRespectToAbort(log);
+                on_task_done(std::move(item));
+                return;
+            }
         }
 
-
-        /// We have to call reset() under a lock, otherwise a race is possible.
-        /// Imagine, that task is finally completed (last execution returned false),
-        /// we removed the task from both queues, but still have pointer.
-        /// The thread that shutdowns storage will scan queues in order to find some tasks to wait for, but will find nothing.
-        /// So, the destructor of a task and the destructor of a storage will be executed concurrently.
-        {
-            NOEXCEPT_SCOPE({
-                ALLOW_ALLOCATIONS_IN_SCOPE;
-                item->task.reset();
-            });
-        }
-
-        item->is_done.set();
-        item = nullptr;
+        on_task_restart(std::move(item));
     }
 }
 
diff --git a/src/Storages/MergeTree/MergeTreeBackgroundExecutor.h b/src/Storages/MergeTree/MergeTreeBackgroundExecutor.h
index 8142e383d0c..552ed32e2d2 100644
--- a/src/Storages/MergeTree/MergeTreeBackgroundExecutor.h
+++ b/src/Storages/MergeTree/MergeTreeBackgroundExecutor.h
@@ -63,7 +63,7 @@ struct TaskRuntimeData
     /// This scenario in not possible in reality.
     Poco::Event is_done{/*autoreset=*/false};
     /// This is equal to task->getPriority() not to do useless virtual calls in comparator
-    UInt64 priority{0};
+    Priority priority;
 
     /// By default priority queue will have max element at top
     static bool comparePtrByPriority(const TaskRuntimeDataPtr & lhs, const TaskRuntimeDataPtr & rhs)
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 32665429051..6bbf80944a7 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -19,6 +19,7 @@
 #include <Common/CurrentMetrics.h>
 #include <Common/ThreadFuzzer.h>
 #include <Common/getNumberOfPhysicalCPUCores.h>
+#include <Common/Config/ConfigHelper.h>
 #include <Compression/CompressedReadBuffer.h>
 #include <Core/QueryProcessingStage.h>
 #include <DataTypes/DataTypeEnum.h>
@@ -82,6 +83,7 @@
 #include <boost/algorithm/string/join.hpp>
 
 #include <base/insertAtEnd.h>
+#include <base/interpolate.h>
 
 #include <algorithm>
 #include <atomic>
@@ -99,6 +101,7 @@
 
 #include <fmt/format.h>
 #include <Poco/Logger.h>
+#include <Poco/Net/NetException.h>
 
 template <>
 struct fmt::formatter<DB::DataPartPtr> : fmt::formatter<std::string>
@@ -130,10 +133,6 @@ namespace ProfileEvents
 namespace CurrentMetrics
 {
     extern const Metric DelayedInserts;
-    extern const Metric MergeTreePartsLoaderThreads;
-    extern const Metric MergeTreePartsLoaderThreadsActive;
-    extern const Metric MergeTreePartsCleanerThreads;
-    extern const Metric MergeTreePartsCleanerThreadsActive;
 }
 
 
@@ -180,8 +179,6 @@ namespace ErrorCodes
     extern const int ZERO_COPY_REPLICATION_ERROR;
     extern const int NOT_INITIALIZED;
     extern const int SERIALIZATION_ERROR;
-    extern const int NETWORK_ERROR;
-    extern const int SOCKET_TIMEOUT;
     extern const int TOO_MANY_MUTATIONS;
 }
 
@@ -605,14 +602,14 @@ namespace
 
 ExpressionActionsPtr getCombinedIndicesExpression(
     const KeyDescription & key,
-    const IndicesDescription & indices,
+    const MergeTreeIndices & indices,
     const ColumnsDescription & columns,
     ContextPtr context)
 {
     ASTPtr combined_expr_list = key.expression_list_ast->clone();
 
     for (const auto & index : indices)
-        for (const auto & index_expr : index.expression_list_ast->children)
+        for (const auto & index_expr : index->index.expression_list_ast->children)
             combined_expr_list->children.push_back(index_expr->clone());
 
     auto syntax_result = TreeRewriter(context).analyze(combined_expr_list, columns.getAllPhysical());
@@ -644,14 +641,16 @@ DataTypes MergeTreeData::getMinMaxColumnsTypes(const KeyDescription & partition_
     return {};
 }
 
-ExpressionActionsPtr MergeTreeData::getPrimaryKeyAndSkipIndicesExpression(const StorageMetadataPtr & metadata_snapshot) const
+ExpressionActionsPtr
+MergeTreeData::getPrimaryKeyAndSkipIndicesExpression(const StorageMetadataPtr & metadata_snapshot, const MergeTreeIndices & indices) const
 {
-    return getCombinedIndicesExpression(metadata_snapshot->getPrimaryKey(), metadata_snapshot->getSecondaryIndices(), metadata_snapshot->getColumns(), getContext());
+    return getCombinedIndicesExpression(metadata_snapshot->getPrimaryKey(), indices, metadata_snapshot->getColumns(), getContext());
 }
 
-ExpressionActionsPtr MergeTreeData::getSortingKeyAndSkipIndicesExpression(const StorageMetadataPtr & metadata_snapshot) const
+ExpressionActionsPtr
+MergeTreeData::getSortingKeyAndSkipIndicesExpression(const StorageMetadataPtr & metadata_snapshot, const MergeTreeIndices & indices) const
 {
-    return getCombinedIndicesExpression(metadata_snapshot->getSortingKey(), metadata_snapshot->getSecondaryIndices(), metadata_snapshot->getColumns(), getContext());
+    return getCombinedIndicesExpression(metadata_snapshot->getSortingKey(), indices, metadata_snapshot->getColumns(), getContext());
 }
 
 
@@ -1173,25 +1172,6 @@ static void preparePartForRemoval(const MergeTreeMutableDataPartPtr & part)
     }
 }
 
-static bool isRetryableException(const Exception & e)
-{
-    if (isNotEnoughMemoryErrorCode(e.code()))
-        return true;
-
-    if (e.code() == ErrorCodes::NETWORK_ERROR || e.code() == ErrorCodes::SOCKET_TIMEOUT)
-        return true;
-
-#if USE_AWS_S3
-    const auto * s3_exception = dynamic_cast<const S3Exception *>(&e);
-    if (s3_exception && s3_exception->isRetryableError())
-        return true;
-#endif
-
-    /// In fact, there can be other similar situations.
-    /// But it is OK, because there is a safety guard against deleting too many parts.
-    return false;
-}
-
 static constexpr size_t loading_parts_initial_backoff_ms = 100;
 static constexpr size_t loading_parts_max_backoff_ms = 5000;
 static constexpr size_t loading_parts_max_tries = 3;
@@ -1210,7 +1190,7 @@ MergeTreeData::LoadPartResult MergeTreeData::loadDataPart(
     auto data_part_storage = std::make_shared<DataPartStorageOnDiskFull>(single_disk_volume, relative_data_path, part_name);
 
     String part_path = fs::path(relative_data_path) / part_name;
-    String marker_path = fs::path(part_path) / IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME;
+    String marker_path = fs::path(part_path) / IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED;
 
     /// Ignore broken parts that can appear as a result of hard server restart.
     auto mark_broken = [&]
@@ -1256,6 +1236,14 @@ MergeTreeData::LoadPartResult MergeTreeData::loadDataPart(
         mark_broken();
         return res;
     }
+    catch (const Poco::Net::NetException &)
+    {
+        throw;
+    }
+    catch (const Poco::TimeoutException &)
+    {
+        throw;
+    }
     catch (...)
     {
         mark_broken();
@@ -1425,71 +1413,32 @@ MergeTreeData::LoadPartResult MergeTreeData::loadDataPartWithRetries(
     UNREACHABLE();
 }
 
-std::vector<MergeTreeData::LoadPartResult> MergeTreeData::loadDataPartsFromDisk(
-    ThreadPool & pool,
-    size_t num_parts,
-    std::queue<PartLoadingTreeNodes> & parts_queue,
-    const MergeTreeSettingsPtr & settings)
+/// Wait for all tasks to finish and rethrow the first exception if any.
+/// The tasks access local variables of the caller function, so we can't just rethrow the first exception until all other tasks are finished.
+void waitForAllToFinishAndRethrowFirstError(std::vector<std::future<void>> & futures)
 {
-    /// Parallel loading of data parts.
-    pool.setMaxThreads(std::min(static_cast<size_t>(settings->max_part_loading_threads), num_parts));
-    size_t num_threads = pool.getMaxThreads();
-    LOG_DEBUG(log, "Going to use {} threads to load parts", num_threads);
+    /// First wait for all tasks to finish.
+    for (auto & future : futures)
+        future.wait();
 
-    std::vector<size_t> parts_per_thread(num_threads, num_parts / num_threads);
-    for (size_t i = 0ul; i < num_parts % num_threads; ++i)
-        ++parts_per_thread[i];
+    /// Now rethrow the first exception if any.
+    for (auto & future : futures)
+        future.get();
 
-    /// Prepare data parts for parallel loading. Threads will focus on given disk first, then steal
-    /// others' tasks when finish current disk part loading process.
-    std::vector<PartLoadingTreeNodes> threads_parts(num_threads);
-    std::set<size_t> remaining_thread_parts;
-    std::queue<size_t> threads_queue;
+    futures.clear();
+}
 
-    for (size_t i = 0; i < num_threads; ++i)
-    {
-        remaining_thread_parts.insert(i);
-        threads_queue.push(i);
-    }
+std::vector<MergeTreeData::LoadPartResult> MergeTreeData::loadDataPartsFromDisk(PartLoadingTreeNodes & parts_to_load)
+{
+    const size_t num_parts = parts_to_load.size();
 
-    while (!parts_queue.empty())
-    {
-        assert(!threads_queue.empty());
-        size_t i = threads_queue.front();
-        auto & need_parts = parts_per_thread[i];
-        assert(need_parts > 0);
+    LOG_TRACE(log, "Will load {} parts using up to {} threads", num_parts, getActivePartsLoadingThreadPool().get().getMaxThreads());
 
-        auto & thread_parts = threads_parts[i];
-        auto & current_parts = parts_queue.front();
-        assert(!current_parts.empty());
+    /// Shuffle all the parts randomly to possible speed up loading them from JBOD.
+    std::shuffle(parts_to_load.begin(), parts_to_load.end(), thread_local_rng);
 
-        auto parts_to_grab = std::min(need_parts, current_parts.size());
-        thread_parts.insert(thread_parts.end(), current_parts.end() - parts_to_grab, current_parts.end());
-        current_parts.resize(current_parts.size() - parts_to_grab);
-        need_parts -= parts_to_grab;
-
-        /// Before processing next thread, change disk if possible.
-        /// Different threads will likely start loading parts from different disk,
-        /// which may improve read parallelism for JBOD.
-
-        /// If current disk still has some parts, push it to the tail.
-        if (!current_parts.empty())
-            parts_queue.push(std::move(current_parts));
-
-        parts_queue.pop();
-
-        /// If current thread still want some parts, push it to the tail.
-        if (need_parts > 0)
-            threads_queue.push(i);
-
-        threads_queue.pop();
-    }
-
-    assert(threads_queue.empty());
-    assert(std::all_of(threads_parts.begin(), threads_parts.end(), [](const auto & parts)
-    {
-        return !parts.empty();
-    }));
+    auto runner = threadPoolCallbackRunner<void>(getActivePartsLoadingThreadPool().get(), "ActiveParts");
+    std::vector<std::future<void>> parts_futures;
 
     std::mutex part_select_mutex;
     std::mutex part_loading_mutex;
@@ -1498,81 +1447,75 @@ std::vector<MergeTreeData::LoadPartResult> MergeTreeData::loadDataPartsFromDisk(
 
     try
     {
-        for (size_t thread = 0; thread < num_threads; ++thread)
+        while (true)
         {
-            pool.scheduleOrThrowOnError([&, thread, thread_group = CurrentThread::getGroup()]
+            bool are_parts_to_load_empty = false;
             {
-                SCOPE_EXIT_SAFE(
-                    if (thread_group)
-                        CurrentThread::detachFromGroupIfNotDetached();
-                );
-                if (thread_group)
-                    CurrentThread::attachToGroupIfDetached(thread_group);
+                std::lock_guard lock(part_select_mutex);
+                are_parts_to_load_empty = parts_to_load.empty();
+            }
 
-                while (true)
+            if (are_parts_to_load_empty)
+            {
+                /// Wait for all scheduled tasks.
+                waitForAllToFinishAndRethrowFirstError(parts_futures);
+
+                /// At this point it is possible, that some other parts appeared in the queue for processing (parts_to_load),
+                /// because we added them from inside the pool.
+                /// So we need to recheck it.
+            }
+
+            PartLoadingTree::NodePtr current_part;
+            {
+                std::lock_guard lock(part_select_mutex);
+                if (parts_to_load.empty())
+                    break;
+
+                current_part = parts_to_load.back();
+                parts_to_load.pop_back();
+            }
+
+            parts_futures.push_back(runner(
+                [&, part = std::move(current_part)]()
                 {
-                    PartLoadingTree::NodePtr thread_part;
-                    size_t thread_idx = thread;
-
-                    {
-                        std::lock_guard lock{part_select_mutex};
-
-                        if (remaining_thread_parts.empty())
-                            return;
-
-                        /// Steal task if nothing to do
-                        if (threads_parts[thread].empty())
-                        {
-                            // Try random steal tasks from the next thread
-                            std::uniform_int_distribution<size_t> distribution(0, remaining_thread_parts.size() - 1);
-                            auto it = remaining_thread_parts.begin();
-                            std::advance(it, distribution(thread_local_rng));
-                            thread_idx = *it;
-                        }
-
-                        auto & thread_parts = threads_parts[thread_idx];
-                        thread_part = thread_parts.back();
-                        thread_parts.pop_back();
-                        if (thread_parts.empty())
-                            remaining_thread_parts.erase(thread_idx);
-                    }
-
                     /// Pass a separate mutex to guard the set of parts, because this lambda
                     /// is called concurrently but with already locked @data_parts_mutex.
                     auto res = loadDataPartWithRetries(
-                        thread_part->info, thread_part->name, thread_part->disk,
+                        part->info, part->name, part->disk,
                         DataPartState::Active, part_loading_mutex, loading_parts_initial_backoff_ms,
                         loading_parts_max_backoff_ms, loading_parts_max_tries);
 
-                    thread_part->is_loaded = true;
+                    part->is_loaded = true;
                     bool is_active_part = res.part->getState() == DataPartState::Active;
 
                     /// If part is broken or duplicate or should be removed according to transaction
                     /// and it has any covered parts then try to load them to replace this part.
-                    if (!is_active_part && !thread_part->children.empty())
+                    if (!is_active_part && !part->children.empty())
                     {
                         std::lock_guard lock{part_select_mutex};
-                        for (const auto & [_, node] : thread_part->children)
-                            threads_parts[thread].push_back(node);
-                        remaining_thread_parts.insert(thread);
+                        for (const auto & [_, node] : part->children)
+                            parts_to_load.push_back(node);
                     }
 
                     {
                         std::lock_guard lock(part_loading_mutex);
                         loaded_parts.push_back(std::move(res));
                     }
-                }
-            });
+                }, Priority{0}));
         }
     }
     catch (...)
     {
-        /// If this is not done, then in case of an exception, tasks will be destroyed before the threads are completed, and it will be bad.
-        pool.wait();
+        /// Wait for all scheduled tasks
+        /// A future becomes invalid after .get() call
+        /// + .wait() method is used not to throw any exception here.
+        for (auto & future: parts_futures)
+            if (future.valid())
+                future.wait();
+
         throw;
     }
 
-    pool.wait();
     return loaded_parts;
 }
 
@@ -1679,9 +1622,12 @@ void MergeTreeData::loadDataParts(bool skip_sanity_checks)
         }
     }
 
-    ThreadPool pool(CurrentMetrics::MergeTreePartsLoaderThreads, CurrentMetrics::MergeTreePartsLoaderThreadsActive, disks.size());
+    auto runner = threadPoolCallbackRunner<void>(getActivePartsLoadingThreadPool().get(), "ActiveParts");
     std::vector<PartLoadingTree::PartLoadingInfos> parts_to_load_by_disk(disks.size());
 
+    std::vector<std::future<void>> disks_futures;
+    disks_futures.reserve(disks.size());
+
     for (size_t i = 0; i < disks.size(); ++i)
     {
         const auto & disk_ptr = disks[i];
@@ -1690,7 +1636,7 @@ void MergeTreeData::loadDataParts(bool skip_sanity_checks)
 
         auto & disk_parts = parts_to_load_by_disk[i];
 
-        pool.scheduleOrThrowOnError([&, disk_ptr]()
+        disks_futures.push_back(runner([&, disk_ptr]()
         {
             for (auto it = disk_ptr->iterateDirectory(relative_data_path); it->isValid(); it->next())
             {
@@ -1703,38 +1649,28 @@ void MergeTreeData::loadDataParts(bool skip_sanity_checks)
                 if (auto part_info = MergeTreePartInfo::tryParsePartName(it->name(), format_version))
                     disk_parts.emplace_back(*part_info, it->name(), disk_ptr);
             }
-        });
+        }, Priority{0}));
     }
 
-    pool.wait();
+    /// For iteration to be completed
+    waitForAllToFinishAndRethrowFirstError(disks_futures);
 
     PartLoadingTree::PartLoadingInfos parts_to_load;
     for (auto & disk_parts : parts_to_load_by_disk)
         std::move(disk_parts.begin(), disk_parts.end(), std::back_inserter(parts_to_load));
 
     auto loading_tree = PartLoadingTree::build(std::move(parts_to_load));
-    /// Collect parts by disks' names.
-    std::map<String, PartLoadingTreeNodes> disk_part_map;
+
+    size_t num_parts = 0;
+    PartLoadingTreeNodes active_parts;
 
     /// Collect only "the most covering" parts from the top level of the tree.
     loading_tree.traverse(/*recursive=*/ false, [&](const auto & node)
     {
-        disk_part_map[node->disk->getName()].emplace_back(node);
+        active_parts.emplace_back(node);
     });
 
-    size_t num_parts = 0;
-    std::queue<PartLoadingTreeNodes> parts_queue;
-
-    for (auto & [disk_name, disk_parts] : disk_part_map)
-    {
-        LOG_INFO(log, "Found {} parts for disk '{}' to load", disk_parts.size(), disk_name);
-
-        if (disk_parts.empty())
-            continue;
-
-        num_parts += disk_parts.size();
-        parts_queue.push(std::move(disk_parts));
-    }
+    num_parts += active_parts.size();
 
     auto part_lock = lockParts();
     LOG_TEST(log, "loadDataParts: clearing data_parts_indexes (had {} parts)", data_parts_indexes.size());
@@ -1754,7 +1690,7 @@ void MergeTreeData::loadDataParts(bool skip_sanity_checks)
 
     if (num_parts > 0)
     {
-        auto loaded_parts = loadDataPartsFromDisk(pool, num_parts, parts_queue, settings);
+        auto loaded_parts = loadDataPartsFromDisk(active_parts);
 
         for (const auto & res : loaded_parts)
         {
@@ -1783,10 +1719,12 @@ void MergeTreeData::loadDataParts(bool skip_sanity_checks)
 
     if (settings->in_memory_parts_enable_wal)
     {
-        pool.setMaxThreads(disks.size());
         std::vector<MutableDataPartsVector> disks_wal_parts(disks.size());
         std::mutex wal_init_lock;
 
+        std::vector<std::future<void>> wal_disks_futures;
+        wal_disks_futures.reserve(disks.size());
+
         for (size_t i = 0; i < disks.size(); ++i)
         {
             const auto & disk_ptr = disks[i];
@@ -1795,7 +1733,7 @@ void MergeTreeData::loadDataParts(bool skip_sanity_checks)
 
             auto & disk_wal_parts = disks_wal_parts[i];
 
-            pool.scheduleOrThrowOnError([&, disk_ptr]()
+            wal_disks_futures.push_back(runner([&, disk_ptr]()
             {
                 for (auto it = disk_ptr->iterateDirectory(relative_data_path); it->isValid(); it->next())
                 {
@@ -1821,10 +1759,11 @@ void MergeTreeData::loadDataParts(bool skip_sanity_checks)
                             disk_wal_parts.push_back(std::move(part));
                     }
                 }
-            });
+            }, Priority{0}));
         }
 
-        pool.wait();
+        /// For for iteration to be completed
+        waitForAllToFinishAndRethrowFirstError(wal_disks_futures);
 
         MutableDataPartsVector parts_from_wal;
         for (auto & disk_wal_parts : disks_wal_parts)
@@ -1925,7 +1864,7 @@ try
 
     std::atomic_size_t num_loaded_parts = 0;
 
-    auto runner = threadPoolCallbackRunner<void>(OutdatedPartsLoadingThreadPool::get(), "OutdatedParts");
+    auto runner = threadPoolCallbackRunner<void>(getOutdatedPartsLoadingThreadPool().get(), "OutdatedParts");
     std::vector<std::future<void>> parts_futures;
 
     while (true)
@@ -1938,8 +1877,8 @@ try
             if (is_async && outdated_data_parts_loading_canceled)
             {
                 /// Wait for every scheduled task
-                for (auto & future : parts_futures)
-                    future.wait();
+                /// In case of any exception it will be re-thrown and server will be terminated.
+                waitForAllToFinishAndRethrowFirstError(parts_futures);
 
                 LOG_DEBUG(log,
                     "Stopped loading outdated data parts because task was canceled. "
@@ -1963,7 +1902,10 @@ try
 
             ++num_loaded_parts;
             if (res.is_broken)
+            {
+                forcefullyRemoveBrokenOutdatedPartFromZooKeeperBeforeDetaching(res.part->name);
                 res.part->renameToDetached("broken-on-start"); /// detached parts must not have '_' in prefixes
+            }
             else if (res.part->is_duplicate)
                 res.part->remove();
             else
@@ -1973,7 +1915,7 @@ try
 
     /// Wait for every scheduled task
     for (auto & future : parts_futures)
-        future.wait();
+        future.get();
 
     LOG_DEBUG(log, "Loaded {} outdated data parts {}",
         num_loaded_parts, is_async ? "asynchronously" : "synchronously");
@@ -1999,6 +1941,13 @@ void MergeTreeData::waitForOutdatedPartsToBeLoaded() const TSA_NO_THREAD_SAFETY_
     if (isStaticStorage())
         return;
 
+    /// We need to load parts as fast as possible
+    getOutdatedPartsLoadingThreadPool().enableTurboMode();
+    SCOPE_EXIT({
+        /// Let's lower the number of threads e.g. for later ATTACH queries to behave as usual
+        getOutdatedPartsLoadingThreadPool().disableTurboMode();
+    });
+
     LOG_TRACE(log, "Will wait for outdated data parts to be loaded");
 
     std::unique_lock lock(outdated_data_parts_mutex);
@@ -2051,6 +2000,21 @@ static bool isOldPartDirectory(const DiskPtr & disk, const String & directory_pa
 
 
 size_t MergeTreeData::clearOldTemporaryDirectories(size_t custom_directories_lifetime_seconds, const NameSet & valid_prefixes)
+{
+    size_t cleared_count = 0;
+
+    cleared_count += clearOldTemporaryDirectories(relative_data_path, custom_directories_lifetime_seconds, valid_prefixes);
+
+    if (allowRemoveStaleMovingParts())
+    {
+        /// Clear _all_ parts from the `moving` directory
+        cleared_count += clearOldTemporaryDirectories(fs::path(relative_data_path) / "moving", custom_directories_lifetime_seconds, {""});
+    }
+
+    return cleared_count;
+}
+
+size_t MergeTreeData::clearOldTemporaryDirectories(const String & root_path, size_t custom_directories_lifetime_seconds, const NameSet & valid_prefixes)
 {
     /// If the method is already called from another thread, then we don't need to do anything.
     std::unique_lock lock(clear_old_temporary_directories_mutex, std::defer_lock);
@@ -2069,7 +2033,7 @@ size_t MergeTreeData::clearOldTemporaryDirectories(size_t custom_directories_lif
         if (disk->isBroken())
             continue;
 
-        for (auto it = disk->iterateDirectory(relative_data_path); it->isValid(); it->next())
+        for (auto it = disk->iterateDirectory(root_path); it->isValid(); it->next())
         {
             const std::string & basename = it->name();
             bool start_with_valid_prefix = false;
@@ -2420,20 +2384,15 @@ void MergeTreeData::clearPartsFromFilesystemImpl(const DataPartsVector & parts_t
         }
     };
 
-    if (settings->max_part_removal_threads <= 1 || parts_to_remove.size() <= settings->concurrent_part_removal_threshold)
+    if (parts_to_remove.size() <= settings->concurrent_part_removal_threshold)
     {
         remove_single_thread();
         return;
     }
 
     /// Parallel parts removal.
-    size_t num_threads = settings->max_part_removal_threads;
-    if (!num_threads)
-        num_threads = getNumberOfPhysicalCPUCores() * 2;
-    num_threads = std::min<size_t>(num_threads, parts_to_remove.size());
     std::mutex part_names_mutex;
-    ThreadPool pool(CurrentMetrics::MergeTreePartsCleanerThreads, CurrentMetrics::MergeTreePartsCleanerThreadsActive,
-                    num_threads, num_threads, /* unlimited queue size */ 0);
+    auto runner = threadPoolCallbackRunner<void>(getPartsCleaningThreadPool().get(), "PartsCleaning");
 
     /// This flag disallow straightforward concurrent parts removal. It's required only in case
     /// when we have parts on zero-copy disk + at least some of them were mutated.
@@ -2453,27 +2412,24 @@ void MergeTreeData::clearPartsFromFilesystemImpl(const DataPartsVector & parts_t
         LOG_DEBUG(
             log, "Removing {} parts from filesystem (concurrently): Parts: [{}]", parts_to_remove.size(), fmt::join(parts_to_remove, ", "));
 
+        std::vector<std::future<void>> parts_to_remove_futures;
+        parts_to_remove_futures.reserve(parts_to_remove.size());
+
         for (const DataPartPtr & part : parts_to_remove)
         {
-            pool.scheduleOrThrowOnError([&part, &part_names_mutex, part_names_succeed, thread_group = CurrentThread::getGroup()]
+            parts_to_remove_futures.push_back(runner([&part, &part_names_mutex, part_names_succeed, thread_group = CurrentThread::getGroup()]
             {
-                SCOPE_EXIT_SAFE(
-                    if (thread_group)
-                        CurrentThread::detachFromGroupIfNotDetached();
-                );
-                if (thread_group)
-                    CurrentThread::attachToGroupIfDetached(thread_group);
-
                 asMutableDeletingPart(part)->remove();
                 if (part_names_succeed)
                 {
                     std::lock_guard lock(part_names_mutex);
                     part_names_succeed->insert(part->name);
                 }
-            });
+            }, Priority{0}));
         }
 
-        pool.wait();
+        waitForAllToFinishAndRethrowFirstError(parts_to_remove_futures);
+
         return;
     }
 
@@ -2544,20 +2500,15 @@ void MergeTreeData::clearPartsFromFilesystemImpl(const DataPartsVector & parts_t
         return independent_ranges;
     };
 
-    auto schedule_parts_removal = [this, &pool, &part_names_mutex, part_names_succeed](
+    std::vector<std::future<void>> part_removal_futures;
+
+    auto schedule_parts_removal = [this, &runner, &part_names_mutex, part_names_succeed, &part_removal_futures](
         const MergeTreePartInfo & range, DataPartsVector && parts_in_range)
     {
         /// Below, range should be captured by copy to avoid use-after-scope on exception from pool
-        pool.scheduleOrThrowOnError(
-            [this, range, &part_names_mutex, part_names_succeed, thread_group = CurrentThread::getGroup(), batch = std::move(parts_in_range)]
+        part_removal_futures.push_back(runner(
+            [this, range, &part_names_mutex, part_names_succeed, batch = std::move(parts_in_range)]
         {
-            SCOPE_EXIT_SAFE(
-                if (thread_group)
-                    CurrentThread::detachFromGroupIfNotDetached();
-            );
-            if (thread_group)
-                CurrentThread::attachToGroupIfDetached(thread_group);
-
             LOG_TRACE(log, "Removing {} parts in blocks range {}", batch.size(), range.getPartNameForLogs());
 
             for (const auto & part : batch)
@@ -2569,7 +2520,7 @@ void MergeTreeData::clearPartsFromFilesystemImpl(const DataPartsVector & parts_t
                     part_names_succeed->insert(part->name);
                 }
             }
-        });
+        }, Priority{0}));
     };
 
     RemovalRanges independent_ranges = split_into_independent_ranges(parts_to_remove, /* split_times */ 0);
@@ -2632,7 +2583,8 @@ void MergeTreeData::clearPartsFromFilesystemImpl(const DataPartsVector & parts_t
     LOG_TRACE(log, "Will remove {} big parts separately: {}", excluded_parts.size(), fmt::join(excluded_parts, ", "));
 
     independent_ranges = split_into_independent_ranges(excluded_parts, /* split_times */ 0);
-    pool.wait();
+
+    waitForAllToFinishAndRethrowFirstError(part_removal_futures);
 
     for (size_t i = 0; i < independent_ranges.infos.size(); ++i)
     {
@@ -2641,7 +2593,7 @@ void MergeTreeData::clearPartsFromFilesystemImpl(const DataPartsVector & parts_t
         schedule_parts_removal(range, std::move(parts_in_range));
     }
 
-    pool.wait();
+    waitForAllToFinishAndRethrowFirstError(part_removal_futures);
 
     if (parts_to_remove.size() != sum_of_ranges + excluded_parts.size())
         throw Exception(ErrorCodes::LOGICAL_ERROR,
@@ -4308,6 +4260,29 @@ size_t MergeTreeData::getActivePartsCount() const
 }
 
 
+size_t MergeTreeData::getOutdatedPartsCount() const
+{
+    return total_outdated_parts_count.load(std::memory_order_relaxed);
+}
+
+size_t MergeTreeData::getNumberOfOutdatedPartsWithExpiredRemovalTime() const
+{
+    size_t res = 0;
+
+    auto time_now = time(nullptr);
+
+    auto parts_lock = lockParts();
+    auto outdated_parts_range = getDataPartsStateRange(DataPartState::Outdated);
+    for (const auto & part : outdated_parts_range)
+    {
+        auto part_remove_time = part->remove_time.load(std::memory_order_relaxed);
+        if (part_remove_time <= time_now && time_now - part_remove_time >= getSettings()->old_parts_lifetime.totalSeconds() && part.unique())
+            ++res;
+    }
+
+    return res;
+}
+
 std::pair<size_t, size_t> MergeTreeData::getMaxPartsCountAndSizeForPartitionWithState(DataPartState state) const
 {
     auto lock = lockParts();
@@ -4369,14 +4344,14 @@ std::optional<Int64> MergeTreeData::getMinPartDataVersion() const
 }
 
 
-void MergeTreeData::delayInsertOrThrowIfNeeded(Poco::Event * until, const ContextPtr & query_context) const
+void MergeTreeData::delayInsertOrThrowIfNeeded(Poco::Event * until, const ContextPtr & query_context, bool allow_throw) const
 {
     const auto settings = getSettings();
     const auto & query_settings = query_context->getSettingsRef();
     const size_t parts_count_in_total = getActivePartsCount();
 
-    /// check if have too many parts in total
-    if (parts_count_in_total >= settings->max_parts_in_total)
+    /// Check if we have too many parts in total
+    if (allow_throw && parts_count_in_total >= settings->max_parts_in_total)
     {
         ProfileEvents::increment(ProfileEvents::RejectedInserts);
         throw Exception(
@@ -4392,7 +4367,7 @@ void MergeTreeData::delayInsertOrThrowIfNeeded(Poco::Event * until, const Contex
         if (settings->inactive_parts_to_throw_insert > 0 || settings->inactive_parts_to_delay_insert > 0)
             outdated_parts_count_in_partition = getMaxOutdatedPartsCountForPartition();
 
-        if (settings->inactive_parts_to_throw_insert > 0 && outdated_parts_count_in_partition >= settings->inactive_parts_to_throw_insert)
+        if (allow_throw && settings->inactive_parts_to_throw_insert > 0 && outdated_parts_count_in_partition >= settings->inactive_parts_to_throw_insert)
         {
             ProfileEvents::increment(ProfileEvents::RejectedInserts);
             throw Exception(
@@ -4416,7 +4391,7 @@ void MergeTreeData::delayInsertOrThrowIfNeeded(Poco::Event * until, const Contex
         bool parts_are_large_enough_in_average
             = settings->max_avg_part_size_for_too_many_parts && average_part_size > settings->max_avg_part_size_for_too_many_parts;
 
-        if (parts_count_in_partition >= active_parts_to_throw_insert && !parts_are_large_enough_in_average)
+        if (allow_throw && parts_count_in_partition >= active_parts_to_throw_insert && !parts_are_large_enough_in_average)
         {
             ProfileEvents::increment(ProfileEvents::RejectedInserts);
             throw Exception(
@@ -4454,18 +4429,17 @@ void MergeTreeData::delayInsertOrThrowIfNeeded(Poco::Event * until, const Contex
                 allowed_parts_over_threshold = settings->inactive_parts_to_throw_insert - settings->inactive_parts_to_delay_insert;
         }
 
-        if (allowed_parts_over_threshold == 0 || parts_over_threshold > allowed_parts_over_threshold) [[unlikely]]
-            throw Exception(
-                ErrorCodes::LOGICAL_ERROR,
-                "Incorrect calculation of {} parts over threshold: allowed_parts_over_threshold={}, parts_over_threshold={}",
-                (use_active_parts_threshold ? "active" : "inactive"),
-                allowed_parts_over_threshold,
-                parts_over_threshold);
-
         const UInt64 max_delay_milliseconds = (settings->max_delay_to_insert > 0 ? settings->max_delay_to_insert * 1000 : 1000);
-        double delay_factor = static_cast<double>(parts_over_threshold) / allowed_parts_over_threshold;
-        const UInt64 min_delay_milliseconds = settings->min_delay_to_insert_ms;
-        delay_milliseconds = std::max(min_delay_milliseconds, static_cast<UInt64>(max_delay_milliseconds * delay_factor));
+        if (allowed_parts_over_threshold == 0 || parts_over_threshold > allowed_parts_over_threshold)
+        {
+            delay_milliseconds = max_delay_milliseconds;
+        }
+        else
+        {
+            double delay_factor = static_cast<double>(parts_over_threshold) / allowed_parts_over_threshold;
+            const UInt64 min_delay_milliseconds = settings->min_delay_to_insert_ms;
+            delay_milliseconds = std::max(min_delay_milliseconds, static_cast<UInt64>(max_delay_milliseconds * delay_factor));
+        }
     }
 
     ProfileEvents::increment(ProfileEvents::DelayedInserts);
@@ -4516,7 +4490,7 @@ void MergeTreeData::delayMutationOrThrowIfNeeded(Poco::Event * until, const Cont
         size_t allowed_mutations_over_threshold = num_mutations_to_throw - num_mutations_to_delay;
 
         double delay_factor = std::min(static_cast<double>(mutations_over_threshold) / allowed_mutations_over_threshold, 1.0);
-        size_t delay_milliseconds = static_cast<size_t>(std::lerp(settings->min_delay_to_mutate_ms, settings->max_delay_to_mutate_ms, delay_factor));
+        size_t delay_milliseconds = static_cast<size_t>(interpolateLinear(settings->min_delay_to_mutate_ms, settings->max_delay_to_mutate_ms, delay_factor));
 
         ProfileEvents::increment(ProfileEvents::DelayedMutations);
         ProfileEvents::increment(ProfileEvents::DelayedMutationsMilliseconds, delay_milliseconds);
@@ -4555,9 +4529,8 @@ MergeTreeData::DataPartPtr MergeTreeData::getActiveContainingPart(
 }
 
 
-void MergeTreeData::swapActivePart(MergeTreeData::DataPartPtr part_copy)
+void MergeTreeData::swapActivePart(MergeTreeData::DataPartPtr part_copy, DataPartsLock &)
 {
-    auto lock = lockParts();
     for (auto original_active_part : getDataPartsStateRange(DataPartState::Active)) // NOLINT (copy is intended)
     {
         if (part_copy->name == original_active_part->name)
@@ -4594,7 +4567,6 @@ void MergeTreeData::swapActivePart(MergeTreeData::DataPartPtr part_copy)
             /// All other locks are taken in StorageReplicatedMergeTree
             lockSharedData(*part_copy);
 
-            asMutableDeletingPart(original_active_part)->writeDeleteOnDestroyMarker();
             return;
         }
     }
@@ -4614,6 +4586,12 @@ MergeTreeData::DataPartPtr MergeTreeData::getActiveContainingPart(const String &
     return getActiveContainingPart(part_info);
 }
 
+MergeTreeData::DataPartPtr MergeTreeData::getActiveContainingPart(const String & part_name, DataPartsLock & lock) const
+{
+    auto part_info = MergeTreePartInfo::fromPartName(part_name, format_version);
+    return getActiveContainingPart(part_info, DataPartState::Active, lock);
+}
+
 MergeTreeData::DataPartsVector MergeTreeData::getVisibleDataPartsVectorInPartition(ContextPtr local_context, const String & partition_id) const
 {
     return getVisibleDataPartsVectorInPartition(local_context->getCurrentTransaction().get(), partition_id);
@@ -4734,12 +4712,19 @@ MergeTreeData::DataPartPtr MergeTreeData::getPartIfExistsUnlocked(const MergeTre
     return nullptr;
 }
 
-static void loadPartAndFixMetadataImpl(MergeTreeData::MutableDataPartPtr part)
+static void loadPartAndFixMetadataImpl(MergeTreeData::MutableDataPartPtr part, ContextPtr local_context, int32_t metadata_version, bool sync)
 {
     /// Remove metadata version file and take it from table.
     /// Currently we cannot attach parts with different schema, so
     /// we can assume that it's equal to table's current schema.
     part->removeMetadataVersion();
+    {
+        auto out_metadata = part->getDataPartStorage().writeFile(IMergeTreeDataPart::METADATA_VERSION_FILE_NAME, 4096, local_context->getWriteSettings());
+        writeText(metadata_version, *out_metadata);
+        out_metadata->finalize();
+        if (sync)
+            out_metadata->sync();
+    }
 
     part->loadColumnsChecksumsIndexes(false, true);
     part->modification_time = part->getDataPartStorage().getLastModified().epochTime();
@@ -4843,7 +4828,7 @@ void MergeTreeData::checkAlterPartitionIsPossible(
                 if (partition_ast && partition_ast->all)
                 {
                     if (command.type != PartitionCommand::DROP_PARTITION)
-                        throw DB::Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Only support DETACH PARTITION ALL currently");
+                        throw DB::Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Only support DROP/DETACH PARTITION ALL currently");
                 }
                 else
                     getPartitionIDFromQuery(command.partition, getContext());
@@ -5161,14 +5146,13 @@ Pipe MergeTreeData::alterPartition(
     return {};
 }
 
-
-BackupEntries MergeTreeData::backupParts(
+MergeTreeData::PartsBackupEntries MergeTreeData::backupParts(
     const DataPartsVector & data_parts,
     const String & data_path_in_backup,
     const BackupSettings & backup_settings,
     const ContextPtr & local_context)
 {
-    BackupEntries backup_entries;
+    MergeTreeData::PartsBackupEntries res;
     std::map<DiskPtr, std::shared_ptr<TemporaryFileOnDisk>> temp_dirs;
     TableLockHolder table_lock;
     ReadSettings read_settings = local_context->getBackupReadSettings();
@@ -5233,10 +5217,13 @@ BackupEntries MergeTreeData::backupParts(
                 wrapBackupEntriesWith(backup_entries_from_part, storage_and_part);
         }
 
-        insertAtEnd(backup_entries, std::move(backup_entries_from_part));
+        auto & part_backup_entries = res.emplace_back();
+        part_backup_entries.part_name = part->name;
+        part_backup_entries.part_checksum = part->checksums.getTotalChecksumUInt128();
+        part_backup_entries.backup_entries = std::move(backup_entries_from_part);
     }
 
-    return backup_entries;
+    return res;
 }
 
 void MergeTreeData::restoreDataFromBackup(RestorerFromBackup & restorer, const String & data_path_in_backup, const std::optional<ASTs> & partitions)
@@ -5869,7 +5856,7 @@ MergeTreeData::MutableDataPartsVector MergeTreeData::tryLoadPartsToAttach(const
             .withPartFormatFromDisk()
             .build();
 
-        loadPartAndFixMetadataImpl(part);
+        loadPartAndFixMetadataImpl(part, local_context, getInMemoryMetadataPtr()->getMetadataVersion(), getSettings()->fsync_after_insert);
         loaded_parts.push_back(part);
     }
 
@@ -7208,6 +7195,9 @@ QueryProcessingStage::Enum MergeTreeData::getQueryProcessingStage(
     /// Parallel replicas
     if (query_context->canUseParallelReplicasOnInitiator() && to_stage >= QueryProcessingStage::WithMergeableState)
     {
+        if (!canUseParallelReplicasBasedOnPKAnalysis(query_context, storage_snapshot, query_info))
+            return QueryProcessingStage::Enum::FetchColumns;
+
         /// ReplicatedMergeTree
         if (supportsReplication())
             return QueryProcessingStage::Enum::WithMergeableState;
@@ -7233,6 +7223,42 @@ QueryProcessingStage::Enum MergeTreeData::getQueryProcessingStage(
 }
 
 
+bool MergeTreeData::canUseParallelReplicasBasedOnPKAnalysis(
+    ContextPtr query_context,
+    const StorageSnapshotPtr & storage_snapshot,
+    SelectQueryInfo & query_info) const
+{
+    const auto & snapshot_data = assert_cast<const MergeTreeData::SnapshotData &>(*storage_snapshot->data);
+    const auto & parts = snapshot_data.parts;
+
+    MergeTreeDataSelectExecutor reader(*this);
+    auto result_ptr = reader.estimateNumMarksToRead(
+        parts,
+        query_info.prewhere_info,
+        storage_snapshot->getMetadataForQuery()->getColumns().getAll().getNames(),
+        storage_snapshot->metadata,
+        storage_snapshot->metadata,
+        query_info,
+        /*added_filter_nodes*/ActionDAGNodes{},
+        query_context,
+        query_context->getSettingsRef().max_threads);
+
+    if (result_ptr->error())
+        std::rethrow_exception(std::get<std::exception_ptr>(result_ptr->result));
+
+    LOG_TRACE(log, "Estimated number of granules to read is {}", result_ptr->marks());
+
+    bool decision = result_ptr->marks() >= query_context->getSettingsRef().parallel_replicas_min_number_of_granules_to_enable;
+
+    if (!decision)
+        LOG_DEBUG(log, "Parallel replicas will be disabled, because the estimated number of granules to read {} is less than the threshold which is {}",
+            result_ptr->marks(),
+            query_context->getSettingsRef().parallel_replicas_min_number_of_granules_to_enable);
+
+    return decision;
+}
+
+
 MergeTreeData & MergeTreeData::checkStructureAndGetMergeTreeData(IStorage & source_table, const StorageMetadataPtr & src_snapshot, const StorageMetadataPtr & my_snapshot) const
 {
     MergeTreeData * src_data = dynamic_cast<MergeTreeData *>(&source_table);
@@ -7275,10 +7301,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
     const String & tmp_part_prefix,
     const MergeTreePartInfo & dst_part_info,
     const StorageMetadataPtr & metadata_snapshot,
-    const MergeTreeTransactionPtr & txn,
-    HardlinkedFiles * hardlinked_files,
-    bool copy_instead_of_hardlink,
-    const NameSet & files_to_copy_instead_of_hardlinks)
+    const IDataPartStorage::ClonePartParams & params)
 {
     /// Check that the storage policy contains the disk where the src_part is located.
     bool does_storage_policy_allow_same_disk = false;
@@ -7329,16 +7352,24 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
     }
 
     String with_copy;
-    if (copy_instead_of_hardlink)
+    if (params.copy_instead_of_hardlink)
         with_copy = " (copying data)";
 
     auto dst_part_storage = src_part_storage->freeze(
         relative_data_path,
         tmp_dst_part_name,
-        /*make_source_readonly=*/ false,
         /*save_metadata_callback=*/ {},
-        copy_instead_of_hardlink,
-        files_to_copy_instead_of_hardlinks);
+        params);
+
+    if (params.metadata_version_to_write.has_value())
+    {
+        chassert(!params.keep_metadata_version);
+        auto out_metadata = dst_part_storage->writeFile(IMergeTreeDataPart::METADATA_VERSION_FILE_NAME, 4096, getContext()->getWriteSettings());
+        writeText(metadata_snapshot->getMetadataVersion(), *out_metadata);
+        out_metadata->finalize();
+        if (getSettings()->fsync_after_insert)
+            out_metadata->sync();
+    }
 
     LOG_DEBUG(log, "Clone{} part {} to {}{}",
               src_flushed_tmp_part ? " flushed" : "",
@@ -7350,18 +7381,18 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
         .withPartFormatFromDisk()
         .build();
 
-    if (!copy_instead_of_hardlink && hardlinked_files)
+    if (!params.copy_instead_of_hardlink && params.hardlinked_files)
     {
-        hardlinked_files->source_part_name = src_part->name;
-        hardlinked_files->source_table_shared_id = src_part->storage.getTableSharedID();
+        params.hardlinked_files->source_part_name = src_part->name;
+        params.hardlinked_files->source_table_shared_id = src_part->storage.getTableSharedID();
 
         for (auto it = src_part->getDataPartStorage().iterate(); it->isValid(); it->next())
         {
-            if (!files_to_copy_instead_of_hardlinks.contains(it->name())
-                && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME
+            if (!params.files_to_copy_instead_of_hardlinks.contains(it->name())
+                && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
                 && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
             {
-                hardlinked_files->hardlinks_from_source_part.insert(it->name());
+                params.hardlinked_files->hardlinks_from_source_part.insert(it->name());
             }
         }
 
@@ -7372,18 +7403,18 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
             for (auto it = projection_storage.iterate(); it->isValid(); it->next())
             {
                 auto file_name_with_projection_prefix = fs::path(projection_storage.getPartDirectory()) / it->name();
-                if (!files_to_copy_instead_of_hardlinks.contains(file_name_with_projection_prefix)
-                    && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME
+                if (!params.files_to_copy_instead_of_hardlinks.contains(file_name_with_projection_prefix)
+                    && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
                     && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
                 {
-                    hardlinked_files->hardlinks_from_source_part.insert(file_name_with_projection_prefix);
+                    params.hardlinked_files->hardlinks_from_source_part.insert(file_name_with_projection_prefix);
                 }
             }
         }
     }
 
     /// We should write version metadata on part creation to distinguish it from parts that were created without transaction.
-    TransactionID tid = txn ? txn->tid : Tx::PrehistoricTID;
+    TransactionID tid = params.txn ? params.txn->tid : Tx::PrehistoricTID;
     dst_data_part->version.setCreationTID(tid, nullptr);
     dst_data_part->storeVersionMetadata();
 
@@ -7565,13 +7596,15 @@ PartitionCommandsResultInfo MergeTreeData::freezePartitionsByMatcher(
             createAndStoreFreezeMetadata(disk, part, fs::path(backup_part_path) / part->getDataPartStorage().getPartDirectory());
         };
 
+        IDataPartStorage::ClonePartParams params
+        {
+            .make_source_readonly = true
+        };
         auto new_storage = data_part_storage->freeze(
             backup_part_path,
             part->getDataPartStorage().getPartDirectory(),
-            /*make_source_readonly=*/ true,
             callback,
-            /*copy_instead_of_hardlink=*/ false,
-            /*files_to_copy_instead_of_hardlinks=*/ {});
+            params);
 
         part->is_frozen.store(true, std::memory_order_relaxed);
         result.push_back(PartitionCommandResultInfo{
@@ -7856,7 +7889,7 @@ MovePartsOutcome MergeTreeData::moveParts(const CurrentlyMovingPartsTaggerPtr &
     for (const auto & moving_part : moving_tagger->parts_to_move)
     {
         Stopwatch stopwatch;
-        MutableDataPartPtr cloned_part;
+        MergeTreePartsMover::TemporaryClonedPart cloned_part;
         ProfileEventsScope profile_events_scope;
 
         auto write_part_log = [&](const ExecutionStatus & execution_status)
@@ -7866,7 +7899,7 @@ MovePartsOutcome MergeTreeData::moveParts(const CurrentlyMovingPartsTaggerPtr &
                 execution_status,
                 stopwatch.elapsed(),
                 moving_part.part->name,
-                cloned_part,
+                cloned_part.part,
                 {moving_part.part},
                 nullptr,
                 profile_events_scope.getSnapshot());
@@ -7942,9 +7975,6 @@ MovePartsOutcome MergeTreeData::moveParts(const CurrentlyMovingPartsTaggerPtr &
         catch (...)
         {
             write_part_log(ExecutionStatus::fromCurrentException("", true));
-            if (cloned_part)
-                cloned_part->remove();
-
             throw;
         }
     }
@@ -8459,6 +8489,11 @@ MergeTreeData::MutableDataPartPtr MergeTreeData::createEmptyPart(
     return new_data_part;
 }
 
+bool MergeTreeData::allowRemoveStaleMovingParts() const
+{
+    return ConfigHelper::getBool(getContext()->getConfigRef(), "allow_remove_stale_moving_parts");
+}
+
 CurrentlySubmergingEmergingTagger::~CurrentlySubmergingEmergingTagger()
 {
     std::lock_guard lock(storage.currently_submerging_emerging_mutex);
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index 1c41de6fa19..8c379af193d 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -504,12 +504,13 @@ public:
 
     /// Returns a part in Active state with the given name or a part containing it. If there is no such part, returns nullptr.
     DataPartPtr getActiveContainingPart(const String & part_name) const;
+    DataPartPtr getActiveContainingPart(const String & part_name, DataPartsLock & lock) const;
     DataPartPtr getActiveContainingPart(const MergeTreePartInfo & part_info) const;
     DataPartPtr getActiveContainingPart(const MergeTreePartInfo & part_info, DataPartState state, DataPartsLock & lock) const;
 
     /// Swap part with it's identical copy (possible with another path on another disk).
     /// If original part is not active or doesn't exist exception will be thrown.
-    void swapActivePart(MergeTreeData::DataPartPtr part_copy);
+    void swapActivePart(MergeTreeData::DataPartPtr part_copy, DataPartsLock &);
 
     /// Returns all parts in specified partition
     DataPartsVector getVisibleDataPartsVectorInPartition(MergeTreeTransaction * txn, const String & partition_id, DataPartsLock * acquired_lock = nullptr) const;
@@ -533,6 +534,10 @@ public:
 
     size_t getActivePartsCount() const;
 
+    size_t getOutdatedPartsCount() const;
+
+    size_t getNumberOfOutdatedPartsWithExpiredRemovalTime() const;
+
     /// Returns a pair with: max number of parts in partition across partitions; sum size of parts inside that partition.
     /// (if there are multiple partitions with max number of parts, the sum size of parts is returned for arbitrary of them)
     std::pair<size_t, size_t> getMaxPartsCountAndSizeForPartitionWithState(DataPartState state) const;
@@ -557,7 +562,7 @@ public:
     /// If the table contains too many active parts, sleep for a while to give them time to merge.
     /// If until is non-null, wake up from the sleep earlier if the event happened.
     /// The decision to delay or throw is made according to settings 'parts_to_delay_insert' and 'parts_to_throw_insert'.
-    void delayInsertOrThrowIfNeeded(Poco::Event * until, const ContextPtr & query_context) const;
+    void delayInsertOrThrowIfNeeded(Poco::Event * until, const ContextPtr & query_context, bool allow_throw) const;
 
     /// If the table contains too many unfinished mutations, sleep for a while to give them time to execute.
     /// If until is non-null, wake up from the sleep earlier if the event happened.
@@ -646,6 +651,9 @@ public:
     /// For active parts it's unsafe because this method modifies fields of part (rename) while some other thread can try to read it.
     void forcefullyMovePartToDetachedAndRemoveFromMemory(const DataPartPtr & part, const String & prefix = "", bool restore_covered = false);
 
+    /// This method should not be here, but async loading of Outdated parts is implemented in MergeTreeData
+    virtual void forcefullyRemoveBrokenOutdatedPartFromZooKeeperBeforeDetaching(const String & /*part_name*/) {}
+
     /// Outdate broken part, set remove time to zero (remove as fast as possible) and make clone in detached directory.
     void outdateBrokenPartAndCloneToDetached(const DataPartPtr & part, const String & prefix);
 
@@ -676,6 +684,7 @@ public:
     /// Delete all directories which names begin with "tmp"
     /// Must be called with locked lockForShare() because it's using relative_data_path.
     size_t clearOldTemporaryDirectories(size_t custom_directories_lifetime_seconds, const NameSet & valid_prefixes = {"tmp_", "tmp-fetch_"});
+    size_t clearOldTemporaryDirectories(const String & root_path, size_t custom_directories_lifetime_seconds, const NameSet & valid_prefixes);
 
     size_t clearEmptyParts();
 
@@ -820,21 +829,10 @@ public:
     MergeTreeData & checkStructureAndGetMergeTreeData(const StoragePtr & source_table, const StorageMetadataPtr & src_snapshot, const StorageMetadataPtr & my_snapshot) const;
     MergeTreeData & checkStructureAndGetMergeTreeData(IStorage & source_table, const StorageMetadataPtr & src_snapshot, const StorageMetadataPtr & my_snapshot) const;
 
-    struct HardlinkedFiles
-    {
-        /// Shared table uuid where hardlinks live
-        std::string source_table_shared_id;
-        /// Hardlinked from part
-        std::string source_part_name;
-        /// Hardlinked files list
-        NameSet hardlinks_from_source_part;
-    };
-
     std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneAndLoadDataPartOnSameDisk(
         const MergeTreeData::DataPartPtr & src_part, const String & tmp_part_prefix,
         const MergeTreePartInfo & dst_part_info, const StorageMetadataPtr & metadata_snapshot,
-        const MergeTreeTransactionPtr & txn, HardlinkedFiles * hardlinked_files,
-        bool copy_instead_of_hardlink, const NameSet & files_to_copy_instead_of_hardlinks);
+        const IDataPartStorage::ClonePartParams & params);
 
     virtual std::vector<MergeTreeMutationStatus> getMutationsStatus() const = 0;
 
@@ -956,8 +954,10 @@ public:
     /// Get column types required for partition key
     static DataTypes getMinMaxColumnsTypes(const KeyDescription & partition_key);
 
-    ExpressionActionsPtr getPrimaryKeyAndSkipIndicesExpression(const StorageMetadataPtr & metadata_snapshot) const;
-    ExpressionActionsPtr getSortingKeyAndSkipIndicesExpression(const StorageMetadataPtr & metadata_snapshot) const;
+    ExpressionActionsPtr
+    getPrimaryKeyAndSkipIndicesExpression(const StorageMetadataPtr & metadata_snapshot, const MergeTreeIndices & indices) const;
+    ExpressionActionsPtr
+    getSortingKeyAndSkipIndicesExpression(const StorageMetadataPtr & metadata_snapshot, const MergeTreeIndices & indices) const;
 
     /// Get compression codec for part according to TTL rules and <compression>
     /// section from config.xml.
@@ -1059,6 +1059,9 @@ public:
     void waitForOutdatedPartsToBeLoaded() const;
     bool canUsePolymorphicParts() const;
 
+    /// TODO: make enabled by default in the next release if no problems found.
+    bool allowRemoveStaleMovingParts() const;
+
 protected:
     friend class IMergeTreeDataPart;
     friend class MergeTreeDataMergerMutator;
@@ -1322,8 +1325,16 @@ protected:
     /// Moves part to specified space, used in ALTER ... MOVE ... queries
     MovePartsOutcome movePartsToSpace(const DataPartsVector & parts, SpacePtr space);
 
+    struct PartBackupEntries
+    {
+        String part_name;
+        UInt128 part_checksum; /// same as MinimalisticDataPartChecksums::hash_of_all_files
+        BackupEntries backup_entries;
+    };
+    using PartsBackupEntries = std::vector<PartBackupEntries>;
+
     /// Makes backup entries to backup the parts of this table.
-    BackupEntries backupParts(const DataPartsVector & data_parts, const String & data_path_in_backup, const BackupSettings & backup_settings, const ContextPtr & local_context);
+    PartsBackupEntries backupParts(const DataPartsVector & data_parts, const String & data_path_in_backup, const BackupSettings & backup_settings, const ContextPtr & local_context);
 
     class RestoredPartsHolder;
 
@@ -1492,6 +1503,8 @@ private:
     std::atomic<size_t> total_active_size_rows = 0;
     std::atomic<size_t> total_active_size_parts = 0;
 
+    mutable std::atomic<size_t> total_outdated_parts_count = 0;
+
     // Record all query ids which access the table. It's guarded by `query_id_set_mutex` and is always mutable.
     mutable std::set<String> query_id_set TSA_GUARDED_BY(query_id_set_mutex);
     mutable std::mutex query_id_set_mutex;
@@ -1519,11 +1532,7 @@ private:
         size_t max_backoff_ms,
         size_t max_tries);
 
-    std::vector<LoadPartResult> loadDataPartsFromDisk(
-        ThreadPool & pool,
-        size_t num_parts,
-        std::queue<PartLoadingTreeNodes> & parts_queue,
-        const MergeTreeSettingsPtr & settings);
+    std::vector<LoadPartResult> loadDataPartsFromDisk(PartLoadingTreeNodes & parts_to_load);
 
     void loadDataPartsFromWAL(MutableDataPartsVector & parts_from_wal);
 
@@ -1540,6 +1549,13 @@ private:
     static MutableDataPartPtr asMutableDeletingPart(const DataPartPtr & part);
 
     mutable TemporaryParts temporary_parts;
+
+    /// Estimate the number of marks to read to make a decision whether to enable parallel replicas (distributed processing) or not
+    /// Note: it could be very rough.
+    bool canUseParallelReplicasBasedOnPKAnalysis(
+        ContextPtr query_context,
+        const StorageSnapshotPtr & storage_snapshot,
+        SelectQueryInfo & query_info) const;
 };
 
 /// RAII struct to record big parts that are submerging or emerging.
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
index 29a1574b66e..c0acc401506 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
@@ -239,8 +239,9 @@ MergeTreeDataMergerMutator::PartitionIdsHint MergeTreeDataMergerMutator::getPart
     if (!best_partition_id_to_optimize.empty())
         res.emplace(std::move(best_partition_id_to_optimize));
 
-    LOG_TRACE(log, "Checked {} partitions, found {} partitions with parts that may be merged: {}",
-              all_partition_ids.size(), res.size(), fmt::join(res, ", "));
+    LOG_TRACE(log, "Checked {} partitions, found {} partitions with parts that may be merged: [{}]"
+              "(max_total_size_to_merge={}, merge_with_ttl_allowed{})",
+              all_partition_ids.size(), res.size(), fmt::join(res, ", "), max_total_size_to_merge, merge_with_ttl_allowed);
     return res;
 }
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
index 78f68ea72fe..6628cd68eaf 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
@@ -154,9 +154,9 @@ bool MergeTreeDataPartChecksums::readV2(ReadBuffer & in)
         assertString("\n\tsize: ", in);
         readText(sum.file_size, in);
         assertString("\n\thash: ", in);
-        readText(sum.file_hash.first, in);
+        readText(sum.file_hash.low64, in);
         assertString(" ", in);
-        readText(sum.file_hash.second, in);
+        readText(sum.file_hash.high64, in);
         assertString("\n\tcompressed: ", in);
         readText(sum.is_compressed, in);
         if (sum.is_compressed)
@@ -164,9 +164,9 @@ bool MergeTreeDataPartChecksums::readV2(ReadBuffer & in)
             assertString("\n\tuncompressed size: ", in);
             readText(sum.uncompressed_size, in);
             assertString("\n\tuncompressed hash: ", in);
-            readText(sum.uncompressed_hash.first, in);
+            readText(sum.uncompressed_hash.low64, in);
             assertString(" ", in);
-            readText(sum.uncompressed_hash.second, in);
+            readText(sum.uncompressed_hash.high64, in);
         }
         assertChar('\n', in);
 
@@ -307,19 +307,7 @@ static void updateHash(SipHash & hash, const std::string & data)
 /// Hash is the same as MinimalisticDataPartChecksums::hash_of_all_files
 String MergeTreeDataPartChecksums::getTotalChecksumHex() const
 {
-    SipHash hash_of_all_files;
-
-    for (const auto & [name, checksum] : files)
-    {
-        updateHash(hash_of_all_files, name);
-        hash_of_all_files.update(checksum.file_hash);
-    }
-
-    UInt64 lo;
-    UInt64 hi;
-    hash_of_all_files.get128(lo, hi);
-
-    return getHexUIntUppercase(hi) + getHexUIntUppercase(lo);
+    return getHexUIntUppercase(getTotalChecksumUInt128());
 }
 
 MergeTreeDataPartChecksums::Checksum::uint128 MergeTreeDataPartChecksums::getTotalChecksumUInt128() const
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCompact.cpp b/src/Storages/MergeTree/MergeTreeDataPartCompact.cpp
index 07e20f16a9f..9c47608e364 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCompact.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartCompact.cpp
@@ -144,6 +144,11 @@ bool MergeTreeDataPartCompact::hasColumnFiles(const NameAndTypePair & column) co
     return (bin_checksum != checksums.files.end() && mrk_checksum != checksums.files.end());
 }
 
+std::optional<time_t> MergeTreeDataPartCompact::getColumnModificationTime(const String & /* column_name */) const
+{
+    return getDataPartStorage().getFileLastModified(DATA_FILE_NAME_WITH_EXTENSION).epochTime();
+}
+
 void MergeTreeDataPartCompact::checkConsistency(bool require_part_metadata) const
 {
     checkConsistencyBase();
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCompact.h b/src/Storages/MergeTree/MergeTreeDataPartCompact.h
index b115692a7cf..08764eedb43 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCompact.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartCompact.h
@@ -55,6 +55,8 @@ public:
 
     bool hasColumnFiles(const NameAndTypePair & column) const override;
 
+    std::optional<time_t> getColumnModificationTime(const String & column_name) const override;
+
     String getFileNameForColumn(const NameAndTypePair & /* column */) const override { return DATA_FILE_NAME; }
 
     ~MergeTreeDataPartCompact() override;
diff --git a/src/Storages/MergeTree/MergeTreeDataPartInMemory.h b/src/Storages/MergeTree/MergeTreeDataPartInMemory.h
index db7244d8e99..2698b69b38e 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartInMemory.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartInMemory.h
@@ -43,6 +43,7 @@ public:
     String getFileNameForColumn(const NameAndTypePair & /* column */) const override { return ""; }
     void renameTo(const String & new_relative_path, bool remove_new_dir_if_exists) override;
     DataPartStoragePtr makeCloneInDetached(const String & prefix, const StorageMetadataPtr & metadata_snapshot) const override;
+    std::optional<time_t> getColumnModificationTime(const String & /* column_name */) const override { return {}; }
 
     MutableDataPartStoragePtr flushToDisk(const String & new_relative_path, const StorageMetadataPtr & metadata_snapshot) const;
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
index f44cbdd8628..2d886e2058b 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
@@ -260,6 +260,18 @@ bool MergeTreeDataPartWide::hasColumnFiles(const NameAndTypePair & column) const
     return res;
 }
 
+std::optional<time_t> MergeTreeDataPartWide::getColumnModificationTime(const String & column_name) const
+{
+    try
+    {
+        return getDataPartStorage().getFileLastModified(column_name + DATA_FILE_EXTENSION).epochTime();
+    }
+    catch (const fs::filesystem_error &)
+    {
+        return {};
+    }
+}
+
 String MergeTreeDataPartWide::getFileNameForColumn(const NameAndTypePair & column) const
 {
     String filename;
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWide.h b/src/Storages/MergeTree/MergeTreeDataPartWide.h
index 5ee497b9b21..0b2ffeb4b18 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWide.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWide.h
@@ -54,6 +54,8 @@ public:
 
     bool hasColumnFiles(const NameAndTypePair & column) const override;
 
+    std::optional<time_t> getColumnModificationTime(const String & column_name) const override;
+
 protected:
     static void loadIndexGranularityImpl(
         MergeTreeIndexGranularity & index_granularity_, MergeTreeIndexGranularityInfo & index_granularity_info_,
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
index 0b650eb9f16..5e1da21da5b 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
@@ -276,14 +276,23 @@ void MergeTreeDataPartWriterCompact::fillDataChecksums(IMergeTreeDataPart::Check
         writeIntBinary(static_cast<UInt64>(0), marks_out);
     }
 
+    for (const auto & [_, stream] : streams_by_codec)
+    {
+        stream->hashing_buf.finalize();
+        stream->compressed_buf.finalize();
+    }
+
+    plain_hashing.finalize();
+
     plain_file->next();
 
     if (marks_source_hashing)
-        marks_source_hashing->next();
+        marks_source_hashing->finalize();
     if (marks_compressor)
-        marks_compressor->next();
+        marks_compressor->finalize();
+
+    marks_file_hashing->finalize();
 
-    marks_file_hashing->next();
     addToChecksums(checksums);
 
     plain_file->preFinalize();
@@ -292,14 +301,14 @@ void MergeTreeDataPartWriterCompact::fillDataChecksums(IMergeTreeDataPart::Check
 
 void MergeTreeDataPartWriterCompact::finishDataSerialization(bool sync)
 {
-    plain_file->finalize();
-    marks_file->finalize();
-
     if (sync)
     {
         plain_file->sync();
         marks_file->sync();
     }
+
+    plain_file->finalize();
+    marks_file->finalize();
 }
 
 static void fillIndexGranularityImpl(
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
index b0101bb962c..f57ffa5ee14 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
@@ -13,17 +13,22 @@ namespace ErrorCodes
 
 void MergeTreeDataPartWriterOnDisk::Stream::preFinalize()
 {
-    compressed_hashing.next();
-    compressor.next();
-    plain_hashing.next();
+    /// Here the main goal is to do preFinalize calls for plain_file and marks_file
+    /// Before that all hashing and compression buffers have to be finalized
+    /// Otherwise some data might stuck in the buffers above plain_file and marks_file
+    /// Also the order is important
+
+    compressed_hashing.finalize();
+    compressor.finalize();
+    plain_hashing.finalize();
 
     if (compress_marks)
     {
-        marks_compressed_hashing.next();
-        marks_compressor.next();
+        marks_compressed_hashing.finalize();
+        marks_compressor.finalize();
     }
 
-    marks_hashing.next();
+    marks_hashing.finalize();
 
     plain_file->preFinalize();
     marks_file->preFinalize();
@@ -347,9 +352,12 @@ void MergeTreeDataPartWriterOnDisk::fillPrimaryIndexChecksums(MergeTreeData::Dat
         }
 
         if (compress_primary_key)
-            index_source_hashing_stream->next();
+        {
+            index_source_hashing_stream->finalize();
+            index_compressor_stream->finalize();
+        }
 
-        index_file_hashing_stream->next();
+        index_file_hashing_stream->finalize();
 
         String index_name = "primary" + getIndexExtension(compress_primary_key);
         if (compress_primary_key)
diff --git a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
index 16b27c2c820..ee515106591 100644
--- a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
@@ -16,6 +16,7 @@
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTSampleRatio.h>
+#include <Parsers/ExpressionListParsers.h>
 #include <Parsers/parseIdentifierOrStringLiteral.h>
 #include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/InterpreterSelectQuery.h>
@@ -45,7 +46,7 @@
 
 #include <IO/WriteBufferFromOStream.h>
 
-#include <Storages/MergeTree/CommonANNIndexes.h>
+#include <Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.h>
 
 namespace CurrentMetrics
 {
@@ -796,12 +797,13 @@ std::optional<std::unordered_set<String>> MergeTreeDataSelectExecutor::filterPar
 }
 
 void MergeTreeDataSelectExecutor::filterPartsByPartition(
+    std::optional<PartitionPruner> & partition_pruner,
+    std::optional<KeyCondition> & minmax_idx_condition,
     MergeTreeData::DataPartsVector & parts,
     std::vector<AlterConversionsPtr> & alter_conversions,
     const std::optional<std::unordered_set<String>> & part_values,
     const StorageMetadataPtr & metadata_snapshot,
     const MergeTreeData & data,
-    const SelectQueryInfo & query_info,
     const ContextPtr & context,
     const PartitionIdToMaxBlock * max_block_numbers_to_read,
     Poco::Logger * log,
@@ -810,27 +812,16 @@ void MergeTreeDataSelectExecutor::filterPartsByPartition(
     chassert(alter_conversions.empty() || parts.size() == alter_conversions.size());
 
     const Settings & settings = context->getSettingsRef();
-
-    std::optional<PartitionPruner> partition_pruner;
-    std::optional<KeyCondition> minmax_idx_condition;
     DataTypes minmax_columns_types;
 
     if (metadata_snapshot->hasPartitionKey())
     {
         const auto & partition_key = metadata_snapshot->getPartitionKey();
-        auto minmax_columns_names = data.getMinMaxColumnsNames(partition_key);
-        auto minmax_expression_actions = data.getMinMaxExpr(partition_key, ExpressionActionsSettings::fromContext(context));
         minmax_columns_types = data.getMinMaxColumnsTypes(partition_key);
 
-        if (context->getSettingsRef().allow_experimental_analyzer)
-            minmax_idx_condition.emplace(query_info.filter_actions_dag, context, minmax_columns_names, minmax_expression_actions, NameSet());
-        else
-            minmax_idx_condition.emplace(query_info, context, minmax_columns_names, minmax_expression_actions);
-
-        partition_pruner.emplace(metadata_snapshot, query_info, context, false /* strict */);
-
         if (settings.force_index_by_date && (minmax_idx_condition->alwaysUnknownOrTrue() && partition_pruner->isUseless()))
         {
+            auto minmax_columns_names = data.getMinMaxColumnsNames(partition_key);
             throw Exception(ErrorCodes::INDEX_NOT_USED,
                 "Neither MinMax index by columns ({}) nor partition expr is used and setting 'force_index_by_date' is set",
                 fmt::join(minmax_columns_names, ", "));
@@ -896,9 +887,9 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
     MergeTreeData::DataPartsVector && parts,
     std::vector<AlterConversionsPtr> && alter_conversions,
     StorageMetadataPtr metadata_snapshot,
-    const SelectQueryInfo & query_info,
     const ContextPtr & context,
     const KeyCondition & key_condition,
+    const UsefulSkipIndexes & skip_indexes,
     const MergeTreeReaderSettings & reader_settings,
     Poco::Logger * log,
     size_t num_streams,
@@ -911,66 +902,6 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
     parts_with_ranges.resize(parts.size());
     const Settings & settings = context->getSettingsRef();
 
-    /// Let's start analyzing all useful indices
-
-    struct IndexStat
-    {
-        std::atomic<size_t> total_granules{0};
-        std::atomic<size_t> granules_dropped{0};
-        std::atomic<size_t> total_parts{0};
-        std::atomic<size_t> parts_dropped{0};
-    };
-
-    struct DataSkippingIndexAndCondition
-    {
-        MergeTreeIndexPtr index;
-        MergeTreeIndexConditionPtr condition;
-        IndexStat stat;
-
-        DataSkippingIndexAndCondition(MergeTreeIndexPtr index_, MergeTreeIndexConditionPtr condition_)
-            : index(index_), condition(condition_)
-        {
-        }
-    };
-
-    struct MergedDataSkippingIndexAndCondition
-    {
-        std::vector<MergeTreeIndexPtr> indices;
-        MergeTreeIndexMergedConditionPtr condition;
-        IndexStat stat;
-
-        void addIndex(const MergeTreeIndexPtr & index)
-        {
-            indices.push_back(index);
-            condition->addIndex(indices.back());
-        }
-    };
-
-    std::list<DataSkippingIndexAndCondition> useful_indices;
-    std::map<std::pair<String, size_t>, MergedDataSkippingIndexAndCondition> merged_indices;
-
-    if (use_skip_indexes)
-    {
-        for (const auto & index : metadata_snapshot->getSecondaryIndices())
-        {
-            auto index_helper = MergeTreeIndexFactory::instance().get(index);
-            if (index_helper->isMergeable())
-            {
-                auto [it, inserted] = merged_indices.try_emplace({index_helper->index.type, index_helper->getGranularity()});
-                if (inserted)
-                    it->second.condition = index_helper->createIndexMergedCondition(query_info, metadata_snapshot);
-
-                it->second.addIndex(index_helper);
-            }
-            else
-            {
-                auto condition = index_helper->createIndexCondition(query_info, context);
-                if (!condition->alwaysUnknownOrTrue())
-                    useful_indices.emplace_back(index_helper, condition);
-            }
-        }
-    }
-
     if (use_skip_indexes && settings.force_data_skipping_indices.changed)
     {
         const auto & indices = settings.force_data_skipping_indices.toString();
@@ -988,7 +919,7 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
             throw Exception(ErrorCodes::CANNOT_PARSE_TEXT, "No indices parsed from force_data_skipping_indices ('{}')", indices);
 
         std::unordered_set<std::string> useful_indices_names;
-        for (const auto & useful_index : useful_indices)
+        for (const auto & useful_index : skip_indexes.useful_indices)
             useful_indices_names.insert(useful_index.index->index.name);
 
         for (const auto & index_name : forced_indices)
@@ -1003,6 +934,17 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
         }
     }
 
+    struct IndexStat
+    {
+        std::atomic<size_t> total_granules{0};
+        std::atomic<size_t> granules_dropped{0};
+        std::atomic<size_t> total_parts{0};
+        std::atomic<size_t> parts_dropped{0};
+    };
+
+    std::vector<IndexStat> useful_indices_stat(skip_indexes.useful_indices.size());
+    std::vector<IndexStat> merged_indices_stat(skip_indexes.merged_indices.size());
+
     std::atomic<size_t> sum_marks_pk = 0;
     std::atomic<size_t> sum_parts_pk = 0;
 
@@ -1031,13 +973,15 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
             if (!ranges.ranges.empty())
                 sum_parts_pk.fetch_add(1, std::memory_order_relaxed);
 
-            for (auto & index_and_condition : useful_indices)
+            for (size_t idx = 0; idx < skip_indexes.useful_indices.size(); ++idx)
             {
                 if (ranges.ranges.empty())
                     break;
 
-                index_and_condition.stat.total_parts.fetch_add(1, std::memory_order_relaxed);
-                index_and_condition.stat.total_granules.fetch_add(ranges.ranges.getNumberOfMarks(), std::memory_order_relaxed);
+                const auto & index_and_condition = skip_indexes.useful_indices[idx];
+                auto & stat = useful_indices_stat[idx];
+                stat.total_parts.fetch_add(1, std::memory_order_relaxed);
+                stat.total_granules.fetch_add(ranges.ranges.getNumberOfMarks(), std::memory_order_relaxed);
 
                 size_t granules_dropped = 0;
                 ranges.ranges = filterMarksUsingIndex(
@@ -1052,17 +996,19 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
                     uncompressed_cache.get(),
                     log);
 
-                index_and_condition.stat.granules_dropped.fetch_add(granules_dropped, std::memory_order_relaxed);
+                stat.granules_dropped.fetch_add(granules_dropped, std::memory_order_relaxed);
                 if (ranges.ranges.empty())
-                    index_and_condition.stat.parts_dropped.fetch_add(1, std::memory_order_relaxed);
+                    stat.parts_dropped.fetch_add(1, std::memory_order_relaxed);
             }
 
-            for (auto & [_, indices_and_condition] : merged_indices)
+            for (size_t idx = 0; idx < skip_indexes.merged_indices.size(); ++idx)
             {
                 if (ranges.ranges.empty())
                     break;
 
-                indices_and_condition.stat.total_parts.fetch_add(1, std::memory_order_relaxed);
+                const auto & indices_and_condition = skip_indexes.merged_indices[idx];
+                auto & stat = merged_indices_stat[idx];
+                stat.total_parts.fetch_add(1, std::memory_order_relaxed);
 
                 size_t total_granules = 0;
                 size_t granules_dropped = 0;
@@ -1073,11 +1019,11 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
                     total_granules, granules_dropped,
                     mark_cache.get(), uncompressed_cache.get(), log);
 
-                indices_and_condition.stat.total_granules.fetch_add(total_granules, std::memory_order_relaxed);
-                indices_and_condition.stat.granules_dropped.fetch_add(granules_dropped, std::memory_order_relaxed);
+                stat.total_granules.fetch_add(total_granules, std::memory_order_relaxed);
+                stat.granules_dropped.fetch_add(granules_dropped, std::memory_order_relaxed);
 
                 if (ranges.ranges.empty())
-                    indices_and_condition.stat.parts_dropped.fetch_add(1, std::memory_order_relaxed);
+                    stat.parts_dropped.fetch_add(1, std::memory_order_relaxed);
             }
 
             if (!ranges.ranges.empty())
@@ -1144,15 +1090,17 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
             .num_granules_after = sum_marks_pk.load(std::memory_order_relaxed)});
     }
 
-    for (const auto & index_and_condition : useful_indices)
+    for (size_t idx = 0; idx < skip_indexes.useful_indices.size(); ++idx)
     {
+        const auto & index_and_condition = skip_indexes.useful_indices[idx];
+        const auto & stat = useful_indices_stat[idx];
         const auto & index_name = index_and_condition.index->index.name;
         LOG_DEBUG(
             log,
             "Index {} has dropped {}/{} granules.",
             backQuote(index_name),
-            index_and_condition.stat.granules_dropped,
-            index_and_condition.stat.total_granules);
+            stat.granules_dropped,
+            stat.total_granules);
 
         std::string description
             = index_and_condition.index->index.type + " GRANULARITY " + std::to_string(index_and_condition.index->index.granularity);
@@ -1161,25 +1109,27 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
             .type = ReadFromMergeTree::IndexType::Skip,
             .name = index_name,
             .description = std::move(description),
-            .num_parts_after = index_and_condition.stat.total_parts - index_and_condition.stat.parts_dropped,
-            .num_granules_after = index_and_condition.stat.total_granules - index_and_condition.stat.granules_dropped});
+            .num_parts_after = stat.total_parts - stat.parts_dropped,
+            .num_granules_after = stat.total_granules - stat.granules_dropped});
     }
 
-    for (const auto & [type_with_granularity, index_and_condition] : merged_indices)
+    for (size_t idx = 0; idx < skip_indexes.merged_indices.size(); ++idx)
     {
+        const auto & index_and_condition = skip_indexes.merged_indices[idx];
+        const auto & stat = merged_indices_stat[idx];
         const auto & index_name = "Merged";
         LOG_DEBUG(log, "Index {} has dropped {}/{} granules.",
                     backQuote(index_name),
-                    index_and_condition.stat.granules_dropped, index_and_condition.stat.total_granules);
+                    stat.granules_dropped, stat.total_granules);
 
-        std::string description = "MERGED GRANULARITY " + std::to_string(type_with_granularity.second);
+        std::string description = "MERGED GRANULARITY " + std::to_string(index_and_condition.indices.at(0)->index.granularity);
 
         index_stats.emplace_back(ReadFromMergeTree::IndexStat{
             .type = ReadFromMergeTree::IndexType::Skip,
             .name = index_name,
             .description = std::move(description),
-            .num_parts_after = index_and_condition.stat.total_parts - index_and_condition.stat.parts_dropped,
-            .num_granules_after = index_and_condition.stat.total_granules - index_and_condition.stat.granules_dropped});
+            .num_parts_after = stat.total_parts - stat.parts_dropped,
+            .num_granules_after = stat.total_granules - stat.granules_dropped});
     }
 
     return parts_with_ranges;
@@ -1301,6 +1251,7 @@ MergeTreeDataSelectAnalysisResultPtr MergeTreeDataSelectExecutor::estimateNumMar
 
     selectColumnNames(column_names_to_return, data, real_column_names, virt_column_names, sample_factor_column_queried);
 
+    std::optional<ReadFromMergeTree::Indexes> indexes;
     return ReadFromMergeTree::selectRangesToRead(
         std::move(parts),
         /*alter_conversions=*/ {},
@@ -1315,7 +1266,8 @@ MergeTreeDataSelectAnalysisResultPtr MergeTreeDataSelectExecutor::estimateNumMar
         data,
         real_column_names,
         sample_factor_column_queried,
-        log);
+        log,
+        indexes);
 }
 
 QueryPlanStepPtr MergeTreeDataSelectExecutor::readFromParts(
@@ -1686,17 +1638,14 @@ MarkRanges MergeTreeDataSelectExecutor::filterMarksUsingIndex(
         {
             if (index_mark != index_range.begin || !granule || last_index_mark != index_range.begin)
                 granule = reader.read();
-            const auto * gin_filter_condition = dynamic_cast<const MergeTreeConditionInverted *>(&*condition);
             // Cast to Ann condition
-            auto ann_condition = std::dynamic_pointer_cast<ApproximateNearestNeighbour::IMergeTreeIndexConditionAnn>(condition);
+            auto ann_condition = std::dynamic_pointer_cast<IMergeTreeIndexConditionApproximateNearestNeighbor>(condition);
             if (ann_condition != nullptr)
             {
                 // vector of indexes of useful ranges
                 auto result = ann_condition->getUsefulRanges(granule);
                 if (result.empty())
-                {
                     ++granules_dropped;
-                }
 
                 for (auto range : result)
                 {
@@ -1714,6 +1663,7 @@ MarkRanges MergeTreeDataSelectExecutor::filterMarksUsingIndex(
             }
 
             bool result = false;
+            const auto * gin_filter_condition = dynamic_cast<const MergeTreeConditionInverted *>(&*condition);
             if (!gin_filter_condition)
                 result = condition->mayBeTrueOnGranule(granule);
             else
diff --git a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.h b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.h
index 18fe312598c..a5dcbfe6650 100644
--- a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.h
+++ b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.h
@@ -175,12 +175,13 @@ public:
 
     /// Filter parts using minmax index and partition key.
     static void filterPartsByPartition(
+        std::optional<PartitionPruner> & partition_pruner,
+        std::optional<KeyCondition> & minmax_idx_condition,
         MergeTreeData::DataPartsVector & parts,
         std::vector<AlterConversionsPtr> & alter_conversions,
         const std::optional<std::unordered_set<String>> & part_values,
         const StorageMetadataPtr & metadata_snapshot,
         const MergeTreeData & data,
-        const SelectQueryInfo & query_info,
         const ContextPtr & context,
         const PartitionIdToMaxBlock * max_block_numbers_to_read,
         Poco::Logger * log,
@@ -193,9 +194,9 @@ public:
         MergeTreeData::DataPartsVector && parts,
         std::vector<AlterConversionsPtr> && alter_conversions,
         StorageMetadataPtr metadata_snapshot,
-        const SelectQueryInfo & query_info,
         const ContextPtr & context,
         const KeyCondition & key_condition,
+        const UsefulSkipIndexes & skip_indexes,
         const MergeTreeReaderSettings & reader_settings,
         Poco::Logger * log,
         size_t num_streams,
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index db486b163eb..7e306880e9c 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -46,6 +46,7 @@ namespace DB
 
 namespace ErrorCodes
 {
+    extern const int ABORTED;
     extern const int LOGICAL_ERROR;
     extern const int TOO_MANY_PARTS;
 }
@@ -115,7 +116,7 @@ void updateTTL(
 
     if (const ColumnUInt16 * column_date = typeid_cast<const ColumnUInt16 *>(ttl_column.get()))
     {
-        const auto & date_lut = DateLUT::instance();
+        const auto & date_lut = DateLUT::serverTimezoneInstance();
         for (const auto & val : column_date->getData())
             ttl_info.update(date_lut.fromDayNum(DayNum(val)));
     }
@@ -128,7 +129,7 @@ void updateTTL(
     {
         if (typeid_cast<const ColumnUInt16 *>(&column_const->getDataColumn()))
         {
-            const auto & date_lut = DateLUT::instance();
+            const auto & date_lut = DateLUT::serverTimezoneInstance();
             ttl_info.update(date_lut.fromDayNum(DayNum(column_const->getValue<UInt16>())));
         }
         else if (typeid_cast<const ColumnUInt32 *>(&column_const->getDataColumn()))
@@ -147,6 +148,19 @@ void updateTTL(
 
 }
 
+void MergeTreeDataWriter::TemporaryPart::cancel()
+{
+    try
+    {
+        /// An exception context is needed to proper delete write buffers without finalization
+        throw Exception(ErrorCodes::ABORTED, "Cancel temporary part.");
+    }
+    catch (...)
+    {
+        *this = TemporaryPart{};
+    }
+}
+
 void MergeTreeDataWriter::TemporaryPart::finalize()
 {
     for (auto & stream : streams)
@@ -369,7 +383,7 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
         DayNum min_date(minmax_idx->hyperrectangle[data.minmax_idx_date_column_pos].left.get<UInt64>());
         DayNum max_date(minmax_idx->hyperrectangle[data.minmax_idx_date_column_pos].right.get<UInt64>());
 
-        const auto & date_lut = DateLUT::instance();
+        const auto & date_lut = DateLUT::serverTimezoneInstance();
 
         auto min_month = date_lut.toNumYYYYMM(min_date);
         auto max_month = date_lut.toNumYYYYMM(max_date);
@@ -398,9 +412,11 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
 
     temp_part.temporary_directory_lock = data.getTemporaryPartDirectoryHolder(part_dir);
 
+    auto indices = MergeTreeIndexFactory::instance().getMany(metadata_snapshot->getSecondaryIndices());
+
     /// If we need to calculate some columns to sort.
     if (metadata_snapshot->hasSortingKey() || metadata_snapshot->hasSecondaryIndices())
-        data.getSortingKeyAndSkipIndicesExpression(metadata_snapshot)->execute(block);
+        data.getSortingKeyAndSkipIndicesExpression(metadata_snapshot, indices)->execute(block);
 
     Names sort_columns = metadata_snapshot->getSortingKeyColumns();
     SortDescription sort_description;
@@ -517,10 +533,16 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
     ///  either default lz4 or compression method with zero thresholds on absolute and relative part size.
     auto compression_codec = data.getContext()->chooseCompressionCodec(0, 0);
 
-    const auto & index_factory = MergeTreeIndexFactory::instance();
-    auto out = std::make_unique<MergedBlockOutputStream>(new_data_part, metadata_snapshot, columns,
-        index_factory.getMany(metadata_snapshot->getSecondaryIndices()), compression_codec,
-        context->getCurrentTransaction(), false, false, context->getWriteSettings());
+    auto out = std::make_unique<MergedBlockOutputStream>(
+        new_data_part,
+        metadata_snapshot,
+        columns,
+        indices,
+        compression_codec,
+        context->getCurrentTransaction(),
+        false,
+        false,
+        context->getWriteSettings());
 
     out->writeWithPermutation(block, perm_ptr);
 
@@ -606,7 +628,7 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeProjectionPartImpl(
 
     /// If we need to calculate some columns to sort.
     if (metadata_snapshot->hasSortingKey() || metadata_snapshot->hasSecondaryIndices())
-        data.getSortingKeyAndSkipIndicesExpression(metadata_snapshot)->execute(block);
+        data.getSortingKeyAndSkipIndicesExpression(metadata_snapshot, {})->execute(block);
 
     Names sort_columns = metadata_snapshot->getSortingKeyColumns();
     SortDescription sort_description;
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.h b/src/Storages/MergeTree/MergeTreeDataWriter.h
index 5dc7bf40922..795453b2afa 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.h
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.h
@@ -71,6 +71,7 @@ public:
 
         scope_guard temporary_directory_lock;
 
+        void cancel();
         void finalize();
     };
 
@@ -79,6 +80,11 @@ public:
       */
     TemporaryPart writeTempPart(BlockWithPartition & block, const StorageMetadataPtr & metadata_snapshot, ContextPtr context);
 
+    MergeTreeData::MergingParams::Mode getMergingMode() const
+    {
+        return data.merging_params.mode;
+    }
+
     TemporaryPart writeTempPartWithoutPrefix(BlockWithPartition & block, const StorageMetadataPtr & metadata_snapshot, int64_t block_number, ContextPtr context);
 
     /// For insertion.
diff --git a/src/Storages/MergeTree/MergeTreeIndexAggregatorBloomFilter.cpp b/src/Storages/MergeTree/MergeTreeIndexAggregatorBloomFilter.cpp
index fe5a2a861f6..ef98accfbc6 100644
--- a/src/Storages/MergeTree/MergeTreeIndexAggregatorBloomFilter.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexAggregatorBloomFilter.cpp
@@ -42,7 +42,7 @@ void MergeTreeIndexAggregatorBloomFilter::update(const Block & block, size_t * p
 {
     if (*pos >= block.rows())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "The provided position is not less than the number of block rows. "
-                        "Position: {}, Block rows: {}.", toString(*pos), toString(block.rows()));
+                        "Position: {}, Block rows: {}.", *pos, block.rows());
 
     Block granule_index_block;
     size_t max_read_rows = std::min(block.rows() - *pos, limit);
diff --git a/src/Storages/MergeTree/MergeTreeIndexAnnoy.cpp b/src/Storages/MergeTree/MergeTreeIndexAnnoy.cpp
index f64d6104ac6..f77cfe4fed0 100644
--- a/src/Storages/MergeTree/MergeTreeIndexAnnoy.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexAnnoy.cpp
@@ -2,26 +2,40 @@
 
 #include <Storages/MergeTree/MergeTreeIndexAnnoy.h>
 
+#include <Columns/ColumnArray.h>
 #include <Common/typeid_cast.h>
 #include <Core/Field.h>
-#include <IO/ReadHelpers.h>
-#include <IO/WriteHelpers.h>
-#include <Interpreters/castColumn.h>
-#include <Columns/ColumnArray.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeTuple.h>
+#include <IO/ReadHelpers.h>
+#include <IO/WriteHelpers.h>
+#include <Interpreters/Context.h>
+#include <Interpreters/castColumn.h>
 
 
 namespace DB
 {
 
-namespace ApproximateNearestNeighbour
+namespace ErrorCodes
 {
+    extern const int ILLEGAL_COLUMN;
+    extern const int INCORRECT_DATA;
+    extern const int INCORRECT_NUMBER_OF_COLUMNS;
+    extern const int INCORRECT_QUERY;
+    extern const int LOGICAL_ERROR;
+}
 
-template<typename Dist>
-void AnnoyIndex<Dist>::serialize(WriteBuffer& ostr) const
+
+template <typename Distance>
+AnnoyIndexWithSerialization<Distance>::AnnoyIndexWithSerialization(size_t dimensions)
+    : Base::AnnoyIndex(dimensions)
 {
-    assert(Base::_built);
+}
+
+template<typename Distance>
+void AnnoyIndexWithSerialization<Distance>::serialize(WriteBuffer & ostr) const
+{
+    chassert(Base::_built);
     writeIntBinary(Base::_s, ostr);
     writeIntBinary(Base::_n_items, ostr);
     writeIntBinary(Base::_n_nodes, ostr);
@@ -29,13 +43,13 @@ void AnnoyIndex<Dist>::serialize(WriteBuffer& ostr) const
     writeIntBinary(Base::_K, ostr);
     writeIntBinary(Base::_seed, ostr);
     writeVectorBinary(Base::_roots, ostr);
-    ostr.write(reinterpret_cast<const char*>(Base::_nodes), Base::_s * Base::_n_nodes);
+    ostr.write(reinterpret_cast<const char *>(Base::_nodes), Base::_s * Base::_n_nodes);
 }
 
-template<typename Dist>
-void AnnoyIndex<Dist>::deserialize(ReadBuffer& istr)
+template<typename Distance>
+void AnnoyIndexWithSerialization<Distance>::deserialize(ReadBuffer & istr)
 {
-    assert(!Base::_built);
+    chassert(!Base::_built);
     readIntBinary(Base::_s, istr);
     readIntBinary(Base::_n_items, istr);
     readIntBinary(Base::_n_nodes, istr);
@@ -54,24 +68,12 @@ void AnnoyIndex<Dist>::deserialize(ReadBuffer& istr)
     Base::_built = true;
 }
 
-template<typename Dist>
-uint64_t AnnoyIndex<Dist>::getNumOfDimensions() const
+template<typename Distance>
+size_t AnnoyIndexWithSerialization<Distance>::getDimensions() const
 {
     return Base::get_f();
 }
 
-}
-
-
-namespace ErrorCodes
-{
-    extern const int ILLEGAL_COLUMN;
-    extern const int INCORRECT_DATA;
-    extern const int INCORRECT_NUMBER_OF_COLUMNS;
-    extern const int INCORRECT_QUERY;
-    extern const int LOGICAL_ERROR;
-    extern const int BAD_ARGUMENTS;
-}
 
 template <typename Distance>
 MergeTreeIndexGranuleAnnoy<Distance>::MergeTreeIndexGranuleAnnoy(const String & index_name_, const Block & index_sample_block_)
@@ -84,27 +86,27 @@ template <typename Distance>
 MergeTreeIndexGranuleAnnoy<Distance>::MergeTreeIndexGranuleAnnoy(
     const String & index_name_,
     const Block & index_sample_block_,
-    AnnoyIndexPtr index_base_)
+    AnnoyIndexWithSerializationPtr<Distance> index_)
     : index_name(index_name_)
     , index_sample_block(index_sample_block_)
-    , index(std::move(index_base_))
+    , index(std::move(index_))
 {}
 
 template <typename Distance>
 void MergeTreeIndexGranuleAnnoy<Distance>::serializeBinary(WriteBuffer & ostr) const
 {
-    /// number of dimensions is required in the constructor,
+    /// Number of dimensions is required in the index constructor,
     /// so it must be written and read separately from the other part
-    writeIntBinary(index->getNumOfDimensions(), ostr); // write dimension
+    writeIntBinary(static_cast<UInt64>(index->getDimensions()), ostr); // write dimension
     index->serialize(ostr);
 }
 
 template <typename Distance>
 void MergeTreeIndexGranuleAnnoy<Distance>::deserializeBinary(ReadBuffer & istr, MergeTreeIndexVersion /*version*/)
 {
-    uint64_t dimension;
+    UInt64 dimension;
     readIntBinary(dimension, istr);
-    index = std::make_shared<AnnoyIndex>(dimension);
+    index = std::make_shared<AnnoyIndexWithSerialization<Distance>>(dimension);
     index->deserialize(istr);
 }
 
@@ -112,18 +114,18 @@ template <typename Distance>
 MergeTreeIndexAggregatorAnnoy<Distance>::MergeTreeIndexAggregatorAnnoy(
     const String & index_name_,
     const Block & index_sample_block_,
-    uint64_t number_of_trees_)
+    UInt64 trees_)
     : index_name(index_name_)
     , index_sample_block(index_sample_block_)
-    , number_of_trees(number_of_trees_)
+    , trees(trees_)
 {}
 
 template <typename Distance>
 MergeTreeIndexGranulePtr MergeTreeIndexAggregatorAnnoy<Distance>::getGranuleAndReset()
 {
     // NOLINTNEXTLINE(*)
-    index->build(static_cast<int>(number_of_trees), /*number_of_threads=*/1);
-    auto granule = std::make_shared<MergeTreeIndexGranuleAnnoy<Distance> >(index_name, index_sample_block, index);
+    index->build(static_cast<int>(trees), /*number_of_threads=*/1);
+    auto granule = std::make_shared<MergeTreeIndexGranuleAnnoy<Distance>>(index_name, index_sample_block, index);
     index = nullptr;
     return granule;
 }
@@ -135,270 +137,254 @@ void MergeTreeIndexAggregatorAnnoy<Distance>::update(const Block & block, size_t
         throw Exception(
             ErrorCodes::LOGICAL_ERROR,
             "The provided position is not less than the number of block rows. Position: {}, Block rows: {}.",
-            toString(*pos), toString(block.rows()));
+            *pos, block.rows());
 
     size_t rows_read = std::min(limit, block.rows() - *pos);
+
     if (rows_read == 0)
         return;
 
     if (index_sample_block.columns() > 1)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Only one column is supported");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected block with single column");
 
-    auto index_column_name = index_sample_block.getByPosition(0).name;
-    const auto & column_cut = block.getByName(index_column_name).column->cut(*pos, rows_read);
-    const auto & column_array = typeid_cast<const ColumnArray*>(column_cut.get());
-    if (column_array)
+    const String & index_column_name = index_sample_block.getByPosition(0).name;
+    ColumnPtr column_cut = block.getByName(index_column_name).column->cut(*pos, rows_read);
+
+    if (const auto & column_array = typeid_cast<const ColumnArray *>(column_cut.get()))
     {
         const auto & data = column_array->getData();
-        const auto & array = typeid_cast<const ColumnFloat32&>(data).getData();
+        const auto & array = typeid_cast<const ColumnFloat32 &>(data).getData();
+
         if (array.empty())
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Array has 0 rows, {} rows expected", rows_read);
+
         const auto & offsets = column_array->getOffsets();
-        size_t num_rows = offsets.size();
+        const size_t num_rows = offsets.size();
 
         /// Check all sizes are the same
         size_t size = offsets[0];
         for (size_t i = 0; i < num_rows - 1; ++i)
             if (offsets[i + 1] - offsets[i] != size)
-                throw Exception(ErrorCodes::INCORRECT_DATA, "Arrays should have same length");
+                throw Exception(ErrorCodes::INCORRECT_DATA, "All arrays in column {} must have equal length", index_column_name);
 
-        index = std::make_shared<AnnoyIndex>(size);
+        index = std::make_shared<AnnoyIndexWithSerialization<Distance>>(size);
 
+        /// Add all rows of block
         index->add_item(index->get_n_items(), array.data());
-        /// add all rows from 1 to num_rows - 1 (this is the same as the beginning of the last element)
         for (size_t current_row = 1; current_row < num_rows; ++current_row)
             index->add_item(index->get_n_items(), &array[offsets[current_row - 1]]);
     }
-    else
+    else if (const auto & column_tuple = typeid_cast<const ColumnTuple *>(column_cut.get()))
     {
-        /// Other possible type of column is Tuple
-        const auto & column_tuple = typeid_cast<const ColumnTuple*>(column_cut.get());
-
-        if (!column_tuple)
-            throw Exception(ErrorCodes::INCORRECT_QUERY, "Wrong type was given to index.");
-
         const auto & columns = column_tuple->getColumns();
 
+        /// TODO check if calling index->add_item() directly on the block's tuples is faster than materializing everything
         std::vector<std::vector<Float32>> data{column_tuple->size(), std::vector<Float32>()};
-        for (const auto& column : columns)
+        for (const auto & column : columns)
         {
-            const auto& pod_array = typeid_cast<const ColumnFloat32*>(column.get())->getData();
+            const auto & pod_array = typeid_cast<const ColumnFloat32 *>(column.get())->getData();
             for (size_t i = 0; i < pod_array.size(); ++i)
                 data[i].push_back(pod_array[i]);
         }
-        assert(!data.empty());
-        if (!index)
-            index = std::make_shared<AnnoyIndex>(data[0].size());
-        for (const auto& item : data)
+
+        if (data.empty())
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Tuple has 0 rows, {} rows expected", rows_read);
+
+        index = std::make_shared<AnnoyIndexWithSerialization<Distance>>(data[0].size());
+
+        for (const auto & item : data)
             index->add_item(index->get_n_items(), item.data());
     }
+    else
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected Array or Tuple column");
 
     *pos += rows_read;
 }
 
 
 MergeTreeIndexConditionAnnoy::MergeTreeIndexConditionAnnoy(
-    const IndexDescription & /*index*/,
+    const IndexDescription & /*index_description*/,
     const SelectQueryInfo & query,
-    ContextPtr context,
-    const String& distance_name_)
-    : condition(query, context), distance_name(distance_name_)
+    const String & distance_function_,
+    ContextPtr context)
+    : ann_condition(query, context)
+    , distance_function(distance_function_)
+    , search_k(context->getSettings().annoy_index_search_k_nodes)
 {}
 
-
-bool MergeTreeIndexConditionAnnoy::mayBeTrueOnGranule(MergeTreeIndexGranulePtr /* idx_granule */) const
+bool MergeTreeIndexConditionAnnoy::mayBeTrueOnGranule(MergeTreeIndexGranulePtr /*idx_granule*/) const
 {
     throw Exception(ErrorCodes::LOGICAL_ERROR, "mayBeTrueOnGranule is not supported for ANN skip indexes");
 }
 
 bool MergeTreeIndexConditionAnnoy::alwaysUnknownOrTrue() const
 {
-    return condition.alwaysUnknownOrTrue(distance_name);
+    return ann_condition.alwaysUnknownOrTrue(distance_function);
 }
 
 std::vector<size_t> MergeTreeIndexConditionAnnoy::getUsefulRanges(MergeTreeIndexGranulePtr idx_granule) const
 {
-    if (distance_name == "L2Distance")
-    {
-        return getUsefulRangesImpl<::Annoy::Euclidean>(idx_granule);
-    }
-    else if (distance_name == "cosineDistance")
-    {
-        return getUsefulRangesImpl<::Annoy::Angular>(idx_granule);
-    }
-    else
-    {
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown distance name. Must be 'L2Distance' or 'cosineDistance'. Got {}", distance_name);
-    }
+    if (distance_function == "L2Distance")
+        return getUsefulRangesImpl<Annoy::Euclidean>(idx_granule);
+    else if (distance_function == "cosineDistance")
+        return getUsefulRangesImpl<Annoy::Angular>(idx_granule);
+    std::unreachable();
 }
 
-
 template <typename Distance>
 std::vector<size_t> MergeTreeIndexConditionAnnoy::getUsefulRangesImpl(MergeTreeIndexGranulePtr idx_granule) const
 {
-    UInt64 limit = condition.getLimit();
-    UInt64 index_granularity = condition.getIndexGranularity();
-    std::optional<float> comp_dist = condition.getQueryType() == ApproximateNearestNeighbour::ANNQueryInformation::Type::Where ?
-     std::optional<float>(condition.getComparisonDistanceForWhereQuery()) : std::nullopt;
+    const UInt64 limit = ann_condition.getLimit();
+    const UInt64 index_granularity = ann_condition.getIndexGranularity();
+    const std::optional<float> comparison_distance = ann_condition.getQueryType() == ApproximateNearestNeighborInformation::Type::Where
+        ? std::optional<float>(ann_condition.getComparisonDistanceForWhereQuery())
+        : std::nullopt;
 
-    if (comp_dist && comp_dist.value() < 0)
+    if (comparison_distance && comparison_distance.value() < 0)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to optimize query with where without distance");
 
-    std::vector<float> target_vec = condition.getTargetVector();
+    const std::vector<float> reference_vector = ann_condition.getReferenceVector();
 
-    auto granule = std::dynamic_pointer_cast<MergeTreeIndexGranuleAnnoy<Distance> >(idx_granule);
+    const auto granule = std::dynamic_pointer_cast<MergeTreeIndexGranuleAnnoy<Distance>>(idx_granule);
     if (granule == nullptr)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Granule has the wrong type");
 
-    auto annoy = granule->index;
+    const AnnoyIndexWithSerializationPtr<Distance> annoy = granule->index;
 
-    if (condition.getNumOfDimensions() != annoy->getNumOfDimensions())
+    if (ann_condition.getDimensions() != annoy->getDimensions())
         throw Exception(ErrorCodes::INCORRECT_QUERY, "The dimension of the space in the request ({}) "
-                        "does not match with the dimension in the index ({})",
-                        toString(condition.getNumOfDimensions()), toString(annoy->getNumOfDimensions()));
+                        "does not match the dimension in the index ({})",
+                        ann_condition.getDimensions(), annoy->getDimensions());
 
-    /// neighbors contain indexes of dots which were closest to target vector
-    std::vector<UInt64> neighbors;
+    std::vector<UInt64> neighbors; /// indexes of dots which were closest to the reference vector
     std::vector<Float32> distances;
     neighbors.reserve(limit);
     distances.reserve(limit);
 
-    int k_search = -1;
-    String params_str = condition.getParamsStr();
-    if (!params_str.empty())
-    {
-        try
-        {
-            /// k_search=... (algorithm will inspect up to search_k nodes which defaults to n_trees * n if not provided)
-            k_search = std::stoi(params_str.data() + 9);
-        }
-        catch (...)
-        {
-            throw Exception(ErrorCodes::INCORRECT_QUERY, "Setting of the annoy index should be int");
-        }
-    }
-    annoy->get_nns_by_vector(target_vec.data(), limit, k_search, &neighbors, &distances);
-    std::unordered_set<size_t> granule_numbers;
+    annoy->get_nns_by_vector(reference_vector.data(), limit, static_cast<int>(search_k), &neighbors, &distances);
+
+    chassert(neighbors.size() == distances.size());
+
+    std::vector<size_t> granule_numbers;
+    granule_numbers.reserve(neighbors.size());
     for (size_t i = 0; i < neighbors.size(); ++i)
     {
-        if (comp_dist && distances[i] > comp_dist)
+        if (comparison_distance && distances[i] > comparison_distance)
             continue;
-        granule_numbers.insert(neighbors[i] / index_granularity);
+        granule_numbers.push_back(neighbors[i] / index_granularity);
     }
 
-    std::vector<size_t> result_vector;
-    result_vector.reserve(granule_numbers.size());
-    for (auto granule_number : granule_numbers)
-        result_vector.push_back(granule_number);
+    /// make unique
+    std::sort(granule_numbers.begin(), granule_numbers.end());
+    granule_numbers.erase(std::unique(granule_numbers.begin(), granule_numbers.end()), granule_numbers.end());
 
-    return result_vector;
+    return granule_numbers;
 }
 
+MergeTreeIndexAnnoy::MergeTreeIndexAnnoy(const IndexDescription & index_, UInt64 trees_, const String & distance_function_)
+    : IMergeTreeIndex(index_)
+    , trees(trees_)
+    , distance_function(distance_function_)
+{}
+
 MergeTreeIndexGranulePtr MergeTreeIndexAnnoy::createIndexGranule() const
 {
-    if (distance_name == "L2Distance")
-    {
-        return std::make_shared<MergeTreeIndexGranuleAnnoy<::Annoy::Euclidean> >(index.name, index.sample_block);
-    }
-    if (distance_name == "cosineDistance")
-    {
-        return std::make_shared<MergeTreeIndexGranuleAnnoy<::Annoy::Angular> >(index.name, index.sample_block);
-    }
-    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown distance name. Must be 'L2Distance' or 'cosineDistance'. Got {}", distance_name);
+    if (distance_function == "L2Distance")
+        return std::make_shared<MergeTreeIndexGranuleAnnoy<Annoy::Euclidean>>(index.name, index.sample_block);
+    else if (distance_function == "cosineDistance")
+        return std::make_shared<MergeTreeIndexGranuleAnnoy<Annoy::Angular>>(index.name, index.sample_block);
+    std::unreachable();
 }
 
 MergeTreeIndexAggregatorPtr MergeTreeIndexAnnoy::createIndexAggregator() const
 {
-    if (distance_name == "L2Distance")
-    {
-        return std::make_shared<MergeTreeIndexAggregatorAnnoy<::Annoy::Euclidean> >(index.name, index.sample_block, number_of_trees);
-    }
-    if (distance_name == "cosineDistance")
-    {
-        return std::make_shared<MergeTreeIndexAggregatorAnnoy<::Annoy::Angular> >(index.name, index.sample_block, number_of_trees);
-    }
-    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown distance name. Must be 'L2Distance' or 'cosineDistance'. Got {}", distance_name);
+    /// TODO: Support more metrics. Available metrics: https://github.com/spotify/annoy/blob/master/src/annoymodule.cc#L151-L171
+    if (distance_function == "L2Distance")
+        return std::make_shared<MergeTreeIndexAggregatorAnnoy<Annoy::Euclidean>>(index.name, index.sample_block, trees);
+    else if (distance_function == "cosineDistance")
+        return std::make_shared<MergeTreeIndexAggregatorAnnoy<Annoy::Angular>>(index.name, index.sample_block, trees);
+    std::unreachable();
 }
 
-MergeTreeIndexConditionPtr MergeTreeIndexAnnoy::createIndexCondition(
-    const SelectQueryInfo & query, ContextPtr context) const
+MergeTreeIndexConditionPtr MergeTreeIndexAnnoy::createIndexCondition(const SelectQueryInfo & query, ContextPtr context) const
 {
-    return std::make_shared<MergeTreeIndexConditionAnnoy>(index, query, context, distance_name);
+    return std::make_shared<MergeTreeIndexConditionAnnoy>(index, query, distance_function, context);
 };
 
 MergeTreeIndexPtr annoyIndexCreator(const IndexDescription & index)
 {
-    uint64_t param = 100;
-    String distance_name = "L2Distance";
-    if (!index.arguments.empty() && !index.arguments[0].tryGet<uint64_t>(param))
-    {
-        if (!index.arguments[0].tryGet<String>(distance_name))
-        {
-            throw Exception(ErrorCodes::INCORRECT_DATA, "Can't parse first argument");
-        }
-    }
-    if (index.arguments.size() > 1 && !index.arguments[1].tryGet<String>(distance_name))
-    {
-        throw Exception(ErrorCodes::INCORRECT_DATA, "Can't parse second argument");
-    }
-    return std::make_shared<MergeTreeIndexAnnoy>(index, param, distance_name);
-}
+    static constexpr auto default_trees = 100uz;
+    static constexpr auto default_distance_function = "L2Distance";
 
-static void assertIndexColumnsType(const Block & header)
-{
-    DataTypePtr column_data_type_ptr = header.getDataTypes()[0];
+    String distance_function = default_distance_function;
+    if (!index.arguments.empty())
+        distance_function = index.arguments[0].get<String>();
 
-    if (const auto * array_type = typeid_cast<const DataTypeArray *>(column_data_type_ptr.get()))
-    {
-        TypeIndex nested_type_index = array_type->getNestedType()->getTypeId();
-        if (!WhichDataType(nested_type_index).isFloat32())
-            throw Exception(
-                ErrorCodes::ILLEGAL_COLUMN,
-                "Unexpected type {} of Annoy index. Only Array(Float32) and Tuple(Float32) are supported.",
-                column_data_type_ptr->getName());
-    }
-    else if (const auto * tuple_type = typeid_cast<const DataTypeTuple *>(column_data_type_ptr.get()))
-    {
-        const DataTypes & nested_types = tuple_type->getElements();
-        for (const auto & type : nested_types)
-        {
-            TypeIndex nested_type_index = type->getTypeId();
-            if (!WhichDataType(nested_type_index).isFloat32())
-                throw Exception(
-                    ErrorCodes::ILLEGAL_COLUMN,
-                    "Unexpected type {} of Annoy index. Only Array(Float32) and Tuple(Float32) are supported.",
-                    column_data_type_ptr->getName());
-        }
-    }
-    else
-        throw Exception(
-            ErrorCodes::ILLEGAL_COLUMN,
-            "Unexpected type {} of Annoy index. Only Array(Float32) and Tuple(Float32) are supported.",
-            column_data_type_ptr->getName());
+    UInt64 trees = default_trees;
+    if (index.arguments.size() > 1)
+        trees = index.arguments[1].get<UInt64>();
 
+    return std::make_shared<MergeTreeIndexAnnoy>(index, trees, distance_function);
 }
 
 void annoyIndexValidator(const IndexDescription & index, bool /* attach */)
 {
+    /// Check number and type of Annoy index arguments:
+
     if (index.arguments.size() > 2)
-    {
         throw Exception(ErrorCodes::INCORRECT_QUERY, "Annoy index must not have more than two parameters");
-    }
-    if (!index.arguments.empty() && index.arguments[0].getType() != Field::Types::UInt64
-        && index.arguments[0].getType() != Field::Types::String)
-    {
-        throw Exception(ErrorCodes::INCORRECT_QUERY, "Annoy index first argument must be UInt64 or String.");
-    }
-    if (index.arguments.size() > 1 && index.arguments[1].getType() != Field::Types::String)
-    {
-        throw Exception(ErrorCodes::INCORRECT_QUERY, "Annoy index second argument must be String.");
-    }
+
+    if (!index.arguments.empty() && index.arguments[0].getType() != Field::Types::String)
+        throw Exception(ErrorCodes::INCORRECT_QUERY, "Distance function argument of Annoy index must be of type String");
+
+    if (index.arguments.size() > 1 && index.arguments[1].getType() != Field::Types::UInt64)
+        throw Exception(ErrorCodes::INCORRECT_QUERY, "Number of trees argument of Annoy index must be of type UInt64");
+
+    /// Check that the index is created on a single column
 
     if (index.column_names.size() != 1 || index.data_types.size() != 1)
         throw Exception(ErrorCodes::INCORRECT_NUMBER_OF_COLUMNS, "Annoy indexes must be created on a single column");
 
-    assertIndexColumnsType(index.sample_block);
+    /// Check that a supported metric was passed as first argument
+
+    if (!index.arguments.empty())
+    {
+        String distance_name = index.arguments[0].get<String>();
+        if (distance_name != "L2Distance" && distance_name != "cosineDistance")
+            throw Exception(ErrorCodes::INCORRECT_DATA, "Annoy index only supports distance functions 'L2Distance' and 'cosineDistance'");
+    }
+
+    /// Check data type of indexed column:
+
+    auto throw_unsupported_underlying_column_exception = []()
+    {
+        throw Exception(
+            ErrorCodes::ILLEGAL_COLUMN,
+            "Annoy indexes can only be created on columns of type Array(Float32) and Tuple(Float32)");
+    };
+
+    DataTypePtr data_type = index.sample_block.getDataTypes()[0];
+
+    if (const auto * data_type_array = typeid_cast<const DataTypeArray *>(data_type.get()))
+    {
+        TypeIndex nested_type_index = data_type_array->getNestedType()->getTypeId();
+        if (!WhichDataType(nested_type_index).isFloat32())
+            throw_unsupported_underlying_column_exception();
+    }
+    else if (const auto * data_type_tuple = typeid_cast<const DataTypeTuple *>(data_type.get()))
+    {
+        const DataTypes & inner_types = data_type_tuple->getElements();
+        for (const auto & inner_type : inner_types)
+        {
+            TypeIndex nested_type_index = inner_type->getTypeId();
+            if (!WhichDataType(nested_type_index).isFloat32())
+                throw_unsupported_underlying_column_exception();
+        }
+    }
+    else
+        throw_unsupported_underlying_column_exception();
 }
 
 }
-#endif // ENABLE_ANNOY
+
+#endif
diff --git a/src/Storages/MergeTree/MergeTreeIndexAnnoy.h b/src/Storages/MergeTree/MergeTreeIndexAnnoy.h
index 3b1a41eb85d..cfc3b7519b8 100644
--- a/src/Storages/MergeTree/MergeTreeIndexAnnoy.h
+++ b/src/Storages/MergeTree/MergeTreeIndexAnnoy.h
@@ -2,7 +2,7 @@
 
 #ifdef ENABLE_ANNOY
 
-#include <Storages/MergeTree/CommonANNIndexes.h>
+#include <Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.h>
 
 #include <annoylib.h>
 #include <kissrandom.h>
@@ -10,36 +10,26 @@
 namespace DB
 {
 
-// auxiliary namespace for working with spotify-annoy library
-// mainly for serialization and deserialization of the index
-namespace ApproximateNearestNeighbour
+template <typename Distance>
+class AnnoyIndexWithSerialization : public Annoy::AnnoyIndex<UInt64, Float32, Distance, Annoy::Kiss64Random, Annoy::AnnoyIndexMultiThreadedBuildPolicy>
 {
-    using AnnoyIndexThreadedBuildPolicy = ::Annoy::AnnoyIndexMultiThreadedBuildPolicy;
-    // TODO: Support different metrics. List of available metrics can be taken from here:
-    // https://github.com/spotify/annoy/blob/master/src/annoymodule.cc#L151-L171
-    template <typename Distance>
-    class AnnoyIndex : public ::Annoy::AnnoyIndex<UInt64, Float32, Distance, ::Annoy::Kiss64Random, AnnoyIndexThreadedBuildPolicy>
-    {
-        using Base = ::Annoy::AnnoyIndex<UInt64, Float32, Distance, ::Annoy::Kiss64Random, AnnoyIndexThreadedBuildPolicy>;
-    public:
-        explicit AnnoyIndex(const uint64_t dim) : Base::AnnoyIndex(dim) {}
-        void serialize(WriteBuffer& ostr) const;
-        void deserialize(ReadBuffer& istr);
-        uint64_t getNumOfDimensions() const;
-    };
-}
+    using Base = Annoy::AnnoyIndex<UInt64, Float32, Distance, Annoy::Kiss64Random, Annoy::AnnoyIndexMultiThreadedBuildPolicy>;
+
+public:
+    explicit AnnoyIndexWithSerialization(size_t dimensions);
+    void serialize(WriteBuffer & ostr) const;
+    void deserialize(ReadBuffer & istr);
+    size_t getDimensions() const;
+};
+
+template <typename Distance>
+using AnnoyIndexWithSerializationPtr = std::shared_ptr<AnnoyIndexWithSerialization<Distance>>;
 
 template <typename Distance>
 struct MergeTreeIndexGranuleAnnoy final : public IMergeTreeIndexGranule
 {
-    using AnnoyIndex = ApproximateNearestNeighbour::AnnoyIndex<Distance>;
-    using AnnoyIndexPtr = std::shared_ptr<AnnoyIndex>;
-
     MergeTreeIndexGranuleAnnoy(const String & index_name_, const Block & index_sample_block_);
-    MergeTreeIndexGranuleAnnoy(
-        const String & index_name_,
-        const Block & index_sample_block_,
-        AnnoyIndexPtr index_base_);
+    MergeTreeIndexGranuleAnnoy(const String & index_name_, const Block & index_sample_block_, AnnoyIndexWithSerializationPtr<Distance> index_);
 
     ~MergeTreeIndexGranuleAnnoy() override = default;
 
@@ -48,54 +38,50 @@ struct MergeTreeIndexGranuleAnnoy final : public IMergeTreeIndexGranule
 
     bool empty() const override { return !index.get(); }
 
-    String index_name;
-    Block index_sample_block;
-    AnnoyIndexPtr index;
+    const String index_name;
+    const Block index_sample_block;
+    AnnoyIndexWithSerializationPtr<Distance> index;
 };
 
 template <typename Distance>
 struct MergeTreeIndexAggregatorAnnoy final : IMergeTreeIndexAggregator
 {
-    using AnnoyIndex = ApproximateNearestNeighbour::AnnoyIndex<Distance>;
-    using AnnoyIndexPtr = std::shared_ptr<AnnoyIndex>;
-
-    MergeTreeIndexAggregatorAnnoy(const String & index_name_, const Block & index_sample_block, uint64_t number_of_trees);
+    MergeTreeIndexAggregatorAnnoy(const String & index_name_, const Block & index_sample_block, UInt64 trees);
     ~MergeTreeIndexAggregatorAnnoy() override = default;
 
     bool empty() const override { return !index || index->get_n_items() == 0; }
     MergeTreeIndexGranulePtr getGranuleAndReset() override;
     void update(const Block & block, size_t * pos, size_t limit) override;
 
-    String index_name;
-    Block index_sample_block;
-    const uint64_t number_of_trees;
-    AnnoyIndexPtr index;
+    const String index_name;
+    const Block index_sample_block;
+    const UInt64 trees;
+    AnnoyIndexWithSerializationPtr<Distance> index;
 };
 
 
-class MergeTreeIndexConditionAnnoy final : public ApproximateNearestNeighbour::IMergeTreeIndexConditionAnn
+class MergeTreeIndexConditionAnnoy final : public IMergeTreeIndexConditionApproximateNearestNeighbor
 {
 public:
     MergeTreeIndexConditionAnnoy(
-        const IndexDescription & index,
+        const IndexDescription & index_description,
         const SelectQueryInfo & query,
-        ContextPtr context,
-        const String& distance_name);
-
-    bool alwaysUnknownOrTrue() const override;
-
-    bool mayBeTrueOnGranule(MergeTreeIndexGranulePtr idx_granule) const override;
-
-    std::vector<size_t> getUsefulRanges(MergeTreeIndexGranulePtr idx_granule) const override;
+        const String & distance_function,
+        ContextPtr context);
 
     ~MergeTreeIndexConditionAnnoy() override = default;
 
+    bool alwaysUnknownOrTrue() const override;
+    bool mayBeTrueOnGranule(MergeTreeIndexGranulePtr idx_granule) const override;
+    std::vector<size_t> getUsefulRanges(MergeTreeIndexGranulePtr idx_granule) const override;
+
 private:
     template <typename Distance>
     std::vector<size_t> getUsefulRangesImpl(MergeTreeIndexGranulePtr idx_granule) const;
 
-    ApproximateNearestNeighbour::ANNCondition condition;
-    const String distance_name;
+    const ApproximateNearestNeighborCondition ann_condition;
+    const String distance_function;
+    const Int64 search_k;
 };
 
 
@@ -103,28 +89,22 @@ class MergeTreeIndexAnnoy : public IMergeTreeIndex
 {
 public:
 
-    MergeTreeIndexAnnoy(const IndexDescription & index_, uint64_t number_of_trees_, const String& distance_name_)
-        : IMergeTreeIndex(index_)
-        , number_of_trees(number_of_trees_)
-        , distance_name(distance_name_)
-    {}
+    MergeTreeIndexAnnoy(const IndexDescription & index_, UInt64 trees_, const String & distance_function_);
 
     ~MergeTreeIndexAnnoy() override = default;
 
     MergeTreeIndexGranulePtr createIndexGranule() const override;
     MergeTreeIndexAggregatorPtr createIndexAggregator() const override;
-
-    MergeTreeIndexConditionPtr createIndexCondition(
-        const SelectQueryInfo & query, ContextPtr context) const override;
+    MergeTreeIndexConditionPtr createIndexCondition(const SelectQueryInfo & query, ContextPtr context) const override;
 
     bool mayBenefitFromIndexForIn(const ASTPtr & /*node*/) const override { return false; }
 
 private:
-    const uint64_t number_of_trees;
-    const String distance_name;
+    const UInt64 trees;
+    const String distance_function;
 };
 
 
 }
 
-#endif // ENABLE_ANNOY
+#endif
diff --git a/src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.cpp b/src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.cpp
index 235d90bb974..398a85e92ac 100644
--- a/src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.cpp
@@ -36,6 +36,7 @@ ColumnWithTypeAndName getPreparedSetInfo(const ConstSetPtr & prepared_set)
 
     Columns set_elements;
     for (auto & set_element : prepared_set->getSetElements())
+
         set_elements.emplace_back(set_element->convertToFullColumnIfConst());
 
     return {ColumnTuple::create(set_elements), std::make_shared<DataTypeTuple>(prepared_set->getElementsTypes()), "dummy"};
@@ -310,13 +311,17 @@ bool MergeTreeIndexConditionBloomFilter::traverseFunction(const RPNBuilderTreeNo
 
         if (functionIsInOrGlobalInOperator(function_name))
         {
-            ConstSetPtr prepared_set = rhs_argument.tryGetPreparedSet();
-
-            if (prepared_set && prepared_set->hasExplicitSetElements())
+            if (auto future_set = rhs_argument.tryGetPreparedSet(); future_set)
             {
-                const auto prepared_info = getPreparedSetInfo(prepared_set);
-                if (traverseTreeIn(function_name, lhs_argument, prepared_set, prepared_info.type, prepared_info.column, out))
-                    maybe_useful = true;
+                if (auto prepared_set = future_set->buildOrderedSetInplace(rhs_argument.getTreeContext().getQueryContext()); prepared_set)
+                {
+                    if (prepared_set->hasExplicitSetElements())
+                    {
+                        const auto prepared_info = getPreparedSetInfo(prepared_set);
+                        if (traverseTreeIn(function_name, lhs_argument, prepared_set, prepared_info.type, prepared_info.column, out))
+                            maybe_useful = true;
+                    }
+                }
             }
         }
         else if (function_name == "equals" ||
diff --git a/src/Storages/MergeTree/MergeTreeIndexFullText.cpp b/src/Storages/MergeTree/MergeTreeIndexFullText.cpp
index 06fddd51cb8..b6a2cafe245 100644
--- a/src/Storages/MergeTree/MergeTreeIndexFullText.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexFullText.cpp
@@ -92,7 +92,7 @@ void MergeTreeIndexAggregatorFullText::update(const Block & block, size_t * pos,
 {
     if (*pos >= block.rows())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "The provided position is not less than the number of block rows. "
-                "Position: {}, Block rows: {}.", toString(*pos), toString(block.rows()));
+                "Position: {}, Block rows: {}.", *pos, block.rows());
 
     size_t rows_read = std::min(limit, block.rows() - *pos);
 
@@ -624,7 +624,11 @@ bool MergeTreeConditionFullText::tryPrepareSetBloomFilter(
     if (key_tuple_mapping.empty())
         return false;
 
-    auto prepared_set = right_argument.tryGetPreparedSet(data_types);
+    auto future_set = right_argument.tryGetPreparedSet(data_types);
+    if (!future_set)
+        return false;
+
+    auto prepared_set = future_set->buildOrderedSetInplace(right_argument.getTreeContext().getQueryContext());
     if (!prepared_set || !prepared_set->hasExplicitSetElements())
         return false;
 
diff --git a/src/Storages/MergeTree/MergeTreeIndexInverted.cpp b/src/Storages/MergeTree/MergeTreeIndexInverted.cpp
index baa11368c8b..6b4919c545d 100644
--- a/src/Storages/MergeTree/MergeTreeIndexInverted.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexInverted.cpp
@@ -123,7 +123,7 @@ void MergeTreeIndexAggregatorInverted::update(const Block & block, size_t * pos,
 {
     if (*pos >= block.rows())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "The provided position is not less than the number of block rows. "
-                "Position: {}, Block rows: {}.", toString(*pos), toString(block.rows()));
+                "Position: {}, Block rows: {}.", *pos, block.rows());
 
     size_t rows_read = std::min(limit, block.rows() - *pos);
     auto row_id = store->getNextRowIDRange(rows_read);
@@ -655,7 +655,11 @@ bool MergeTreeConditionInverted::tryPrepareSetGinFilter(
     if (key_tuple_mapping.empty())
         return false;
 
-    ConstSetPtr prepared_set = rhs.tryGetPreparedSet();
+    auto future_set = rhs.tryGetPreparedSet();
+    if (!future_set)
+        return false;
+
+    auto prepared_set = future_set->buildOrderedSetInplace(rhs.getTreeContext().getQueryContext());
     if (!prepared_set || !prepared_set->hasExplicitSetElements())
         return false;
 
diff --git a/src/Storages/MergeTree/MergeTreeIndexMinMax.cpp b/src/Storages/MergeTree/MergeTreeIndexMinMax.cpp
index d80f7521430..3b011837cb3 100644
--- a/src/Storages/MergeTree/MergeTreeIndexMinMax.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexMinMax.cpp
@@ -122,7 +122,7 @@ void MergeTreeIndexAggregatorMinMax::update(const Block & block, size_t * pos, s
 {
     if (*pos >= block.rows())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "The provided position is not less than the number of block rows. "
-                "Position: {}, Block rows: {}.", toString(*pos), toString(block.rows()));
+                "Position: {}, Block rows: {}.", *pos, block.rows());
 
     size_t rows_read = std::min(limit, block.rows() - *pos);
 
diff --git a/src/Storages/MergeTree/MergeTreeIndexSet.cpp b/src/Storages/MergeTree/MergeTreeIndexSet.cpp
index 901636a2de9..9c34a149128 100644
--- a/src/Storages/MergeTree/MergeTreeIndexSet.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexSet.cpp
@@ -146,7 +146,7 @@ void MergeTreeIndexAggregatorSet::update(const Block & block, size_t * pos, size
 {
     if (*pos >= block.rows())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "The provided position is not less than the number of block rows. "
-                "Position: {}, Block rows: {}.", toString(*pos), toString(block.rows()));
+                "Position: {}, Block rows: {}.", *pos, block.rows());
 
     size_t rows_read = std::min(limit, block.rows() - *pos);
 
@@ -554,7 +554,10 @@ void MergeTreeIndexConditionSet::traverseAST(ASTPtr & node) const
     if (atomFromAST(node))
     {
         if (node->as<ASTIdentifier>() || node->as<ASTFunction>())
-            node = makeASTFunction("__bitWrapperFunc", node);
+            /// __bitWrapperFunc* uses default implementation for Nullable types
+            /// Here we additionally convert Null to 0,
+            /// otherwise condition 'something OR NULL' will always return Null and filter everything.
+            node = makeASTFunction("__bitWrapperFunc", makeASTFunction("ifNull", node, std::make_shared<ASTLiteral>(Field(0))));
     }
     else
         node = std::make_shared<ASTLiteral>(UNKNOWN_FIELD);
diff --git a/src/Storages/MergeTree/MergeTreeMarksLoader.cpp b/src/Storages/MergeTree/MergeTreeMarksLoader.cpp
index 9a5576f0ad2..5c722eec380 100644
--- a/src/Storages/MergeTree/MergeTreeMarksLoader.cpp
+++ b/src/Storages/MergeTree/MergeTreeMarksLoader.cpp
@@ -135,6 +135,7 @@ MarkCache::MappedPtr MergeTreeMarksLoader::loadMarksImpl()
     if (!index_granularity_info.mark_type.adaptive)
     {
         /// Read directly to marks.
+        chassert(expected_uncompressed_size == plain_marks.size() * sizeof(MarkInCompressedFile));
         reader->readStrict(reinterpret_cast<char *>(plain_marks.data()), expected_uncompressed_size);
 
         if (!reader->eof())
@@ -148,23 +149,25 @@ MarkCache::MappedPtr MergeTreeMarksLoader::loadMarksImpl()
     }
     else
     {
-        size_t i = 0;
-        size_t granularity;
-        while (!reader->eof())
+        for (size_t i = 0; i < marks_count; ++i)
         {
+            if (reader->eof())
+                throw Exception(
+                    ErrorCodes::CANNOT_READ_ALL_DATA,
+                    "Cannot read all marks from file {}, marks expected {} (bytes size {}), marks read {} (bytes size {})",
+                    mrk_path, marks_count, expected_uncompressed_size, i, reader->count());
+
+            size_t granularity;
             reader->readStrict(
                 reinterpret_cast<char *>(plain_marks.data() + i * columns_in_mark), columns_in_mark * sizeof(MarkInCompressedFile));
             readIntBinary(granularity, *reader);
-            ++i;
         }
 
-        if (i * mark_size != expected_uncompressed_size)
-        {
+        if (!reader->eof())
             throw Exception(
                 ErrorCodes::CANNOT_READ_ALL_DATA,
-                "Cannot read all marks from file {}, marks expected {} (bytes size {}), marks read {} (bytes size {})",
-                mrk_path, marks_count, expected_uncompressed_size, i, reader->count());
-        }
+                "Too many marks in file {}, marks expected {} (bytes size {})",
+                mrk_path, marks_count, expected_uncompressed_size);
     }
 
     auto res = std::make_shared<MarksInCompressedFile>(plain_marks);
diff --git a/src/Storages/MergeTree/MergeTreeMutationEntry.cpp b/src/Storages/MergeTree/MergeTreeMutationEntry.cpp
index feffffb57ea..cac26c5ac23 100644
--- a/src/Storages/MergeTree/MergeTreeMutationEntry.cpp
+++ b/src/Storages/MergeTree/MergeTreeMutationEntry.cpp
@@ -128,7 +128,7 @@ MergeTreeMutationEntry::MergeTreeMutationEntry(DiskPtr disk_, const String & pat
 
     LocalDateTime create_time_dt;
     *buf >> "create time: " >> create_time_dt >> "\n";
-    create_time = DateLUT::instance().makeDateTime(
+    create_time = DateLUT::serverTimezoneInstance().makeDateTime(
         create_time_dt.year(), create_time_dt.month(), create_time_dt.day(),
         create_time_dt.hour(), create_time_dt.minute(), create_time_dt.second());
 
diff --git a/src/Storages/MergeTree/MergeTreePartInfo.cpp b/src/Storages/MergeTree/MergeTreePartInfo.cpp
index 84432a293d7..e1b52d8a7b7 100644
--- a/src/Storages/MergeTree/MergeTreePartInfo.cpp
+++ b/src/Storages/MergeTree/MergeTreePartInfo.cpp
@@ -148,7 +148,7 @@ void MergeTreePartInfo::parseMinMaxDatesFromPartName(const String & part_name, D
         throw Exception(ErrorCodes::BAD_DATA_PART_NAME, "Unexpected part name: {}", part_name);
     }
 
-    const auto & date_lut = DateLUT::instance();
+    const auto & date_lut = DateLUT::serverTimezoneInstance();
 
     min_date = date_lut.YYYYMMDDToDayNum(min_yyyymmdd);
     max_date = date_lut.YYYYMMDDToDayNum(max_yyyymmdd);
@@ -219,7 +219,7 @@ String MergeTreePartInfo::getPartNameV1() const
 
 String MergeTreePartInfo::getPartNameV0(DayNum left_date, DayNum right_date) const
 {
-    const auto & date_lut = DateLUT::instance();
+    const auto & date_lut = DateLUT::serverTimezoneInstance();
 
     /// Directory name for the part has form: `YYYYMMDD_YYYYMMDD_N_N_L`.
 
diff --git a/src/Storages/MergeTree/MergeTreePartition.cpp b/src/Storages/MergeTree/MergeTreePartition.cpp
index 1626018f1c1..bce33438229 100644
--- a/src/Storages/MergeTree/MergeTreePartition.cpp
+++ b/src/Storages/MergeTree/MergeTreePartition.cpp
@@ -247,7 +247,7 @@ String MergeTreePartition::getID(const Block & partition_key_sample) const
                 result += '-';
 
             if (typeid_cast<const DataTypeDate *>(partition_key_sample.getByPosition(i).type.get()))
-                result += toString(DateLUT::instance().toNumYYYYMMDD(DayNum(value[i].safeGet<UInt64>())));
+                result += toString(DateLUT::serverTimezoneInstance().toNumYYYYMMDD(DayNum(value[i].safeGet<UInt64>())));
             else if (typeid_cast<const DataTypeIPv4 *>(partition_key_sample.getByPosition(i).type.get()))
                 result += toString(value[i].get<IPv4>().toUnderType());
             else
@@ -331,7 +331,7 @@ std::optional<Row> MergeTreePartition::tryParseValueFromID(const String & partit
                     throw Exception(
                         ErrorCodes::INVALID_PARTITION_VALUE, "Cannot parse partition_id: got unexpected Date: {}", date_yyyymmdd);
 
-                UInt32 date = DateLUT::instance().YYYYMMDDToDayNum(date_yyyymmdd);
+                UInt32 date = DateLUT::serverTimezoneInstance().YYYYMMDDToDayNum(date_yyyymmdd);
                 res.emplace_back(date);
                 break;
             }
@@ -435,9 +435,11 @@ std::unique_ptr<WriteBufferFromFileBase> MergeTreePartition::store(const Block &
         partition_key_sample.getByPosition(i).type->getDefaultSerialization()->serializeBinary(value[i], out_hashing, {});
     }
 
-    out_hashing.next();
+    out_hashing.finalize();
+
     checksums.files["partition.dat"].file_size = out_hashing.count();
     checksums.files["partition.dat"].file_hash = out_hashing.getHash();
+
     out->preFinalize();
     return out;
 }
diff --git a/src/Storages/MergeTree/MergeTreePartsMover.cpp b/src/Storages/MergeTree/MergeTreePartsMover.cpp
index e1da57744b3..a8f34ba4cec 100644
--- a/src/Storages/MergeTree/MergeTreePartsMover.cpp
+++ b/src/Storages/MergeTree/MergeTreePartsMover.cpp
@@ -11,6 +11,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int ABORTED;
+    extern const int DIRECTORY_ALREADY_EXISTS;
 }
 
 namespace
@@ -203,7 +204,7 @@ bool MergeTreePartsMover::selectPartsForMove(
         return false;
 }
 
-MergeTreeMutableDataPartPtr MergeTreePartsMover::clonePart(const MergeTreeMoveEntry & moving_part) const
+MergeTreePartsMover::TemporaryClonedPart MergeTreePartsMover::clonePart(const MergeTreeMoveEntry & moving_part) const
 {
     if (moves_blocker.isCancelled())
         throw Exception(ErrorCodes::ABORTED, "Cancelled moving parts.");
@@ -212,6 +213,8 @@ MergeTreeMutableDataPartPtr MergeTreePartsMover::clonePart(const MergeTreeMoveEn
     auto part = moving_part.part;
     auto disk = moving_part.reserved_space->getDisk();
     LOG_DEBUG(log, "Cloning part {} from '{}' to '{}'", part->name, part->getDataPartStorage().getDiskName(), disk->getName());
+    TemporaryClonedPart cloned_part;
+    cloned_part.temporary_directory_lock = data->getTemporaryPartDirectoryHolder(part->name);
 
     MutableDataPartStoragePtr cloned_part_storage;
     if (disk->supportZeroCopyReplication() && settings->allow_remote_fs_zero_copy_replication)
@@ -222,8 +225,10 @@ MergeTreeMutableDataPartPtr MergeTreePartsMover::clonePart(const MergeTreeMoveEn
         String relative_path = part->getDataPartStorage().getPartDirectory();
         if (disk->exists(path_to_clone + relative_path))
         {
-            LOG_WARNING(log, "Path {} already exists. Will remove it and clone again.", fullPath(disk, path_to_clone + relative_path));
-            disk->removeRecursive(fs::path(path_to_clone) / relative_path / "");
+            throw Exception(ErrorCodes::DIRECTORY_ALREADY_EXISTS,
+                "Cannot clone part {} from '{}' to '{}': path '{}' already exists",
+                part->name, part->getDataPartStorage().getDiskName(), disk->getName(),
+                fullPath(disk, path_to_clone + relative_path));
         }
 
         disk->createDirectories(path_to_clone);
@@ -242,37 +247,51 @@ MergeTreeMutableDataPartPtr MergeTreePartsMover::clonePart(const MergeTreeMoveEn
     }
 
     MergeTreeDataPartBuilder builder(*data, part->name, cloned_part_storage);
-    auto cloned_part = std::move(builder).withPartFormatFromDisk().build();
-    LOG_TRACE(log, "Part {} was cloned to {}", part->name, cloned_part->getDataPartStorage().getFullPath());
+    cloned_part.part = std::move(builder).withPartFormatFromDisk().build();
+    LOG_TRACE(log, "Part {} was cloned to {}", part->name, cloned_part.part->getDataPartStorage().getFullPath());
 
-    cloned_part->loadColumnsChecksumsIndexes(true, true);
-    cloned_part->loadVersionMetadata();
-    cloned_part->modification_time = cloned_part->getDataPartStorage().getLastModified().epochTime();
+    cloned_part.part->is_temp = data->allowRemoveStaleMovingParts();
+    cloned_part.part->loadColumnsChecksumsIndexes(true, true);
+    cloned_part.part->loadVersionMetadata();
+    cloned_part.part->modification_time = cloned_part.part->getDataPartStorage().getLastModified().epochTime();
     return cloned_part;
 }
 
 
-void MergeTreePartsMover::swapClonedPart(const MergeTreeMutableDataPartPtr & cloned_part) const
+void MergeTreePartsMover::swapClonedPart(TemporaryClonedPart & cloned_part) const
 {
     if (moves_blocker.isCancelled())
         throw Exception(ErrorCodes::ABORTED, "Cancelled moving parts.");
 
-    auto active_part = data->getActiveContainingPart(cloned_part->name);
+    /// `getActiveContainingPart` and `swapActivePart` are called under the same lock
+    /// to prevent part becoming inactive between calls
+    auto part_lock = data->lockParts();
+    auto active_part = data->getActiveContainingPart(cloned_part.part->name, part_lock);
 
     /// It's ok, because we don't block moving parts for merges or mutations
-    if (!active_part || active_part->name != cloned_part->name)
+    if (!active_part || active_part->name != cloned_part.part->name)
     {
-        LOG_INFO(log, "Failed to swap {}. Active part doesn't exist. Possible it was merged or mutated. Will remove copy on path '{}'.", cloned_part->name, cloned_part->getDataPartStorage().getFullPath());
+        LOG_INFO(log,
+            "Failed to swap {}. Active part doesn't exist (containing part {}). "
+            "Possible it was merged or mutated. Part on path '{}' {}",
+            cloned_part.part->name,
+            active_part ? active_part->name : "doesn't exist",
+            cloned_part.part->getDataPartStorage().getFullPath(),
+            data->allowRemoveStaleMovingParts() ? "will be removed" : "will remain intact (set <allow_remove_stale_moving_parts> in config.xml, exercise caution when using)");
         return;
     }
 
+    cloned_part.part->is_temp = false;
+
     /// Don't remove new directory but throw an error because it may contain part which is currently in use.
-    cloned_part->renameTo(active_part->name, false);
+    cloned_part.part->renameTo(active_part->name, false);
 
     /// TODO what happen if server goes down here?
-    data->swapActivePart(cloned_part);
+    data->swapActivePart(cloned_part.part, part_lock);
 
-    LOG_TRACE(log, "Part {} was moved to {}", cloned_part->name, cloned_part->getDataPartStorage().getFullPath());
+    LOG_TRACE(log, "Part {} was moved to {}", cloned_part.part->name, cloned_part.part->getDataPartStorage().getFullPath());
+
+    cloned_part.temporary_directory_lock = {};
 }
 
 }
diff --git a/src/Storages/MergeTree/MergeTreePartsMover.h b/src/Storages/MergeTree/MergeTreePartsMover.h
index 1cee98bcba9..82fd271ee5f 100644
--- a/src/Storages/MergeTree/MergeTreePartsMover.h
+++ b/src/Storages/MergeTree/MergeTreePartsMover.h
@@ -3,6 +3,7 @@
 #include <functional>
 #include <optional>
 #include <vector>
+#include <base/scope_guard.h>
 #include <Disks/StoragePolicy.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
 #include <Storages/MergeTree/MovesList.h>
@@ -43,12 +44,19 @@ private:
     using AllowedMovingPredicate = std::function<bool(const std::shared_ptr<const IMergeTreeDataPart> &, String * reason)>;
 
 public:
+
     explicit MergeTreePartsMover(MergeTreeData * data_)
         : data(data_)
         , log(&Poco::Logger::get("MergeTreePartsMover"))
     {
     }
 
+    struct TemporaryClonedPart
+    {
+        MergeTreeMutableDataPartPtr part;
+        scope_guard temporary_directory_lock;
+    };
+
     /// Select parts for background moves according to storage_policy configuration.
     /// Returns true if at least one part was selected for move.
     bool selectPartsForMove(
@@ -57,14 +65,14 @@ public:
         const std::lock_guard<std::mutex> & moving_parts_lock);
 
     /// Copies part to selected reservation in detached folder. Throws exception if part already exists.
-    MergeTreeMutableDataPartPtr clonePart(const MergeTreeMoveEntry & moving_part) const;
+    TemporaryClonedPart clonePart(const MergeTreeMoveEntry & moving_part) const;
 
     /// Replaces cloned part from detached directory into active data parts set.
     /// Replacing part changes state to DeleteOnDestroy and will be removed from disk after destructor of
     /// IMergeTreeDataPart called. If replacing part doesn't exists or not active (committed) than
     /// cloned part will be removed and log message will be reported. It may happen in case of concurrent
     /// merge or mutation.
-    void swapClonedPart(const MergeTreeMutableDataPartPtr & cloned_parts) const;
+    void swapClonedPart(TemporaryClonedPart & cloned_part) const;
 
     /// Can stop background moves and moves from queries
     ActionBlocker moves_blocker;
diff --git a/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp b/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
index 63a205a1a61..8a2ee0ce9e1 100644
--- a/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
+++ b/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
@@ -494,7 +494,7 @@ MergeTreePrefetchedReadPool::ThreadsTasks MergeTreePrefetchedReadPool::createThr
     ThreadsTasks result_threads_tasks;
     for (size_t i = 0, part_idx = 0; i < threads && part_idx < parts_infos.size(); ++i)
     {
-        auto need_marks = min_marks_per_thread;
+        int64_t need_marks = min_marks_per_thread;
 
         /// Priority is given according to the prefetch number for each thread,
         /// e.g. the first task of each thread has the same priority and is greater
@@ -515,7 +515,7 @@ MergeTreePrefetchedReadPool::ThreadsTasks MergeTreePrefetchedReadPool::createThr
             }
 
             MarkRanges ranges_to_get_from_part;
-            size_t marks_to_get_from_part = std::min(need_marks, marks_in_part);
+            size_t marks_to_get_from_part = std::min<size_t>(need_marks, marks_in_part);
 
             /// Split by prefetch step even if !allow_prefetch below. Because it will allow
             /// to make a better distribution of tasks which did not fill into memory limit
diff --git a/src/Storages/MergeTree/MergeTreeReadPool.cpp b/src/Storages/MergeTree/MergeTreeReadPool.cpp
index ba8c2c6385f..2ab90189f9d 100644
--- a/src/Storages/MergeTree/MergeTreeReadPool.cpp
+++ b/src/Storages/MergeTree/MergeTreeReadPool.cpp
@@ -6,6 +6,7 @@
 #include <Common/Stopwatch.h>
 #include <Common/formatReadable.h>
 #include <Common/logger_useful.h>
+#include <Storages/MergeTree/RequestResponse.h>
 
 
 namespace ProfileEvents
@@ -433,8 +434,12 @@ MergeTreeReadTaskPtr MergeTreeReadPoolParallelReplicas::getTask(size_t thread)
 
     if (buffered_ranges.empty())
     {
-        auto result = extension.callback(ParallelReadRequest{
-            .replica_num = extension.number_of_current_replica, .min_number_of_marks = min_marks_for_concurrent_read * threads});
+        auto result = extension.callback(ParallelReadRequest(
+            CoordinationMode::Default,
+            extension.number_of_current_replica,
+            min_marks_for_concurrent_read * threads,
+            /// For Default coordination mode we don't need to pass part names.
+            RangesInDataPartsDescription{}));
 
         if (!result || result->finish)
         {
@@ -529,12 +534,12 @@ MarkRanges MergeTreeInOrderReadPoolParallelReplicas::getNewTask(RangesInDataPart
     if (no_more_tasks)
         return {};
 
-    auto response = extension.callback(ParallelReadRequest{
-        .mode = mode,
-        .replica_num = extension.number_of_current_replica,
-        .min_number_of_marks = min_marks_for_concurrent_read * request.size(),
-        .description = request,
-    });
+    auto response = extension.callback(ParallelReadRequest(
+        mode,
+        extension.number_of_current_replica,
+        min_marks_for_concurrent_read * request.size(),
+        request
+    ));
 
     if (!response || response->description.empty() || response->finish)
     {
diff --git a/src/Storages/MergeTree/MergeTreeReadPool.h b/src/Storages/MergeTree/MergeTreeReadPool.h
index 21273904e00..68d5438cb3d 100644
--- a/src/Storages/MergeTree/MergeTreeReadPool.h
+++ b/src/Storages/MergeTree/MergeTreeReadPool.h
@@ -193,10 +193,11 @@ public:
             predict_block_size_bytes, column_names, virtual_column_names, prewhere_info,
             actions_settings, reader_settings, per_part_params);
 
-        extension.all_callback({
-            .description = parts_ranges.getDescriptions(),
-            .replica_num = extension.number_of_current_replica
-        });
+        extension.all_callback(InitialAllRangesAnnouncement(
+            CoordinationMode::Default,
+            parts_ranges.getDescriptions(),
+            extension.number_of_current_replica
+        ));
     }
 
     ~MergeTreeReadPoolParallelReplicas() override;
@@ -253,10 +254,11 @@ public:
         for (const auto & part : parts_ranges)
             buffered_tasks.push_back({part.data_part->info, MarkRanges{}});
 
-        extension.all_callback({
-            .description = parts_ranges.getDescriptions(),
-            .replica_num = extension.number_of_current_replica
-        });
+        extension.all_callback(InitialAllRangesAnnouncement(
+            mode,
+            parts_ranges.getDescriptions(),
+            extension.number_of_current_replica
+        ));
     }
 
     MarkRanges getNewTask(RangesInDataPartDescription description);
diff --git a/src/Storages/MergeTree/MergeTreeReaderCompact.cpp b/src/Storages/MergeTree/MergeTreeReaderCompact.cpp
index d22684eaa9d..f65e66ff52d 100644
--- a/src/Storages/MergeTree/MergeTreeReaderCompact.cpp
+++ b/src/Storages/MergeTree/MergeTreeReaderCompact.cpp
@@ -1,5 +1,6 @@
 #include <Storages/MergeTree/MergeTreeReaderCompact.h>
 #include <Storages/MergeTree/MergeTreeDataPartCompact.h>
+#include <Storages/MergeTree/checkDataPart.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/NestedUtils.h>
 
@@ -10,7 +11,6 @@ namespace ErrorCodes
 {
     extern const int CANNOT_READ_ALL_DATA;
     extern const int ARGUMENT_OUT_OF_BOUND;
-    extern const int MEMORY_LIMIT_EXCEEDED;
 }
 
 
@@ -112,6 +112,12 @@ void MergeTreeReaderCompact::initialize()
             compressed_data_buffer = non_cached_buffer.get();
         }
     }
+    catch (const Exception & e)
+    {
+        if (!isRetryableException(e))
+            data_part_info_for_read->reportBroken();
+        throw;
+    }
     catch (...)
     {
         data_part_info_for_read->reportBroken();
@@ -207,11 +213,11 @@ size_t MergeTreeReaderCompact::readRows(
             }
             catch (Exception & e)
             {
-                if (e.code() != ErrorCodes::MEMORY_LIMIT_EXCEEDED)
+                if (!isRetryableException(e))
                     data_part_info_for_read->reportBroken();
 
                 /// Better diagnostics.
-                e.addMessage("(while reading column " + columns_to_read[pos].name + ")");
+                e.addMessage(getMessageForDiagnosticOfBrokenPart(from_mark, max_rows_to_read));
                 throw;
             }
             catch (...)
@@ -315,6 +321,7 @@ void MergeTreeReaderCompact::readData(
 }
 
 void MergeTreeReaderCompact::prefetchBeginOfRange(Priority priority)
+try
 {
     if (!initialized)
     {
@@ -326,6 +333,17 @@ void MergeTreeReaderCompact::prefetchBeginOfRange(Priority priority)
     seekToMark(all_mark_ranges.front().begin, 0);
     data_buffer->prefetch(priority);
 }
+catch (const Exception & e)
+{
+    if (!isRetryableException(e))
+        data_part_info_for_read->reportBroken();
+    throw;
+}
+catch (...)
+{
+    data_part_info_for_read->reportBroken();
+    throw;
+}
 
 void MergeTreeReaderCompact::seekToMark(size_t row_index, size_t column_index)
 {
diff --git a/src/Storages/MergeTree/MergeTreeReaderWide.cpp b/src/Storages/MergeTree/MergeTreeReaderWide.cpp
index baacfa55c94..140fb6da5df 100644
--- a/src/Storages/MergeTree/MergeTreeReaderWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeReaderWide.cpp
@@ -9,6 +9,7 @@
 #include <Interpreters/Context.h>
 #include <Storages/MergeTree/IMergeTreeReader.h>
 #include <Storages/MergeTree/MergeTreeDataPartWide.h>
+#include <Storages/MergeTree/checkDataPart.h>
 #include <Common/escapeForFileName.h>
 #include <Common/typeid_cast.h>
 
@@ -20,11 +21,6 @@ namespace
     constexpr auto DATA_FILE_EXTENSION = ".bin";
 }
 
-namespace ErrorCodes
-{
-    extern const int MEMORY_LIMIT_EXCEEDED;
-}
-
 MergeTreeReaderWide::MergeTreeReaderWide(
     MergeTreeDataPartInfoForReaderPtr data_part_info_,
     NamesAndTypesList columns_,
@@ -51,6 +47,12 @@ MergeTreeReaderWide::MergeTreeReaderWide(
         for (size_t i = 0; i < columns_to_read.size(); ++i)
             addStreams(columns_to_read[i], serializations[i], profile_callback_, clock_type_);
     }
+    catch (const Exception & e)
+    {
+        if (!isRetryableException(e))
+            data_part_info_for_read->reportBroken();
+        throw;
+    }
     catch (...)
     {
         data_part_info_for_read->reportBroken();
@@ -76,9 +78,9 @@ void MergeTreeReaderWide::prefetchBeginOfRange(Priority priority)
         /// of range only once so there is no such problem.
         /// 4. continue_reading == false, as we haven't read anything yet.
     }
-    catch (Exception & e)
+    catch (const Exception & e)
     {
-        if (e.code() != ErrorCodes::MEMORY_LIMIT_EXCEEDED)
+        if (!isRetryableException(e))
             data_part_info_for_read->reportBroken();
         throw;
     }
@@ -184,21 +186,16 @@ size_t MergeTreeReaderWide::readRows(
     }
     catch (Exception & e)
     {
-        if (e.code() != ErrorCodes::MEMORY_LIMIT_EXCEEDED)
+        if (!isRetryableException(e))
             data_part_info_for_read->reportBroken();
 
         /// Better diagnostics.
-        e.addMessage(
-            fmt::format(
-                "(while reading from part {} from mark {} with max_rows_to_read = {})",
-                data_part_info_for_read->getDataPartStorage()->getFullPath(),
-                toString(from_mark), toString(max_rows_to_read)));
+        e.addMessage(getMessageForDiagnosticOfBrokenPart(from_mark, max_rows_to_read));
         throw;
     }
     catch (...)
     {
         data_part_info_for_read->reportBroken();
-
         throw;
     }
 
diff --git a/src/Storages/MergeTree/MergeTreeSequentialSource.cpp b/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
index e27354f9d16..5a6d59bf0be 100644
--- a/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
+++ b/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
@@ -8,6 +8,7 @@
 #include <QueryPipeline/Pipe.h>
 #include <Interpreters/Context.h>
 #include <Processors/Sources/NullSource.h>
+#include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/FilterStep.h>
 #include <Common/logger_useful.h>
 
diff --git a/src/Storages/MergeTree/MergeTreeSettings.cpp b/src/Storages/MergeTree/MergeTreeSettings.cpp
index 479e50fdebb..6df841059b9 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.cpp
+++ b/src/Storages/MergeTree/MergeTreeSettings.cpp
@@ -175,5 +175,29 @@ void MergeTreeSettings::sanityCheck(size_t background_pool_tasks) const
             min_bytes_to_rebalance_partition_over_jbod,
             max_bytes_to_merge_at_max_space_in_pool / 1024);
     }
+
+    if (max_cleanup_delay_period < cleanup_delay_period)
+    {
+        throw Exception(
+            ErrorCodes::BAD_ARGUMENTS,
+            "The value of max_cleanup_delay_period setting ({}) must be greater than the value of cleanup_delay_period setting ({})",
+            max_cleanup_delay_period, cleanup_delay_period);
+    }
+
+    if (max_merge_selecting_sleep_ms < merge_selecting_sleep_ms)
+    {
+        throw Exception(
+            ErrorCodes::BAD_ARGUMENTS,
+            "The value of max_merge_selecting_sleep_ms setting ({}) must be greater than the value of merge_selecting_sleep_ms setting ({})",
+            max_merge_selecting_sleep_ms, merge_selecting_sleep_ms);
+    }
+
+    if (merge_selecting_sleep_slowdown_factor < 1.f)
+    {
+        throw Exception(
+            ErrorCodes::BAD_ARGUMENTS,
+            "The value of merge_selecting_sleep_slowdown_factor setting ({}) cannot be less than 1.0",
+            merge_selecting_sleep_slowdown_factor);
+    }
 }
 }
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index 5ea99009756..dc24327712c 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -57,7 +57,9 @@ struct Settings;
     M(Bool, fsync_part_directory, false, "Do fsync for part directory after all part operations (writes, renames, etc.).", 0) \
     M(UInt64, non_replicated_deduplication_window, 0, "How many last blocks of hashes should be kept on disk (0 - disabled).", 0) \
     M(UInt64, max_parts_to_merge_at_once, 100, "Max amount of parts which can be merged at once (0 - disabled). Doesn't affect OPTIMIZE FINAL query.", 0) \
-    M(UInt64, merge_selecting_sleep_ms, 5000, "Sleep time for merge selecting when no part selected, a lower setting will trigger selecting tasks in background_schedule_pool frequently which result in large amount of requests to zookeeper in large-scale clusters", 0) \
+    M(UInt64, merge_selecting_sleep_ms, 5000, "Maximum sleep time for merge selecting, a lower setting will trigger selecting tasks in background_schedule_pool frequently which result in large amount of requests to zookeeper in large-scale clusters", 0) \
+    M(UInt64, max_merge_selecting_sleep_ms, 60000, "Maximum sleep time for merge selecting, a lower setting will trigger selecting tasks in background_schedule_pool frequently which result in large amount of requests to zookeeper in large-scale clusters", 0) \
+    M(Float, merge_selecting_sleep_slowdown_factor, 1.2f, "The sleep time for merge selecting task is multiplied by this factor when there's nothing to merge and divided when a merge was assigned", 0) \
     M(UInt64, merge_tree_clear_old_temporary_directories_interval_seconds, 60, "The period of executing the clear old temporary directories operation in background.", 0) \
     M(UInt64, merge_tree_clear_old_parts_interval_seconds, 1, "The period of executing the clear old parts operation in background.", 0) \
     M(UInt64, merge_tree_clear_old_broken_detached_parts_ttl_timeout_seconds, 1ULL * 3600 * 24 * 30, "Remove old broken detached parts in the background if they remained intouched for a specified by this setting period of time.", 0) \
@@ -67,17 +69,17 @@ struct Settings;
     M(Bool, remove_rolled_back_parts_immediately, 1, "Setting for an incomplete experimental feature.", 0) \
     M(CleanDeletedRows, clean_deleted_rows, CleanDeletedRows::Never, "Is the Replicated Merge cleanup has to be done automatically at each merge or manually (possible values are 'Always'/'Never' (default))", 0) \
     M(UInt64, replicated_max_mutations_in_one_entry, 10000, "Max number of mutation commands that can be merged together and executed in one MUTATE_PART entry (0 means unlimited)", 0) \
-    M(UInt64, number_of_mutations_to_delay, 0, "If table has at least that many unfinished mutations, artificially slow down mutations of table. Disabled if set to 0", 0) \
-    M(UInt64, number_of_mutations_to_throw, 0, "If table has at least that many unfinished mutations, throw 'Too many mutations' exception. Disabled if set to 0", 0) \
+    M(UInt64, number_of_mutations_to_delay, 500, "If table has at least that many unfinished mutations, artificially slow down mutations of table. Disabled if set to 0", 0) \
+    M(UInt64, number_of_mutations_to_throw, 1000, "If table has at least that many unfinished mutations, throw 'Too many mutations' exception. Disabled if set to 0", 0) \
     M(UInt64, min_delay_to_mutate_ms, 10, "Min delay of mutating MergeTree table in milliseconds, if there are a lot of unfinished mutations", 0) \
     M(UInt64, max_delay_to_mutate_ms, 1000, "Max delay of mutating MergeTree table in milliseconds, if there are a lot of unfinished mutations", 0) \
     \
     /** Inserts settings. */ \
-    M(UInt64, parts_to_delay_insert, 150, "If table contains at least that many active parts in single partition, artificially slow down insert into table. Disabled if set to 0", 0) \
+    M(UInt64, parts_to_delay_insert, 1000, "If table contains at least that many active parts in single partition, artificially slow down insert into table. Disabled if set to 0", 0) \
     M(UInt64, inactive_parts_to_delay_insert, 0, "If table contains at least that many inactive parts in single partition, artificially slow down insert into table.", 0) \
-    M(UInt64, parts_to_throw_insert, 300, "If more than this number active parts in single partition, throw 'Too many parts ...' exception.", 0) \
+    M(UInt64, parts_to_throw_insert, 3000, "If more than this number active parts in single partition, throw 'Too many parts ...' exception.", 0) \
     M(UInt64, inactive_parts_to_throw_insert, 0, "If more than this number inactive parts in single partition, throw 'Too many inactive parts ...' exception.", 0) \
-    M(UInt64, max_avg_part_size_for_too_many_parts, 10ULL * 1024 * 1024 * 1024, "The 'too many parts' check according to 'parts_to_delay_insert' and 'parts_to_throw_insert' will be active only if the average part size (in the relevant partition) is not larger than the specified threshold. If it is larger than the specified threshold, the INSERTs will be neither delayed or rejected. This allows to have hundreds of terabytes in a single table on a single server if the parts are successfully merged to larger parts. This does not affect the thresholds on inactive parts or total parts.", 0) \
+    M(UInt64, max_avg_part_size_for_too_many_parts, 1ULL * 1024 * 1024 * 1024, "The 'too many parts' check according to 'parts_to_delay_insert' and 'parts_to_throw_insert' will be active only if the average part size (in the relevant partition) is not larger than the specified threshold. If it is larger than the specified threshold, the INSERTs will be neither delayed or rejected. This allows to have hundreds of terabytes in a single table on a single server if the parts are successfully merged to larger parts. This does not affect the thresholds on inactive parts or total parts.", 0) \
     M(UInt64, max_delay_to_insert, 1, "Max delay of inserting data into MergeTree table in seconds, if there are a lot of unmerged parts in single partition.", 0) \
     M(UInt64, min_delay_to_insert_ms, 10, "Min delay of inserting data into MergeTree table in milliseconds, if there are a lot of unmerged parts in single partition.", 0) \
     M(UInt64, max_parts_in_total, 100000, "If more than this number active parts in all partitions in total, throw 'Too many parts ...' exception.", 0) \
@@ -120,8 +122,10 @@ struct Settings;
     \
     /** Check delay of replicas settings. */ \
     M(UInt64, min_relative_delay_to_measure, 120, "Calculate relative replica delay only if absolute delay is not less that this value.", 0) \
-    M(UInt64, cleanup_delay_period, 30, "Period to clean old queue logs, blocks hashes and parts.", 0) \
+    M(UInt64, cleanup_delay_period, 30, "Minimum period to clean old queue logs, blocks hashes and parts.", 0) \
+    M(UInt64, max_cleanup_delay_period, 300, "Maximum period to clean old queue logs, blocks hashes and parts.", 0) \
     M(UInt64, cleanup_delay_period_random_add, 10, "Add uniformly distributed value from 0 to x seconds to cleanup_delay_period to avoid thundering herd effect and subsequent DoS of ZooKeeper in case of very large number of tables.", 0) \
+    M(UInt64, cleanup_thread_preferred_points_per_iteration, 150, "Preferred batch size for background cleanup (points are abstract but 1 point is approximately equivalent to 1 inserted block).", 0) \
     M(UInt64, min_relative_delay_to_close, 300, "Minimal delay from other replicas to close, stop serving requests and not return Ok during status check.", 0) \
     M(UInt64, min_absolute_delay_to_close, 0, "Minimal absolute delay to close, stop serving requests and not return Ok during status check.", 0) \
     M(UInt64, enable_vertical_merge_algorithm, 1, "Enable usage of Vertical merge algorithm.", 0) \
@@ -143,8 +147,6 @@ struct Settings;
     M(Bool, ttl_only_drop_parts, false, "Only drop altogether the expired parts and not partially prune them.", 0) \
     M(Bool, materialize_ttl_recalculate_only, false, "Only recalculate ttl info when MATERIALIZE TTL", 0) \
     M(Bool, enable_mixed_granularity_parts, true, "Enable parts with adaptive and non adaptive granularity", 0) \
-    M(MaxThreads, max_part_loading_threads, 0, "The number of threads to load data parts at startup.", 0) \
-    M(MaxThreads, max_part_removal_threads, 0, "The number of threads for concurrent removal of inactive data parts. One is usually enough, but in 'Google Compute Environment SSD Persistent Disks' file removal (unlink) operation is extraordinarily slow and you probably have to increase this number (recommended is up to 16).", 0) \
     M(UInt64, concurrent_part_removal_threshold, 100, "Activate concurrent part removal (see 'max_part_removal_threads') only if the number of inactive data parts is at least this.", 0) \
     M(UInt64, zero_copy_concurrent_part_removal_max_split_times, 5, "Max recursion depth for splitting independent Outdated parts ranges into smaller subranges (highly not recommended to change)", 0) \
     M(Float, zero_copy_concurrent_part_removal_max_postpone_ratio, static_cast<Float32>(0.05), "Max percentage of top level parts to postpone removal in order to get smaller independent ranges (highly not recommended to change)", 0) \
@@ -160,6 +162,7 @@ struct Settings;
     M(Bool, check_sample_column_is_correct, true, "Check columns or columns by hash for sampling are unsigned integer.", 0) \
     M(Bool, allow_vertical_merges_from_compact_to_wide_parts, false, "Allows vertical merges from compact to wide parts. This settings must have the same value on all replicas", 0) \
     M(Bool, enable_the_endpoint_id_with_zookeeper_name_prefix, false, "Enable the endpoint id with zookeeper name prefix for the replicated merge tree table", 0) \
+    M(UInt64, zero_copy_merge_mutation_min_parts_size_sleep_before_lock, 1ULL * 1024 * 1024 * 1024, "If zero copy replication is enabled sleep random amount of time before trying to lock depending on parts size for merge or mutation", 0) \
     \
     /** Experimental/work in progress feature. Unsafe for production. */ \
     M(UInt64, part_moves_between_shards_enable, 0, "Experimental/Incomplete feature to move parts between shards. Does not take into account sharding expressions.", 0) \
@@ -192,6 +195,9 @@ struct Settings;
     M(UInt64, write_ahead_log_bytes_to_fsync, 100ULL * 1024 * 1024, "Obsolete setting, does nothing.", 0) \
     M(UInt64, write_ahead_log_interval_ms_to_fsync, 100, "Obsolete setting, does nothing.", 0) \
     M(Bool, in_memory_parts_insert_sync, false, "Obsolete setting, does nothing.", 0) \
+    M(MaxThreads, max_part_loading_threads, 0, "Obsolete setting, does nothing.", 0) \
+    M(MaxThreads, max_part_removal_threads, 0, "Obsolete setting, does nothing.", 0) \
+
     /// Settings that should not change after the creation of a table.
     /// NOLINTNEXTLINE
 #define APPLY_FOR_IMMUTABLE_MERGE_TREE_SETTINGS(M) \
diff --git a/src/Storages/MergeTree/MergeTreeSink.cpp b/src/Storages/MergeTree/MergeTreeSink.cpp
index d62fe5024f4..36816904a81 100644
--- a/src/Storages/MergeTree/MergeTreeSink.cpp
+++ b/src/Storages/MergeTree/MergeTreeSink.cpp
@@ -45,9 +45,9 @@ MergeTreeSink::MergeTreeSink(
 
 void MergeTreeSink::onStart()
 {
-    /// Only check "too many parts" before write,
+    /// It's only allowed to throw "too many parts" before write,
     /// because interrupting long-running INSERT query in the middle is not convenient for users.
-    storage.delayInsertOrThrowIfNeeded(nullptr, context);
+    storage.delayInsertOrThrowIfNeeded(nullptr, context, true);
 }
 
 void MergeTreeSink::onFinish()
@@ -57,6 +57,9 @@ void MergeTreeSink::onFinish()
 
 void MergeTreeSink::consume(Chunk chunk)
 {
+    if (num_blocks_processed > 0)
+        storage.delayInsertOrThrowIfNeeded(nullptr, context, false);
+
     auto block = getHeader().cloneWithColumns(chunk.detachColumns());
     if (!storage_snapshot->object_columns.empty())
         convertDynamicColumnsToTuples(block, storage_snapshot);
@@ -136,6 +139,8 @@ void MergeTreeSink::consume(Chunk chunk)
     finishDelayedChunk();
     delayed_chunk = std::make_unique<MergeTreeSink::DelayedChunk>();
     delayed_chunk->partitions = std::move(partitions);
+
+    ++num_blocks_processed;
 }
 
 void MergeTreeSink::finishDelayedChunk()
diff --git a/src/Storages/MergeTree/MergeTreeSink.h b/src/Storages/MergeTree/MergeTreeSink.h
index 68f11d86a25..07ab3850df2 100644
--- a/src/Storages/MergeTree/MergeTreeSink.h
+++ b/src/Storages/MergeTree/MergeTreeSink.h
@@ -35,7 +35,8 @@ private:
     size_t max_parts_per_block;
     ContextPtr context;
     StorageSnapshotPtr storage_snapshot;
-    uint64_t chunk_dedup_seqnum = 0; /// input chunk ordinal number in case of dedup token
+    UInt64 chunk_dedup_seqnum = 0; /// input chunk ordinal number in case of dedup token
+    UInt64 num_blocks_processed = 0;
 
     /// We can delay processing for previous chunk and start writing a new one.
     struct DelayedChunk;
diff --git a/src/Storages/MergeTree/MergeTreeSource.cpp b/src/Storages/MergeTree/MergeTreeSource.cpp
index b65f044a13b..69fbdd5a64d 100644
--- a/src/Storages/MergeTree/MergeTreeSource.cpp
+++ b/src/Storages/MergeTree/MergeTreeSource.cpp
@@ -105,7 +105,7 @@ struct MergeTreeSource::AsyncReadingState
     AsyncReadingState()
     {
         control = std::make_shared<Control>();
-        callback_runner = threadPoolCallbackRunner<void>(IOThreadPool::get(), "MergeTreeRead");
+        callback_runner = threadPoolCallbackRunner<void>(getIOThreadPool().get(), "MergeTreeRead");
     }
 
     ~AsyncReadingState()
diff --git a/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp b/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp
index 25a4579c73e..1620ba98d58 100644
--- a/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp
+++ b/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp
@@ -110,6 +110,9 @@ static void collectColumns(const RPNBuilderTreeNode & node, const NameSet & colu
     if (node.isConstant())
         return;
 
+    if (node.isSubqueryOrSet())
+        return;
+
     if (!node.isFunction())
     {
         auto column_name = node.getColumnName();
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.cpp b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
index c93ad135835..bfd9e92b4eb 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.cpp
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
@@ -201,7 +201,7 @@ MergedBlockOutputStream::WrittenFiles MergedBlockOutputStream::finalizePartOnDis
             auto count_out = new_part->getDataPartStorage().writeFile("count.txt", 4096, write_settings);
             HashingWriteBuffer count_out_hashing(*count_out);
             writeIntText(rows_count, count_out_hashing);
-            count_out_hashing.next();
+            count_out_hashing.finalize();
             checksums.files["count.txt"].file_size = count_out_hashing.count();
             checksums.files["count.txt"].file_hash = count_out_hashing.getHash();
             count_out->preFinalize();
@@ -215,6 +215,7 @@ MergedBlockOutputStream::WrittenFiles MergedBlockOutputStream::finalizePartOnDis
             auto out = new_part->getDataPartStorage().writeFile(IMergeTreeDataPart::UUID_FILE_NAME, 4096, write_settings);
             HashingWriteBuffer out_hashing(*out);
             writeUUIDText(new_part->uuid, out_hashing);
+            out_hashing.finalize();
             checksums.files[IMergeTreeDataPart::UUID_FILE_NAME].file_size = out_hashing.count();
             checksums.files[IMergeTreeDataPart::UUID_FILE_NAME].file_hash = out_hashing.getHash();
             out->preFinalize();
@@ -241,7 +242,7 @@ MergedBlockOutputStream::WrittenFiles MergedBlockOutputStream::finalizePartOnDis
             auto count_out = new_part->getDataPartStorage().writeFile("count.txt", 4096, write_settings);
             HashingWriteBuffer count_out_hashing(*count_out);
             writeIntText(rows_count, count_out_hashing);
-            count_out_hashing.next();
+            count_out_hashing.finalize();
             checksums.files["count.txt"].file_size = count_out_hashing.count();
             checksums.files["count.txt"].file_hash = count_out_hashing.getHash();
             count_out->preFinalize();
@@ -255,6 +256,7 @@ MergedBlockOutputStream::WrittenFiles MergedBlockOutputStream::finalizePartOnDis
         auto out = new_part->getDataPartStorage().writeFile("ttl.txt", 4096, write_settings);
         HashingWriteBuffer out_hashing(*out);
         new_part->ttl_infos.write(out_hashing);
+        out_hashing.finalize();
         checksums.files["ttl.txt"].file_size = out_hashing.count();
         checksums.files["ttl.txt"].file_hash = out_hashing.getHash();
         out->preFinalize();
@@ -266,6 +268,7 @@ MergedBlockOutputStream::WrittenFiles MergedBlockOutputStream::finalizePartOnDis
         auto out = new_part->getDataPartStorage().writeFile(IMergeTreeDataPart::SERIALIZATION_FILE_NAME, 4096, write_settings);
         HashingWriteBuffer out_hashing(*out);
         new_part->getSerializationInfos().writeJSON(out_hashing);
+        out_hashing.finalize();
         checksums.files[IMergeTreeDataPart::SERIALIZATION_FILE_NAME].file_size = out_hashing.count();
         checksums.files[IMergeTreeDataPart::SERIALIZATION_FILE_NAME].file_hash = out_hashing.getHash();
         out->preFinalize();
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.h b/src/Storages/MergeTree/MergedBlockOutputStream.h
index f3a5653a880..20e6de5a99b 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.h
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.h
@@ -48,7 +48,6 @@ public:
         Finalizer & operator=(Finalizer &&) noexcept;
         ~Finalizer();
 
-
         void finish();
     };
 
diff --git a/src/Storages/MergeTree/MutateFromLogEntryTask.cpp b/src/Storages/MergeTree/MutateFromLogEntryTask.cpp
index d0b85ee65b8..ba55fb400ca 100644
--- a/src/Storages/MergeTree/MutateFromLogEntryTask.cpp
+++ b/src/Storages/MergeTree/MutateFromLogEntryTask.cpp
@@ -3,6 +3,7 @@
 #include <Common/logger_useful.h>
 #include <Common/ProfileEvents.h>
 #include <Storages/StorageReplicatedMergeTree.h>
+#include <cmath>
 
 namespace ProfileEvents
 {
@@ -128,6 +129,27 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
                 };
             }
 
+            if (storage_settings_ptr->zero_copy_merge_mutation_min_parts_size_sleep_before_lock != 0 &&
+                estimated_space_for_result >= storage_settings_ptr->zero_copy_merge_mutation_min_parts_size_sleep_before_lock)
+            {
+                /// In zero copy replication only one replica execute merge/mutation, others just download merged parts metadata.
+                /// Here we are trying to metigate the skew of merges execution because of faster/slower replicas.
+                /// Replicas can be slow because of different reasons like bigger latency for ZooKeeper or just slight step behind because of bigger queue.
+                /// In this case faster replica can pick up all merges execution, especially large merges while other replicas can just idle. And even in this case
+                /// the fast replica is not overloaded because amount of executing merges don't affect the ability to aquite locks for new merges.
+                ///
+                /// So here we trying to solve it with the simplest solution -- sleep random time up to 500ms for 1GB part and up to 7 seconds for 300GB part.
+                /// It can sound too much, but we are trying to acquire these locks in background tasks which can be scheduled each 5 seconds or so.
+                double start_to_sleep_seconds = std::logf(storage_settings_ptr->zero_copy_merge_mutation_min_parts_size_sleep_before_lock.value);
+                uint64_t right_border_to_sleep_ms = static_cast<uint64_t>((std::log(estimated_space_for_result) - start_to_sleep_seconds + 0.5) * 1000);
+                uint64_t time_to_sleep_milliseconds = std::min<uint64_t>(10000UL, std::uniform_int_distribution<uint64_t>(1, 1 + right_border_to_sleep_ms)(rng));
+
+                LOG_INFO(log, "Mutation size is {} bytes (it's more than sleep threshold {}) so will intentionally sleep for {} ms to allow other replicas to took this big mutation",
+                    estimated_space_for_result, storage_settings_ptr->zero_copy_merge_mutation_min_parts_size_sleep_before_lock, time_to_sleep_milliseconds);
+
+                std::this_thread::sleep_for(std::chrono::milliseconds(time_to_sleep_milliseconds));
+            }
+
             zero_copy_lock = storage.tryCreateZeroCopyExclusiveLock(entry.new_part_name, disk);
 
             if (!zero_copy_lock || !zero_copy_lock->isLocked())
@@ -184,7 +206,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
 
     /// Adjust priority
     for (auto & item : future_mutated_part->parts)
-        priority += item->getBytesOnDisk();
+        priority.value += item->getBytesOnDisk();
 
     return {true, true, [this] (const ExecutionStatus & execution_status)
     {
@@ -245,7 +267,7 @@ bool MutateFromLogEntryTask::finalize(ReplicatedMergeMutateTaskBase::PartLogWrit
     /** With `ZSESSIONEXPIRED` or `ZOPERATIONTIMEOUT`, we can inadvertently roll back local changes to the parts.
          * This is not a problem, because in this case the entry will remain in the queue, and we will try again.
          */
-    storage.merge_selecting_task->schedule();
+    finish_callback = [storage_ptr = &storage]() { storage_ptr->merge_selecting_task->schedule(); };
     ProfileEvents::increment(ProfileEvents::ReplicatedPartMutations);
     write_part_log({});
 
diff --git a/src/Storages/MergeTree/MutateFromLogEntryTask.h b/src/Storages/MergeTree/MutateFromLogEntryTask.h
index 2a2cc308f85..b6d3f5d4b6b 100644
--- a/src/Storages/MergeTree/MutateFromLogEntryTask.h
+++ b/src/Storages/MergeTree/MutateFromLogEntryTask.h
@@ -1,5 +1,7 @@
 #pragma once
 
+#include <pcg_random.hpp>
+
 #include <Storages/MergeTree/IExecutableTask.h>
 #include <Storages/MergeTree/MutateTask.h>
 #include <Storages/MergeTree/ReplicatedMergeMutateTaskBase.h>
@@ -7,6 +9,7 @@
 #include <Storages/MergeTree/ReplicatedMergeTreeLogEntry.h>
 #include <Storages/MergeTree/ZeroCopyLock.h>
 #include <Storages/StorageReplicatedMergeTree.h>
+#include <Common/randomSeed.h>
 
 namespace DB
 {
@@ -24,10 +27,11 @@ public:
             storage_,
             selected_entry_,
             task_result_callback_)
+        , rng(randomSeed())
         {}
 
 
-    UInt64 getPriority() override { return priority; }
+    Priority getPriority() override { return priority; }
 
 private:
 
@@ -40,7 +44,7 @@ private:
         return mutate_task->execute();
     }
 
-    UInt64 priority{0};
+    Priority priority;
 
     TableLockHolder table_lock_holder{nullptr};
     ReservationSharedPtr reserved_space{nullptr};
@@ -56,6 +60,7 @@ private:
     FutureMergedMutatedPartPtr future_mutated_part{nullptr};
 
     MutateTaskPtr mutate_task;
+    pcg64 rng;
 };
 
 
diff --git a/src/Storages/MergeTree/MutatePlainMergeTreeTask.cpp b/src/Storages/MergeTree/MutatePlainMergeTreeTask.cpp
index 04effdb8894..3180431d31b 100644
--- a/src/Storages/MergeTree/MutatePlainMergeTreeTask.cpp
+++ b/src/Storages/MergeTree/MutatePlainMergeTreeTask.cpp
@@ -24,7 +24,6 @@ void MutatePlainMergeTreeTask::onCompleted()
     task_result_callback(delay);
 }
 
-
 void MutatePlainMergeTreeTask::prepare()
 {
     future_part = merge_mutate_entry->future_part;
diff --git a/src/Storages/MergeTree/MutatePlainMergeTreeTask.h b/src/Storages/MergeTree/MutatePlainMergeTreeTask.h
index 823ea6d7a0f..bd03c276256 100644
--- a/src/Storages/MergeTree/MutatePlainMergeTreeTask.h
+++ b/src/Storages/MergeTree/MutatePlainMergeTreeTask.h
@@ -36,13 +36,13 @@ public:
         , task_result_callback(task_result_callback_)
     {
         for (auto & part : merge_mutate_entry->future_part->parts)
-            priority += part->getBytesOnDisk();
+            priority.value += part->getBytesOnDisk();
     }
 
     bool executeStep() override;
     void onCompleted() override;
     StorageID getStorageID() override;
-    UInt64 getPriority() override { return priority; }
+    Priority getPriority() override { return priority; }
 
 private:
 
@@ -66,7 +66,7 @@ private:
     std::unique_ptr<Stopwatch> stopwatch;
     MergeTreeData::MutableDataPartPtr new_part;
 
-    UInt64 priority{0};
+    Priority priority;
 
     using MergeListEntryPtr = std::unique_ptr<MergeListEntry>;
     MergeListEntryPtr merge_list_entry;
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 76096d00641..f4a071b8f27 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -1,5 +1,6 @@
 #include <Storages/MergeTree/MutateTask.h>
 
+#include "Common/Priority.h"
 #include <Common/logger_useful.h>
 #include <Common/escapeForFileName.h>
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
@@ -152,20 +153,22 @@ static void splitAndModifyMutationCommands(
                     /// But we don't know for sure what happened.
                     auto part_metadata_version = part->getMetadataVersion();
                     auto table_metadata_version = metadata_snapshot->getMetadataVersion();
-                    /// StorageMergeTree does not have metadata version
-                    if (table_metadata_version <= part_metadata_version && part->storage.supportsReplication())
-                        throw Exception(ErrorCodes::LOGICAL_ERROR, "Part {} with metadata version {} contains column {} that is absent "
-                                        "in table {} with metadata version {}",
-                                        part->name, part_metadata_version, column.name,
-                                        part->storage.getStorageID().getNameForLogs(), table_metadata_version);
 
-                    if (part_metadata_version < table_metadata_version)
+                    bool allow_equal_versions = part_metadata_version == table_metadata_version && part->old_part_with_no_metadata_version_on_disk;
+                    if (part_metadata_version < table_metadata_version || allow_equal_versions)
                     {
                         LOG_WARNING(log, "Ignoring column {} from part {} with metadata version {} because there is no such column "
                                          "in table {} with metadata version {}. Assuming the column was dropped", column.name, part->name,
                                     part_metadata_version, part->storage.getStorageID().getNameForLogs(), table_metadata_version);
                         continue;
                     }
+
+                    /// StorageMergeTree does not have metadata version
+                    if (part->storage.supportsReplication())
+                        throw Exception(ErrorCodes::LOGICAL_ERROR, "Part {} with metadata version {} contains column {} that is absent "
+                                        "in table {} with metadata version {}",
+                                        part->name, part_metadata_version, column.name,
+                                        part->storage.getStorageID().getNameForLogs(), table_metadata_version);
                 }
 
                 for_interpreter.emplace_back(
@@ -200,8 +203,7 @@ static void splitAndModifyMutationCommands(
             {
                 for_file_renames.push_back(command);
             }
-            /// If we don't have this column in source part, than we don't need
-            /// to materialize it
+            /// If we don't have this column in source part, we don't need to materialize it.
             else if (part_columns.has(command.column_name))
             {
                 if (command.type == MutationCommand::Type::READ_COLUMN)
@@ -438,51 +440,13 @@ static ExecuteTTLType shouldExecuteTTL(const StorageMetadataPtr & metadata_snaps
 }
 
 
-/// Get skip indices, that should exists in the resulting data part.
-static MergeTreeIndices getIndicesForNewDataPart(
-    const IndicesDescription & all_indices,
-    const MutationCommands & commands_for_removes)
-{
-    NameSet removed_indices;
-    for (const auto & command : commands_for_removes)
-        if (command.type == MutationCommand::DROP_INDEX)
-            removed_indices.insert(command.column_name);
-
-    MergeTreeIndices new_indices;
-    for (const auto & index : all_indices)
-        if (!removed_indices.contains(index.name))
-            new_indices.push_back(MergeTreeIndexFactory::instance().get(index));
-
-    return new_indices;
-}
-
-static std::vector<ProjectionDescriptionRawPtr> getProjectionsForNewDataPart(
-    const ProjectionsDescription & all_projections,
-    const MutationCommands & commands_for_removes)
-{
-    NameSet removed_projections;
-    for (const auto & command : commands_for_removes)
-        if (command.type == MutationCommand::DROP_PROJECTION)
-            removed_projections.insert(command.column_name);
-
-    std::vector<ProjectionDescriptionRawPtr> new_projections;
-    for (const auto & projection : all_projections)
-        if (!removed_projections.contains(projection.name))
-            new_projections.push_back(&projection);
-
-    return new_projections;
-}
-
-
 /// Return set of indices which should be recalculated during mutation also
 /// wraps input stream into additional expression stream
 static std::set<MergeTreeIndexPtr> getIndicesToRecalculate(
     QueryPipelineBuilder & builder,
-    const NameSet & updated_columns,
     const StorageMetadataPtr & metadata_snapshot,
     ContextPtr context,
-    const NameSet & materialized_indices,
-    const MergeTreeData::DataPartPtr & source_part)
+    const NameSet & materialized_indices)
 {
     /// Checks if columns used in skipping indexes modified.
     const auto & index_factory = MergeTreeIndexFactory::instance();
@@ -492,11 +456,7 @@ static std::set<MergeTreeIndexPtr> getIndicesToRecalculate(
 
     for (const auto & index : indices)
     {
-        bool has_index =
-            source_part->checksums.has(INDEX_FILE_PREFIX + index.name + ".idx") ||
-            source_part->checksums.has(INDEX_FILE_PREFIX + index.name + ".idx2");
-        // If we ask to materialize and it already exists
-        if (!has_index && materialized_indices.contains(index.name))
+        if (materialized_indices.contains(index.name))
         {
             if (indices_to_recalc.insert(index_factory.get(index)).second)
             {
@@ -505,26 +465,6 @@ static std::set<MergeTreeIndexPtr> getIndicesToRecalculate(
                     indices_recalc_expr_list->children.push_back(expr->clone());
             }
         }
-        // If some dependent columns gets mutated
-        else
-        {
-            bool mutate = false;
-            const auto & index_cols = index.expression->getRequiredColumns();
-            for (const auto & col : index_cols)
-            {
-                if (updated_columns.contains(col))
-                {
-                    mutate = true;
-                    break;
-                }
-            }
-            if (mutate && indices_to_recalc.insert(index_factory.get(index)).second)
-            {
-                ASTPtr expr_list = index.expression_list_ast->clone();
-                for (const auto & expr : expr_list->children)
-                    indices_recalc_expr_list->children.push_back(expr->clone());
-            }
-        }
     }
 
     if (!indices_to_recalc.empty() && builder.initialized())
@@ -545,37 +485,15 @@ static std::set<MergeTreeIndexPtr> getIndicesToRecalculate(
     return indices_to_recalc;
 }
 
-std::set<ProjectionDescriptionRawPtr> getProjectionsToRecalculate(
-    const NameSet & updated_columns,
+static std::set<ProjectionDescriptionRawPtr> getProjectionsToRecalculate(
     const StorageMetadataPtr & metadata_snapshot,
-    const NameSet & materialized_projections,
-    const MergeTreeData::DataPartPtr & source_part)
+    const NameSet & materialized_projections)
 {
-    /// Checks if columns used in projections modified.
     std::set<ProjectionDescriptionRawPtr> projections_to_recalc;
     for (const auto & projection : metadata_snapshot->getProjections())
     {
-        // If we ask to materialize and it doesn't exist
-        if (!source_part->checksums.has(projection.name + ".proj") && materialized_projections.contains(projection.name))
-        {
+        if (materialized_projections.contains(projection.name))
             projections_to_recalc.insert(&projection);
-        }
-        else
-        {
-            // If some dependent columns gets mutated
-            bool mutate = false;
-            const auto & projection_cols = projection.required_columns;
-            for (const auto & col : projection_cols)
-            {
-                if (updated_columns.contains(col))
-                {
-                    mutate = true;
-                    break;
-                }
-            }
-            if (mutate)
-                projections_to_recalc.insert(&projection);
-        }
     }
     return projections_to_recalc;
 }
@@ -618,33 +536,6 @@ static NameSet collectFilesToSkip(
     /// Do not hardlink this file because it's always rewritten at the end of mutation.
     files_to_skip.insert(IMergeTreeDataPart::SERIALIZATION_FILE_NAME);
 
-    auto new_stream_counts = getStreamCounts(new_part, new_part->getColumns().getNames());
-    auto source_updated_stream_counts = getStreamCounts(source_part, updated_header.getNames());
-    auto new_updated_stream_counts = getStreamCounts(new_part, updated_header.getNames());
-
-    /// Skip all modified files in new part.
-    for (const auto & [stream_name, _] : new_updated_stream_counts)
-    {
-        files_to_skip.insert(stream_name + ".bin");
-        files_to_skip.insert(stream_name + mrk_extension);
-    }
-
-    /// Skip files that we read from source part and do not write in new part.
-    /// E.g. ALTER MODIFY from LowCardinality(String) to String.
-    for (const auto & [stream_name, _] : source_updated_stream_counts)
-    {
-        /// If we read shared stream and do not write it
-        /// (e.g. while ALTER MODIFY COLUMN from array of Nested type to String),
-        /// we need to hardlink its files, because they will be lost otherwise.
-        bool need_hardlink = new_updated_stream_counts[stream_name] == 0 && new_stream_counts[stream_name] != 0;
-
-        if (!need_hardlink)
-        {
-            files_to_skip.insert(stream_name + ".bin");
-            files_to_skip.insert(stream_name + mrk_extension);
-        }
-    }
-
     for (const auto & index : indices_to_recalc)
     {
         /// Since MinMax index has .idx2 extension, we need to add correct extension.
@@ -655,6 +546,36 @@ static NameSet collectFilesToSkip(
     for (const auto & projection : projections_to_recalc)
         files_to_skip.insert(projection->getDirectoryName());
 
+    if (isWidePart(source_part))
+    {
+        auto new_stream_counts = getStreamCounts(new_part, new_part->getColumns().getNames());
+        auto source_updated_stream_counts = getStreamCounts(source_part, updated_header.getNames());
+        auto new_updated_stream_counts = getStreamCounts(new_part, updated_header.getNames());
+
+        /// Skip all modified files in new part.
+        for (const auto & [stream_name, _] : new_updated_stream_counts)
+        {
+            files_to_skip.insert(stream_name + ".bin");
+            files_to_skip.insert(stream_name + mrk_extension);
+        }
+
+        /// Skip files that we read from source part and do not write in new part.
+        /// E.g. ALTER MODIFY from LowCardinality(String) to String.
+        for (const auto & [stream_name, _] : source_updated_stream_counts)
+        {
+            /// If we read shared stream and do not write it
+            /// (e.g. while ALTER MODIFY COLUMN from array of Nested type to String),
+            /// we need to hardlink its files, because they will be lost otherwise.
+            bool need_hardlink = new_updated_stream_counts[stream_name] == 0 && new_stream_counts[stream_name] != 0;
+
+            if (!need_hardlink)
+            {
+                files_to_skip.insert(stream_name + ".bin");
+                files_to_skip.insert(stream_name + mrk_extension);
+            }
+        }
+    }
+
     return files_to_skip;
 }
 
@@ -701,57 +622,60 @@ static NameToNameVector collectFilesForRenames(
             if (source_part->checksums.has(command.column_name + ".proj"))
                 add_rename(command.column_name + ".proj", "");
         }
-        else if (command.type == MutationCommand::Type::DROP_COLUMN)
+        else if (isWidePart(source_part))
         {
-            ISerialization::StreamCallback callback = [&](const ISerialization::SubstreamPath & substream_path)
+            if (command.type == MutationCommand::Type::DROP_COLUMN)
             {
-                String stream_name = ISerialization::getFileNameForStream({command.column_name, command.data_type}, substream_path);
-                /// Delete files if they are no longer shared with another column.
-                if (--stream_counts[stream_name] == 0)
+                ISerialization::StreamCallback callback = [&](const ISerialization::SubstreamPath & substream_path)
                 {
-                    add_rename(stream_name + ".bin", "");
-                    add_rename(stream_name + mrk_extension, "");
-                }
-            };
+                    String stream_name = ISerialization::getFileNameForStream({command.column_name, command.data_type}, substream_path);
+                    /// Delete files if they are no longer shared with another column.
+                    if (--stream_counts[stream_name] == 0)
+                    {
+                        add_rename(stream_name + ".bin", "");
+                        add_rename(stream_name + mrk_extension, "");
+                    }
+                };
 
-            if (auto serialization = source_part->tryGetSerialization(command.column_name))
-                serialization->enumerateStreams(callback);
-        }
-        else if (command.type == MutationCommand::Type::RENAME_COLUMN)
-        {
-            String escaped_name_from = escapeForFileName(command.column_name);
-            String escaped_name_to = escapeForFileName(command.rename_to);
-
-            ISerialization::StreamCallback callback = [&](const ISerialization::SubstreamPath & substream_path)
+                if (auto serialization = source_part->tryGetSerialization(command.column_name))
+                    serialization->enumerateStreams(callback);
+            }
+            else if (command.type == MutationCommand::Type::RENAME_COLUMN)
             {
-                String stream_from = ISerialization::getFileNameForStream(command.column_name, substream_path);
-                String stream_to = boost::replace_first_copy(stream_from, escaped_name_from, escaped_name_to);
+                String escaped_name_from = escapeForFileName(command.column_name);
+                String escaped_name_to = escapeForFileName(command.rename_to);
 
-                if (stream_from != stream_to)
+                ISerialization::StreamCallback callback = [&](const ISerialization::SubstreamPath & substream_path)
                 {
-                    add_rename(stream_from + ".bin", stream_to + ".bin");
-                    add_rename(stream_from + mrk_extension, stream_to + mrk_extension);
-                }
-            };
+                    String stream_from = ISerialization::getFileNameForStream(command.column_name, substream_path);
+                    String stream_to = boost::replace_first_copy(stream_from, escaped_name_from, escaped_name_to);
 
-            if (auto serialization = source_part->tryGetSerialization(command.column_name))
-                serialization->enumerateStreams(callback);
-        }
-        else if (command.type == MutationCommand::Type::READ_COLUMN)
-        {
-            /// Remove files for streams that exist in source_part,
-            /// but were removed in new_part by MODIFY COLUMN from
-            /// type with higher number of streams (e.g. LowCardinality -> String).
+                    if (stream_from != stream_to)
+                    {
+                        add_rename(stream_from + ".bin", stream_to + ".bin");
+                        add_rename(stream_from + mrk_extension, stream_to + mrk_extension);
+                    }
+                };
 
-            auto old_streams = getStreamCounts(source_part, source_part->getColumns().getNames());
-            auto new_streams = getStreamCounts(new_part, source_part->getColumns().getNames());
-
-            for (const auto & [old_stream, _] : old_streams)
+                if (auto serialization = source_part->tryGetSerialization(command.column_name))
+                    serialization->enumerateStreams(callback);
+            }
+            else if (command.type == MutationCommand::Type::READ_COLUMN)
             {
-                if (!new_streams.contains(old_stream) && --stream_counts[old_stream] == 0)
+                /// Remove files for streams that exist in source_part,
+                /// but were removed in new_part by MODIFY COLUMN from
+                /// type with higher number of streams (e.g. LowCardinality -> String).
+
+                auto old_streams = getStreamCounts(source_part, source_part->getColumns().getNames());
+                auto new_streams = getStreamCounts(new_part, source_part->getColumns().getNames());
+
+                for (const auto & [old_stream, _] : old_streams)
                 {
-                    add_rename(old_stream + ".bin", "");
-                    add_rename(old_stream + mrk_extension, "");
+                    if (!new_streams.contains(old_stream) && --stream_counts[old_stream] == 0)
+                    {
+                        add_rename(old_stream + ".bin", "");
+                        add_rename(old_stream + mrk_extension, "");
+                    }
                 }
             }
         }
@@ -784,6 +708,7 @@ void finalizeMutatedPart(
         auto out = new_data_part->getDataPartStorage().writeFile(IMergeTreeDataPart::UUID_FILE_NAME, 4096, context->getWriteSettings());
         HashingWriteBuffer out_hashing(*out);
         writeUUIDText(new_data_part->uuid, out_hashing);
+        out_hashing.finalize();
         new_data_part->checksums.files[IMergeTreeDataPart::UUID_FILE_NAME].file_size = out_hashing.count();
         new_data_part->checksums.files[IMergeTreeDataPart::UUID_FILE_NAME].file_hash = out_hashing.getHash();
         written_files.push_back(std::move(out));
@@ -795,6 +720,7 @@ void finalizeMutatedPart(
         auto out_ttl = new_data_part->getDataPartStorage().writeFile("ttl.txt", 4096, context->getWriteSettings());
         HashingWriteBuffer out_hashing(*out_ttl);
         new_data_part->ttl_infos.write(out_hashing);
+        out_hashing.finalize();
         new_data_part->checksums.files["ttl.txt"].file_size = out_hashing.count();
         new_data_part->checksums.files["ttl.txt"].file_hash = out_hashing.getHash();
         written_files.push_back(std::move(out_ttl));
@@ -805,6 +731,7 @@ void finalizeMutatedPart(
         auto out_serialization = new_data_part->getDataPartStorage().writeFile(IMergeTreeDataPart::SERIALIZATION_FILE_NAME, 4096, context->getWriteSettings());
         HashingWriteBuffer out_hashing(*out_serialization);
         new_data_part->getSerializationInfos().writeJSON(out_hashing);
+        out_hashing.finalize();
         new_data_part->checksums.files[IMergeTreeDataPart::SERIALIZATION_FILE_NAME].file_size = out_hashing.count();
         new_data_part->checksums.files[IMergeTreeDataPart::SERIALIZATION_FILE_NAME].file_hash = out_hashing.getHash();
         written_files.push_back(std::move(out_serialization));
@@ -851,11 +778,8 @@ void finalizeMutatedPart(
     new_data_part->minmax_idx = source_part->minmax_idx;
     new_data_part->modification_time = time(nullptr);
 
-    /// This line should not be here because at that moment
-    /// of executing of mutation all projections should be loaded.
-    /// But unfortunately without it some tests fail.
-    /// TODO: fix.
-    new_data_part->loadProjections(false, false);
+    /// Load rest projections which are hardlinked
+    new_data_part->loadProjections(false, false, true /* if_not_loaded */);
 
     /// All information about sizes is stored in checksums.
     /// It doesn't make sense to touch filesystem for sizes.
@@ -917,9 +841,9 @@ struct MutationContext
     std::vector<ProjectionDescriptionRawPtr> projections_to_build;
     IMergeTreeDataPart::MinMaxIndexPtr minmax_idx{nullptr};
 
-    NameSet updated_columns;
     std::set<MergeTreeIndexPtr> indices_to_recalc;
     std::set<ProjectionDescriptionRawPtr> projections_to_recalc;
+    MergeTreeData::DataPart::Checksums existing_indices_checksums;
     NameSet files_to_skip;
     NameToNameVector files_to_rename;
 
@@ -928,7 +852,7 @@ struct MutationContext
 
     MergeTreeTransactionPtr txn;
 
-    MergeTreeData::HardlinkedFiles hardlinked_files;
+    HardlinkedFiles hardlinked_files;
 
     bool need_prefix = true;
 
@@ -961,7 +885,7 @@ public:
 
     void onCompleted() override { throw Exception(ErrorCodes::LOGICAL_ERROR, "Not implemented"); }
     StorageID getStorageID() override { throw Exception(ErrorCodes::LOGICAL_ERROR, "Not implemented"); }
-    UInt64 getPriority() override { throw Exception(ErrorCodes::LOGICAL_ERROR, "Not implemented"); }
+    Priority getPriority() override { throw Exception(ErrorCodes::LOGICAL_ERROR, "Not implemented"); }
 
     bool executeStep() override
     {
@@ -1283,7 +1207,7 @@ public:
 
     void onCompleted() override { throw Exception(ErrorCodes::LOGICAL_ERROR, "Not implemented"); }
     StorageID getStorageID() override { throw Exception(ErrorCodes::LOGICAL_ERROR, "Not implemented"); }
-    UInt64 getPriority() override { throw Exception(ErrorCodes::LOGICAL_ERROR, "Not implemented"); }
+    Priority getPriority() override { throw Exception(ErrorCodes::LOGICAL_ERROR, "Not implemented"); }
 
     bool executeStep() override
     {
@@ -1331,10 +1255,107 @@ private:
         /// (which is locked in shared mode when input streams are created) and when inserting new data
         /// the order is reverse. This annoys TSan even though one lock is locked in shared mode and thus
         /// deadlock is impossible.
-        ctx->compression_codec = ctx->data->getCompressionCodecForPart(ctx->source_part->getBytesOnDisk(), ctx->source_part->ttl_infos, ctx->time_of_mutation);
+        ctx->compression_codec
+            = ctx->data->getCompressionCodecForPart(ctx->source_part->getBytesOnDisk(), ctx->source_part->ttl_infos, ctx->time_of_mutation);
 
-        auto skip_part_indices = MutationHelpers::getIndicesForNewDataPart(ctx->metadata_snapshot->getSecondaryIndices(), ctx->for_file_renames);
-        ctx->projections_to_build = MutationHelpers::getProjectionsForNewDataPart(ctx->metadata_snapshot->getProjections(), ctx->for_file_renames);
+        NameSet entries_to_hardlink;
+
+        NameSet removed_indices;
+        for (const auto & command : ctx->for_file_renames)
+        {
+            if (command.type == MutationCommand::DROP_INDEX)
+                removed_indices.insert(command.column_name);
+        }
+
+        const auto & indices = ctx->metadata_snapshot->getSecondaryIndices();
+        MergeTreeIndices skip_indices;
+        for (const auto & idx : indices)
+        {
+            if (removed_indices.contains(idx.name))
+                continue;
+
+            if (ctx->materialized_indices.contains(idx.name))
+            {
+                skip_indices.push_back(MergeTreeIndexFactory::instance().get(idx));
+            }
+            else
+            {
+                auto prefix = fmt::format("{}{}.", INDEX_FILE_PREFIX, idx.name);
+                auto it = ctx->source_part->checksums.files.upper_bound(prefix);
+                while (it != ctx->source_part->checksums.files.end())
+                {
+                    if (!startsWith(it->first, prefix))
+                        break;
+
+                    entries_to_hardlink.insert(it->first);
+                    ctx->existing_indices_checksums.addFile(it->first, it->second.file_size, it->second.file_hash);
+                    ++it;
+                }
+            }
+        }
+
+        NameSet removed_projections;
+        for (const auto & command : ctx->for_file_renames)
+        {
+            if (command.type == MutationCommand::DROP_PROJECTION)
+                removed_projections.insert(command.column_name);
+        }
+
+        const auto & projections = ctx->metadata_snapshot->getProjections();
+        for (const auto & projection : projections)
+        {
+            if (removed_projections.contains(projection.name))
+                continue;
+
+            if (ctx->materialized_projections.contains(projection.name))
+            {
+                ctx->projections_to_build.push_back(&projection);
+            }
+            else
+            {
+                if (ctx->source_part->checksums.has(projection.getDirectoryName()))
+                    entries_to_hardlink.insert(projection.getDirectoryName());
+            }
+        }
+
+        NameSet hardlinked_files;
+        /// Create hardlinks for unchanged files
+        for (auto it = ctx->source_part->getDataPartStorage().iterate(); it->isValid(); it->next())
+        {
+            if (!entries_to_hardlink.contains(it->name()))
+                continue;
+
+            if (it->isFile())
+            {
+                ctx->new_data_part->getDataPartStorage().createHardLinkFrom(
+                    ctx->source_part->getDataPartStorage(), it->name(), it->name());
+                hardlinked_files.insert(it->name());
+            }
+            else
+            {
+                // it's a projection part directory
+                ctx->new_data_part->getDataPartStorage().createProjection(it->name());
+
+                auto projection_data_part_storage_src = ctx->source_part->getDataPartStorage().getProjection(it->name());
+                auto projection_data_part_storage_dst = ctx->new_data_part->getDataPartStorage().getProjection(it->name());
+
+                for (auto p_it = projection_data_part_storage_src->iterate(); p_it->isValid(); p_it->next())
+                {
+                    projection_data_part_storage_dst->createHardLinkFrom(
+                        *projection_data_part_storage_src, p_it->name(), p_it->name());
+
+                    auto file_name_with_projection_prefix = fs::path(projection_data_part_storage_src->getPartDirectory()) / p_it->name();
+                    hardlinked_files.insert(file_name_with_projection_prefix);
+                }
+            }
+        }
+
+        /// Tracking of hardlinked files required for zero-copy replication.
+        /// We don't remove them when we delete last copy of source part because
+        /// new part can use them.
+        ctx->hardlinked_files.source_table_shared_id = ctx->source_part->storage.getTableSharedID();
+        ctx->hardlinked_files.source_part_name = ctx->source_part->name;
+        ctx->hardlinked_files.hardlinks_from_source_part = std::move(hardlinked_files);
 
         if (!ctx->mutating_pipeline_builder.initialized())
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot mutate part columns with uninitialized mutations stream. It's a bug");
@@ -1343,8 +1364,8 @@ private:
 
         if (ctx->metadata_snapshot->hasPrimaryKey() || ctx->metadata_snapshot->hasSecondaryIndices())
         {
-            builder.addTransform(
-                std::make_shared<ExpressionTransform>(builder.getHeader(), ctx->data->getPrimaryKeyAndSkipIndicesExpression(ctx->metadata_snapshot)));
+            builder.addTransform(std::make_shared<ExpressionTransform>(
+                builder.getHeader(), ctx->data->getPrimaryKeyAndSkipIndicesExpression(ctx->metadata_snapshot, skip_indices)));
 
             builder.addTransform(std::make_shared<MaterializingTransform>(builder.getHeader()));
         }
@@ -1361,7 +1382,7 @@ private:
             ctx->new_data_part,
             ctx->metadata_snapshot,
             ctx->new_data_part->getColumns(),
-            skip_part_indices,
+            skip_indices,
             ctx->compression_codec,
             ctx->txn,
             /*reset_columns=*/ true,
@@ -1381,10 +1402,12 @@ private:
     void finalize()
     {
         ctx->new_data_part->minmax_idx = std::move(ctx->minmax_idx);
+        ctx->new_data_part->loadProjections(false, false, true /* if_not_loaded */);
         ctx->mutating_executor.reset();
         ctx->mutating_pipeline.reset();
 
-        static_pointer_cast<MergedBlockOutputStream>(ctx->out)->finalizePart(ctx->new_data_part, ctx->need_sync);
+        static_pointer_cast<MergedBlockOutputStream>(ctx->out)->finalizePart(
+            ctx->new_data_part, ctx->need_sync, nullptr, &ctx->existing_indices_checksums);
         ctx->out.reset();
     }
 
@@ -1412,7 +1435,7 @@ public:
 
     void onCompleted() override { throw Exception(ErrorCodes::LOGICAL_ERROR, "Not implemented"); }
     StorageID getStorageID() override { throw Exception(ErrorCodes::LOGICAL_ERROR, "Not implemented"); }
-    UInt64 getPriority() override { throw Exception(ErrorCodes::LOGICAL_ERROR, "Not implemented"); }
+    Priority getPriority() override { throw Exception(ErrorCodes::LOGICAL_ERROR, "Not implemented"); }
 
     bool executeStep() override
     {
@@ -1530,7 +1553,7 @@ private:
         /// new part can use them.
         ctx->hardlinked_files.source_table_shared_id = ctx->source_part->storage.getTableSharedID();
         ctx->hardlinked_files.source_part_name = ctx->source_part->name;
-        ctx->hardlinked_files.hardlinks_from_source_part = hardlinked_files;
+        ctx->hardlinked_files.hardlinks_from_source_part = std::move(hardlinked_files);
 
         (*ctx->mutate_entry)->columns_written = ctx->storage_columns.size() - ctx->updated_header.columns();
 
@@ -1780,7 +1803,12 @@ bool MutateTask::prepare()
         if (ctx->need_prefix)
             prefix = "tmp_clone_";
 
-        auto [part, lock] = ctx->data->cloneAndLoadDataPartOnSameDisk(ctx->source_part, prefix, ctx->future_part->part_info, ctx->metadata_snapshot, ctx->txn, &ctx->hardlinked_files, false, files_to_copy_instead_of_hardlinks);
+        IDataPartStorage::ClonePartParams clone_params
+        {
+            .txn = ctx->txn, .hardlinked_files = &ctx->hardlinked_files,
+            .files_to_copy_instead_of_hardlinks = std::move(files_to_copy_instead_of_hardlinks), .keep_metadata_version = true
+        };
+        auto [part, lock] = ctx->data->cloneAndLoadDataPartOnSameDisk(ctx->source_part, prefix, ctx->future_part->part_info, ctx->metadata_snapshot, clone_params);
         part->getDataPartStorage().beginTransaction();
 
         ctx->temporary_directory_lock = std::move(lock);
@@ -1878,14 +1906,10 @@ bool MutateTask::prepare()
     }
     else /// TODO: check that we modify only non-key columns in this case.
     {
-        /// We will modify only some of the columns. Other columns and key values can be copied as-is.
-        for (const auto & name_type : ctx->updated_header.getNamesAndTypesList())
-            ctx->updated_columns.emplace(name_type.name);
-
         ctx->indices_to_recalc = MutationHelpers::getIndicesToRecalculate(
-            ctx->mutating_pipeline_builder, ctx->updated_columns, ctx->metadata_snapshot, ctx->context, ctx->materialized_indices, ctx->source_part);
-        ctx->projections_to_recalc = MutationHelpers::getProjectionsToRecalculate(
-            ctx->updated_columns, ctx->metadata_snapshot, ctx->materialized_projections, ctx->source_part);
+            ctx->mutating_pipeline_builder, ctx->metadata_snapshot, ctx->context, ctx->materialized_indices);
+
+        ctx->projections_to_recalc = MutationHelpers::getProjectionsToRecalculate(ctx->metadata_snapshot, ctx->materialized_projections);
 
         ctx->files_to_skip = MutationHelpers::collectFilesToSkip(
             ctx->source_part,
@@ -1913,7 +1937,7 @@ bool MutateTask::prepare()
     return true;
 }
 
-const MergeTreeData::HardlinkedFiles & MutateTask::getHardlinkedFiles() const
+const HardlinkedFiles & MutateTask::getHardlinkedFiles() const
 {
     return ctx->hardlinked_files;
 }
diff --git a/src/Storages/MergeTree/MutateTask.h b/src/Storages/MergeTree/MutateTask.h
index 54ad996ad4c..dc21df018d7 100644
--- a/src/Storages/MergeTree/MutateTask.h
+++ b/src/Storages/MergeTree/MutateTask.h
@@ -45,7 +45,7 @@ public:
         return promise.get_future();
     }
 
-    const MergeTreeData::HardlinkedFiles & getHardlinkedFiles() const;
+    const HardlinkedFiles & getHardlinkedFiles() const;
 
 private:
 
diff --git a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
index bb044d15ba2..57cd91cc995 100644
--- a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
+++ b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
@@ -43,7 +43,7 @@ struct fmt::formatter<DB::Part>
     template <typename FormatContext>
     auto format(const DB::Part & part, FormatContext & ctx)
     {
-        return format_to(ctx.out(), "{} in replicas [{}]", part.description.describe(), fmt::join(part.replicas, ", "));
+        return fmt::format_to(ctx.out(), "{} in replicas [{}]", part.description.describe(), fmt::join(part.replicas, ", "));
     }
 };
 
@@ -102,7 +102,6 @@ public:
 
     explicit DefaultCoordinator(size_t replicas_count_)
         : ParallelReplicasReadingCoordinator::ImplInterface(replicas_count_)
-        , announcements(replicas_count_)
         , reading_state(replicas_count_)
     {
     }
@@ -119,7 +118,6 @@ public:
     PartitionToBlockRanges partitions;
 
     size_t sent_initial_requests{0};
-    std::vector<InitialAllRangesAnnouncement> announcements;
 
     Parts all_parts_to_read;
     /// Contains only parts which we haven't started to read from
diff --git a/src/Storages/MergeTree/PartMetadataManagerWithCache.cpp b/src/Storages/MergeTree/PartMetadataManagerWithCache.cpp
index 7c0aedf699b..bb6462b3058 100644
--- a/src/Storages/MergeTree/PartMetadataManagerWithCache.cpp
+++ b/src/Storages/MergeTree/PartMetadataManagerWithCache.cpp
@@ -250,8 +250,8 @@ std::unordered_map<String, IPartMetadataManager::uint128> PartMetadataManagerWit
                     ErrorCodes::CORRUPTED_DATA,
                     "Checksums doesn't match in part {} for {}. Expected: {}. Found {}.",
                     part->name, file_path,
-                    getHexUIntUppercase(disk_checksum.first) + getHexUIntUppercase(disk_checksum.second),
-                    getHexUIntUppercase(cache_checksums[i].first) + getHexUIntUppercase(cache_checksums[i].second));
+                    getHexUIntUppercase(disk_checksum),
+                    getHexUIntUppercase(cache_checksums[i]));
 
             disk_checksums.push_back(disk_checksum);
             continue;
@@ -287,8 +287,8 @@ std::unordered_map<String, IPartMetadataManager::uint128> PartMetadataManagerWit
                 ErrorCodes::CORRUPTED_DATA,
                 "Checksums doesn't match in projection part {} {}. Expected: {}. Found {}.",
                 part->name, proj_name,
-                getHexUIntUppercase(disk_checksum.first) + getHexUIntUppercase(disk_checksum.second),
-                getHexUIntUppercase(cache_checksums[i].first) + getHexUIntUppercase(cache_checksums[i].second));
+                getHexUIntUppercase(disk_checksum),
+                getHexUIntUppercase(cache_checksums[i]));
         disk_checksums.push_back(disk_checksum);
     }
     return results;
diff --git a/src/Storages/MergeTree/PartitionPruner.cpp b/src/Storages/MergeTree/PartitionPruner.cpp
index 35b2d5db3b5..97bb9f3b4d4 100644
--- a/src/Storages/MergeTree/PartitionPruner.cpp
+++ b/src/Storages/MergeTree/PartitionPruner.cpp
@@ -24,6 +24,13 @@ PartitionPruner::PartitionPruner(const StorageMetadataPtr & metadata, const Sele
 {
 }
 
+PartitionPruner::PartitionPruner(const StorageMetadataPtr & metadata, ActionsDAGPtr filter_actions_dag, ContextPtr context, bool strict)
+    : partition_key(MergeTreePartition::adjustPartitionKey(metadata, context))
+    , partition_condition(filter_actions_dag, context, partition_key.column_names, partition_key.expression, {}, true /* single_point */, strict)
+    , useless(strict ? partition_condition.anyUnknownOrAlwaysTrue() : partition_condition.alwaysUnknownOrTrue())
+{
+}
+
 bool PartitionPruner::canBePruned(const IMergeTreeDataPart & part)
 {
     if (part.isEmpty())
diff --git a/src/Storages/MergeTree/PartitionPruner.h b/src/Storages/MergeTree/PartitionPruner.h
index 3a986923321..7f1b74795c4 100644
--- a/src/Storages/MergeTree/PartitionPruner.h
+++ b/src/Storages/MergeTree/PartitionPruner.h
@@ -14,6 +14,7 @@ class PartitionPruner
 {
 public:
     PartitionPruner(const StorageMetadataPtr & metadata, const SelectQueryInfo & query_info, ContextPtr context, bool strict);
+    PartitionPruner(const StorageMetadataPtr & metadata, ActionsDAGPtr filter_actions_dag, ContextPtr context, bool strict);
 
     bool canBePruned(const IMergeTreeDataPart & part);
 
diff --git a/src/Storages/MergeTree/RPNBuilder.cpp b/src/Storages/MergeTree/RPNBuilder.cpp
index e49459d3d17..a0c96c13d59 100644
--- a/src/Storages/MergeTree/RPNBuilder.cpp
+++ b/src/Storages/MergeTree/RPNBuilder.cpp
@@ -9,6 +9,7 @@
 
 #include <DataTypes/FieldToDataType.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 
 #include <Columns/ColumnConst.h>
 #include <Columns/ColumnSet.h>
@@ -180,6 +181,21 @@ bool RPNBuilderTreeNode::isConstant() const
     }
 }
 
+bool RPNBuilderTreeNode::isSubqueryOrSet() const
+{
+    if (ast_node)
+    {
+        return
+            typeid_cast<const ASTSubquery *>(ast_node) ||
+            typeid_cast<const ASTTableIdentifier *>(ast_node);
+    }
+    else
+    {
+        const auto * node_without_alias = getNodeWithoutAlias(dag_node);
+        return node_without_alias->result_type->getTypeId() == TypeIndex::Set;
+    }
+}
+
 ColumnWithTypeAndName RPNBuilderTreeNode::getConstantColumn() const
 {
     if (!isConstant())
@@ -275,7 +291,7 @@ bool RPNBuilderTreeNode::tryGetConstant(Field & output_value, DataTypePtr & outp
 namespace
 {
 
-ConstSetPtr tryGetSetFromDAGNode(const ActionsDAG::Node * dag_node)
+FutureSetPtr tryGetSetFromDAGNode(const ActionsDAG::Node * dag_node)
 {
     if (!dag_node->column)
         return {};
@@ -285,28 +301,26 @@ ConstSetPtr tryGetSetFromDAGNode(const ActionsDAG::Node * dag_node)
         column = &column_const->getDataColumn();
 
     if (const auto * column_set = typeid_cast<const ColumnSet *>(column))
-    {
-        auto set = column_set->getData();
-
-        if (set && set->isCreated())
-            return set;
-    }
+        return column_set->getData();
 
     return {};
 }
 
 }
 
-ConstSetPtr RPNBuilderTreeNode::tryGetPreparedSet() const
+FutureSetPtr RPNBuilderTreeNode::tryGetPreparedSet() const
 {
     const auto & prepared_sets = getTreeContext().getPreparedSets();
 
     if (ast_node && prepared_sets)
     {
-        auto prepared_sets_with_same_hash = prepared_sets->getByTreeHash(ast_node->getTreeHash());
-        for (auto & set : prepared_sets_with_same_hash)
-            if (set.isCreated())
-                return set.get();
+        auto key = ast_node->getTreeHash();
+        const auto & sets = prepared_sets->getSetsFromTuple();
+        auto it = sets.find(key);
+        if (it != sets.end() && !it->second.empty())
+            return it->second.at(0);
+
+        return prepared_sets->findSubquery(key);
     }
     else if (dag_node)
     {
@@ -317,16 +331,16 @@ ConstSetPtr RPNBuilderTreeNode::tryGetPreparedSet() const
     return {};
 }
 
-ConstSetPtr RPNBuilderTreeNode::tryGetPreparedSet(const DataTypes & data_types) const
+FutureSetPtr RPNBuilderTreeNode::tryGetPreparedSet(const DataTypes & data_types) const
 {
     const auto & prepared_sets = getTreeContext().getPreparedSets();
 
     if (prepared_sets && ast_node)
     {
         if (ast_node->as<ASTSubquery>() || ast_node->as<ASTTableIdentifier>())
-            return prepared_sets->get(PreparedSetKey::forSubquery(*ast_node));
+            return prepared_sets->findSubquery(ast_node->getTreeHash());
 
-        return prepared_sets->get(PreparedSetKey::forLiteral(*ast_node, data_types));
+        return prepared_sets->findTuple(ast_node->getTreeHash(), data_types);
     }
     else if (dag_node)
     {
@@ -337,46 +351,59 @@ ConstSetPtr RPNBuilderTreeNode::tryGetPreparedSet(const DataTypes & data_types)
     return nullptr;
 }
 
-ConstSetPtr RPNBuilderTreeNode::tryGetPreparedSet(
+FutureSetPtr RPNBuilderTreeNode::tryGetPreparedSet(
     const std::vector<MergeTreeSetIndex::KeyTuplePositionMapping> & indexes_mapping,
     const DataTypes & data_types) const
 {
     const auto & prepared_sets = getTreeContext().getPreparedSets();
 
+    /// We have `PreparedSetKey::forLiteral` but it is useless here as we don't have enough information
+    /// about types in left argument of the IN operator. Instead, we manually iterate through all the sets
+    /// and find the one for the right arg based on the AST structure (getTreeHash), after that we check
+    /// that the types it was prepared with are compatible with the types of the primary key.
+    auto types_match = [&indexes_mapping, &data_types](const DataTypes & set_types)
+    {
+        assert(indexes_mapping.size() == data_types.size());
+
+        for (size_t i = 0; i < indexes_mapping.size(); ++i)
+        {
+            if (indexes_mapping[i].tuple_index >= set_types.size())
+                return false;
+
+            auto lhs = removeNullable(recursiveRemoveLowCardinality(data_types[i]));
+            auto rhs = removeNullable(recursiveRemoveLowCardinality(set_types[indexes_mapping[i].tuple_index]));
+
+            if (!lhs->equals(*rhs))
+                return false;
+        }
+
+        return true;
+    };
+
     if (prepared_sets && ast_node)
     {
         if (ast_node->as<ASTSubquery>() || ast_node->as<ASTTableIdentifier>())
-            return prepared_sets->get(PreparedSetKey::forSubquery(*ast_node));
-
-        /// We have `PreparedSetKey::forLiteral` but it is useless here as we don't have enough information
-        /// about types in left argument of the IN operator. Instead, we manually iterate through all the sets
-        /// and find the one for the right arg based on the AST structure (getTreeHash), after that we check
-        /// that the types it was prepared with are compatible with the types of the primary key.
-        auto types_match = [&indexes_mapping, &data_types](const SetPtr & candidate_set)
-        {
-            assert(indexes_mapping.size() == data_types.size());
-
-            for (size_t i = 0; i < indexes_mapping.size(); ++i)
-            {
-                if (!candidate_set->areTypesEqual(indexes_mapping[i].tuple_index, data_types[i]))
-                    return false;
-            }
-
-            return true;
-        };
+            return prepared_sets->findSubquery(ast_node->getTreeHash());
 
         auto tree_hash = ast_node->getTreeHash();
-        for (const auto & set : prepared_sets->getByTreeHash(tree_hash))
-        {
-            if (set.isCreated() && types_match(set.get()))
-                return set.get();
-        }
+        const auto & sets = prepared_sets->getSetsFromTuple();
+        auto it = sets.find(tree_hash);
+        if (it == sets.end())
+            return nullptr;
+
+        for (const auto & future_set : it->second)
+            if (types_match(future_set->getTypes()))
+                return future_set;
     }
     else
     {
         const auto * node_without_alias = getNodeWithoutAlias(dag_node);
         if (node_without_alias->column)
-            return tryGetSetFromDAGNode(node_without_alias);
+        {
+            auto future_set = tryGetSetFromDAGNode(node_without_alias);
+            if (types_match(future_set->getTypes()))
+                return future_set;
+        }
     }
 
     return nullptr;
diff --git a/src/Storages/MergeTree/RPNBuilder.h b/src/Storages/MergeTree/RPNBuilder.h
index 626eb288493..9eeb6deefd5 100644
--- a/src/Storages/MergeTree/RPNBuilder.h
+++ b/src/Storages/MergeTree/RPNBuilder.h
@@ -98,6 +98,8 @@ public:
     /// Is node constant
     bool isConstant() const;
 
+    bool isSubqueryOrSet() const;
+
     /** Get constant as constant column.
       * Node must be constant before calling these method, otherwise logical exception is thrown.
       */
@@ -109,13 +111,13 @@ public:
     bool tryGetConstant(Field & output_value, DataTypePtr & output_type) const;
 
     /// Try get prepared set from node
-    ConstSetPtr tryGetPreparedSet() const;
+    FutureSetPtr tryGetPreparedSet() const;
 
     /// Try get prepared set from node that match data types
-    ConstSetPtr tryGetPreparedSet(const DataTypes & data_types) const;
+    FutureSetPtr tryGetPreparedSet(const DataTypes & data_types) const;
 
     /// Try get prepared set from node that match indexes mapping and data types
-    ConstSetPtr tryGetPreparedSet(
+    FutureSetPtr tryGetPreparedSet(
         const std::vector<MergeTreeSetIndex::KeyTuplePositionMapping> & indexes_mapping,
         const DataTypes & data_types) const;
 
diff --git a/src/Storages/MergeTree/RangesInDataPart.cpp b/src/Storages/MergeTree/RangesInDataPart.cpp
index 6203f9f7483..e64e9ab0b2a 100644
--- a/src/Storages/MergeTree/RangesInDataPart.cpp
+++ b/src/Storages/MergeTree/RangesInDataPart.cpp
@@ -15,7 +15,7 @@ struct fmt::formatter<DB::RangesInDataPartDescription>
     template <typename FormatContext>
     auto format(const DB::RangesInDataPartDescription & range, FormatContext & ctx)
     {
-        return format_to(ctx.out(), "{}", range.describe());
+        return fmt::format_to(ctx.out(), "{}", range.describe());
     }
 };
 
diff --git a/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.cpp b/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.cpp
index 3b361abfc1a..61356558e16 100644
--- a/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.cpp
@@ -119,9 +119,11 @@ bool ReplicatedMergeMutateTaskBase::executeStep()
                 }
             }
         }
-
     }
 
+    if (saved_exception)
+        std::rethrow_exception(saved_exception);
+
     return false;
 }
 
diff --git a/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.h b/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.h
index a7bf1290274..1e7f9834245 100644
--- a/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.h
+++ b/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.h
@@ -21,10 +21,10 @@ public:
         StorageReplicatedMergeTree & storage_,
         ReplicatedMergeTreeQueue::SelectedEntryPtr & selected_entry_,
         IExecutableTask::TaskResultCallback & task_result_callback_)
-        : selected_entry(selected_entry_)
+        : storage(storage_)
+        , selected_entry(selected_entry_)
         , entry(*selected_entry->log_entry)
         , log(log_)
-        , storage(storage_)
         /// This is needed to ask an asssignee to assign a new merge/mutate operation
         /// It takes bool argument and true means that current task is successfully executed.
         , task_result_callback(task_result_callback_)
@@ -52,13 +52,18 @@ protected:
     /// Will execute a part of inner MergeTask or MutateTask
     virtual bool executeInnerTask() = 0;
 
+    StorageReplicatedMergeTree & storage;
+
+    /// A callback to reschedule merge_selecting_task after destroying merge_mutate_entry
+    /// The order is important, because merge_selecting_task may rely on the number of entries in MergeList
+    scope_guard finish_callback;
+
     /// This is important not to execute the same mutation in parallel
     /// selected_entry is a RAII class, so the time of living must be the same as for the whole task
     ReplicatedMergeTreeQueue::SelectedEntryPtr selected_entry;
     ReplicatedMergeTreeLogEntry & entry;
     MergeList::EntryPtr merge_mutate_entry{nullptr};
     Poco::Logger * log;
-    StorageReplicatedMergeTree & storage;
     /// ProfileEvents for current part will be stored here
     ProfileEvents::Counters profile_counters;
     ContextMutablePtr task_context;
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.cpp
index 0409cadc1e9..bcc4dc749fb 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.cpp
@@ -25,19 +25,22 @@ ReplicatedMergeTreeCleanupThread::ReplicatedMergeTreeCleanupThread(StorageReplic
     : storage(storage_)
     , log_name(storage.getStorageID().getFullTableName() + " (ReplicatedMergeTreeCleanupThread)")
     , log(&Poco::Logger::get(log_name))
+    , sleep_ms(storage.getSettings()->cleanup_delay_period * 1000)
 {
     task = storage.getContext()->getSchedulePool().createTask(log_name, [this]{ run(); });
 }
 
 void ReplicatedMergeTreeCleanupThread::run()
 {
-    auto storage_settings = storage.getSettings();
-    const auto sleep_ms = storage_settings->cleanup_delay_period * 1000
-        + std::uniform_int_distribution<UInt64>(0, storage_settings->cleanup_delay_period_random_add * 1000)(rng);
+    SCOPE_EXIT({ is_running.store(false, std::memory_order_relaxed); });
+    is_running.store(true, std::memory_order_relaxed);
 
+    auto storage_settings = storage.getSettings();
+
+    Float32 cleanup_points = 0;
     try
     {
-        iterate();
+        cleanup_points = iterate();
     }
     catch (const Coordination::Exception & e)
     {
@@ -51,39 +54,144 @@ void ReplicatedMergeTreeCleanupThread::run()
         tryLogCurrentException(log, __PRETTY_FUNCTION__);
     }
 
+    UInt64 prev_timestamp = prev_cleanup_timestamp_ms.load(std::memory_order_relaxed);
+    UInt64 now_ms = clock_gettime_ns_adjusted(prev_timestamp * 1'000'000) / 1'000'000;
+
+    /// Do not adjust sleep_ms on the first run after starting the server
+    if (prev_timestamp && storage_settings->cleanup_thread_preferred_points_per_iteration)
+    {
+        /// We don't want to run the task too often when the table was barely changed and there's almost nothing to cleanup.
+        /// But we cannot simply sleep max_cleanup_delay_period (300s) when nothing was cleaned up and cleanup_delay_period (30s)
+        /// when we removed something, because inserting one part per 30s will lead to running cleanup each 30s just to remove one part.
+        /// So we need some interpolation based on preferred batch size.
+        auto expected_cleanup_points = storage_settings->cleanup_thread_preferred_points_per_iteration;
+
+        /// How long should we sleep to remove cleanup_thread_preferred_points_per_iteration on the next iteration?
+        Float32 ratio = cleanup_points / expected_cleanup_points;
+        if (ratio == 0)
+            sleep_ms = storage_settings->max_cleanup_delay_period * 1000;
+        else
+            sleep_ms = static_cast<UInt64>(sleep_ms / ratio);
+
+        if (sleep_ms < storage_settings->cleanup_delay_period * 1000)
+            sleep_ms = storage_settings->cleanup_delay_period * 1000;
+        if (storage_settings->max_cleanup_delay_period * 1000 < sleep_ms)
+            sleep_ms = storage_settings->max_cleanup_delay_period * 1000;
+
+        UInt64 interval_ms = now_ms - prev_timestamp;
+        LOG_TRACE(log, "Scheduling next cleanup after {}ms (points: {}, interval: {}ms, ratio: {}, points per minute: {})",
+                  sleep_ms, cleanup_points, interval_ms, ratio, cleanup_points / interval_ms * 60'000);
+    }
+    prev_cleanup_timestamp_ms.store(now_ms, std::memory_order_relaxed);
+
+    sleep_ms += std::uniform_int_distribution<UInt64>(0, storage_settings->cleanup_delay_period_random_add * 1000)(rng);
     task->scheduleAfter(sleep_ms);
 }
 
-
-void ReplicatedMergeTreeCleanupThread::iterate()
+void ReplicatedMergeTreeCleanupThread::wakeupEarlierIfNeeded()
 {
-    storage.clearOldPartsAndRemoveFromZK();
+    /// It may happen that the tables was idle for a long time, but then a user started to aggressively insert (or mutate) data.
+    /// In this case, sleep_ms was set to the highest possible value, the task is not going to wake up soon,
+    /// but the number of objects to clean up is growing. We need to wakeup the task earlier.
+    auto storage_settings = storage.getSettings();
+    if (!storage_settings->cleanup_thread_preferred_points_per_iteration)
+        return;
+
+    /// The number of other objects (logs, blocks, etc) is usually correlated with the number of Outdated parts.
+    /// Do not wake up unless we have too many.
+    size_t number_of_outdated_objects = storage.getOutdatedPartsCount();
+    if (number_of_outdated_objects < storage_settings->cleanup_thread_preferred_points_per_iteration * 2)
+        return;
+
+    /// A race condition is possible here, but it's okay
+    if (is_running.load(std::memory_order_relaxed))
+        return;
+
+    /// Do not re-check all parts too often (avoid constantly calling getNumberOfOutdatedPartsWithExpiredRemovalTime())
+    if (!wakeup_check_timer.compareAndRestart(storage_settings->cleanup_delay_period / 4.0))
+        return;
+
+    UInt64 prev_run_timestamp_ms = prev_cleanup_timestamp_ms.load(std::memory_order_relaxed);
+    UInt64 now_ms = clock_gettime_ns_adjusted(prev_run_timestamp_ms * 1'000'000) / 1'000'000;
+    if (!prev_run_timestamp_ms || now_ms <= prev_run_timestamp_ms)
+        return;
+
+    /// Don't run it more often than cleanup_delay_period
+    UInt64 seconds_passed = (now_ms - prev_run_timestamp_ms) / 1000;
+    if (seconds_passed < storage_settings->cleanup_delay_period)
+        return;
+
+    /// Do not count parts that cannot be removed anyway. Do not wake up unless we have too many.
+    number_of_outdated_objects = storage.getNumberOfOutdatedPartsWithExpiredRemovalTime();
+    if (number_of_outdated_objects < storage_settings->cleanup_thread_preferred_points_per_iteration * 2)
+        return;
+
+    LOG_TRACE(log, "Waking up cleanup thread because there are {} outdated objects and previous cleanup finished {}s ago",
+              number_of_outdated_objects, seconds_passed);
+
+    wakeup();
+}
+
+
+Float32 ReplicatedMergeTreeCleanupThread::iterate()
+{
+    size_t cleaned_logs = 0;
+    Float32 cleaned_blocks = 0;
+    size_t cleaned_other = 0;
+    size_t cleaned_part_like = 0;
+    size_t cleaned_parts = storage.clearOldPartsAndRemoveFromZK();
+
+    auto storage_settings = storage.getSettings();
 
     {
         auto lock = storage.lockForShare(RWLockImpl::NO_QUERY, storage.getSettings()->lock_acquire_timeout_for_background_operations);
         /// Both use relative_data_path which changes during rename, so we
         /// do it under share lock
-        storage.clearOldWriteAheadLogs();
-        storage.clearOldTemporaryDirectories(storage.getSettings()->temporary_directories_lifetime.totalSeconds());
+        cleaned_other += storage.clearOldWriteAheadLogs();
+        cleaned_part_like += storage.clearOldTemporaryDirectories(storage.getSettings()->temporary_directories_lifetime.totalSeconds());
         if (storage.getSettings()->merge_tree_enable_clear_old_broken_detached)
-            storage.clearOldBrokenPartsFromDetachedDirectory();
+            cleaned_part_like += storage.clearOldBrokenPartsFromDetachedDirectory();
     }
 
     /// This is loose condition: no problem if we actually had lost leadership at this moment
     ///  and two replicas will try to do cleanup simultaneously.
     if (storage.is_leader)
     {
-        clearOldLogs();
-        auto storage_settings = storage.getSettings();
-        clearOldBlocks("blocks", storage_settings->replicated_deduplication_window_seconds, storage_settings->replicated_deduplication_window, cached_block_stats_for_sync_inserts);
-        clearOldBlocks("async_blocks", storage_settings->replicated_deduplication_window_seconds_for_async_inserts, storage_settings->replicated_deduplication_window_for_async_inserts, cached_block_stats_for_async_inserts);
-        clearOldMutations();
-        storage.clearEmptyParts();
+        cleaned_logs = clearOldLogs();
+        size_t normal_blocks = clearOldBlocks("blocks", storage_settings->replicated_deduplication_window_seconds,
+                                   storage_settings->replicated_deduplication_window, cached_block_stats_for_sync_inserts);
+
+        size_t async_blocks = clearOldBlocks("async_blocks",
+                                   storage_settings->replicated_deduplication_window_seconds_for_async_inserts,
+                                   storage_settings->replicated_deduplication_window_for_async_inserts,
+                                   cached_block_stats_for_async_inserts);
+
+        /// Many async blocks are transformed into one ordinary block
+        Float32 async_blocks_per_block = static_cast<Float32>(storage_settings->replicated_deduplication_window) /
+            (storage_settings->replicated_deduplication_window_for_async_inserts + 1);
+        cleaned_blocks = (normal_blocks + async_blocks * async_blocks_per_block) / 2;
+
+        cleaned_other += clearOldMutations();
+        cleaned_part_like += storage.clearEmptyParts();
     }
+
+    /// We need to measure the number of removed objects somehow (for better scheduling),
+    /// but just summing the number of removed async blocks, logs, and empty parts does not make any sense.
+    /// So we are trying to (approximately) measure the number of inserted blocks/parts, so we will be able to compare apples to apples.
+
+    /// Each inserted block produces 3 objects that have to be cleaned up: one block, one log entry and one part.
+    /// A few new parts get merged together producing one log entry and one part.
+
+    /// Other objects (like mutations and WALs) are much more rare than Outdated parts (because mutations usually produce
+    /// many Outdated parts, and WALs usually contain many parts too). We count then as one part for simplicity.
+
+    constexpr Float32 parts_number_amplification = 1.3f;     /// Assuming we merge 4-5 parts each time
+    Float32 cleaned_inserted_parts = (cleaned_blocks + (cleaned_logs + cleaned_parts) / parts_number_amplification) / 3;
+    return cleaned_inserted_parts + cleaned_part_like + cleaned_other;
 }
 
 
-void ReplicatedMergeTreeCleanupThread::clearOldLogs()
+size_t ReplicatedMergeTreeCleanupThread::clearOldLogs()
 {
     auto zookeeper = storage.getZooKeeper();
     auto storage_settings = storage.getSettings();
@@ -102,7 +210,7 @@ void ReplicatedMergeTreeCleanupThread::clearOldLogs()
     size_t min_replicated_logs_to_keep = static_cast<size_t>(storage_settings->min_replicated_logs_to_keep * ratio);
 
     if (static_cast<double>(children_count) < min_replicated_logs_to_keep)
-        return;
+        return 0;
 
     Strings replicas = zookeeper->getChildren(storage.zookeeper_path + "/replicas", &stat);
 
@@ -114,7 +222,7 @@ void ReplicatedMergeTreeCleanupThread::clearOldLogs()
     Strings entries = zookeeper->getChildren(storage.zookeeper_path + "/log");
 
     if (entries.empty())
-        return;
+        return 0;
 
     ::sort(entries.begin(), entries.end());
 
@@ -227,7 +335,7 @@ void ReplicatedMergeTreeCleanupThread::clearOldLogs()
     entries.erase(std::lower_bound(entries.begin(), entries.end(), "log-" + padIndex(min_saved_log_pointer)), entries.end());
 
     if (entries.empty())
-        return;
+        return 0;
 
     markLostReplicas(
         host_versions_lost_replicas,
@@ -268,6 +376,8 @@ void ReplicatedMergeTreeCleanupThread::clearOldLogs()
 
     if (i != 0)
         LOG_DEBUG(log, "Removed {} old log entries: {} - {}", i, entries[0], entries[i - 1]);
+
+    return i;
 }
 
 
@@ -323,7 +433,7 @@ struct ReplicatedMergeTreeCleanupThread::NodeWithStat
     }
 };
 
-void ReplicatedMergeTreeCleanupThread::clearOldBlocks(const String & blocks_dir_name, UInt64 window_seconds, UInt64 window_size, NodeCTimeAndVersionCache & cached_block_stats)
+size_t ReplicatedMergeTreeCleanupThread::clearOldBlocks(const String & blocks_dir_name, UInt64 window_seconds, UInt64 window_size, NodeCTimeAndVersionCache & cached_block_stats)
 {
     auto zookeeper = storage.getZooKeeper();
 
@@ -331,7 +441,7 @@ void ReplicatedMergeTreeCleanupThread::clearOldBlocks(const String & blocks_dir_
     getBlocksSortedByTime(blocks_dir_name, *zookeeper, timed_blocks, cached_block_stats);
 
     if (timed_blocks.empty())
-        return;
+        return 0;
 
     /// Use ZooKeeper's first node (last according to time) timestamp as "current" time.
     Int64 current_time = timed_blocks.front().ctime;
@@ -350,7 +460,7 @@ void ReplicatedMergeTreeCleanupThread::clearOldBlocks(const String & blocks_dir_
 
     auto num_nodes_to_delete = timed_blocks.end() - first_outdated_block;
     if (!num_nodes_to_delete)
-        return;
+        return 0;
 
     auto last_outdated_block = timed_blocks.end() - 1;
     LOG_TRACE(log, "Will clear {} old blocks from {} (ctime {}) to {} (ctime {})", num_nodes_to_delete,
@@ -388,6 +498,7 @@ void ReplicatedMergeTreeCleanupThread::clearOldBlocks(const String & blocks_dir_
     }
 
     LOG_TRACE(log, "Cleared {} old blocks from ZooKeeper", num_nodes_to_delete);
+    return num_nodes_to_delete;
 }
 
 
@@ -456,17 +567,17 @@ void ReplicatedMergeTreeCleanupThread::getBlocksSortedByTime(const String & bloc
 }
 
 
-void ReplicatedMergeTreeCleanupThread::clearOldMutations()
+size_t ReplicatedMergeTreeCleanupThread::clearOldMutations()
 {
     auto storage_settings = storage.getSettings();
     if (!storage_settings->finished_mutations_to_keep)
-        return;
+        return 0;
 
     if (storage.queue.countFinishedMutations() <= storage_settings->finished_mutations_to_keep)
     {
         /// Not strictly necessary, but helps to avoid unnecessary ZooKeeper requests.
         /// If even this replica hasn't finished enough mutations yet, then we don't need to clean anything.
-        return;
+        return 0;
     }
 
     auto zookeeper = storage.getZooKeeper();
@@ -481,7 +592,7 @@ void ReplicatedMergeTreeCleanupThread::clearOldMutations()
         // No Need to check return value to delete mutations.
         zookeeper->tryGet(storage.zookeeper_path + "/replicas/" + replica + "/mutation_pointer", pointer);
         if (pointer.empty())
-            return; /// One replica hasn't done anything yet so we can't delete any mutations.
+            return 0; /// One replica hasn't done anything yet so we can't delete any mutations.
         min_pointer = std::min(parse<UInt64>(pointer), min_pointer);
     }
 
@@ -492,11 +603,11 @@ void ReplicatedMergeTreeCleanupThread::clearOldMutations()
     entries.erase(std::upper_bound(entries.begin(), entries.end(), padIndex(min_pointer)), entries.end());
     /// Do not remove last `storage_settings->finished_mutations_to_keep` entries.
     if (entries.size() <= storage_settings->finished_mutations_to_keep)
-        return;
+        return 0;
     entries.erase(entries.end() - storage_settings->finished_mutations_to_keep, entries.end());
 
     if (entries.empty())
-        return;
+        return 0;
 
     Coordination::Requests ops;
     size_t batch_start_i = 0;
@@ -526,6 +637,8 @@ void ReplicatedMergeTreeCleanupThread::clearOldMutations()
             ops.clear();
         }
     }
+
+    return entries.size();
 }
 
 }
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.h b/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.h
index 76b9ee4a575..57de7944970 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.h
@@ -4,6 +4,7 @@
 #include <Common/ZooKeeper/Types.h>
 #include <Common/ZooKeeper/ZooKeeper.h>
 #include <Common/randomSeed.h>
+#include <Common/Stopwatch.h>
 #include <Core/BackgroundSchedulePool.h>
 #include <thread>
 
@@ -31,6 +32,8 @@ public:
 
     void stop() { task->deactivate(); }
 
+    void wakeupEarlierIfNeeded();
+
 private:
     StorageReplicatedMergeTree & storage;
     String log_name;
@@ -38,11 +41,20 @@ private:
     BackgroundSchedulePool::TaskHolder task;
     pcg64 rng{randomSeed()};
 
-    void run();
-    void iterate();
+    UInt64 sleep_ms;
 
-    /// Remove old records from ZooKeeper.
-    void clearOldLogs();
+    std::atomic<UInt64> prev_cleanup_timestamp_ms = 0;
+    std::atomic<bool> is_running = false;
+
+    AtomicStopwatch wakeup_check_timer;
+
+    void run();
+
+    /// Returns a number this is directly proportional to the number of cleaned up blocks
+    Float32 iterate();
+
+    /// Remove old records from ZooKeeper. Returns the number of removed logs
+    size_t clearOldLogs();
 
     /// The replica is marked as "lost" if it is inactive and its log pointer
     ///  is far behind and we are not going to keep logs for it.
@@ -52,11 +64,11 @@ private:
                           size_t replicas_count, const zkutil::ZooKeeperPtr & zookeeper);
 
     using NodeCTimeAndVersionCache = std::map<String, std::pair<Int64, Int32>>;
-    /// Remove old block hashes from ZooKeeper. This is done by the leader replica.
-    void clearOldBlocks(const String & blocks_dir_name, UInt64 window_seconds, UInt64 window_size, NodeCTimeAndVersionCache & cached_block_stats);
+    /// Remove old block hashes from ZooKeeper. This is done by the leader replica. Returns the number of removed blocks
+    size_t clearOldBlocks(const String & blocks_dir_name, UInt64 window_seconds, UInt64 window_size, NodeCTimeAndVersionCache & cached_block_stats);
 
-    /// Remove old mutations that are done from ZooKeeper. This is done by the leader replica.
-    void clearOldMutations();
+    /// Remove old mutations that are done from ZooKeeper. This is done by the leader replica. Returns the number of removed mutations
+    size_t clearOldMutations();
 
     NodeCTimeAndVersionCache cached_block_stats_for_sync_inserts;
     NodeCTimeAndVersionCache cached_block_stats_for_async_inserts;
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeLogEntry.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeLogEntry.cpp
index 79b0beb0933..ac956433eab 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeLogEntry.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeLogEntry.cpp
@@ -199,7 +199,7 @@ void ReplicatedMergeTreeLogEntryData::readText(ReadBuffer & in, MergeTreeDataFor
     {
         LocalDateTime create_time_dt;
         in >> "create_time: " >> create_time_dt >> "\n";
-        create_time = DateLUT::instance().makeDateTime(
+        create_time = DateLUT::serverTimezoneInstance().makeDateTime(
             create_time_dt.year(), create_time_dt.month(), create_time_dt.day(),
             create_time_dt.hour(), create_time_dt.minute(), create_time_dt.second());
     }
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeMutationEntry.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeMutationEntry.cpp
index 5e01cd96f6b..1bbb246338c 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeMutationEntry.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeMutationEntry.cpp
@@ -38,7 +38,7 @@ void ReplicatedMergeTreeMutationEntry::readText(ReadBuffer & in)
 
     LocalDateTime create_time_dt;
     in >> "create time: " >> create_time_dt >> "\n";
-    create_time = DateLUT::instance().makeDateTime(
+    create_time = DateLUT::serverTimezoneInstance().makeDateTime(
         create_time_dt.year(), create_time_dt.month(), create_time_dt.day(),
         create_time_dt.hour(), create_time_dt.minute(), create_time_dt.second());
 
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
index 0882ff5a0bc..c495fdaf5e2 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
@@ -344,6 +344,22 @@ CheckResult ReplicatedMergeTreePartCheckThread::checkPart(const String & part_na
 
     LOG_TRACE(log, "Part {} in zookeeper: {}, locally: {}", part_name, exists_in_zookeeper, part != nullptr);
 
+    if (exists_in_zookeeper && !part)
+    {
+        auto outdated = storage.getPartIfExists(part_name, {MergeTreeDataPartState::Outdated, MergeTreeDataPartState::Deleting});
+        if (outdated)
+        {
+            /// We cannot rely on exists_in_zookeeper, because the cleanup thread is probably going to remove it from ZooKeeper
+            /// Also, it will avoid "Cannot commit empty part: Part ... (state Outdated) already exists, but it will be deleted soon"
+            LOG_WARNING(log, "Part {} is Outdated, will wait for cleanup thread to handle it and check again later", part_name);
+            time_t lifetime = time(nullptr) - outdated->remove_time;
+            time_t max_lifetime = storage.getSettings()->old_parts_lifetime.totalSeconds();
+            time_t delay = lifetime >= max_lifetime ? 0 : max_lifetime - lifetime;
+            enqueuePart(part_name, delay + 30);
+            return {part_name, true, "Part is Outdated, will recheck later"};
+        }
+    }
+
     /// We do not have this or a covering part.
     if (!part)
     {
@@ -403,10 +419,11 @@ CheckResult ReplicatedMergeTreePartCheckThread::checkPart(const String & part_na
             }
             catch (const Exception & e)
             {
-                /// Don't count the part as broken if there is not enough memory to load it.
-                /// In fact, there can be many similar situations.
-                /// But it is OK, because there is a safety guard against deleting too many parts.
-                if (isNotEnoughMemoryErrorCode(e.code()))
+                /// Don't count the part as broken if we got known retryable exception.
+                /// In fact, there can be other similar situations because not all
+                /// of the exceptions are classified as retryable/non-retryable. But it is OK,
+                /// because there is a safety guard against deleting too many parts.
+                if (isRetryableException(e))
                     throw;
 
                 tryLogCurrentException(log, __PRETTY_FUNCTION__);
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
index 03ded2ef260..792843cbe18 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
@@ -1448,6 +1448,15 @@ bool ReplicatedMergeTreeQueue::shouldExecuteLogEntry(
             LOG_TRACE(LogToStr(out_postpone_reason, log), fmt_string, entry.znode_name, entry.alter_version, head_alter);
             return false;
         }
+
+        auto database_name = storage.getStorageID().database_name;
+        auto database = DatabaseCatalog::instance().getDatabase(database_name);
+        if (!database->canExecuteReplicatedMetadataAlter())
+        {
+            LOG_TRACE(LogToStr(out_postpone_reason, log), "Cannot execute alter metadata {} with version {} "
+                      "because database {} cannot process metadata alters now", entry.znode_name, entry.alter_version, database_name);
+            return false;
+        }
     }
 
     /// If this MUTATE_PART is part of alter modify/drop query, than we have to execute them one by one
@@ -1530,7 +1539,7 @@ bool ReplicatedMergeTreeQueue::shouldExecuteLogEntry(
 
 
 Int64 ReplicatedMergeTreeQueue::getCurrentMutationVersion(
-    const String & partition_id, Int64 data_version, std::lock_guard<std::mutex> & /* state_lock */) const
+    const String & partition_id, Int64 data_version) const
 {
     auto in_partition = mutations_by_partition.find(partition_id);
     if (in_partition == mutations_by_partition.end())
@@ -2108,24 +2117,19 @@ ReplicatedMergeTreeQueue::QueueLocks ReplicatedMergeTreeQueue::lockQueue()
 }
 
 LocalMergePredicate::LocalMergePredicate(ReplicatedMergeTreeQueue & queue_)
-    : queue(queue_)
 {
+    /// Use only information that can be quickly accessed locally without querying ZooKeeper
+    virtual_parts_ = &queue_.virtual_parts;
+    mutations_state_ = &queue_;
+    virtual_parts_mutex = &queue_.state_mutex;
 }
 
-ReplicatedMergeTreeMergePredicate::ReplicatedMergeTreeMergePredicate(
-    ReplicatedMergeTreeQueue & queue_, zkutil::ZooKeeperPtr & zookeeper, std::optional<PartitionIdsHint> && partition_ids_hint_)
-    : nested_pred(queue_)
-    , queue(queue_)
-    , partition_ids_hint(std::move(partition_ids_hint_))
-    , prev_virtual_parts(queue.format_version)
-{
-    {
-        std::lock_guard lock(queue.state_mutex);
-        prev_virtual_parts = queue.virtual_parts;
-    }
 
-    /// Load current quorum status.
-    auto quorum_status_future = zookeeper->asyncTryGet(fs::path(queue.zookeeper_path) / "quorum" / "status");
+template<typename VirtualPartsT, typename MutationsStateT>
+CommittingBlocks BaseMergePredicate<VirtualPartsT, MutationsStateT>::getCommittingBlocks(
+    zkutil::ZooKeeperPtr & zookeeper, const std::string & zookeeper_path, Poco::Logger * log_)
+{
+    CommittingBlocks committing_blocks;
 
     /// Load current inserts
     /// Hint avoids listing partitions that we don't really need.
@@ -2133,14 +2137,14 @@ ReplicatedMergeTreeMergePredicate::ReplicatedMergeTreeMergePredicate(
     /// so without hint it can do a few thousands requests (if not using MultiRead).
     Strings partitions;
     if (!partition_ids_hint)
-        partitions = zookeeper->getChildren(fs::path(queue.zookeeper_path) / "block_numbers");
+        partitions = zookeeper->getChildren(fs::path(zookeeper_path) / "block_numbers");
     else
         std::copy(partition_ids_hint->begin(), partition_ids_hint->end(), std::back_inserter(partitions));
 
     std::vector<std::string> paths;
     paths.reserve(partitions.size());
     for (const String & partition : partitions)
-        paths.push_back(fs::path(queue.zookeeper_path) / "block_numbers" / partition);
+        paths.push_back(fs::path(zookeeper_path) / "block_numbers" / partition);
 
     auto locks_children = zookeeper->tryGetChildren(paths);
 
@@ -2153,22 +2157,40 @@ ReplicatedMergeTreeMergePredicate::ReplicatedMergeTreeMergePredicate(
         if (response.error != Coordination::Error::ZOK)
         {
             /// Probably a wrong hint was provided (it's ok if a user passed non-existing partition to OPTIMIZE)
-            LOG_WARNING(queue.log, "Partition id '{}' was provided as a hint, but there's not such partition in ZooKeeper", partitions[i]);
+            LOG_WARNING(log_, "Partition id '{}' was provided as a hint, but there's not such partition in ZooKeeper", partitions[i]);
             partition_ids_hint->erase(partitions[i]);
             continue;
         }
 
-        Strings partition_block_numbers = response.names;
+        Strings partition_block_numbers = locks_children[i].names;
         for (const String & entry : partition_block_numbers)
         {
             if (!startsWith(entry, "block-"))
                 continue;
+
             Int64 block_number = parse<Int64>(entry.substr(strlen("block-")));
-            String zk_path = fs::path(queue.zookeeper_path) / "block_numbers" / partitions[i] / entry;
             committing_blocks[partitions[i]].insert(block_number);
         }
     }
 
+    return committing_blocks;
+}
+
+ReplicatedMergeTreeMergePredicate::ReplicatedMergeTreeMergePredicate(
+    ReplicatedMergeTreeQueue & queue_, zkutil::ZooKeeperPtr & zookeeper, std::optional<PartitionIdsHint> && partition_ids_hint_)
+    : BaseMergePredicate<ActiveDataPartSet, ReplicatedMergeTreeQueue>(std::move(partition_ids_hint_))
+    , queue(queue_)
+{
+    {
+        std::lock_guard lock(queue.state_mutex);
+        prev_virtual_parts = std::make_shared<ActiveDataPartSet>(queue.virtual_parts);
+    }
+
+    /// Load current quorum status.
+    auto quorum_status_future = zookeeper->asyncTryGet(fs::path(queue.zookeeper_path) / "quorum" / "status");
+
+    committing_blocks = std::make_shared<CommittingBlocks>(getCommittingBlocks(zookeeper, queue.zookeeper_path, queue.log));
+
     merges_version = queue_.pullLogsToQueue(zookeeper, {}, ReplicatedMergeTreeQueue::MERGE_PREDICATE);
 
     {
@@ -2179,7 +2201,8 @@ ReplicatedMergeTreeMergePredicate::ReplicatedMergeTreeMergePredicate(
         ///
         /// If pinned parts are fetched after logs are pulled then we can safely say that it contains all locks up to `merges_version`.
         String s = zookeeper->get(queue.zookeeper_path + "/pinned_part_uuids");
-        pinned_part_uuids.fromString(s);
+        pinned_part_uuids = std::make_shared<PinnedPartUUIDs>();
+        pinned_part_uuids->fromString(s);
     }
 
     Coordination::GetResponse quorum_status_response = quorum_status_future.get();
@@ -2187,13 +2210,21 @@ ReplicatedMergeTreeMergePredicate::ReplicatedMergeTreeMergePredicate(
     {
         ReplicatedMergeTreeQuorumEntry quorum_status;
         quorum_status.fromString(quorum_status_response.data);
-        inprogress_quorum_part = quorum_status.part_name;
+        inprogress_quorum_part = std::make_shared<String>(quorum_status.part_name);
     }
-    else
-        inprogress_quorum_part.clear();
+
+    /// Use all information about parts
+    prev_virtual_parts_ = prev_virtual_parts.get();
+    virtual_parts_ = &queue.virtual_parts;
+    committing_blocks_ = committing_blocks.get();
+    pinned_part_uuids_ = pinned_part_uuids.get();
+    inprogress_quorum_part_ = inprogress_quorum_part.get();
+    mutations_state_ = &queue;
+    virtual_parts_mutex = &queue.state_mutex;
 }
 
-bool LocalMergePredicate::operator()(
+template<typename VirtualPartsT, typename MutationsStateT>
+bool BaseMergePredicate<VirtualPartsT, MutationsStateT>::operator()(
     const MergeTreeData::DataPartPtr & left,
     const MergeTreeData::DataPartPtr & right,
     const MergeTreeTransaction *,
@@ -2205,20 +2236,8 @@ bool LocalMergePredicate::operator()(
         return canMergeSinglePart(right, out_reason);
 }
 
-bool ReplicatedMergeTreeMergePredicate::operator()(
-    const MergeTreeData::DataPartPtr & left,
-    const MergeTreeData::DataPartPtr & right,
-    const MergeTreeTransaction *,
-    String * out_reason) const
-{
-    if (left)
-        return canMergeTwoParts(left, right, out_reason);
-    else
-        return canMergeSinglePart(right, out_reason);
-}
-
-
-bool ReplicatedMergeTreeMergePredicate::canMergeTwoParts(
+template<typename VirtualPartsT, typename MutationsStateT>
+bool BaseMergePredicate<VirtualPartsT, MutationsStateT>::canMergeTwoParts(
     const MergeTreeData::DataPartPtr & left,
     const MergeTreeData::DataPartPtr & right,
     String * out_reason) const
@@ -2263,21 +2282,21 @@ bool ReplicatedMergeTreeMergePredicate::canMergeTwoParts(
 
     for (const MergeTreeData::DataPartPtr & part : {left, right})
     {
-        if (pinned_part_uuids.part_uuids.contains(part->uuid))
+        if (pinned_part_uuids_ && pinned_part_uuids_->part_uuids.contains(part->uuid))
         {
             if (out_reason)
                 *out_reason = "Part " + part->name + " has uuid " + toString(part->uuid) + " which is currently pinned";
             return false;
         }
 
-        if (part->name == inprogress_quorum_part)
+        if (inprogress_quorum_part_ && part->name == *inprogress_quorum_part_)
         {
             if (out_reason)
                 *out_reason = "Quorum insert for part " + part->name + " is currently in progress";
             return false;
         }
 
-        if (prev_virtual_parts.getContainingPart(part->info).empty())
+        if (prev_virtual_parts_ && prev_virtual_parts_->getContainingPart(part->info).empty())
         {
             if (out_reason)
                 *out_reason = "Entry for part " + part->name + " hasn't been read from the replication log yet";
@@ -2290,7 +2309,7 @@ bool ReplicatedMergeTreeMergePredicate::canMergeTwoParts(
     if (left_max_block > right_min_block)
         std::swap(left_max_block, right_min_block);
 
-    if (left_max_block + 1 < right_min_block)
+    if (committing_blocks_ && left_max_block + 1 < right_min_block)
     {
         if (partition_ids_hint && !partition_ids_hint->contains(left->info.partition_id))
         {
@@ -2299,8 +2318,8 @@ bool ReplicatedMergeTreeMergePredicate::canMergeTwoParts(
             return false;
         }
 
-        auto committing_blocks_in_partition = committing_blocks.find(left->info.partition_id);
-        if (committing_blocks_in_partition != committing_blocks.end())
+        auto committing_blocks_in_partition = committing_blocks_->find(left->info.partition_id);
+        if (committing_blocks_in_partition != committing_blocks_->end())
         {
             const std::set<Int64> & block_numbers = committing_blocks_in_partition->second;
 
@@ -2316,109 +2335,107 @@ bool ReplicatedMergeTreeMergePredicate::canMergeTwoParts(
         }
     }
 
-    return nested_pred.canMergeTwoParts(left, right, out_reason);
-}
+    std::unique_lock<std::mutex> lock;
+    if (virtual_parts_mutex)
+        lock = std::unique_lock(*virtual_parts_mutex);
 
-bool LocalMergePredicate::canMergeTwoParts(
-    const MergeTreeData::DataPartPtr & left,
-    const MergeTreeData::DataPartPtr & right,
-    String * out_reason) const
-{
-    Int64 left_max_block = left->info.max_block;
-    Int64 right_min_block = right->info.min_block;
-
-    std::lock_guard lock(queue.state_mutex);
-
-    for (const MergeTreeData::DataPartPtr & part : {left, right})
+    if (virtual_parts_)
     {
-        /// We look for containing parts in queue.virtual_parts (and not in prev_virtual_parts) because queue.virtual_parts is newer
-        /// and it is guaranteed that it will contain all merges assigned before this object is constructed.
-        String containing_part = queue.virtual_parts.getContainingPart(part->info);
-        if (containing_part != part->name)
+        for (const MergeTreeData::DataPartPtr & part : {left, right})
         {
-            if (out_reason)
-                *out_reason = "Part " + part->name + " has already been assigned a merge into " + containing_part;
-            return false;
+            /// We look for containing parts in queue.virtual_parts (and not in prev_virtual_parts) because queue.virtual_parts is newer
+            /// and it is guaranteed that it will contain all merges assigned before this object is constructed.
+            String containing_part = virtual_parts_->getContainingPart(part->info);
+            if (containing_part != part->name)
+            {
+                if (out_reason)
+                    *out_reason = "Part " + part->name + " has already been assigned a merge into " + containing_part;
+                return false;
+            }
+        }
+
+        if (left_max_block + 1 < right_min_block)
+        {
+            /// Fake part which will appear as merge result
+            MergeTreePartInfo gap_part_info(
+                left->info.partition_id, left_max_block + 1, right_min_block - 1,
+                MergeTreePartInfo::MAX_LEVEL, MergeTreePartInfo::MAX_BLOCK_NUMBER);
+
+            /// We don't select parts if any smaller part covered by our merge must exist after
+            /// processing replication log up to log_pointer.
+            Strings covered = virtual_parts_->getPartsCoveredBy(gap_part_info);
+            if (!covered.empty())
+            {
+                if (out_reason)
+                    *out_reason = "There are " + toString(covered.size()) + " parts (from " + covered.front()
+                        + " to " + covered.back() + ") that are still not present or being processed by "
+                        + " other background process on this replica between " + left->name + " and " + right->name;
+                return false;
+            }
         }
     }
 
-    if (left_max_block + 1 < right_min_block)
+    if (mutations_state_)
     {
-        /// Fake part which will appear as merge result
-        MergeTreePartInfo gap_part_info(
-            left->info.partition_id, left_max_block + 1, right_min_block - 1,
-            MergeTreePartInfo::MAX_LEVEL, MergeTreePartInfo::MAX_BLOCK_NUMBER);
+        Int64 left_mutation_ver = mutations_state_->getCurrentMutationVersion(
+            left->info.partition_id, left->info.getDataVersion());
 
-        /// We don't select parts if any smaller part covered by our merge must exist after
-        /// processing replication log up to log_pointer.
-        Strings covered = queue.virtual_parts.getPartsCoveredBy(gap_part_info);
-        if (!covered.empty())
+        Int64 right_mutation_ver = mutations_state_->getCurrentMutationVersion(
+            left->info.partition_id, right->info.getDataVersion());
+
+        if (left_mutation_ver != right_mutation_ver)
         {
             if (out_reason)
-                *out_reason = "There are " + toString(covered.size()) + " parts (from " + covered.front()
-                    + " to " + covered.back() + ") that are still not present or being processed by "
-                    + " other background process on this replica between " + left->name + " and " + right->name;
+                *out_reason = "Current mutation versions of parts " + left->name + " and " + right->name + " differ: "
+                    + toString(left_mutation_ver) + " and " + toString(right_mutation_ver) + " respectively";
             return false;
         }
     }
 
-    Int64 left_mutation_ver = queue.getCurrentMutationVersion(
-        left->info.partition_id, left->info.getDataVersion(), lock);
-
-    Int64 right_mutation_ver = queue.getCurrentMutationVersion(
-        left->info.partition_id, right->info.getDataVersion(), lock);
-
-    if (left_mutation_ver != right_mutation_ver)
-    {
-        if (out_reason)
-            *out_reason = "Current mutation versions of parts " + left->name + " and " + right->name + " differ: "
-                + toString(left_mutation_ver) + " and " + toString(right_mutation_ver) + " respectively";
-        return false;
-    }
-
     return MergeTreeData::partsContainSameProjections(left, right);
 }
 
-bool ReplicatedMergeTreeMergePredicate::canMergeSinglePart(
+template<typename VirtualPartsT, typename MutationsStateT>
+bool BaseMergePredicate<VirtualPartsT, MutationsStateT>::canMergeSinglePart(
     const MergeTreeData::DataPartPtr & part,
     String * out_reason) const
 {
-    if (pinned_part_uuids.part_uuids.contains(part->uuid))
+    if (pinned_part_uuids_ && pinned_part_uuids_->part_uuids.contains(part->uuid))
     {
         if (out_reason)
             *out_reason = fmt::format("Part {} has uuid {} which is currently pinned", part->name, part->uuid);
         return false;
     }
 
-    if (part->name == inprogress_quorum_part)
+    if (inprogress_quorum_part_ && part->name == *inprogress_quorum_part_)
     {
         if (out_reason)
             *out_reason = fmt::format("Quorum insert for part {} is currently in progress", part->name);
         return false;
     }
 
-    if (prev_virtual_parts.getContainingPart(part->info).empty())
+    if (prev_virtual_parts_ && prev_virtual_parts_->getContainingPart(part->info).empty())
     {
         if (out_reason)
             *out_reason = fmt::format("Entry for part {} hasn't been read from the replication log yet", part->name);
         return false;
     }
 
-    return nested_pred.canMergeSinglePart(part, out_reason);
-}
+    std::unique_lock<std::mutex> lock;
+    if (virtual_parts_mutex)
+        lock = std::unique_lock(*virtual_parts_mutex);
 
-bool LocalMergePredicate::canMergeSinglePart(const MergeTreeData::DataPartPtr & part, String * out_reason) const
-{
-    std::lock_guard lock(queue.state_mutex);
-
-    /// We look for containing parts in queue.virtual_parts (and not in prev_virtual_parts) because queue.virtual_parts is newer
-    /// and it is guaranteed that it will contain all merges assigned before this object is constructed.
-    String containing_part = queue.virtual_parts.getContainingPart(part->info);
-    if (containing_part != part->name)
+    if (virtual_parts_)
     {
-        if (out_reason)
-            *out_reason = fmt::format("Part {} has already been assigned a merge into {}", part->name, containing_part);
-        return false;
+        /// We look for containing parts in queue.virtual_parts (and not in prev_virtual_parts) because queue.virtual_parts is newer
+        /// and it is guaranteed that it will contain all merges assigned before this object is constructed.
+        String containing_part = virtual_parts_->getContainingPart(part->info);
+        if (containing_part != part->name)
+        {
+            if (out_reason)
+                *out_reason = fmt::format("Part {} has already been assigned a merge into {}", part->name, containing_part);
+            return false;
+        }
     }
 
     return true;
@@ -2459,7 +2476,7 @@ std::optional<std::pair<Int64, int>> ReplicatedMergeTreeMergePredicate::getDesir
 
     /// We cannot mutate part if it's being inserted with quorum and it's not
     /// already reached.
-    if (part->name == inprogress_quorum_part)
+    if (inprogress_quorum_part && part->name == *inprogress_quorum_part)
         return {};
 
     std::lock_guard lock(queue.state_mutex);
@@ -2474,7 +2491,7 @@ std::optional<std::pair<Int64, int>> ReplicatedMergeTreeMergePredicate::getDesir
     UInt64 mutations_limit = queue.storage.getSettings()->replicated_max_mutations_in_one_entry;
     UInt64 mutations_count = 0;
 
-    Int64 current_version = queue.getCurrentMutationVersion(part->info.partition_id, part->info.getDataVersion(), lock);
+    Int64 current_version = queue.getCurrentMutationVersion(part->info.partition_id, part->info.getDataVersion());
     Int64 max_version = in_partition->second.begin()->first;
 
     int alter_version = -1;
@@ -2548,8 +2565,8 @@ bool ReplicatedMergeTreeMergePredicate::isMutationFinished(const std::string & z
         if (partition_ids_hint && !partition_ids_hint->contains(partition_id))
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Partition id {} was not provided as hint, it's a bug", partition_id);
 
-        auto partition_it = committing_blocks.find(partition_id);
-        if (partition_it != committing_blocks.end())
+        auto partition_it = committing_blocks->find(partition_id);
+        if (partition_it != committing_blocks->end())
         {
             size_t blocks_count = std::distance(
                 partition_it->second.begin(), partition_it->second.lower_bound(block_num));
@@ -2671,4 +2688,6 @@ void ReplicatedMergeTreeQueue::removeCurrentPartsFromMutations()
         removeCoveredPartsFromMutations(part_name, /*remove_part = */ false, /*remove_covered_parts = */ true);
 }
 
+template class BaseMergePredicate<ActiveDataPartSet, ReplicatedMergeTreeQueue>;
+
 }
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeQueue.h b/src/Storages/MergeTree/ReplicatedMergeTreeQueue.h
index 79572e13963..f205526a660 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeQueue.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeQueue.h
@@ -34,6 +34,7 @@ private:
     friend class CurrentlyExecuting;
     friend class LocalMergePredicate;
     friend class ReplicatedMergeTreeMergePredicate;
+    template<typename T, typename U> friend class BaseMergePredicate;
     friend class MergeFromLogEntryTask;
     friend class ReplicatedMergeMutateTaskBase;
 
@@ -212,7 +213,7 @@ private:
     /// with getDataVersion() == data_version. (Either this mutation was already applied or the part
     /// was created after the mutation).
     /// If there is no such mutation or it has already been executed and deleted, return 0.
-    Int64 getCurrentMutationVersion(const String & partition_id, Int64 data_version, std::lock_guard<std::mutex> & /* state_lock */) const;
+    Int64 getCurrentMutationVersion(const String & partition_id, Int64 data_version) const;
 
     /** Check that part isn't in currently generating parts and isn't covered by them.
       * Should be called under state_mutex.
@@ -491,33 +492,14 @@ public:
     void createLogEntriesToFetchBrokenParts();
 };
 
-/// Lightweight version of ReplicatedMergeTreeMergePredicate that do not make any ZooKeeper requests,
-/// but may return false-positive results. Checks only a subset of required conditions.
-class LocalMergePredicate
+using CommittingBlocks = std::unordered_map<String, std::set<Int64>>;
+
+template<typename VirtualPartsT, typename MutationsStateT>
+class BaseMergePredicate
 {
 public:
-    LocalMergePredicate(ReplicatedMergeTreeQueue & queue_);
-
-    bool operator()(const MergeTreeData::DataPartPtr & left,
-                    const MergeTreeData::DataPartPtr & right,
-                    const MergeTreeTransaction * txn,
-                    String * out_reason = nullptr) const;
-
-    bool canMergeTwoParts(const MergeTreeData::DataPartPtr & left,
-                          const MergeTreeData::DataPartPtr & right,
-                          String * out_reason = nullptr) const;
-
-    bool canMergeSinglePart(const MergeTreeData::DataPartPtr & part, String * out_reason) const;
-
-private:
-    const ReplicatedMergeTreeQueue & queue;
-};
-
-class ReplicatedMergeTreeMergePredicate
-{
-public:
-    ReplicatedMergeTreeMergePredicate(ReplicatedMergeTreeQueue & queue_, zkutil::ZooKeeperPtr & zookeeper,
-                                      std::optional<PartitionIdsHint> && partition_ids_hint_);
+    BaseMergePredicate() = default;
+    BaseMergePredicate(std::optional<PartitionIdsHint> && partition_ids_hint_) : partition_ids_hint(std::move(partition_ids_hint_)) {}
 
     /// Depending on the existence of left part checks a merge predicate for two parts or for single part.
     bool operator()(const MergeTreeData::DataPartPtr & left,
@@ -537,6 +519,46 @@ public:
     /// This predicate is checked for the first part of each range.
     bool canMergeSinglePart(const MergeTreeData::DataPartPtr & part, String * out_reason) const;
 
+    CommittingBlocks getCommittingBlocks(zkutil::ZooKeeperPtr & zookeeper, const std::string & zookeeper_path, Poco::Logger * log_);
+
+protected:
+    /// A list of partitions that can be used in the merge predicate
+    std::optional<PartitionIdsHint> partition_ids_hint;
+
+    /// A snapshot of active parts that would appear if the replica executes all log entries in its queue.
+    const VirtualPartsT * prev_virtual_parts_ = nullptr;
+    const VirtualPartsT * virtual_parts_ = nullptr;
+
+    /// partition ID -> block numbers of the inserts and mutations that are about to commit
+    /// (loaded at some later time than prev_virtual_parts).
+    const CommittingBlocks * committing_blocks_ = nullptr;
+
+    /// List of UUIDs for parts that have their identity "pinned".
+    const PinnedPartUUIDs * pinned_part_uuids_ = nullptr;
+
+    /// Quorum state taken at some later time than prev_virtual_parts.
+    const String * inprogress_quorum_part_ = nullptr;
+
+    /// An object that provides current mutation version for a part
+    const MutationsStateT * mutations_state_ = nullptr;
+
+    std::mutex * virtual_parts_mutex = nullptr;
+};
+
+/// Lightweight version of ReplicatedMergeTreeMergePredicate that do not make any ZooKeeper requests,
+/// but may return false-positive results. Checks only a subset of required conditions.
+class LocalMergePredicate : public BaseMergePredicate<ActiveDataPartSet, ReplicatedMergeTreeQueue>
+{
+public:
+    LocalMergePredicate(ReplicatedMergeTreeQueue & queue_);
+};
+
+class ReplicatedMergeTreeMergePredicate : public BaseMergePredicate<ActiveDataPartSet, ReplicatedMergeTreeQueue>
+{
+public:
+    ReplicatedMergeTreeMergePredicate(ReplicatedMergeTreeQueue & queue_, zkutil::ZooKeeperPtr & zookeeper,
+                                      std::optional<PartitionIdsHint> && partition_ids_hint_);
+
     /// Returns true if part is needed for some REPLACE_RANGE entry.
     /// We should not drop part in this case, because replication queue may stuck without that part.
     bool partParticipatesInReplaceRange(const MergeTreeData::DataPartPtr & part, String * out_reason) const;
@@ -561,28 +583,17 @@ public:
     String getCoveringVirtualPart(const String & part_name) const;
 
 private:
-    LocalMergePredicate nested_pred;
-
     const ReplicatedMergeTreeQueue & queue;
 
-    std::optional<PartitionIdsHint> partition_ids_hint;
-
-    /// A snapshot of active parts that would appear if the replica executes all log entries in its queue.
-    ActiveDataPartSet prev_virtual_parts;
-    /// partition ID -> block numbers of the inserts and mutations that are about to commit
-    /// (loaded at some later time than prev_virtual_parts).
-    std::unordered_map<String, std::set<Int64>> committing_blocks;
-
-    /// List of UUIDs for parts that have their identity "pinned".
-    PinnedPartUUIDs pinned_part_uuids;
-
-    /// Quorum state taken at some later time than prev_virtual_parts.
-    String inprogress_quorum_part;
+    /// We copy a merge predicate when we cast it to AllowedMergingPredicate, let's keep the pointers valid
+    std::shared_ptr<ActiveDataPartSet> prev_virtual_parts;
+    std::shared_ptr<CommittingBlocks> committing_blocks;
+    std::shared_ptr<PinnedPartUUIDs> pinned_part_uuids;
+    std::shared_ptr<String> inprogress_quorum_part;
 
     int32_t merges_version = -1;
 };
 
-
 /** Convert a number to a string in the format of the suffixes of auto-incremental nodes in ZooKeeper.
   * Negative numbers are also supported - for them the name of the node looks somewhat silly
   *  and does not match any auto-incremented node in ZK.
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
index a38e9eba844..4128654a632 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
@@ -7,6 +7,8 @@
 #include <Common/SipHash.h>
 #include <Common/ZooKeeper/KeeperException.h>
 #include <Common/ThreadFuzzer.h>
+#include <Storages/MergeTree/MergeAlgorithm.h>
+#include <Storages/MergeTree/MergeTreeDataWriter.h>
 #include <Storages/MergeTree/AsyncBlockIDsCache.h>
 #include <DataTypes/ObjectUtils.h>
 #include <Core/Block.h>
@@ -54,6 +56,9 @@ struct ReplicatedMergeTreeSinkImpl<async_insert>::DelayedChunk
         UInt64 elapsed_ns;
         BlockIDsType block_id;
         BlockWithPartition block_with_partition;
+        /// Some merging algorithms can mofidy the block which loses the information about the async insert offsets
+        /// when preprocessing or filtering data for asnyc inserts deduplication we want to use the initial, unmerged block
+        std::optional<BlockWithPartition> unmerged_block_with_partition;
         std::unordered_map<String, std::vector<size_t>> block_id_to_offset_idx;
         ProfileEvents::Counters part_counters;
 
@@ -63,12 +68,14 @@ struct ReplicatedMergeTreeSinkImpl<async_insert>::DelayedChunk
                   UInt64 elapsed_ns_,
                   BlockIDsType && block_id_,
                   BlockWithPartition && block_,
+                  std::optional<BlockWithPartition> && unmerged_block_with_partition_,
                   ProfileEvents::Counters && part_counters_)
             : log(log_),
               temp_part(std::move(temp_part_)),
               elapsed_ns(elapsed_ns_),
               block_id(std::move(block_id_)),
               block_with_partition(std::move(block_)),
+              unmerged_block_with_partition(std::move(unmerged_block_with_partition_)),
               part_counters(std::move(part_counters_))
         {
                 initBlockIDMap();
@@ -113,6 +120,7 @@ struct ReplicatedMergeTreeSinkImpl<async_insert>::DelayedChunk
         {
             if constexpr (async_insert)
             {
+                auto * current_block_with_partition = unmerged_block_with_partition.has_value() ? &unmerged_block_with_partition.value() : &block_with_partition;
                 std::vector<size_t> offset_idx;
                 for (const auto & raw_path : block_paths)
                 {
@@ -127,14 +135,14 @@ struct ReplicatedMergeTreeSinkImpl<async_insert>::DelayedChunk
                 }
                 std::sort(offset_idx.begin(), offset_idx.end());
 
-                auto & offsets = block_with_partition.offsets;
+                auto & offsets = current_block_with_partition->offsets;
                 size_t idx = 0, remove_count = 0;
                 auto it = offset_idx.begin();
                 std::vector<size_t> new_offsets;
                 std::vector<String> new_block_ids;
 
                 /// construct filter
-                size_t rows = block_with_partition.block.rows();
+                size_t rows = current_block_with_partition->block.rows();
                 auto filter_col = ColumnUInt8::create(rows, 1u);
                 ColumnUInt8::Container & vec = filter_col->getData();
                 UInt8 * pos = vec.data();
@@ -162,18 +170,21 @@ struct ReplicatedMergeTreeSinkImpl<async_insert>::DelayedChunk
 
                 LOG_TRACE(log, "New block IDs: {}, new offsets: {}, size: {}", toString(new_block_ids), toString(new_offsets), new_offsets.size());
 
-                block_with_partition.offsets = std::move(new_offsets);
+                current_block_with_partition->offsets = std::move(new_offsets);
                 block_id = std::move(new_block_ids);
-                auto cols = block_with_partition.block.getColumns();
+                auto cols = current_block_with_partition->block.getColumns();
                 for (auto & col : cols)
                 {
                     col = col->filter(vec, rows - remove_count);
                 }
-                block_with_partition.block.setColumns(cols);
+                current_block_with_partition->block.setColumns(cols);
 
-                LOG_TRACE(log, "New block rows {}", block_with_partition.block.rows());
+                LOG_TRACE(log, "New block rows {}", current_block_with_partition->block.rows());
 
                 initBlockIDMap();
+
+                if (unmerged_block_with_partition.has_value())
+                    block_with_partition.block = unmerged_block_with_partition->block;
             }
             else
             {
@@ -202,7 +213,7 @@ std::vector<Int64> testSelfDeduplicate(std::vector<Int64> data, std::vector<size
     BlockWithPartition block1(std::move(block), Row(), std::move(offsets));
     ProfileEvents::Counters profile_counters;
     ReplicatedMergeTreeSinkImpl<true>::DelayedChunk::Partition part(
-        &Poco::Logger::get("testSelfDeduplicate"), MergeTreeDataWriter::TemporaryPart(), 0, std::move(hashes), std::move(block1), std::move(profile_counters));
+        &Poco::Logger::get("testSelfDeduplicate"), MergeTreeDataWriter::TemporaryPart(), 0, std::move(hashes), std::move(block1), std::nullopt, std::move(profile_counters));
 
     part.filterSelfDuplicate();
 
@@ -235,8 +246,10 @@ namespace
         {
             SipHash hash;
             for (size_t i = start; i < offset; ++i)
+            {
                 for (const auto & col : cols)
                     col->updateHashWithValue(i, hash);
+            }
             union
             {
                 char bytes[16];
@@ -367,6 +380,9 @@ size_t ReplicatedMergeTreeSinkImpl<async_insert>::checkQuorumPrecondition(const
 template<bool async_insert>
 void ReplicatedMergeTreeSinkImpl<async_insert>::consume(Chunk chunk)
 {
+    if (num_blocks_processed > 0)
+        storage.delayInsertOrThrowIfNeeded(&storage.partial_shutdown_event, context, false);
+
     auto block = getHeader().cloneWithColumns(chunk.detachColumns());
 
     const auto & settings = context->getSettingsRef();
@@ -429,8 +445,18 @@ void ReplicatedMergeTreeSinkImpl<async_insert>::consume(Chunk chunk)
         ProfileEvents::Counters part_counters;
         auto profile_events_scope = std::make_unique<ProfileEventsScope>(&part_counters);
 
-        /// Write part to the filesystem under temporary name. Calculate a checksum.
+        /// Some merging algorithms can mofidy the block which loses the information about the async insert offsets
+        /// when preprocessing or filtering data for asnyc inserts deduplication we want to use the initial, unmerged block
+        std::optional<BlockWithPartition> unmerged_block;
 
+        if constexpr (async_insert)
+        {
+            /// we copy everything but offsets which we move because they are only used by async insert
+            if (settings.optimize_on_insert && storage.writer.getMergingMode() != MergeTreeData::MergingParams::Mode::Ordinary)
+                unmerged_block.emplace(Block(current_block.block), Row(current_block.partition), std::move(current_block.offsets));
+        }
+
+        /// Write part to the filesystem under temporary name. Calculate a checksum.
         auto temp_part = storage.writer.writeTempPart(current_block, metadata_snapshot, context);
 
         /// If optimize_on_insert setting is true, current_block could become empty after merge
@@ -443,31 +469,35 @@ void ReplicatedMergeTreeSinkImpl<async_insert>::consume(Chunk chunk)
         if constexpr (async_insert)
         {
             /// TODO consider insert_deduplication_token
-            block_id = getHashesForBlocks(current_block, temp_part.part->info.partition_id);
+            block_id = getHashesForBlocks(unmerged_block.has_value() ? *unmerged_block : current_block, temp_part.part->info.partition_id);
             LOG_TRACE(log, "async insert part, part id {}, block id {}, offsets {}, size {}", temp_part.part->info.partition_id, toString(block_id), toString(current_block.offsets), current_block.offsets.size());
         }
-        else if (deduplicate)
-        {
-            String block_dedup_token;
-
-            /// We add the hash from the data and partition identifier to deduplication ID.
-            /// That is, do not insert the same data to the same partition twice.
-
-            const String & dedup_token = settings.insert_deduplication_token;
-            if (!dedup_token.empty())
-            {
-                /// multiple blocks can be inserted within the same insert query
-                /// an ordinal number is added to dedup token to generate a distinctive block id for each block
-                block_dedup_token = fmt::format("{}_{}", dedup_token, chunk_dedup_seqnum);
-                ++chunk_dedup_seqnum;
-            }
-
-            block_id = temp_part.part->getZeroLevelPartBlockID(block_dedup_token);
-            LOG_DEBUG(log, "Wrote block with ID '{}', {} rows{}", block_id, current_block.block.rows(), quorumLogMessage(replicas_num));
-        }
         else
         {
-            LOG_DEBUG(log, "Wrote block with {} rows{}", current_block.block.rows(), quorumLogMessage(replicas_num));
+
+            if (deduplicate)
+            {
+                String block_dedup_token;
+
+                /// We add the hash from the data and partition identifier to deduplication ID.
+                /// That is, do not insert the same data to the same partition twice.
+
+                const String & dedup_token = settings.insert_deduplication_token;
+                if (!dedup_token.empty())
+                {
+                    /// multiple blocks can be inserted within the same insert query
+                    /// an ordinal number is added to dedup token to generate a distinctive block id for each block
+                    block_dedup_token = fmt::format("{}_{}", dedup_token, chunk_dedup_seqnum);
+                    ++chunk_dedup_seqnum;
+                }
+
+                block_id = temp_part.part->getZeroLevelPartBlockID(block_dedup_token);
+                LOG_DEBUG(log, "Wrote block with ID '{}', {} rows{}", block_id, current_block.block.rows(), quorumLogMessage(replicas_num));
+            }
+            else
+            {
+                LOG_DEBUG(log, "Wrote block with {} rows{}", current_block.block.rows(), quorumLogMessage(replicas_num));
+            }
         }
 
         profile_events_scope.reset();
@@ -498,6 +528,7 @@ void ReplicatedMergeTreeSinkImpl<async_insert>::consume(Chunk chunk)
             elapsed_ns,
             std::move(block_id),
             std::move(current_block),
+            std::move(unmerged_block),
             std::move(part_counters) /// profile_events_scope must be reset here.
         ));
     }
@@ -512,6 +543,8 @@ void ReplicatedMergeTreeSinkImpl<async_insert>::consume(Chunk chunk)
     /// TODO: we can also delay commit if there is no MVs.
     if (!settings.deduplicate_blocks_in_dependent_materialized_views)
         finishDelayedChunk(zookeeper);
+
+    ++num_blocks_processed;
 }
 
 template<>
@@ -532,12 +565,12 @@ void ReplicatedMergeTreeSinkImpl<false>::finishDelayedChunk(const ZooKeeperWithF
 
         try
         {
-            commitPart(zookeeper, part, partition.block_id, delayed_chunk->replicas_num, false);
+            bool deduplicated = commitPart(zookeeper, part, partition.block_id, delayed_chunk->replicas_num, false).second;
 
-            last_block_is_duplicate = last_block_is_duplicate || part->is_duplicate;
+            last_block_is_duplicate = last_block_is_duplicate || deduplicated;
 
             /// Set a special error code if the block is duplicate
-            int error = (deduplicate && part->is_duplicate) ? ErrorCodes::INSERT_WAS_DEDUPLICATED : 0;
+            int error = (deduplicate && deduplicated) ? ErrorCodes::INSERT_WAS_DEDUPLICATED : 0;
             auto counters_snapshot = std::make_shared<ProfileEvents::Counters::Snapshot>(partition.part_counters.getPartiallyAtomicSnapshot());
             PartLog::addNewPart(storage.getContext(), PartLog::PartLogEntry(part, partition.elapsed_ns, counters_snapshot), ExecutionStatus(error));
             storage.incrementInsertedPartsProfileEvent(part->getType());
@@ -567,6 +600,7 @@ void ReplicatedMergeTreeSinkImpl<true>::finishDelayedChunk(const ZooKeeperWithFa
         {
             LOG_TRACE(log, "found duplicated inserts in the block");
             partition.block_with_partition.partition = std::move(partition.temp_part.part->partition.value);
+            partition.temp_part.cancel();
             partition.temp_part = storage.writer.writeTempPart(partition.block_with_partition, metadata_snapshot, context);
         }
 
@@ -575,7 +609,7 @@ void ReplicatedMergeTreeSinkImpl<true>::finishDelayedChunk(const ZooKeeperWithFa
         while (true)
         {
             partition.temp_part.finalize();
-            auto conflict_block_ids = commitPart(zookeeper, partition.temp_part.part, partition.block_id, delayed_chunk->replicas_num, false);
+            auto conflict_block_ids = commitPart(zookeeper, partition.temp_part.part, partition.block_id, delayed_chunk->replicas_num, false).first;
             if (conflict_block_ids.empty())
                 break;
             ++retry_times;
@@ -585,6 +619,7 @@ void ReplicatedMergeTreeSinkImpl<true>::finishDelayedChunk(const ZooKeeperWithFa
             if (partition.block_id.empty())
                 break;
             partition.block_with_partition.partition = std::move(partition.temp_part.part->partition.value);
+            /// partition.temp_part is already finalized, no need to call cancel
             partition.temp_part = storage.writer.writeTempPart(partition.block_with_partition, metadata_snapshot, context);
         }
     }
@@ -596,7 +631,6 @@ template<bool async_insert>
 void ReplicatedMergeTreeSinkImpl<async_insert>::writeExistingPart(MergeTreeData::MutableDataPartPtr & part)
 {
     /// NOTE: No delay in this case. That's Ok.
-
     auto origin_zookeeper = storage.getZooKeeper();
     assertSessionIsNotExpired(origin_zookeeper);
     auto zookeeper = std::make_shared<ZooKeeperWithFaultInjection>(origin_zookeeper);
@@ -620,7 +654,7 @@ void ReplicatedMergeTreeSinkImpl<async_insert>::writeExistingPart(MergeTreeData:
 }
 
 template<bool async_insert>
-std::vector<String> ReplicatedMergeTreeSinkImpl<async_insert>::commitPart(
+std::pair<std::vector<String>, bool> ReplicatedMergeTreeSinkImpl<async_insert>::commitPart(
     const ZooKeeperWithFaultInjectionPtr & zookeeper,
     MergeTreeData::MutableDataPartPtr & part,
     const BlockIDsType & block_id,
@@ -644,6 +678,7 @@ std::vector<String> ReplicatedMergeTreeSinkImpl<async_insert>::commitPart(
 
     /// for retries due to keeper error
     bool part_committed_locally_but_zookeeper = false;
+    bool part_was_deduplicated = false;
     Coordination::Error write_part_info_keeper_error = Coordination::Error::ZOK;
     std::vector<String> conflict_block_ids;
 
@@ -844,7 +879,7 @@ std::vector<String> ReplicatedMergeTreeSinkImpl<async_insert>::commitPart(
             /// If it exists on our replica, ignore it.
             if (storage.getActiveContainingPart(existing_part_name))
             {
-                part->is_duplicate = true;
+                part_was_deduplicated = true;
                 ProfileEvents::increment(ProfileEvents::DuplicatedInsertedBlocks);
                 if (isQuorumEnabled())
                 {
@@ -1040,7 +1075,7 @@ std::vector<String> ReplicatedMergeTreeSinkImpl<async_insert>::commitPart(
                 ++loop_counter;
                 if (loop_counter == max_iterations)
                 {
-                    part->is_duplicate = true; /// Part is duplicate, just remove it from local FS
+                    part_was_deduplicated = true; /// Part is duplicate, just remove it from local FS
                     throw Exception(ErrorCodes::DUPLICATE_DATA_PART, "Too many transaction retries - it may indicate an error");
                 }
                 retries_ctl.requestUnconditionalRetry(); /// we want one more iteration w/o counting it as a try and timeout
@@ -1093,7 +1128,7 @@ std::vector<String> ReplicatedMergeTreeSinkImpl<async_insert>::commitPart(
     [&zookeeper]() { zookeeper->cleanupEphemeralNodes(); });
 
     if (!conflict_block_ids.empty())
-        return conflict_block_ids;
+        return {conflict_block_ids, part_was_deduplicated};
 
     if (isQuorumEnabled())
     {
@@ -1129,15 +1164,15 @@ std::vector<String> ReplicatedMergeTreeSinkImpl<async_insert>::commitPart(
                 return;
         });
     }
-    return {};
+    return {conflict_block_ids, part_was_deduplicated};
 }
 
 template<bool async_insert>
 void ReplicatedMergeTreeSinkImpl<async_insert>::onStart()
 {
-    /// Only check "too many parts" before write,
+    /// It's only allowed to throw "too many parts" before write,
     /// because interrupting long-running INSERT query in the middle is not convenient for users.
-    storage.delayInsertOrThrowIfNeeded(&storage.partial_shutdown_event, context);
+    storage.delayInsertOrThrowIfNeeded(&storage.partial_shutdown_event, context, true);
 }
 
 template<bool async_insert>
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeSink.h b/src/Storages/MergeTree/ReplicatedMergeTreeSink.h
index 3777a9f7285..868590efa25 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeSink.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeSink.h
@@ -87,7 +87,8 @@ private:
     size_t checkQuorumPrecondition(const ZooKeeperWithFaultInjectionPtr & zookeeper);
 
     /// Rename temporary part and commit to ZooKeeper.
-    std::vector<String> commitPart(
+    /// Returns a list of conflicting async blocks and true if the whole parts was deduplicated
+    std::pair<std::vector<String>, bool> commitPart(
         const ZooKeeperWithFaultInjectionPtr & zookeeper,
         MergeTreeData::MutableDataPartPtr & part,
         const BlockIDsType & block_id,
@@ -122,6 +123,7 @@ private:
     bool quorum_parallel = false;
     const bool deduplicate = true;
     bool last_block_is_duplicate = false;
+    UInt64 num_blocks_processed = 0;
 
     using Logger = Poco::Logger;
     Poco::Logger * log;
diff --git a/src/Storages/MergeTree/RequestResponse.cpp b/src/Storages/MergeTree/RequestResponse.cpp
index 05930d5a4c4..2ce0e20dcd2 100644
--- a/src/Storages/MergeTree/RequestResponse.cpp
+++ b/src/Storages/MergeTree/RequestResponse.cpp
@@ -51,7 +51,7 @@ String ParallelReadRequest::describe() const
     return result;
 }
 
-void ParallelReadRequest::deserialize(ReadBuffer & in)
+ParallelReadRequest ParallelReadRequest::deserialize(ReadBuffer & in)
 {
     UInt64 version;
     readIntBinary(version, in);
@@ -60,12 +60,24 @@ void ParallelReadRequest::deserialize(ReadBuffer & in)
             "from replicas differ. Got: {}, supported version: {}",
             version, DBMS_PARALLEL_REPLICAS_PROTOCOL_VERSION);
 
+    CoordinationMode mode;
+    size_t replica_num;
+    size_t min_number_of_marks;
+    RangesInDataPartsDescription description;
+
     uint8_t mode_candidate;
     readIntBinary(mode_candidate, in);
     mode = validateAndGet(mode_candidate);
     readIntBinary(replica_num, in);
     readIntBinary(min_number_of_marks, in);
     description.deserialize(in);
+
+    return ParallelReadRequest(
+        mode,
+        replica_num,
+        min_number_of_marks,
+        std::move(description)
+    );
 }
 
 void ParallelReadRequest::merge(ParallelReadRequest & other)
@@ -125,7 +137,7 @@ String InitialAllRangesAnnouncement::describe()
     return result;
 }
 
-void InitialAllRangesAnnouncement::deserialize(ReadBuffer & in)
+InitialAllRangesAnnouncement InitialAllRangesAnnouncement::deserialize(ReadBuffer & in)
 {
     UInt64 version;
     readIntBinary(version, in);
@@ -134,11 +146,21 @@ void InitialAllRangesAnnouncement::deserialize(ReadBuffer & in)
             "from replicas differ. Got: {}, supported version: {}",
             version, DBMS_PARALLEL_REPLICAS_PROTOCOL_VERSION);
 
+    CoordinationMode mode;
+    RangesInDataPartsDescription description;
+    size_t replica_num;
+
     uint8_t mode_candidate;
     readIntBinary(mode_candidate, in);
     mode = validateAndGet(mode_candidate);
     description.deserialize(in);
     readIntBinary(replica_num, in);
+
+    return InitialAllRangesAnnouncement {
+        mode,
+        description,
+        replica_num
+    };
 }
 
 }
diff --git a/src/Storages/MergeTree/RequestResponse.h b/src/Storages/MergeTree/RequestResponse.h
index 7e5563c0553..3a5bfde6c20 100644
--- a/src/Storages/MergeTree/RequestResponse.h
+++ b/src/Storages/MergeTree/RequestResponse.h
@@ -40,21 +40,40 @@ struct PartBlockRange
     }
 };
 
+/// ParallelReadRequest is used by remote replicas during parallel read
+/// to signal an initiator that they need more marks to read.
 struct ParallelReadRequest
 {
+    /// No default constructor, you must initialize all fields at once.
+
+    ParallelReadRequest(
+        CoordinationMode mode_,
+        size_t replica_num_,
+        size_t min_number_of_marks_,
+        RangesInDataPartsDescription description_)
+        : mode(mode_)
+        , replica_num(replica_num_)
+        , min_number_of_marks(min_number_of_marks_)
+        , description(std::move(description_))
+    {}
+
     CoordinationMode mode;
     size_t replica_num;
     size_t min_number_of_marks;
-
-    /// Extension for ordered mode
+    /// Extension for Ordered (InOrder or ReverseOrder) mode
+    /// Contains only data part names without mark ranges.
     RangesInDataPartsDescription description;
 
     void serialize(WriteBuffer & out) const;
     String describe() const;
-    void deserialize(ReadBuffer & in);
+    static ParallelReadRequest deserialize(ReadBuffer & in);
     void merge(ParallelReadRequest & other);
 };
 
+/// ParallelReadResponse is used by an initiator to tell
+/// remote replicas about what to read during parallel reading.
+/// Additionally contains information whether there are more available
+/// marks to read (whether it is the last packet or not).
 struct ParallelReadResponse
 {
     bool finish{false};
@@ -66,15 +85,30 @@ struct ParallelReadResponse
 };
 
 
+/// The set of parts (their names) along with ranges to read which is sent back
+/// to the initiator by remote replicas during parallel reading.
+/// Additionally contains an identifier (replica_num) plus
+/// the reading algorithm chosen (Default, InOrder or ReverseOrder).
 struct InitialAllRangesAnnouncement
 {
+    /// No default constructor, you must initialize all fields at once.
+
+    InitialAllRangesAnnouncement(
+        CoordinationMode mode_,
+        RangesInDataPartsDescription description_,
+        size_t replica_num_)
+        : mode(mode_)
+        , description(description_)
+        , replica_num(replica_num_)
+    {}
+
     CoordinationMode mode;
     RangesInDataPartsDescription description;
     size_t replica_num;
 
     void serialize(WriteBuffer & out) const;
     String describe();
-    void deserialize(ReadBuffer & in);
+    static InitialAllRangesAnnouncement deserialize(ReadBuffer & in);
 };
 
 
diff --git a/src/Storages/MergeTree/SimpleMergeSelector.cpp b/src/Storages/MergeTree/SimpleMergeSelector.cpp
index af3373fd175..7e7539f71d5 100644
--- a/src/Storages/MergeTree/SimpleMergeSelector.cpp
+++ b/src/Storages/MergeTree/SimpleMergeSelector.cpp
@@ -28,7 +28,7 @@ struct Estimator
         {
             double difference = std::abs(log2(static_cast<double>(sum_size) / size_prev_at_left));
             if (difference < settings.heuristic_to_align_parts_max_absolute_difference_in_powers_of_two)
-                current_score *= std::lerp(settings.heuristic_to_align_parts_max_score_adjustment, 1,
+                current_score *= interpolateLinear(settings.heuristic_to_align_parts_max_score_adjustment, 1,
                     difference / settings.heuristic_to_align_parts_max_absolute_difference_in_powers_of_two);
         }
 
@@ -115,8 +115,8 @@ bool allow(
 //    std::cerr << "size_normalized: " << size_normalized << "\n";
 
     /// Calculate boundaries for age
-    double min_age_to_lower_base = std::lerp(settings.min_age_to_lower_base_at_min_size, settings.min_age_to_lower_base_at_max_size, size_normalized);
-    double max_age_to_lower_base = std::lerp(settings.max_age_to_lower_base_at_min_size, settings.max_age_to_lower_base_at_max_size, size_normalized);
+    double min_age_to_lower_base = interpolateLinear(settings.min_age_to_lower_base_at_min_size, settings.min_age_to_lower_base_at_max_size, size_normalized);
+    double max_age_to_lower_base = interpolateLinear(settings.max_age_to_lower_base_at_min_size, settings.max_age_to_lower_base_at_max_size, size_normalized);
 
 //    std::cerr << "min_age_to_lower_base: " << min_age_to_lower_base << "\n";
 //    std::cerr << "max_age_to_lower_base: " << max_age_to_lower_base << "\n";
@@ -137,7 +137,7 @@ bool allow(
 
 //    std::cerr << "combined_ratio: " << combined_ratio << "\n";
 
-    double lowered_base = std::lerp(settings.base, 2.0, combined_ratio);
+    double lowered_base = interpolateLinear(settings.base, 2.0, combined_ratio);
 
 //    std::cerr << "------- lowered_base: " << lowered_base << "\n";
 
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index 00710ed3ed6..1967357a840 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -1,4 +1,4 @@
-#include "Storages/MergeTree/IDataPartStorage.h"
+#include <Poco/Logger.h>
 #include <algorithm>
 #include <optional>
 
@@ -8,8 +8,12 @@
 #include <Storages/MergeTree/checkDataPart.h>
 #include <Storages/MergeTree/MergeTreeDataPartCompact.h>
 #include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
+#include <Storages/MergeTree/IDataPartStorage.h>
+#include <Interpreters/Cache/FileCache.h>
+#include <Interpreters/Cache/FileCacheFactory.h>
 #include <Compression/CompressedReadBuffer.h>
 #include <IO/HashingReadBuffer.h>
+#include <IO/S3Common.h>
 #include <Common/CurrentMetrics.h>
 
 
@@ -30,6 +34,8 @@ namespace ErrorCodes
     extern const int CANNOT_MUNMAP;
     extern const int CANNOT_MREMAP;
     extern const int UNEXPECTED_FILE_IN_DATA_PART;
+    extern const int NETWORK_ERROR;
+    extern const int SOCKET_TIMEOUT;
 }
 
 
@@ -44,13 +50,33 @@ bool isNotEnoughMemoryErrorCode(int code)
         || code == ErrorCodes::CANNOT_MREMAP;
 }
 
+bool isRetryableException(const Exception & e)
+{
+    if (isNotEnoughMemoryErrorCode(e.code()))
+        return true;
 
-IMergeTreeDataPart::Checksums checkDataPart(
+    if (e.code() == ErrorCodes::NETWORK_ERROR || e.code() == ErrorCodes::SOCKET_TIMEOUT)
+        return true;
+
+#if USE_AWS_S3
+    const auto * s3_exception = dynamic_cast<const S3Exception *>(&e);
+    if (s3_exception && s3_exception->isRetryableError())
+        return true;
+#endif
+
+    /// In fact, there can be other similar situations.
+    /// But it is OK, because there is a safety guard against deleting too many parts.
+    return false;
+}
+
+
+static IMergeTreeDataPart::Checksums checkDataPart(
     MergeTreeData::DataPartPtr data_part,
     const IDataPartStorage & data_part_storage,
     const NamesAndTypesList & columns_list,
     const MergeTreeDataPartType & part_type,
     const NameSet & files_without_checksums,
+    const ReadSettings & read_settings,
     bool require_checksums,
     std::function<bool()> is_cancelled)
 {
@@ -65,7 +91,7 @@ IMergeTreeDataPart::Checksums checkDataPart(
     NamesAndTypesList columns_txt;
 
     {
-        auto buf = data_part_storage.readFile("columns.txt", {}, std::nullopt, std::nullopt);
+        auto buf = data_part_storage.readFile("columns.txt", read_settings, std::nullopt, std::nullopt);
         columns_txt.readText(*buf);
         assertEOF(*buf);
     }
@@ -78,9 +104,9 @@ IMergeTreeDataPart::Checksums checkDataPart(
     IMergeTreeDataPart::Checksums checksums_data;
 
     /// This function calculates checksum for both compressed and decompressed contents of compressed file.
-    auto checksum_compressed_file = [](const IDataPartStorage & data_part_storage_, const String & file_path)
+    auto checksum_compressed_file = [&read_settings](const IDataPartStorage & data_part_storage_, const String & file_path)
     {
-        auto file_buf = data_part_storage_.readFile(file_path, {}, std::nullopt, std::nullopt);
+        auto file_buf = data_part_storage_.readFile(file_path, read_settings, std::nullopt, std::nullopt);
         HashingReadBuffer compressed_hashing_buf(*file_buf);
         CompressedReadBuffer uncompressing_buf(compressed_hashing_buf);
         HashingReadBuffer uncompressed_hashing_buf(uncompressing_buf);
@@ -98,7 +124,7 @@ IMergeTreeDataPart::Checksums checkDataPart(
 
     if (data_part_storage.exists(IMergeTreeDataPart::SERIALIZATION_FILE_NAME))
     {
-        auto serialization_file = data_part_storage.readFile(IMergeTreeDataPart::SERIALIZATION_FILE_NAME, {}, std::nullopt, std::nullopt);
+        auto serialization_file = data_part_storage.readFile(IMergeTreeDataPart::SERIALIZATION_FILE_NAME, read_settings, std::nullopt, std::nullopt);
         SerializationInfo::Settings settings{ratio_of_defaults, false};
         serialization_infos = SerializationInfoByName::readJSON(columns_txt, settings, *serialization_file);
     }
@@ -114,7 +140,7 @@ IMergeTreeDataPart::Checksums checkDataPart(
     /// This function calculates only checksum of file content (compressed or uncompressed).
     auto checksum_file = [&](const String & file_name)
     {
-        auto file_buf = data_part_storage.readFile(file_name, {}, std::nullopt, std::nullopt);
+        auto file_buf = data_part_storage.readFile(file_name, read_settings, std::nullopt, std::nullopt);
         HashingReadBuffer hashing_buf(*file_buf);
         hashing_buf.ignoreAll();
         checksums_data.files[file_name] = IMergeTreeDataPart::Checksums::Checksum(hashing_buf.count(), hashing_buf.getHash());
@@ -152,7 +178,7 @@ IMergeTreeDataPart::Checksums checkDataPart(
 
     if (require_checksums || data_part_storage.exists("checksums.txt"))
     {
-        auto buf = data_part_storage.readFile("checksums.txt", {}, std::nullopt, std::nullopt);
+        auto buf = data_part_storage.readFile("checksums.txt", read_settings, std::nullopt, std::nullopt);
         checksums_txt.read(*buf);
         assertEOF(*buf);
     }
@@ -202,7 +228,7 @@ IMergeTreeDataPart::Checksums checkDataPart(
             projection, *data_part_storage.getProjection(projection_file),
             projection->getColumns(), projection->getType(),
             projection->getFileNamesWithoutChecksums(),
-            require_checksums, is_cancelled);
+            read_settings, require_checksums, is_cancelled);
 
         checksums_data.files[projection_file] = IMergeTreeDataPart::Checksums::Checksum(
             projection_checksums.getTotalSizeOnDisk(),
@@ -243,14 +269,70 @@ IMergeTreeDataPart::Checksums checkDataPart(
     if (auto part_in_memory = asInMemoryPart(data_part))
         return checkDataPartInMemory(part_in_memory);
 
-    return checkDataPart(
-        data_part,
-        data_part->getDataPartStorage(),
-        data_part->getColumns(),
-        data_part->getType(),
-        data_part->getFileNamesWithoutChecksums(),
-        require_checksums,
-        is_cancelled);
+    /// If check of part has failed and it is stored on disk with cache
+    /// try to drop cache and check it once again because maybe the cache
+    /// is broken not the part itself.
+    auto drop_cache_and_check = [&]
+    {
+        const auto & data_part_storage = data_part->getDataPartStorage();
+        auto cache_name = data_part_storage.getCacheName();
+
+        if (!cache_name)
+            throw;
+
+        LOG_DEBUG(
+            &Poco::Logger::get("checkDataPart"),
+            "Will drop cache for data part {} and will check it once again", data_part->name);
+
+        auto & cache = *FileCacheFactory::instance().getByName(*cache_name).cache;
+        for (auto it = data_part_storage.iterate(); it->isValid(); it->next())
+        {
+            auto file_name = it->name();
+            if (!data_part_storage.isDirectory(file_name))
+            {
+                auto remote_path = data_part_storage.getRemotePath(file_name);
+                cache.removePathIfExists(remote_path);
+            }
+        }
+
+        ReadSettings read_settings;
+        read_settings.enable_filesystem_cache = false;
+
+        return checkDataPart(
+            data_part,
+            data_part_storage,
+            data_part->getColumns(),
+            data_part->getType(),
+            data_part->getFileNamesWithoutChecksums(),
+            read_settings,
+            require_checksums,
+            is_cancelled);
+    };
+
+    try
+    {
+        ReadSettings read_settings;
+        return checkDataPart(
+            data_part,
+            data_part->getDataPartStorage(),
+            data_part->getColumns(),
+            data_part->getType(),
+            data_part->getFileNamesWithoutChecksums(),
+            read_settings,
+            require_checksums,
+            is_cancelled);
+    }
+    catch (const Exception & e)
+    {
+        if (isRetryableException(e))
+            throw;
+
+        return drop_cache_and_check();
+    }
+    catch (...)
+    {
+        return drop_cache_and_check();
+    }
 }
 
 }
diff --git a/src/Storages/MergeTree/checkDataPart.h b/src/Storages/MergeTree/checkDataPart.h
index ecb7a13ca4a..20ddecad3ed 100644
--- a/src/Storages/MergeTree/checkDataPart.h
+++ b/src/Storages/MergeTree/checkDataPart.h
@@ -12,15 +12,7 @@ IMergeTreeDataPart::Checksums checkDataPart(
     bool require_checksums,
     std::function<bool()> is_cancelled = []{ return false; });
 
-IMergeTreeDataPart::Checksums checkDataPart(
-    const DiskPtr & disk,
-    const String & full_relative_path,
-    const NamesAndTypesList & columns_list,
-    const MergeTreeDataPartType & part_type,
-    const NameSet & files_without_checksums,
-    bool require_checksums,
-    std::function<bool()> is_cancelled = []{ return false; });
-
 bool isNotEnoughMemoryErrorCode(int code);
+bool isRetryableException(const Exception & e);
 
 }
diff --git a/src/Storages/MergeTree/registerStorageMergeTree.cpp b/src/Storages/MergeTree/registerStorageMergeTree.cpp
index 027cd1af7c9..75f1542e30e 100644
--- a/src/Storages/MergeTree/registerStorageMergeTree.cpp
+++ b/src/Storages/MergeTree/registerStorageMergeTree.cpp
@@ -23,6 +23,7 @@
 #include <Interpreters/Context.h>
 #include <Interpreters/FunctionNameNormalizer.h>
 #include <Interpreters/evaluateConstantExpression.h>
+#include <Interpreters/DDLTask.h>
 
 
 namespace DB
@@ -684,6 +685,10 @@ static StoragePtr create(const StorageFactory::Arguments & args)
 
     if (replicated)
     {
+        bool need_check_table_structure = true;
+        if (auto txn = args.getLocalContext()->getZooKeeperMetadataTransaction())
+            need_check_table_structure = txn->isInitialQuery();
+
         return std::make_shared<StorageReplicatedMergeTree>(
             zookeeper_path,
             replica_name,
@@ -696,7 +701,8 @@ static StoragePtr create(const StorageFactory::Arguments & args)
             merging_params,
             std::move(storage_settings),
             args.has_force_restore_data_flag,
-            renaming_restrictions);
+            renaming_restrictions,
+            need_check_table_structure);
     }
     else
         return std::make_shared<StorageMergeTree>(
diff --git a/src/Storages/MergeTree/tests/gtest_executor.cpp b/src/Storages/MergeTree/tests/gtest_executor.cpp
index 3a4f147b456..5815b74284a 100644
--- a/src/Storages/MergeTree/tests/gtest_executor.cpp
+++ b/src/Storages/MergeTree/tests/gtest_executor.cpp
@@ -51,7 +51,7 @@ public:
             throw std::runtime_error("Unlucky...");
     }
 
-    UInt64 getPriority() override { return 0; }
+    Priority getPriority() override { return {}; }
 
 private:
     std::mt19937 generator;
@@ -65,11 +65,11 @@ using StepFunc = std::function<void(const String & name, size_t steps_left)>;
 class LambdaExecutableTask : public IExecutableTask
 {
 public:
-    explicit LambdaExecutableTask(const String & name_, size_t step_count_, StepFunc step_func_ = {}, UInt64 priority_ = 0)
+    explicit LambdaExecutableTask(const String & name_, size_t step_count_, StepFunc step_func_ = {}, Int64 priority_value = 0)
         : name(name_)
         , step_count(step_count_)
         , step_func(step_func_)
-        , priority(priority_)
+        , priority{priority_value}
     {}
 
     bool executeStep() override
@@ -86,13 +86,13 @@ public:
 
     void onCompleted() override {}
 
-    UInt64 getPriority() override { return priority; }
+    Priority getPriority() override { return priority; }
 
 private:
     String name;
     size_t step_count;
     StepFunc step_func;
-    UInt64 priority;
+    Priority priority;
 };
 
 
diff --git a/src/Storages/MessageQueueSink.h b/src/Storages/MessageQueueSink.h
index 590bee7ee4f..b3c1e61734f 100644
--- a/src/Storages/MessageQueueSink.h
+++ b/src/Storages/MessageQueueSink.h
@@ -40,7 +40,7 @@ public:
     void onStart() override;
     void onFinish() override;
     void onCancel() override { onFinish(); }
-    void onException() override { onFinish(); }
+    void onException(std::exception_ptr /* exception */) override { onFinish(); }
 
 protected:
     /// Do some specific initialization before consuming data.
diff --git a/src/Storages/NATS/StorageNATS.cpp b/src/Storages/NATS/StorageNATS.cpp
index aa4ec77b0d8..a3478069356 100644
--- a/src/Storages/NATS/StorageNATS.cpp
+++ b/src/Storages/NATS/StorageNATS.cpp
@@ -353,7 +353,7 @@ void StorageNATS::read(
 }
 
 
-SinkToStoragePtr StorageNATS::write(const ASTPtr &, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+SinkToStoragePtr StorageNATS::write(const ASTPtr &, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
     auto modified_context = addSettings(local_context);
     std::string subject = modified_context->getSettingsRef().stream_like_engine_insert_queue.changed
diff --git a/src/Storages/NATS/StorageNATS.h b/src/Storages/NATS/StorageNATS.h
index 518d81fb145..efe54243ee9 100644
--- a/src/Storages/NATS/StorageNATS.h
+++ b/src/Storages/NATS/StorageNATS.h
@@ -51,7 +51,7 @@ public:
         size_t /* max_block_size */,
         size_t /* num_streams */) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, bool async_insert) override;
 
     /// We want to control the number of rows in a chunk inserted into NATS
     bool prefersLargeBlocks() const override { return false; }
diff --git a/src/Storages/NamedCollectionsHelpers.h b/src/Storages/NamedCollectionsHelpers.h
index 1473a3fbe48..d0d6a526f9b 100644
--- a/src/Storages/NamedCollectionsHelpers.h
+++ b/src/Storages/NamedCollectionsHelpers.h
@@ -36,6 +36,10 @@ struct MongoDBEqualKeysSet
     static constexpr std::array<std::pair<std::string_view, std::string_view>, 4> equal_keys{
         std::pair{"username", "user"}, std::pair{"database", "db"}, std::pair{"hostname", "host"}, std::pair{"table", "collection"}};
 };
+struct RedisEqualKeysSet
+{
+    static constexpr std::array<std::pair<std::string_view, std::string_view>, 4> equal_keys{std::pair{"hostname", "host"}};
+};
 
 template <typename EqualKeys> struct NamedCollectionValidateKey
 {
diff --git a/src/Storages/PartitionedSink.cpp b/src/Storages/PartitionedSink.cpp
index 363b4557290..18442a8691f 100644
--- a/src/Storages/PartitionedSink.cpp
+++ b/src/Storages/PartitionedSink.cpp
@@ -111,11 +111,11 @@ void PartitionedSink::consume(Chunk chunk)
     }
 }
 
-void PartitionedSink::onException()
+void PartitionedSink::onException(std::exception_ptr exception)
 {
     for (auto & [_, sink] : partition_id_to_sink)
     {
-        sink->onException();
+        sink->onException(exception);
     }
 }
 
diff --git a/src/Storages/PartitionedSink.h b/src/Storages/PartitionedSink.h
index c4bf9c0622c..68edeb6fd73 100644
--- a/src/Storages/PartitionedSink.h
+++ b/src/Storages/PartitionedSink.h
@@ -22,7 +22,7 @@ public:
 
     void consume(Chunk chunk) override;
 
-    void onException() override;
+    void onException(std::exception_ptr exception) override;
 
     void onFinish() override;
 
diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
index e84f5c963a8..651c63e1b91 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
@@ -764,7 +764,7 @@ void StorageRabbitMQ::read(
 }
 
 
-SinkToStoragePtr StorageRabbitMQ::write(const ASTPtr &, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+SinkToStoragePtr StorageRabbitMQ::write(const ASTPtr &, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
     auto producer = std::make_unique<RabbitMQProducer>(
         configuration, routing_keys, exchange_name, exchange_type, producer_id.fetch_add(1), persistent, shutdown_called, log);
diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.h b/src/Storages/RabbitMQ/StorageRabbitMQ.h
index c531026d83a..dc410c4f298 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.h
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.h
@@ -57,7 +57,8 @@ public:
     SinkToStoragePtr write(
         const ASTPtr & query,
         const StorageMetadataPtr & metadata_snapshot,
-        ContextPtr context) override;
+        ContextPtr context,
+        bool async_insert) override;
 
     /// We want to control the number of rows in a chunk inserted into RabbitMQ
     bool prefersLargeBlocks() const override { return false; }
diff --git a/src/Storages/ReadFromStorageProgress.cpp b/src/Storages/ReadFromStorageProgress.cpp
index 48e64d7968b..8ad1cf92209 100644
--- a/src/Storages/ReadFromStorageProgress.cpp
+++ b/src/Storages/ReadFromStorageProgress.cpp
@@ -7,7 +7,8 @@ namespace DB
 
 void updateRowsProgressApprox(
     ISource & source,
-    const Chunk & chunk,
+    size_t num_rows,
+    UInt64 chunk_bytes_size,
     UInt64 total_result_size,
     UInt64 & total_rows_approx_accumulated,
     size_t & total_rows_count_times,
@@ -16,8 +17,6 @@ void updateRowsProgressApprox(
     if (!total_result_size)
         return;
 
-    const size_t num_rows = chunk.getNumRows();
-
     if (!num_rows)
         return;
 
@@ -32,7 +31,7 @@ void updateRowsProgressApprox(
         }
     }
 
-    const auto bytes_per_row = std::ceil(static_cast<double>(chunk.bytes()) / num_rows);
+    const auto bytes_per_row = std::ceil(static_cast<double>(chunk_bytes_size) / num_rows);
     size_t total_rows_approx = static_cast<size_t>(std::ceil(static_cast<double>(total_result_size) / bytes_per_row));
     total_rows_approx_accumulated += total_rows_approx;
     ++total_rows_count_times;
diff --git a/src/Storages/ReadFromStorageProgress.h b/src/Storages/ReadFromStorageProgress.h
index 9f45845ac6e..2be37d26fee 100644
--- a/src/Storages/ReadFromStorageProgress.h
+++ b/src/Storages/ReadFromStorageProgress.h
@@ -5,11 +5,11 @@ namespace DB
 {
 
 class ISource;
-class Chunk;
 
 void updateRowsProgressApprox(
     ISource & source,
-    const Chunk & chunk,
+    size_t num_rows,
+    UInt64 chunk_bytes_size,
     UInt64 total_result_size,
     UInt64 & total_rows_approx_accumulated,
     size_t & total_rows_count_times,
diff --git a/src/Storages/RedisCommon.cpp b/src/Storages/RedisCommon.cpp
new file mode 100644
index 00000000000..a0534a9e23b
--- /dev/null
+++ b/src/Storages/RedisCommon.cpp
@@ -0,0 +1,150 @@
+#include "RedisCommon.h"
+#include <Common/Exception.h>
+#include <Common/parseAddress.h>
+#include <Interpreters/evaluateConstantExpression.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int INTERNAL_REDIS_ERROR;
+    extern const int TIMEOUT_EXCEEDED;
+    extern const int INVALID_REDIS_STORAGE_TYPE;
+}
+
+RedisConnection::RedisConnection(RedisPoolPtr pool_, RedisClientPtr client_)
+    : pool(std::move(pool_)), client(std::move(client_))
+{
+}
+
+RedisConnection::~RedisConnection()
+{
+    pool->returnObject(std::move(client));
+}
+
+String storageTypeToKeyType(RedisStorageType type)
+{
+    switch (type)
+    {
+        case RedisStorageType::SIMPLE:
+            return "string";
+        case RedisStorageType::HASH_MAP:
+            return "hash";
+        default:
+            return "none";
+    }
+
+    UNREACHABLE();
+}
+
+String serializeStorageType(RedisStorageType storage_type)
+{
+    switch (storage_type)
+    {
+        case RedisStorageType::SIMPLE:
+            return "simple";
+        case RedisStorageType::HASH_MAP:
+            return "hash_map";
+        default:
+            return "none";
+    }
+}
+
+RedisStorageType parseStorageType(const String & storage_type_str)
+{
+    if (storage_type_str == "hash_map")
+        return RedisStorageType::HASH_MAP;
+    else if (!storage_type_str.empty() && storage_type_str != "simple")
+        throw Exception(ErrorCodes::INVALID_REDIS_STORAGE_TYPE, "Unknown storage type {} for Redis dictionary", storage_type_str);
+
+    return RedisStorageType::SIMPLE;
+}
+
+RedisConnectionPtr getRedisConnection(RedisPoolPtr pool, const RedisConfiguration & configuration)
+{
+    RedisClientPtr client;
+    bool ok = pool->tryBorrowObject(client,
+        [] { return std::make_unique<Poco::Redis::Client>(); },
+        REDIS_LOCK_ACQUIRE_TIMEOUT_MS);
+
+    if (!ok)
+        throw Exception(ErrorCodes::TIMEOUT_EXCEEDED,
+                        "Could not get connection from pool, timeout exceeded {} seconds",
+                        REDIS_LOCK_ACQUIRE_TIMEOUT_MS);
+
+    if (!client->isConnected())
+    {
+        try
+        {
+            client->connect(configuration.host, configuration.port);
+
+            if (!configuration.password.empty())
+            {
+                RedisCommand command("AUTH");
+                command << configuration.password;
+                String reply = client->execute<String>(command);
+                if (reply != "OK")
+                    throw Exception(ErrorCodes::INTERNAL_REDIS_ERROR,
+                                    "Authentication failed with reason {}", reply);
+            }
+
+            if (configuration.db_index != 0)
+            {
+                RedisCommand command("SELECT");
+                command << std::to_string(configuration.db_index);
+                String reply = client->execute<String>(command);
+                if (reply != "OK")
+                    throw Exception(ErrorCodes::INTERNAL_REDIS_ERROR,
+                                    "Selecting database with index {} failed with reason {}",
+                                    configuration.db_index, reply);
+            }
+        }
+        catch (...)
+        {
+            if (client->isConnected())
+                client->disconnect();
+
+            pool->returnObject(std::move(client));
+            throw;
+        }
+    }
+
+    return std::make_unique<RedisConnection>(pool, std::move(client));
+}
+
+
+RedisArrayPtr getRedisHashMapKeys(const RedisConnectionPtr & connection, RedisArray & keys)
+{
+    RedisArrayPtr hkeys = std::make_shared<RedisArray>();
+    for (const auto & key : keys)
+    {
+        RedisCommand command_for_secondary_keys("HKEYS");
+        command_for_secondary_keys.addRedisType(key);
+
+        auto secondary_keys = connection->client->execute<RedisArray>(command_for_secondary_keys);
+        if (secondary_keys.isNull())
+            continue;
+
+        RedisArray primary_with_secondary;
+        primary_with_secondary.addRedisType(key);
+        for (const auto & secondary_key : secondary_keys)
+        {
+            primary_with_secondary.addRedisType(secondary_key);
+            /// Do not store more than max_block_size values for one request.
+            if (primary_with_secondary.size() == REDIS_MAX_BLOCK_SIZE + 1)
+            {
+                hkeys->add(primary_with_secondary);
+                primary_with_secondary.clear();
+                primary_with_secondary.addRedisType(key);
+            }
+        }
+
+        if (primary_with_secondary.size() > 1)
+            hkeys->add(primary_with_secondary);
+    }
+
+    return hkeys;
+}
+
+}
diff --git a/src/Storages/RedisCommon.h b/src/Storages/RedisCommon.h
new file mode 100644
index 00000000000..4cc358e6536
--- /dev/null
+++ b/src/Storages/RedisCommon.h
@@ -0,0 +1,78 @@
+#pragma once
+
+#include <Poco/Redis/Client.h>
+#include <Poco/Redis/Command.h>
+#include <Poco/Redis/Array.h>
+#include <Poco/Types.h>
+
+#include <Core/Defines.h>
+#include <base/BorrowedObjectPool.h>
+#include <Core/Names.h>
+#include <Storages/ColumnsDescription.h>
+#include <Storages/StorageFactory.h>
+
+namespace DB
+{
+static constexpr size_t REDIS_MAX_BLOCK_SIZE = DEFAULT_BLOCK_SIZE;
+static constexpr size_t REDIS_LOCK_ACQUIRE_TIMEOUT_MS = 5000;
+
+enum class RedisStorageType
+{
+    SIMPLE,
+    HASH_MAP,
+    UNKNOWN
+};
+
+
+/// storage type to Redis key type
+String storageTypeToKeyType(RedisStorageType type);
+
+RedisStorageType parseStorageType(const String & storage_type_str);
+String serializeStorageType(RedisStorageType storage_type);
+
+struct RedisConfiguration
+{
+    String host;
+    uint32_t port;
+    uint32_t db_index;
+    String password;
+    RedisStorageType storage_type;
+    uint32_t pool_size;
+};
+
+static uint32_t DEFAULT_REDIS_DB_INDEX = 0;
+static uint32_t DEFAULT_REDIS_POOL_SIZE = 16;
+static String DEFAULT_REDIS_PASSWORD;
+
+using RedisCommand = Poco::Redis::Command;
+using RedisArray = Poco::Redis::Array;
+using RedisArrayPtr = std::shared_ptr<RedisArray>;
+using RedisBulkString = Poco::Redis::BulkString;
+using RedisSimpleString = String;
+using RedisInteger = Poco::Int64;
+
+using RedisClientPtr = std::unique_ptr<Poco::Redis::Client>;
+using RedisPool = BorrowedObjectPool<RedisClientPtr>;
+using RedisPoolPtr = std::shared_ptr<RedisPool>;
+
+/// Redis scan iterator
+using RedisIterator = int64_t;
+
+struct RedisConnection
+{
+    RedisConnection(RedisPoolPtr pool_, RedisClientPtr client_);
+    ~RedisConnection();
+
+    RedisPoolPtr pool;
+    RedisClientPtr client;
+};
+
+using RedisConnectionPtr = std::unique_ptr<RedisConnection>;
+
+RedisConnectionPtr getRedisConnection(RedisPoolPtr pool, const RedisConfiguration & configuration);
+
+///get all redis hash key array
+///    eg: keys -> [key1, key2] and get [[key1, field1, field2], [key2, field1, field2]]
+RedisArrayPtr getRedisHashMapKeys(const RedisConnectionPtr & connection, RedisArray & keys);
+
+}
diff --git a/src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp b/src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp
index d1195a9132e..27e8de78b0f 100644
--- a/src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp
+++ b/src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp
@@ -461,7 +461,7 @@ Pipe StorageEmbeddedRocksDB::read(
 }
 
 SinkToStoragePtr StorageEmbeddedRocksDB::write(
-    const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr /*context*/)
+    const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr /*context*/, bool /*async_insert*/)
 {
     return std::make_shared<EmbeddedRocksDBSink>(*this, metadata_snapshot);
 }
diff --git a/src/Storages/RocksDB/StorageEmbeddedRocksDB.h b/src/Storages/RocksDB/StorageEmbeddedRocksDB.h
index 32d7740009e..97fd07626a8 100644
--- a/src/Storages/RocksDB/StorageEmbeddedRocksDB.h
+++ b/src/Storages/RocksDB/StorageEmbeddedRocksDB.h
@@ -48,7 +48,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
     void truncate(const ASTPtr &, const StorageMetadataPtr & metadata_snapshot, ContextPtr, TableExclusiveLockHolder &) override;
 
     void checkMutationIsPossible(const MutationCommands & commands, const Settings & settings) const override;
diff --git a/src/Storages/SelectQueryInfo.cpp b/src/Storages/SelectQueryInfo.cpp
new file mode 100644
index 00000000000..665da7fee70
--- /dev/null
+++ b/src/Storages/SelectQueryInfo.cpp
@@ -0,0 +1,16 @@
+#include <Storages/SelectQueryInfo.h>
+#include <Parsers/ASTSelectQuery.h>
+
+namespace DB
+{
+
+bool SelectQueryInfo::isFinal() const
+{
+    if (table_expression_modifiers)
+        return table_expression_modifiers->hasFinal();
+
+    const auto & select = query->as<ASTSelectQuery &>();
+    return select.final();
+}
+
+}
diff --git a/src/Storages/SelectQueryInfo.h b/src/Storages/SelectQueryInfo.h
index b3dfd44b2ad..8fbc64b7a24 100644
--- a/src/Storages/SelectQueryInfo.h
+++ b/src/Storages/SelectQueryInfo.h
@@ -265,5 +265,7 @@ struct SelectQueryInfo
     {
         return input_order_info ? input_order_info : (projection ? projection->input_order_info : nullptr);
     }
+
+    bool isFinal() const;
 };
 }
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
new file mode 100644
index 00000000000..0880d058cb5
--- /dev/null
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -0,0 +1,1331 @@
+#include <Storages/StorageAzureBlob.h>
+
+
+#if USE_AZURE_BLOB_STORAGE
+#include <Formats/FormatFactory.h>
+#include <Interpreters/evaluateConstantExpression.h>
+#include <Storages/checkAndGetLiteralArgument.h>
+#include <Parsers/ASTFunction.h>
+#include <Parsers/ASTInsertQuery.h>
+
+#include <IO/ParallelReadBuffer.h>
+#include <IO/SharedThreadPools.h>
+
+#include <Parsers/ASTCreateQuery.h>
+#include <Formats/ReadSchemaUtils.h>
+#include <DataTypes/DataTypeLowCardinality.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <re2/re2.h>
+
+#include <azure/identity/managed_identity_credential.hpp>
+#include <azure/storage/common/storage_credential.hpp>
+#include <Processors/Transforms/AddingDefaultsTransform.h>
+#include <Processors/Formats/IOutputFormat.h>
+#include <Processors/Formats/IInputFormat.h>
+
+#include <Storages/StorageFactory.h>
+#include <Storages/StorageSnapshot.h>
+#include <Storages/PartitionedSink.h>
+#include <Storages/VirtualColumnUtils.h>
+#include <Storages/getVirtualsForStorage.h>
+#include <Storages/StorageURL.h>
+#include <Storages/NamedCollectionsHelpers.h>
+#include <Storages/ReadFromStorageProgress.h>
+#include <Common/parseGlobs.h>
+#include <Disks/ObjectStorages/ObjectStorageIterator.h>
+#include <Disks/IO/AsynchronousBoundedReadBuffer.h>
+
+#include <QueryPipeline/QueryPipelineBuilder.h>
+#include <QueryPipeline/Pipe.h>
+
+#include <Disks/IO/ReadBufferFromAzureBlobStorage.h>
+#include <Disks/IO/WriteBufferFromAzureBlobStorage.h>
+
+
+using namespace Azure::Storage::Blobs;
+
+namespace CurrentMetrics
+{
+    extern const Metric ObjectStorageAzureThreads;
+    extern const Metric ObjectStorageAzureThreadsActive;
+}
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int BAD_ARGUMENTS;
+    extern const int DATABASE_ACCESS_DENIED;
+    extern const int CANNOT_COMPILE_REGEXP;
+    extern const int CANNOT_EXTRACT_TABLE_STRUCTURE;
+    extern const int LOGICAL_ERROR;
+    extern const int NOT_IMPLEMENTED;
+
+}
+
+namespace
+{
+
+const std::unordered_set<std::string_view> required_configuration_keys = {
+    "blob_path",
+    "container",
+};
+
+const std::unordered_set<std::string_view> optional_configuration_keys = {
+    "format",
+    "compression",
+    "structure",
+    "compression_method",
+    "account_name",
+    "account_key",
+    "connection_string",
+    "storage_account_url",
+};
+
+bool isConnectionString(const std::string & candidate)
+{
+    return candidate.starts_with("DefaultEndpointsProtocol");
+}
+
+}
+
+void StorageAzureBlob::processNamedCollectionResult(StorageAzureBlob::Configuration & configuration, const NamedCollection & collection)
+{
+    validateNamedCollection(collection, required_configuration_keys, optional_configuration_keys);
+
+    if (collection.has("connection_string"))
+    {
+        configuration.connection_url = collection.get<String>("connection_string");
+        configuration.is_connection_string = true;
+    }
+
+    if (collection.has("storage_account_url"))
+    {
+        configuration.connection_url = collection.get<String>("storage_account_url");
+        configuration.is_connection_string = false;
+    }
+
+    configuration.container = collection.get<String>("container");
+    configuration.blob_path = collection.get<String>("blob_path");
+
+    if (collection.has("account_name"))
+        configuration.account_name = collection.get<String>("account_name");
+
+    if (collection.has("account_key"))
+        configuration.account_key = collection.get<String>("account_key");
+
+    configuration.structure = collection.getOrDefault<String>("structure", "auto");
+    configuration.format = collection.getOrDefault<String>("format", configuration.format);
+    configuration.compression_method = collection.getOrDefault<String>("compression_method", collection.getOrDefault<String>("compression", "auto"));
+}
+
+
+StorageAzureBlob::Configuration StorageAzureBlob::getConfiguration(ASTs & engine_args, ContextPtr local_context)
+{
+    StorageAzureBlob::Configuration configuration;
+
+    /// Supported signatures:
+    ///
+    /// AzureBlobStorage(connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression])
+    ///
+
+    if (auto named_collection = tryGetNamedCollectionWithOverrides(engine_args, local_context))
+    {
+        processNamedCollectionResult(configuration, *named_collection);
+
+        configuration.blobs_paths = {configuration.blob_path};
+
+        if (configuration.format == "auto")
+            configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path, true);
+
+        return configuration;
+    }
+
+    if (engine_args.size() < 3 || engine_args.size() > 7)
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                        "Storage AzureBlobStorage requires 3 to 7 arguments: "
+                        "AzureBlobStorage(connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression])");
+
+    for (auto & engine_arg : engine_args)
+        engine_arg = evaluateConstantExpressionOrIdentifierAsLiteral(engine_arg, local_context);
+
+    std::unordered_map<std::string_view, size_t> engine_args_to_idx;
+
+    configuration.connection_url = checkAndGetLiteralArgument<String>(engine_args[0], "connection_string/storage_account_url");
+    configuration.is_connection_string = isConnectionString(configuration.connection_url);
+
+    configuration.container = checkAndGetLiteralArgument<String>(engine_args[1], "container");
+    configuration.blob_path = checkAndGetLiteralArgument<String>(engine_args[2], "blobpath");
+
+    auto is_format_arg = [] (const std::string & s) -> bool
+    {
+        return s == "auto" || FormatFactory::instance().getAllFormats().contains(s);
+    };
+
+    if (engine_args.size() == 4)
+    {
+        //'c1 UInt64, c2 UInt64
+        auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name");
+        if (is_format_arg(fourth_arg))
+        {
+            configuration.format = fourth_arg;
+        }
+        else
+        {
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown format or account name specified without account key");
+        }
+    }
+    else if (engine_args.size() == 5)
+    {
+        auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name");
+        if (is_format_arg(fourth_arg))
+        {
+            configuration.format = fourth_arg;
+            configuration.compression_method = checkAndGetLiteralArgument<String>(engine_args[4], "compression");
+        }
+        else
+        {
+            configuration.account_name = fourth_arg;
+            configuration.account_key = checkAndGetLiteralArgument<String>(engine_args[4], "account_key");
+        }
+    }
+    else if (engine_args.size() == 6)
+    {
+        auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name");
+        if (fourth_arg == "auto" || FormatFactory::instance().getAllFormats().contains(fourth_arg))
+        {
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Format and compression must be last arguments");
+        }
+        else
+        {
+            configuration.account_name = fourth_arg;
+
+            configuration.account_key = checkAndGetLiteralArgument<String>(engine_args[4], "account_key");
+            auto sixth_arg = checkAndGetLiteralArgument<String>(engine_args[5], "format/account_name");
+            if (!is_format_arg(sixth_arg))
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown format {}", sixth_arg);
+            configuration.format = sixth_arg;
+        }
+    }
+    else if (engine_args.size() == 7)
+    {
+        auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name");
+        if (fourth_arg == "auto" || FormatFactory::instance().getAllFormats().contains(fourth_arg))
+        {
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Format and compression must be last arguments");
+        }
+        else
+        {
+            configuration.account_name = fourth_arg;
+            configuration.account_key = checkAndGetLiteralArgument<String>(engine_args[4], "account_key");
+            auto sixth_arg = checkAndGetLiteralArgument<String>(engine_args[5], "format/account_name");
+            if (!is_format_arg(sixth_arg))
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown format {}", sixth_arg);
+            configuration.format = sixth_arg;
+            configuration.compression_method = checkAndGetLiteralArgument<String>(engine_args[6], "compression");
+        }
+    }
+
+    configuration.blobs_paths = {configuration.blob_path};
+
+    if (configuration.format == "auto")
+        configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path, true);
+
+    return configuration;
+}
+
+
+AzureObjectStorage::SettingsPtr StorageAzureBlob::createSettings(ContextPtr local_context)
+{
+    const auto & context_settings = local_context->getSettingsRef();
+    auto settings_ptr = std::make_unique<AzureObjectStorageSettings>();
+    settings_ptr->max_single_part_upload_size = context_settings.azure_max_single_part_upload_size;
+    settings_ptr->max_single_read_retries = context_settings.azure_max_single_read_retries;
+    settings_ptr->list_object_keys_size = static_cast<int32_t>(context_settings.azure_list_object_keys_size);
+
+    return settings_ptr;
+}
+
+void registerStorageAzureBlob(StorageFactory & factory)
+{
+    factory.registerStorage("AzureBlobStorage", [](const StorageFactory::Arguments & args)
+    {
+        auto & engine_args = args.engine_args;
+        if (engine_args.empty())
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "External data source must have arguments");
+
+        auto configuration = StorageAzureBlob::getConfiguration(engine_args, args.getLocalContext());
+        auto client = StorageAzureBlob::createClient(configuration);
+        // Use format settings from global server context + settings from
+        // the SETTINGS clause of the create query. Settings from current
+        // session and user are ignored.
+        std::optional<FormatSettings> format_settings;
+        if (args.storage_def->settings)
+        {
+            FormatFactorySettings user_format_settings;
+
+            // Apply changed settings from global context, but ignore the
+            // unknown ones, because we only have the format settings here.
+            const auto & changes = args.getContext()->getSettingsRef().changes();
+            for (const auto & change : changes)
+            {
+                if (user_format_settings.has(change.name))
+                    user_format_settings.set(change.name, change.value);
+            }
+
+            // Apply changes from SETTINGS clause, with validation.
+            user_format_settings.applyChanges(args.storage_def->settings->changes);
+            format_settings = getFormatSettings(args.getContext(), user_format_settings);
+        }
+        else
+        {
+            format_settings = getFormatSettings(args.getContext());
+        }
+
+        ASTPtr partition_by;
+        if (args.storage_def->partition_by)
+            partition_by = args.storage_def->partition_by->clone();
+
+        auto settings = StorageAzureBlob::createSettings(args.getContext());
+
+        return std::make_shared<StorageAzureBlob>(
+            std::move(configuration),
+            std::make_unique<AzureObjectStorage>("AzureBlobStorage", std::move(client), std::move(settings)),
+            args.getContext(),
+            args.table_id,
+            args.columns,
+            args.constraints,
+            args.comment,
+            format_settings,
+            partition_by);
+    },
+    {
+        .supports_settings = true,
+        .supports_sort_order = true, // for partition by
+        .supports_schema_inference = true,
+        .source_access_type = AccessType::AZURE,
+    });
+}
+
+AzureClientPtr StorageAzureBlob::createClient(StorageAzureBlob::Configuration configuration)
+{
+    AzureClientPtr result;
+
+    if (configuration.is_connection_string)
+    {
+        result = std::make_unique<BlobContainerClient>(BlobContainerClient::CreateFromConnectionString(configuration.connection_url, configuration.container));
+        result->CreateIfNotExists();
+    }
+    else
+    {
+        if (configuration.account_name.has_value() && configuration.account_key.has_value())
+        {
+            auto storage_shared_key_credential = std::make_shared<Azure::Storage::StorageSharedKeyCredential>(*configuration.account_name, *configuration.account_key);
+            auto blob_service_client = std::make_unique<BlobServiceClient>(configuration.connection_url, storage_shared_key_credential);
+            try
+            {
+                result = std::make_unique<BlobContainerClient>(blob_service_client->CreateBlobContainer(configuration.container).Value);
+            }
+            catch (const Azure::Storage::StorageException & e)
+            {
+                if (e.StatusCode == Azure::Core::Http::HttpStatusCode::Conflict)
+                {
+                    auto final_url = configuration.connection_url
+                        + (configuration.connection_url.back() == '/' ? "" : "/")
+                        + configuration.container;
+
+                    result = std::make_unique<BlobContainerClient>(final_url, storage_shared_key_credential);
+                }
+                else
+                {
+                    throw;
+                }
+            }
+        }
+        else
+        {
+            auto managed_identity_credential = std::make_shared<Azure::Identity::ManagedIdentityCredential>();
+            auto blob_service_client = std::make_unique<BlobServiceClient>(configuration.connection_url, managed_identity_credential);
+            try
+            {
+                result = std::make_unique<BlobContainerClient>(blob_service_client->CreateBlobContainer(configuration.container).Value);
+            }
+            catch (const Azure::Storage::StorageException & e)
+            {
+                if (e.StatusCode == Azure::Core::Http::HttpStatusCode::Conflict)
+                {
+                    auto final_url = configuration.connection_url
+                        + (configuration.connection_url.back() == '/' ? "" : "/")
+                        + configuration.container;
+
+                    result = std::make_unique<BlobContainerClient>(final_url, managed_identity_credential);
+                }
+                else
+                {
+                    throw;
+                }
+            }
+        }
+    }
+
+    return result;
+}
+
+Poco::URI StorageAzureBlob::Configuration::getConnectionURL() const
+{
+    if (!is_connection_string)
+        return Poco::URI(connection_url);
+
+    auto parsed_connection_string = Azure::Storage::_internal::ParseConnectionString(connection_url);
+    return Poco::URI(parsed_connection_string.BlobServiceUrl.GetAbsoluteUrl());
+}
+
+
+StorageAzureBlob::StorageAzureBlob(
+    const Configuration & configuration_,
+    std::unique_ptr<AzureObjectStorage> && object_storage_,
+    ContextPtr context,
+    const StorageID & table_id_,
+    const ColumnsDescription & columns_,
+    const ConstraintsDescription & constraints_,
+    const String & comment,
+    std::optional<FormatSettings> format_settings_,
+    ASTPtr partition_by_)
+    : IStorage(table_id_)
+    , name("AzureBlobStorage")
+    , configuration(configuration_)
+    , object_storage(std::move(object_storage_))
+    , distributed_processing(false)
+    , format_settings(format_settings_)
+    , partition_by(partition_by_)
+{
+    FormatFactory::instance().checkFormatName(configuration.format);
+    context->getGlobalContext()->getRemoteHostFilter().checkURL(configuration.getConnectionURL());
+
+    StorageInMemoryMetadata storage_metadata;
+    if (columns_.empty())
+    {
+        auto columns = getTableStructureFromData(object_storage.get(), configuration, format_settings, context);
+        storage_metadata.setColumns(columns);
+    }
+    else
+        storage_metadata.setColumns(columns_);
+
+    storage_metadata.setConstraints(constraints_);
+    storage_metadata.setComment(comment);
+    setInMemoryMetadata(storage_metadata);
+
+    StoredObjects objects;
+    for (const auto & key : configuration.blobs_paths)
+        objects.emplace_back(key);
+
+    auto default_virtuals = NamesAndTypesList{
+        {"_path", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
+        {"_file", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())}};
+
+    auto columns = storage_metadata.getSampleBlock().getNamesAndTypesList();
+
+    virtual_columns = getVirtualsForStorage(columns, default_virtuals);
+    for (const auto & column : virtual_columns)
+        virtual_block.insert({column.type->createColumn(), column.type, column.name});
+}
+
+void StorageAzureBlob::truncate(const ASTPtr &, const StorageMetadataPtr &, ContextPtr, TableExclusiveLockHolder &)
+{
+    if (configuration.withGlobs())
+    {
+        throw Exception(
+            ErrorCodes::DATABASE_ACCESS_DENIED,
+            "S3 key '{}' contains globs, so the table is in readonly mode",
+            configuration.blob_path);
+    }
+
+    StoredObjects objects;
+    for (const auto & key : configuration.blobs_paths)
+        objects.emplace_back(key);
+
+    object_storage->removeObjectsIfExist(objects);
+}
+
+namespace
+{
+
+class StorageAzureBlobSink : public SinkToStorage
+{
+public:
+    StorageAzureBlobSink(
+        const String & format,
+        const Block & sample_block_,
+        ContextPtr context,
+        std::optional<FormatSettings> format_settings_,
+        const CompressionMethod compression_method,
+        AzureObjectStorage * object_storage,
+        const String & blob_path)
+        : SinkToStorage(sample_block_)
+        , sample_block(sample_block_)
+        , format_settings(format_settings_)
+    {
+        StoredObject object(blob_path);
+        write_buf = wrapWriteBufferWithCompressionMethod(object_storage->writeObject(object, WriteMode::Rewrite), compression_method, 3);
+        writer = FormatFactory::instance().getOutputFormatParallelIfPossible(format, *write_buf, sample_block, context, format_settings);
+    }
+
+    String getName() const override { return "StorageAzureBlobSink"; }
+
+    void consume(Chunk chunk) override
+    {
+        std::lock_guard lock(cancel_mutex);
+        if (cancelled)
+            return;
+        writer->write(getHeader().cloneWithColumns(chunk.detachColumns()));
+    }
+
+    void onCancel() override
+    {
+        std::lock_guard lock(cancel_mutex);
+        finalize();
+        cancelled = true;
+    }
+
+    void onException(std::exception_ptr exception) override
+    {
+        std::lock_guard lock(cancel_mutex);
+        try
+        {
+            std::rethrow_exception(exception);
+        }
+        catch (...)
+        {
+            /// An exception context is needed to proper delete write buffers without finalization
+            release();
+        }
+    }
+
+    void onFinish() override
+    {
+        std::lock_guard lock(cancel_mutex);
+        finalize();
+    }
+
+private:
+    void finalize()
+    {
+        if (!writer)
+            return;
+
+        try
+        {
+            writer->finalize();
+            writer->flush();
+            write_buf->finalize();
+        }
+        catch (...)
+        {
+            /// Stop ParallelFormattingOutputFormat correctly.
+            release();
+            throw;
+        }
+    }
+
+    void release()
+    {
+        writer.reset();
+        write_buf->finalize();
+    }
+
+    Block sample_block;
+    std::optional<FormatSettings> format_settings;
+    std::unique_ptr<WriteBuffer> write_buf;
+    OutputFormatPtr writer;
+    bool cancelled = false;
+    std::mutex cancel_mutex;
+};
+
+class PartitionedStorageAzureBlobSink : public PartitionedSink
+{
+public:
+    PartitionedStorageAzureBlobSink(
+        const ASTPtr & partition_by,
+        const String & format_,
+        const Block & sample_block_,
+        ContextPtr context_,
+        std::optional<FormatSettings> format_settings_,
+        const CompressionMethod compression_method_,
+        AzureObjectStorage * object_storage_,
+        const String & blob_)
+        : PartitionedSink(partition_by, context_, sample_block_)
+        , format(format_)
+        , sample_block(sample_block_)
+        , context(context_)
+        , compression_method(compression_method_)
+        , object_storage(object_storage_)
+        , blob(blob_)
+        , format_settings(format_settings_)
+    {
+    }
+
+    SinkPtr createSinkForPartition(const String & partition_id) override
+    {
+        auto partition_key = replaceWildcards(blob, partition_id);
+        validateKey(partition_key);
+
+        return std::make_shared<StorageAzureBlobSink>(
+            format,
+            sample_block,
+            context,
+            format_settings,
+            compression_method,
+            object_storage,
+            partition_key
+        );
+    }
+
+private:
+    const String format;
+    const Block sample_block;
+    const ContextPtr context;
+    const CompressionMethod compression_method;
+    AzureObjectStorage * object_storage;
+    const String blob;
+    const std::optional<FormatSettings> format_settings;
+
+    ExpressionActionsPtr partition_by_expr;
+
+    static void validateKey(const String & str)
+    {
+        validatePartitionKey(str, true);
+    }
+};
+
+}
+
+Pipe StorageAzureBlob::read(
+    const Names & column_names,
+    const StorageSnapshotPtr &  storage_snapshot,
+    SelectQueryInfo & query_info,
+    ContextPtr local_context,
+    QueryProcessingStage::Enum /*processed_stage*/,
+    size_t max_block_size,
+    size_t num_streams)
+{
+    if (partition_by && configuration.withWildcard())
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Reading from a partitioned Azure storage is not implemented yet");
+
+    Pipes pipes;
+
+    std::unordered_set<String> column_names_set(column_names.begin(), column_names.end());
+    std::vector<NameAndTypePair> requested_virtual_columns;
+
+    for (const auto & virtual_column : getVirtuals())
+    {
+        if (column_names_set.contains(virtual_column.name))
+            requested_virtual_columns.push_back(virtual_column);
+    }
+
+    std::shared_ptr<StorageAzureBlobSource::IIterator> iterator_wrapper;
+    if (configuration.withGlobs())
+    {
+        /// Iterate through disclosed globs and make a source for each file
+        iterator_wrapper = std::make_shared<StorageAzureBlobSource::GlobIterator>(
+            object_storage.get(), configuration.container, configuration.blob_path,
+            query_info.query, virtual_block, local_context, nullptr);
+    }
+    else
+    {
+        iterator_wrapper = std::make_shared<StorageAzureBlobSource::KeysIterator>(
+            object_storage.get(), configuration.container, configuration.blobs_paths,
+            query_info.query, virtual_block, local_context, nullptr);
+    }
+
+    ColumnsDescription columns_description;
+    Block block_for_format;
+    if (supportsSubsetOfColumns())
+    {
+        auto fetch_columns = column_names;
+        const auto & virtuals = getVirtuals();
+        std::erase_if(
+            fetch_columns,
+            [&](const String & col)
+            { return std::any_of(virtuals.begin(), virtuals.end(), [&](const NameAndTypePair & virtual_col){ return col == virtual_col.name; }); });
+
+        if (fetch_columns.empty())
+            fetch_columns.push_back(ExpressionActions::getSmallestColumn(storage_snapshot->metadata->getColumns().getAllPhysical()).name);
+
+        columns_description = storage_snapshot->getDescriptionForColumns(fetch_columns);
+        block_for_format = storage_snapshot->getSampleBlockForColumns(columns_description.getNamesOfPhysical());
+    }
+    else
+    {
+        columns_description = storage_snapshot->metadata->getColumns();
+        block_for_format = storage_snapshot->metadata->getSampleBlock();
+    }
+
+    for (size_t i = 0; i < num_streams; ++i)
+    {
+        pipes.emplace_back(std::make_shared<StorageAzureBlobSource>(
+            requested_virtual_columns,
+            configuration.format,
+            getName(),
+            block_for_format,
+            local_context,
+            format_settings,
+            columns_description,
+            max_block_size,
+            configuration.compression_method,
+            object_storage.get(),
+            configuration.container,
+            iterator_wrapper));
+    }
+
+    return Pipe::unitePipes(std::move(pipes));
+}
+
+SinkToStoragePtr StorageAzureBlob::write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
+{
+    auto sample_block = metadata_snapshot->getSampleBlock();
+    auto chosen_compression_method = chooseCompressionMethod(configuration.blobs_paths.back(), configuration.compression_method);
+    auto insert_query = std::dynamic_pointer_cast<ASTInsertQuery>(query);
+
+    auto partition_by_ast = insert_query ? (insert_query->partition_by ? insert_query->partition_by : partition_by) : nullptr;
+    bool is_partitioned_implementation = partition_by_ast && configuration.withWildcard();
+
+    if (is_partitioned_implementation)
+    {
+        return std::make_shared<PartitionedStorageAzureBlobSink>(
+            partition_by_ast,
+            configuration.format,
+            sample_block,
+            local_context,
+            format_settings,
+            chosen_compression_method,
+            object_storage.get(),
+            configuration.blobs_paths.back());
+    }
+    else
+    {
+        if (configuration.withGlobs())
+            throw Exception(ErrorCodes::DATABASE_ACCESS_DENIED,
+                            "AzureBlobStorage key '{}' contains globs, so the table is in readonly mode", configuration.blob_path);
+
+        bool truncate_in_insert = local_context->getSettingsRef().azure_truncate_on_insert;
+
+        if (!truncate_in_insert && object_storage->exists(StoredObject(configuration.blob_path)))
+        {
+
+            if (local_context->getSettingsRef().azure_create_new_file_on_insert)
+            {
+                size_t index = configuration.blobs_paths.size();
+                const auto & first_key = configuration.blobs_paths[0];
+                auto pos = first_key.find_first_of('.');
+                String new_key;
+
+                do
+                {
+                    new_key = first_key.substr(0, pos) + "." + std::to_string(index) + (pos == std::string::npos ? "" : first_key.substr(pos));
+                    ++index;
+                }
+                while (object_storage->exists(StoredObject(new_key)));
+
+                configuration.blobs_paths.push_back(new_key);
+            }
+            else
+            {
+                throw Exception(
+                    ErrorCodes::BAD_ARGUMENTS,
+                    "Object in bucket {} with key {} already exists. "
+                    "If you want to overwrite it, enable setting azure_truncate_on_insert, if you "
+                    "want to create a new file on each insert, enable setting azure_create_new_file_on_insert",
+                    configuration.container, configuration.blobs_paths.back());
+            }
+        }
+
+        return std::make_shared<StorageAzureBlobSink>(
+            configuration.format,
+            sample_block,
+            local_context,
+            format_settings,
+            chosen_compression_method,
+            object_storage.get(),
+            configuration.blobs_paths.back());
+    }
+}
+
+NamesAndTypesList StorageAzureBlob::getVirtuals() const
+{
+    return virtual_columns;
+}
+
+bool StorageAzureBlob::supportsPartitionBy() const
+{
+    return true;
+}
+
+bool StorageAzureBlob::supportsSubcolumns() const
+{
+    return FormatFactory::instance().checkIfFormatSupportsSubcolumns(configuration.format);
+}
+
+bool StorageAzureBlob::supportsSubsetOfColumns() const
+{
+    return FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(configuration.format);
+}
+
+bool StorageAzureBlob::prefersLargeBlocks() const
+{
+    return FormatFactory::instance().checkIfOutputFormatPrefersLargeBlocks(configuration.format);
+}
+
+bool StorageAzureBlob::parallelizeOutputAfterReading(ContextPtr context) const
+{
+    return FormatFactory::instance().checkParallelizeOutputAfterReading(configuration.format, context);
+}
+
+static void addPathToVirtualColumns(Block & block, const String & path, size_t idx)
+{
+    if (block.has("_path"))
+        block.getByName("_path").column->assumeMutableRef().insert(path);
+
+    if (block.has("_file"))
+    {
+        auto pos = path.find_last_of('/');
+        assert(pos != std::string::npos);
+
+        auto file = path.substr(pos + 1);
+        block.getByName("_file").column->assumeMutableRef().insert(file);
+    }
+
+    block.getByName("_idx").column->assumeMutableRef().insert(idx);
+}
+
+StorageAzureBlobSource::GlobIterator::GlobIterator(
+    AzureObjectStorage * object_storage_,
+    const std::string & container_,
+    String blob_path_with_globs_,
+    ASTPtr query_,
+    const Block & virtual_header_,
+    ContextPtr context_,
+    RelativePathsWithMetadata * outer_blobs_)
+    : IIterator(context_)
+    , object_storage(object_storage_)
+    , container(container_)
+    , blob_path_with_globs(blob_path_with_globs_)
+    , query(query_)
+    , virtual_header(virtual_header_)
+    , outer_blobs(outer_blobs_)
+{
+
+    const String key_prefix = blob_path_with_globs.substr(0, blob_path_with_globs.find_first_of("*?{"));
+
+    /// We don't have to list bucket, because there is no asterisks.
+    if (key_prefix.size() == blob_path_with_globs.size())
+    {
+        ObjectMetadata object_metadata = object_storage->getObjectMetadata(blob_path_with_globs);
+        blobs_with_metadata.emplace_back(blob_path_with_globs, object_metadata);
+        if (outer_blobs)
+            outer_blobs->emplace_back(blobs_with_metadata.back());
+        return;
+    }
+
+    object_storage_iterator = object_storage->iterate(key_prefix);
+
+    matcher = std::make_unique<re2::RE2>(makeRegexpPatternFromGlobs(blob_path_with_globs));
+
+    if (!matcher->ok())
+        throw Exception(
+            ErrorCodes::CANNOT_COMPILE_REGEXP, "Cannot compile regex from glob ({}): {}", blob_path_with_globs, matcher->error());
+
+    recursive = blob_path_with_globs == "/**" ? true : false;
+}
+
+RelativePathWithMetadata StorageAzureBlobSource::GlobIterator::next()
+{
+    std::lock_guard lock(next_mutex);
+
+    if (is_finished)
+        return {};
+
+    bool need_new_batch = blobs_with_metadata.empty() || index >= blobs_with_metadata.size();
+
+    if (need_new_batch)
+    {
+        RelativePathsWithMetadata new_batch;
+        while (new_batch.empty())
+        {
+            auto result = object_storage_iterator->getCurrrentBatchAndScheduleNext();
+            if (result.has_value())
+            {
+                new_batch = result.value();
+            }
+            else
+            {
+                is_finished = true;
+                return {};
+            }
+
+            for (auto it = new_batch.begin(); it != new_batch.end();)
+            {
+                if (!recursive && !re2::RE2::FullMatch(it->relative_path, *matcher))
+                    it = new_batch.erase(it);
+                else
+                    ++it;
+            }
+        }
+
+        index = 0;
+        if (!is_initialized)
+        {
+            createFilterAST(new_batch.front().relative_path);
+            is_initialized = true;
+        }
+
+        if (filter_ast)
+        {
+            auto block = virtual_header.cloneEmpty();
+            for (size_t i = 0; i < new_batch.size(); ++i)
+                addPathToVirtualColumns(block, fs::path(container) / new_batch[i].relative_path, i);
+
+            VirtualColumnUtils::filterBlockWithQuery(query, block, getContext(), filter_ast);
+            const auto & idxs = typeid_cast<const ColumnUInt64 &>(*block.getByName("_idx").column);
+
+            blobs_with_metadata.clear();
+            for (UInt64 idx : idxs.getData())
+            {
+                total_size.fetch_add(new_batch[idx].metadata.size_bytes, std::memory_order_relaxed);
+                blobs_with_metadata.emplace_back(std::move(new_batch[idx]));
+                if (outer_blobs)
+                    outer_blobs->emplace_back(blobs_with_metadata.back());
+            }
+        }
+        else
+        {
+            if (outer_blobs)
+                outer_blobs->insert(outer_blobs->end(), new_batch.begin(), new_batch.end());
+
+            blobs_with_metadata = std::move(new_batch);
+            for (const auto & [_, info] : blobs_with_metadata)
+                total_size.fetch_add(info.size_bytes, std::memory_order_relaxed);
+        }
+    }
+
+    size_t current_index = index++;
+    if (current_index >= blobs_with_metadata.size())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Index out of bound for blob metadata");
+    return blobs_with_metadata[current_index];
+}
+
+size_t StorageAzureBlobSource::GlobIterator::getTotalSize() const
+{
+    return total_size.load(std::memory_order_relaxed);
+}
+
+
+void StorageAzureBlobSource::GlobIterator::createFilterAST(const String & any_key)
+{
+    if (!query || !virtual_header)
+        return;
+
+    /// Create a virtual block with one row to construct filter
+    /// Append "idx" column as the filter result
+    virtual_header.insert({ColumnUInt64::create(), std::make_shared<DataTypeUInt64>(), "_idx"});
+
+    auto block = virtual_header.cloneEmpty();
+    addPathToVirtualColumns(block, fs::path(container) / any_key, 0);
+    VirtualColumnUtils::prepareFilterBlockWithQuery(query, getContext(), block, filter_ast);
+}
+
+
+StorageAzureBlobSource::KeysIterator::KeysIterator(
+    AzureObjectStorage * object_storage_,
+    const std::string & container_,
+    Strings keys_,
+    ASTPtr query_,
+    const Block & virtual_header_,
+    ContextPtr context_,
+    RelativePathsWithMetadata * outer_blobs_)
+    : IIterator(context_)
+    , object_storage(object_storage_)
+    , container(container_)
+    , query(query_)
+    , virtual_header(virtual_header_)
+    , outer_blobs(outer_blobs_)
+{
+    Strings all_keys = keys_;
+
+    /// Create a virtual block with one row to construct filter
+    if (query && virtual_header && !all_keys.empty())
+    {
+        /// Append "idx" column as the filter result
+        virtual_header.insert({ColumnUInt64::create(), std::make_shared<DataTypeUInt64>(), "_idx"});
+
+        auto block = virtual_header.cloneEmpty();
+        addPathToVirtualColumns(block, fs::path(container) / all_keys.front(), 0);
+
+        VirtualColumnUtils::prepareFilterBlockWithQuery(query, getContext(), block, filter_ast);
+
+        if (filter_ast)
+        {
+            block = virtual_header.cloneEmpty();
+            for (size_t i = 0; i < all_keys.size(); ++i)
+                addPathToVirtualColumns(block, fs::path(container) / all_keys[i], i);
+
+            VirtualColumnUtils::filterBlockWithQuery(query, block, getContext(), filter_ast);
+            const auto & idxs = typeid_cast<const ColumnUInt64 &>(*block.getByName("_idx").column);
+
+            Strings filtered_keys;
+            filtered_keys.reserve(block.rows());
+            for (UInt64 idx : idxs.getData())
+                filtered_keys.emplace_back(std::move(all_keys[idx]));
+
+            all_keys = std::move(filtered_keys);
+        }
+    }
+
+    for (auto && key : all_keys)
+    {
+        ObjectMetadata object_metadata = object_storage->getObjectMetadata(key);
+        total_size += object_metadata.size_bytes;
+        keys.emplace_back(RelativePathWithMetadata{key, object_metadata});
+    }
+
+    if (outer_blobs)
+        *outer_blobs = keys;
+}
+
+RelativePathWithMetadata StorageAzureBlobSource::KeysIterator::next()
+{
+    size_t current_index = index.fetch_add(1, std::memory_order_relaxed);
+    if (current_index >= keys.size())
+        return {};
+
+    return keys[current_index];
+}
+
+size_t StorageAzureBlobSource::KeysIterator::getTotalSize() const
+{
+    return total_size.load(std::memory_order_relaxed);
+}
+
+
+Chunk StorageAzureBlobSource::generate()
+{
+    while (true)
+    {
+        if (isCancelled() || !reader)
+        {
+            if (reader)
+                reader->cancel();
+            break;
+        }
+
+        Chunk chunk;
+        if (reader->pull(chunk))
+        {
+            UInt64 num_rows = chunk.getNumRows();
+
+            const auto & file_path = reader.getPath();
+            if (num_rows && total_objects_size)
+            {
+                size_t chunk_size = reader.getFormat()->getApproxBytesReadForChunk();
+                if (!chunk_size)
+                    chunk_size = chunk.bytes();
+                updateRowsProgressApprox(
+                    *this, num_rows, chunk_size, total_objects_size, total_rows_approx_accumulated, total_rows_count_times, total_rows_approx_max);
+            }
+
+            for (const auto & virtual_column : requested_virtual_columns)
+            {
+                if (virtual_column.name == "_path")
+                {
+                    chunk.addColumn(virtual_column.type->createColumnConst(num_rows, file_path)->convertToFullColumnIfConst());
+                }
+                else if (virtual_column.name == "_file")
+                {
+                    size_t last_slash_pos = file_path.find_last_of('/');
+                    auto column = virtual_column.type->createColumnConst(num_rows, file_path.substr(last_slash_pos + 1));
+                    chunk.addColumn(column->convertToFullColumnIfConst());
+                }
+            }
+
+            return chunk;
+        }
+
+
+        assert(reader_future.valid());
+        reader = reader_future.get();
+
+        if (!reader)
+            break;
+
+        size_t object_size = tryGetFileSizeFromReadBuffer(*reader.getReadBuffer()).value_or(0);
+        /// Adjust total_rows_approx_accumulated with new total size.
+        if (total_objects_size)
+            total_rows_approx_accumulated = static_cast<size_t>(
+                std::ceil(static_cast<double>(total_objects_size + object_size) / total_objects_size * total_rows_approx_accumulated));
+        total_objects_size += object_size;
+
+        /// Even if task is finished the thread may be not freed in pool.
+        /// So wait until it will be freed before scheduling a new task.
+        create_reader_pool.wait();
+        reader_future = createReaderAsync();
+    }
+
+    return {};
+}
+
+Block StorageAzureBlobSource::getHeader(Block sample_block, const std::vector<NameAndTypePair> & requested_virtual_columns)
+{
+    for (const auto & virtual_column : requested_virtual_columns)
+        sample_block.insert({virtual_column.type->createColumn(), virtual_column.type, virtual_column.name});
+
+    return sample_block;
+}
+
+StorageAzureBlobSource::StorageAzureBlobSource(
+    const std::vector<NameAndTypePair> & requested_virtual_columns_,
+    const String & format_,
+    String name_,
+    const Block & sample_block_,
+    ContextPtr context_,
+    std::optional<FormatSettings> format_settings_,
+    const ColumnsDescription & columns_,
+    UInt64 max_block_size_,
+    String compression_hint_,
+    AzureObjectStorage * object_storage_,
+    const String & container_,
+    std::shared_ptr<IIterator> file_iterator_)
+    :ISource(getHeader(sample_block_, requested_virtual_columns_))
+    , WithContext(context_)
+    , requested_virtual_columns(requested_virtual_columns_)
+    , format(format_)
+    , name(std::move(name_))
+    , sample_block(sample_block_)
+    , format_settings(format_settings_)
+    , columns_desc(columns_)
+    , max_block_size(max_block_size_)
+    , compression_hint(compression_hint_)
+    , object_storage(std::move(object_storage_))
+    , container(container_)
+    , file_iterator(file_iterator_)
+    , create_reader_pool(CurrentMetrics::ObjectStorageAzureThreads, CurrentMetrics::ObjectStorageAzureThreadsActive, 1)
+    , create_reader_scheduler(threadPoolCallbackRunner<ReaderHolder>(create_reader_pool, "AzureReader"))
+{
+    reader = createReader();
+    if (reader)
+    {
+        const auto & read_buf = reader.getReadBuffer();
+        if (read_buf)
+            total_objects_size = tryGetFileSizeFromReadBuffer(*reader.getReadBuffer()).value_or(0);
+
+        reader_future = createReaderAsync();
+    }
+}
+
+
+StorageAzureBlobSource::~StorageAzureBlobSource()
+{
+    create_reader_pool.wait();
+}
+
+String StorageAzureBlobSource::getName() const
+{
+    return name;
+}
+
+StorageAzureBlobSource::ReaderHolder StorageAzureBlobSource::createReader()
+{
+    auto [current_key, info] = file_iterator->next();
+    if (current_key.empty())
+        return {};
+
+    size_t object_size = info.size_bytes != 0 ? info.size_bytes : object_storage->getObjectMetadata(current_key).size_bytes;
+    auto compression_method = chooseCompressionMethod(current_key, compression_hint);
+
+    auto read_buf = createAzureReadBuffer(current_key, object_size);
+    auto input_format = FormatFactory::instance().getInput(
+            format, *read_buf, sample_block, getContext(), max_block_size,
+            format_settings, std::nullopt, std::nullopt,
+            /* is_remote_fs */ true, compression_method);
+
+    QueryPipelineBuilder builder;
+    builder.init(Pipe(input_format));
+
+    if (columns_desc.hasDefaults())
+    {
+        builder.addSimpleTransform(
+            [&](const Block & header)
+            { return std::make_shared<AddingDefaultsTransform>(header, columns_desc, *input_format, getContext()); });
+    }
+
+    auto pipeline = std::make_unique<QueryPipeline>(QueryPipelineBuilder::getPipeline(std::move(builder)));
+    auto current_reader = std::make_unique<PullingPipelineExecutor>(*pipeline);
+
+    return ReaderHolder{fs::path(container) / current_key, std::move(read_buf), input_format, std::move(pipeline), std::move(current_reader)};
+}
+
+std::future<StorageAzureBlobSource::ReaderHolder> StorageAzureBlobSource::createReaderAsync()
+{
+    return create_reader_scheduler([this] { return createReader(); }, Priority{});
+}
+
+std::unique_ptr<ReadBuffer> StorageAzureBlobSource::createAzureReadBuffer(const String & key, size_t object_size)
+{
+    auto read_settings = getContext()->getReadSettings().adjustBufferSize(object_size);
+    read_settings.enable_filesystem_cache = false;
+    auto download_buffer_size = getContext()->getSettings().max_download_buffer_size;
+    const bool object_too_small = object_size <= 2 * download_buffer_size;
+
+    // Create a read buffer that will prefetch the first ~1 MB of the file.
+    // When reading lots of tiny files, this prefetching almost doubles the throughput.
+    // For bigger files, parallel reading is more useful.
+    if (object_too_small && read_settings.remote_fs_method == RemoteFSReadMethod::threadpool)
+    {
+        LOG_TRACE(log, "Downloading object of size {} from Azure with initial prefetch", object_size);
+        return createAsyncAzureReadBuffer(key, read_settings, object_size);
+    }
+
+    return object_storage->readObject(StoredObject(key), read_settings, {}, object_size);
+}
+
+ColumnsDescription StorageAzureBlob::getTableStructureFromData(
+    AzureObjectStorage * object_storage,
+    const Configuration & configuration,
+    const std::optional<FormatSettings> & format_settings,
+    ContextPtr ctx)
+{
+    RelativePathsWithMetadata read_keys;
+    std::shared_ptr<StorageAzureBlobSource::IIterator> file_iterator;
+    if (configuration.withGlobs())
+    {
+        file_iterator = std::make_shared<StorageAzureBlobSource::GlobIterator>(
+            object_storage, configuration.container, configuration.blob_path, nullptr, Block{}, ctx, &read_keys);
+    }
+    else
+    {
+        file_iterator = std::make_shared<StorageAzureBlobSource::KeysIterator>(
+            object_storage, configuration.container, configuration.blobs_paths, nullptr, Block{}, ctx, &read_keys);
+    }
+
+    std::optional<ColumnsDescription> columns_from_cache;
+    size_t prev_read_keys_size = read_keys.size();
+    if (ctx->getSettingsRef().schema_inference_use_cache_for_azure)
+        columns_from_cache = tryGetColumnsFromCache(read_keys.begin(), read_keys.end(), configuration, format_settings, ctx);
+
+    ReadBufferIterator read_buffer_iterator = [&, first = true](ColumnsDescription & cached_columns) mutable -> std::unique_ptr<ReadBuffer>
+    {
+        auto [key, metadata] = file_iterator->next();
+
+        if (key.empty())
+        {
+            if (first)
+                throw Exception(
+                    ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                    "Cannot extract table structure from {} format file, because there are no files with provided path "
+                    "in AzureBlobStorage. You must specify table structure manually", configuration.format);
+
+            return nullptr;
+        }
+
+        /// S3 file iterator could get new keys after new iteration, check them in schema cache.
+        if (ctx->getSettingsRef().schema_inference_use_cache_for_azure && read_keys.size() > prev_read_keys_size)
+        {
+            columns_from_cache = tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end(), configuration, format_settings, ctx);
+            prev_read_keys_size = read_keys.size();
+            if (columns_from_cache)
+            {
+                cached_columns = *columns_from_cache;
+                return nullptr;
+            }
+        }
+
+        first = false;
+        int zstd_window_log_max = static_cast<int>(ctx->getSettingsRef().zstd_window_log_max);
+        return wrapReadBufferWithCompressionMethod(
+            object_storage->readObject(StoredObject(key), ctx->getReadSettings(), {}, metadata.size_bytes),
+            chooseCompressionMethod(key, configuration.compression_method),
+            zstd_window_log_max);
+    };
+
+    ColumnsDescription columns;
+    if (columns_from_cache)
+        columns = *columns_from_cache;
+    else
+        columns = readSchemaFromFormat(configuration.format, format_settings, read_buffer_iterator, configuration.withGlobs(), ctx);
+
+    if (ctx->getSettingsRef().schema_inference_use_cache_for_azure)
+        addColumnsToCache(read_keys, columns, configuration, format_settings, configuration.format, ctx);
+
+    return columns;
+
+}
+
+std::optional<ColumnsDescription> StorageAzureBlob::tryGetColumnsFromCache(
+        const RelativePathsWithMetadata::const_iterator & begin,
+        const RelativePathsWithMetadata::const_iterator & end,
+        const StorageAzureBlob::Configuration & configuration,
+        const std::optional<FormatSettings> & format_settings,
+        const ContextPtr & ctx)
+{
+    auto & schema_cache = getSchemaCache(ctx);
+    for (auto it = begin; it < end; ++it)
+    {
+        auto get_last_mod_time = [&] -> time_t
+        {
+            return it->metadata.last_modified->epochTime();
+        };
+
+        auto host_and_bucket = configuration.connection_url + '/' + configuration.container;
+        String source = host_and_bucket + '/' + it->relative_path;
+        auto cache_key = getKeyForSchemaCache(source, configuration.format, format_settings, ctx);
+        auto columns = schema_cache.tryGet(cache_key, get_last_mod_time);
+        if (columns)
+            return columns;
+    }
+
+    return std::nullopt;
+
+}
+
+void StorageAzureBlob::addColumnsToCache(
+    const RelativePathsWithMetadata & keys,
+    const ColumnsDescription & columns,
+    const StorageAzureBlob::Configuration & configuration,
+    const std::optional<FormatSettings> & format_settings,
+    const String & format_name,
+    const ContextPtr & ctx)
+{
+    auto host_and_bucket = configuration.connection_url + '/' + configuration.container;
+    Strings sources;
+    sources.reserve(keys.size());
+    std::transform(keys.begin(), keys.end(), std::back_inserter(sources), [&](const auto & elem){ return host_and_bucket + '/' + elem.relative_path; });
+    auto cache_keys = getKeysForSchemaCache(sources, format_name, format_settings, ctx);
+    auto & schema_cache = getSchemaCache(ctx);
+    schema_cache.addMany(cache_keys, columns);
+}
+
+SchemaCache & StorageAzureBlob::getSchemaCache(const ContextPtr & ctx)
+{
+    static SchemaCache schema_cache(ctx->getConfigRef().getUInt("schema_inference_cache_max_elements_for_azure", DEFAULT_SCHEMA_CACHE_ELEMENTS));
+    return schema_cache;
+}
+
+
+std::unique_ptr<ReadBuffer> StorageAzureBlobSource::createAsyncAzureReadBuffer(
+    const String & key, const ReadSettings & read_settings, size_t object_size)
+{
+    auto modified_settings{read_settings};
+    modified_settings.remote_read_min_bytes_for_seek = modified_settings.remote_fs_buffer_size;
+    auto async_reader = object_storage->readObjects(StoredObjects{StoredObject{key, object_size}}, modified_settings);
+
+    async_reader->setReadUntilEnd();
+    if (read_settings.remote_fs_prefetch)
+        async_reader->prefetch(DEFAULT_PREFETCH_PRIORITY);
+
+    return async_reader;
+}
+
+}
+
+#endif
diff --git a/src/Storages/StorageAzureBlob.h b/src/Storages/StorageAzureBlob.h
new file mode 100644
index 00000000000..3d6b0c64998
--- /dev/null
+++ b/src/Storages/StorageAzureBlob.h
@@ -0,0 +1,341 @@
+#pragma once
+
+#include "config.h"
+
+#if USE_AZURE_BLOB_STORAGE
+
+#include <re2/re2.h>
+#include <Storages/IStorage.h>
+#include <Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h>
+#include <Storages/Cache/SchemaCache.h>
+#include <Storages/StorageConfiguration.h>
+#include <Processors/Executors/PullingPipelineExecutor.h>
+#include <Storages/NamedCollectionsHelpers.h>
+
+namespace DB
+{
+
+class StorageAzureBlob : public IStorage
+{
+public:
+
+    using AzureClient = Azure::Storage::Blobs::BlobContainerClient;
+    using AzureClientPtr = std::unique_ptr<Azure::Storage::Blobs::BlobContainerClient>;
+
+    struct Configuration : public StatelessTableEngineConfiguration
+    {
+        Configuration() = default;
+
+        String getPath() const { return blob_path; }
+
+        bool update(ContextPtr context);
+
+        void connect(ContextPtr context);
+
+        bool withGlobs() const { return blob_path.find_first_of("*?{") != std::string::npos; }
+
+        bool withWildcard() const
+        {
+            static const String PARTITION_ID_WILDCARD = "{_partition_id}";
+            return blobs_paths.back().find(PARTITION_ID_WILDCARD) != String::npos;
+        }
+
+        Poco::URI getConnectionURL() const;
+
+        std::string connection_url;
+        bool is_connection_string;
+
+        std::optional<std::string> account_name;
+        std::optional<std::string> account_key;
+
+        std::string container;
+        std::string blob_path;
+        std::vector<String> blobs_paths;
+    };
+
+    StorageAzureBlob(
+        const Configuration & configuration_,
+        std::unique_ptr<AzureObjectStorage> && object_storage_,
+        ContextPtr context_,
+        const StorageID & table_id_,
+        const ColumnsDescription & columns_,
+        const ConstraintsDescription & constraints_,
+        const String & comment,
+        std::optional<FormatSettings> format_settings_,
+        ASTPtr partition_by_);
+
+    static StorageAzureBlob::Configuration getConfiguration(ASTs & engine_args, ContextPtr local_context);
+    static AzureClientPtr createClient(StorageAzureBlob::Configuration configuration);
+
+    static AzureObjectStorage::SettingsPtr createSettings(ContextPtr local_context);
+
+    static void processNamedCollectionResult(StorageAzureBlob::Configuration & configuration, const NamedCollection & collection);
+
+    String getName() const override
+    {
+        return name;
+    }
+
+    Pipe read(
+        const Names &,
+        const StorageSnapshotPtr &,
+        SelectQueryInfo &,
+        ContextPtr,
+        QueryProcessingStage::Enum,
+        size_t,
+        size_t) override;
+
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /* metadata_snapshot */, ContextPtr context, bool /*async_insert*/) override;
+
+    void truncate(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, TableExclusiveLockHolder &) override;
+
+    NamesAndTypesList getVirtuals() const override;
+
+    bool supportsPartitionBy() const override;
+
+    bool supportsSubcolumns() const override;
+
+    bool supportsSubsetOfColumns() const override;
+
+    bool prefersLargeBlocks() const override;
+
+    bool parallelizeOutputAfterReading(ContextPtr context) const override;
+
+    static SchemaCache & getSchemaCache(const ContextPtr & ctx);
+
+    static ColumnsDescription getTableStructureFromData(
+        AzureObjectStorage * object_storage,
+        const Configuration & configuration,
+        const std::optional<FormatSettings> & format_settings,
+        ContextPtr ctx);
+
+private:
+    std::string name;
+    Configuration configuration;
+    std::unique_ptr<AzureObjectStorage> object_storage;
+    NamesAndTypesList virtual_columns;
+    Block virtual_block;
+
+    const bool distributed_processing;
+    std::optional<FormatSettings> format_settings;
+    ASTPtr partition_by;
+
+
+    static std::optional<ColumnsDescription> tryGetColumnsFromCache(
+        const RelativePathsWithMetadata::const_iterator & begin,
+        const RelativePathsWithMetadata::const_iterator & end,
+        const StorageAzureBlob::Configuration & configuration,
+        const std::optional<FormatSettings> & format_settings,
+        const ContextPtr & ctx);
+
+    static void addColumnsToCache(
+        const RelativePathsWithMetadata & keys,
+        const ColumnsDescription & columns,
+        const Configuration & configuration,
+        const std::optional<FormatSettings> & format_settings,
+        const String & format_name,
+        const ContextPtr & ctx);
+
+
+};
+
+class StorageAzureBlobSource : public ISource, WithContext
+{
+public:
+    class IIterator : public WithContext
+    {
+    public:
+        IIterator(ContextPtr context_):WithContext(context_) {}
+        virtual ~IIterator() = default;
+        virtual RelativePathWithMetadata next() = 0;
+        virtual size_t getTotalSize() const = 0;
+
+        RelativePathWithMetadata operator ()() { return next(); }
+    };
+
+    class GlobIterator : public IIterator
+    {
+    public:
+        GlobIterator(
+            AzureObjectStorage * object_storage_,
+            const std::string & container_,
+            String blob_path_with_globs_,
+            ASTPtr query_,
+            const Block & virtual_header_,
+            ContextPtr context_,
+            RelativePathsWithMetadata * outer_blobs_);
+
+        RelativePathWithMetadata next() override;
+        size_t getTotalSize() const override;
+        ~GlobIterator() override = default;
+
+     private:
+        AzureObjectStorage * object_storage;
+        std::string container;
+        String blob_path_with_globs;
+        ASTPtr query;
+        ASTPtr filter_ast;
+        Block virtual_header;
+
+        size_t index = 0;
+        std::atomic<size_t> total_size = 0;
+
+        RelativePathsWithMetadata blobs_with_metadata;
+        RelativePathsWithMetadata * outer_blobs;
+        ObjectStorageIteratorPtr object_storage_iterator;
+        bool recursive{false};
+
+        std::unique_ptr<re2::RE2> matcher;
+
+        void createFilterAST(const String & any_key);
+        bool is_finished = false;
+        bool is_initialized = false;
+        std::mutex next_mutex;
+    };
+
+    class KeysIterator : public IIterator
+    {
+    public:
+        KeysIterator(
+            AzureObjectStorage * object_storage_,
+            const std::string & container_,
+            Strings keys_,
+            ASTPtr query_,
+            const Block & virtual_header_,
+            ContextPtr context_,
+            RelativePathsWithMetadata * outer_blobs_);
+
+        RelativePathWithMetadata next() override;
+        size_t getTotalSize() const override;
+        ~KeysIterator() override = default;
+
+    private:
+        AzureObjectStorage * object_storage;
+        std::string container;
+        RelativePathsWithMetadata keys;
+
+        ASTPtr query;
+        ASTPtr filter_ast;
+        Block virtual_header;
+
+        std::atomic<size_t> index = 0;
+        std::atomic<size_t> total_size = 0;
+
+        RelativePathsWithMetadata * outer_blobs;
+    };
+
+    StorageAzureBlobSource(
+        const std::vector<NameAndTypePair> & requested_virtual_columns_,
+        const String & format_,
+        String name_,
+        const Block & sample_block_,
+        ContextPtr context_,
+        std::optional<FormatSettings> format_settings_,
+        const ColumnsDescription & columns_,
+        UInt64 max_block_size_,
+        String compression_hint_,
+        AzureObjectStorage * object_storage_,
+        const String & container_,
+        std::shared_ptr<IIterator> file_iterator_);
+
+    ~StorageAzureBlobSource() override;
+
+    Chunk generate() override;
+
+    String getName() const override;
+
+    static Block getHeader(Block sample_block, const std::vector<NameAndTypePair> & requested_virtual_columns);
+
+private:
+    std::vector<NameAndTypePair> requested_virtual_columns;
+    String format;
+    String name;
+    Block sample_block;
+    std::optional<FormatSettings> format_settings;
+    ColumnsDescription columns_desc;
+    UInt64 max_block_size;
+    String compression_hint;
+    AzureObjectStorage * object_storage;
+    String container;
+    std::shared_ptr<IIterator> file_iterator;
+
+    struct ReaderHolder
+    {
+    public:
+        ReaderHolder(
+            String path_,
+            std::unique_ptr<ReadBuffer> read_buf_,
+            std::shared_ptr<IInputFormat> input_format_,
+            std::unique_ptr<QueryPipeline> pipeline_,
+            std::unique_ptr<PullingPipelineExecutor> reader_)
+            : path(std::move(path_))
+            , read_buf(std::move(read_buf_))
+            , input_format(input_format_)
+            , pipeline(std::move(pipeline_))
+            , reader(std::move(reader_))
+        {
+        }
+
+        ReaderHolder() = default;
+        ReaderHolder(const ReaderHolder & other) = delete;
+        ReaderHolder & operator=(const ReaderHolder & other) = delete;
+
+        ReaderHolder(ReaderHolder && other) noexcept
+        {
+            *this = std::move(other);
+        }
+
+        ReaderHolder & operator=(ReaderHolder && other) noexcept
+        {
+            /// The order of destruction is important.
+            /// reader uses pipeline, pipeline uses read_buf.
+            reader = std::move(other.reader);
+            pipeline = std::move(other.pipeline);
+            input_format = std::move(other.input_format);
+            read_buf = std::move(other.read_buf);
+            path = std::move(other.path);
+            return *this;
+        }
+
+        explicit operator bool() const { return reader != nullptr; }
+        PullingPipelineExecutor * operator->() { return reader.get(); }
+        const PullingPipelineExecutor * operator->() const { return reader.get(); }
+        const String & getPath() const { return path; }
+
+        const std::unique_ptr<ReadBuffer> & getReadBuffer() const { return read_buf; }
+
+        const std::shared_ptr<IInputFormat> & getFormat() const { return input_format; }
+
+    private:
+        String path;
+        std::unique_ptr<ReadBuffer> read_buf;
+        std::shared_ptr<IInputFormat> input_format;
+        std::unique_ptr<QueryPipeline> pipeline;
+        std::unique_ptr<PullingPipelineExecutor> reader;
+    };
+
+    ReaderHolder reader;
+
+    Poco::Logger * log = &Poco::Logger::get("StorageAzureBlobSource");
+
+    ThreadPool create_reader_pool;
+    ThreadPoolCallbackRunner<ReaderHolder> create_reader_scheduler;
+    std::future<ReaderHolder> reader_future;
+
+    UInt64 total_rows_approx_max = 0;
+    size_t total_rows_count_times = 0;
+    UInt64 total_rows_approx_accumulated = 0;
+    size_t total_objects_size = 0;
+
+    /// Recreate ReadBuffer and Pipeline for each file.
+    ReaderHolder createReader();
+    std::future<ReaderHolder> createReaderAsync();
+
+    std::unique_ptr<ReadBuffer> createAzureReadBuffer(const String & key, size_t object_size);
+    std::unique_ptr<ReadBuffer> createAsyncAzureReadBuffer(
+        const String & key, const ReadSettings & read_settings, size_t object_size);
+};
+
+}
+
+#endif
diff --git a/src/Storages/StorageBuffer.cpp b/src/Storages/StorageBuffer.cpp
index 757d3161067..fcc0871a71a 100644
--- a/src/Storages/StorageBuffer.cpp
+++ b/src/Storages/StorageBuffer.cpp
@@ -656,7 +656,7 @@ private:
 };
 
 
-SinkToStoragePtr StorageBuffer::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr /*context*/)
+SinkToStoragePtr StorageBuffer::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr /*context*/, bool /*async_insert*/)
 {
     return std::make_shared<BufferSink>(*this, metadata_snapshot);
 }
diff --git a/src/Storages/StorageBuffer.h b/src/Storages/StorageBuffer.h
index 83d2376216b..8f089a4d580 100644
--- a/src/Storages/StorageBuffer.h
+++ b/src/Storages/StorageBuffer.h
@@ -88,7 +88,7 @@ public:
 
     bool supportsSubcolumns() const override { return true; }
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool /*async_insert*/) override;
 
     void startup() override;
     /// Flush all buffers into the subordinate table and stop background thread.
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index bcf6f68d00d..c46192ab43b 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -81,13 +81,13 @@
 #include <TableFunctions/TableFunctionView.h>
 #include <TableFunctions/TableFunctionFactory.h>
 
+#include <Storages/buildQueryTreeForShard.h>
 #include <Storages/IStorageCluster.h>
 
 #include <Processors/Executors/PushingPipelineExecutor.h>
 #include <Processors/Executors/CompletedPipelineExecutor.h>
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
-#include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
 #include <Processors/QueryPlan/ReadFromPreparedSource.h>
 #include <Processors/QueryPlan/ExpressionStep.h>
 #include <Processors/Sources/NullSource.h>
@@ -153,7 +153,6 @@ namespace ErrorCodes
     extern const int DISTRIBUTED_TOO_MANY_PENDING_BYTES;
     extern const int ARGUMENT_OUT_OF_BOUND;
     extern const int TOO_LARGE_DISTRIBUTED_DEPTH;
-    extern const int DISTRIBUTED_IN_JOIN_SUBQUERY_DENIED;
 }
 
 namespace ActionLocks
@@ -650,264 +649,6 @@ StorageSnapshotPtr StorageDistributed::getStorageSnapshotForQuery(
 namespace
 {
 
-/// Visitor that collect column source to columns mapping from query and all subqueries
-class CollectColumnSourceToColumnsVisitor : public InDepthQueryTreeVisitor<CollectColumnSourceToColumnsVisitor>
-{
-public:
-    struct Columns
-    {
-        NameSet column_names;
-        NamesAndTypes columns;
-
-        void addColumn(NameAndTypePair column)
-        {
-            if (column_names.contains(column.name))
-                return;
-
-            column_names.insert(column.name);
-            columns.push_back(std::move(column));
-        }
-    };
-
-    const std::unordered_map<QueryTreeNodePtr, Columns> & getColumnSourceToColumns() const
-    {
-        return column_source_to_columns;
-    }
-
-    void visitImpl(QueryTreeNodePtr & node)
-    {
-        auto * column_node = node->as<ColumnNode>();
-        if (!column_node)
-            return;
-
-        auto column_source = column_node->getColumnSourceOrNull();
-        if (!column_source)
-            return;
-
-        auto it = column_source_to_columns.find(column_source);
-        if (it == column_source_to_columns.end())
-        {
-            auto [insert_it, _] = column_source_to_columns.emplace(column_source, Columns());
-            it = insert_it;
-        }
-
-        it->second.addColumn(column_node->getColumn());
-    }
-
-private:
-    std::unordered_map<QueryTreeNodePtr, Columns> column_source_to_columns;
-};
-
-/** Visitor that rewrites IN and JOINs in query and all subqueries according to distributed_product_mode and
-  * prefer_global_in_and_join settings.
-  *
-  * Additionally collects GLOBAL JOIN and GLOBAL IN query nodes.
-  *
-  * If distributed_product_mode = deny, then visitor throws exception if there are multiple distributed tables.
-  * If distributed_product_mode = local, then visitor collects replacement map for tables that must be replaced
-  * with local tables.
-  * If distributed_product_mode = global or prefer_global_in_and_join setting is true, then visitor rewrites JOINs and IN functions that
-  * contain distributed tables to GLOBAL JOINs and GLOBAL IN functions.
-  * If distributed_product_mode = allow, then visitor does not rewrite query if there are multiple distributed tables.
-  */
-class DistributedProductModeRewriteInJoinVisitor : public InDepthQueryTreeVisitorWithContext<DistributedProductModeRewriteInJoinVisitor>
-{
-public:
-    using Base = InDepthQueryTreeVisitorWithContext<DistributedProductModeRewriteInJoinVisitor>;
-    using Base::Base;
-
-    explicit DistributedProductModeRewriteInJoinVisitor(const ContextPtr & context_)
-        : Base(context_)
-    {}
-
-    struct InFunctionOrJoin
-    {
-        QueryTreeNodePtr query_node;
-        size_t subquery_depth = 0;
-    };
-
-    const std::unordered_map<const IQueryTreeNode *, QueryTreeNodePtr> & getReplacementMap() const
-    {
-        return replacement_map;
-    }
-
-    const std::vector<InFunctionOrJoin> & getGlobalInOrJoinNodes() const
-    {
-        return global_in_or_join_nodes;
-    }
-
-    static bool needChildVisit(QueryTreeNodePtr & parent, QueryTreeNodePtr & child)
-    {
-        auto * function_node = parent->as<FunctionNode>();
-        if (function_node && isNameOfGlobalInFunction(function_node->getFunctionName()))
-            return false;
-
-        auto * join_node = parent->as<JoinNode>();
-        if (join_node && join_node->getLocality() == JoinLocality::Global && join_node->getRightTableExpression() == child)
-            return false;
-
-        return true;
-    }
-
-    void visitImpl(QueryTreeNodePtr & node)
-    {
-        auto * function_node = node->as<FunctionNode>();
-        auto * join_node = node->as<JoinNode>();
-
-        if ((function_node && isNameOfGlobalInFunction(function_node->getFunctionName())) ||
-            (join_node && join_node->getLocality() == JoinLocality::Global))
-        {
-            InFunctionOrJoin in_function_or_join_entry;
-            in_function_or_join_entry.query_node = node;
-            in_function_or_join_entry.subquery_depth = getSubqueryDepth();
-            global_in_or_join_nodes.push_back(std::move(in_function_or_join_entry));
-            return;
-        }
-
-        if ((function_node && isNameOfLocalInFunction(function_node->getFunctionName())) ||
-            (join_node && join_node->getLocality() != JoinLocality::Global))
-        {
-            InFunctionOrJoin in_function_or_join_entry;
-            in_function_or_join_entry.query_node = node;
-            in_function_or_join_entry.subquery_depth = getSubqueryDepth();
-            in_function_or_join_stack.push_back(in_function_or_join_entry);
-            return;
-        }
-
-        if (node->getNodeType() == QueryTreeNodeType::TABLE)
-            tryRewriteTableNodeIfNeeded(node);
-    }
-
-    void leaveImpl(QueryTreeNodePtr & node)
-    {
-        if (!in_function_or_join_stack.empty() && node.get() == in_function_or_join_stack.back().query_node.get())
-            in_function_or_join_stack.pop_back();
-    }
-
-private:
-    void tryRewriteTableNodeIfNeeded(const QueryTreeNodePtr & table_node)
-    {
-        const auto & table_node_typed = table_node->as<TableNode &>();
-        const auto * distributed_storage = typeid_cast<const StorageDistributed *>(table_node_typed.getStorage().get());
-        if (!distributed_storage)
-            return;
-
-        bool distributed_valid_for_rewrite = distributed_storage->getShardCount() >= 2;
-        if (!distributed_valid_for_rewrite)
-            return;
-
-        auto distributed_product_mode = getSettings().distributed_product_mode;
-
-        if (distributed_product_mode == DistributedProductMode::LOCAL)
-        {
-            StorageID remote_storage_id = StorageID{distributed_storage->getRemoteDatabaseName(),
-                distributed_storage->getRemoteTableName()};
-            auto resolved_remote_storage_id = getContext()->resolveStorageID(remote_storage_id);
-            const auto & distributed_storage_columns = table_node_typed.getStorageSnapshot()->metadata->getColumns();
-            auto storage = std::make_shared<StorageDummy>(resolved_remote_storage_id, distributed_storage_columns);
-            auto replacement_table_expression = std::make_shared<TableNode>(std::move(storage), getContext());
-            replacement_map.emplace(table_node.get(), std::move(replacement_table_expression));
-        }
-        else if ((distributed_product_mode == DistributedProductMode::GLOBAL || getSettings().prefer_global_in_and_join) &&
-            !in_function_or_join_stack.empty())
-        {
-            auto * in_or_join_node_to_modify = in_function_or_join_stack.back().query_node.get();
-
-            if (auto * in_function_to_modify = in_or_join_node_to_modify->as<FunctionNode>())
-            {
-                auto global_in_function_name = getGlobalInFunctionNameForLocalInFunctionName(in_function_to_modify->getFunctionName());
-                auto global_in_function_resolver = FunctionFactory::instance().get(global_in_function_name, getContext());
-                in_function_to_modify->resolveAsFunction(global_in_function_resolver->build(in_function_to_modify->getArgumentColumns()));
-            }
-            else if (auto * join_node_to_modify = in_or_join_node_to_modify->as<JoinNode>())
-            {
-                join_node_to_modify->setLocality(JoinLocality::Global);
-            }
-
-            global_in_or_join_nodes.push_back(in_function_or_join_stack.back());
-        }
-        else if (distributed_product_mode == DistributedProductMode::ALLOW)
-        {
-            return;
-        }
-        else if (distributed_product_mode == DistributedProductMode::DENY)
-        {
-            throw Exception(ErrorCodes::DISTRIBUTED_IN_JOIN_SUBQUERY_DENIED,
-                "Double-distributed IN/JOIN subqueries is denied (distributed_product_mode = 'deny'). "
-                "You may rewrite query to use local tables "
-                "in subqueries, or use GLOBAL keyword, or set distributed_product_mode to suitable value.");
-        }
-    }
-
-    std::vector<InFunctionOrJoin> in_function_or_join_stack;
-    std::unordered_map<const IQueryTreeNode *, QueryTreeNodePtr> replacement_map;
-    std::vector<InFunctionOrJoin> global_in_or_join_nodes;
-};
-
-/** Execute subquery node and put result in mutable context temporary table.
-  * Returns table node that is initialized with temporary table storage.
-  */
-QueryTreeNodePtr executeSubqueryNode(const QueryTreeNodePtr & subquery_node,
-    ContextMutablePtr & mutable_context,
-    size_t subquery_depth)
-{
-    auto subquery_hash = subquery_node->getTreeHash();
-    String temporary_table_name = fmt::format("_data_{}_{}", subquery_hash.first, subquery_hash.second);
-
-    const auto & external_tables = mutable_context->getExternalTables();
-    auto external_table_it = external_tables.find(temporary_table_name);
-    if (external_table_it != external_tables.end())
-    {
-        auto temporary_table_expression_node = std::make_shared<TableNode>(external_table_it->second, mutable_context);
-        temporary_table_expression_node->setTemporaryTableName(temporary_table_name);
-        return temporary_table_expression_node;
-    }
-
-    auto subquery_options = SelectQueryOptions(QueryProcessingStage::Complete, subquery_depth, true /*is_subquery*/);
-    auto context_copy = Context::createCopy(mutable_context);
-    updateContextForSubqueryExecution(context_copy);
-
-    InterpreterSelectQueryAnalyzer interpreter(subquery_node, context_copy, subquery_options);
-    auto & query_plan = interpreter.getQueryPlan();
-
-    auto sample_block_with_unique_names = query_plan.getCurrentDataStream().header;
-    makeUniqueColumnNamesInBlock(sample_block_with_unique_names);
-
-    if (!blocksHaveEqualStructure(sample_block_with_unique_names, query_plan.getCurrentDataStream().header))
-    {
-        auto actions_dag = ActionsDAG::makeConvertingActions(
-            query_plan.getCurrentDataStream().header.getColumnsWithTypeAndName(),
-            sample_block_with_unique_names.getColumnsWithTypeAndName(),
-            ActionsDAG::MatchColumnsMode::Position);
-        auto converting_step = std::make_unique<ExpressionStep>(query_plan.getCurrentDataStream(), std::move(actions_dag));
-        query_plan.addStep(std::move(converting_step));
-    }
-
-    Block sample = interpreter.getSampleBlock();
-    NamesAndTypesList columns = sample.getNamesAndTypesList();
-
-    auto external_storage_holder = TemporaryTableHolder(
-        mutable_context,
-        ColumnsDescription{columns},
-        ConstraintsDescription{},
-        nullptr /*query*/,
-        true /*create_for_global_subquery*/);
-
-    StoragePtr external_storage = external_storage_holder.getTable();
-    auto temporary_table_expression_node = std::make_shared<TableNode>(external_storage, mutable_context);
-    temporary_table_expression_node->setTemporaryTableName(temporary_table_name);
-
-    auto table_out = external_storage->write({}, external_storage->getInMemoryMetadataPtr(), mutable_context);
-    auto io = interpreter.execute();
-    io.pipeline.complete(std::move(table_out));
-    CompletedPipelineExecutor executor(io.pipeline);
-    executor.execute();
-
-    mutable_context->addExternalTable(temporary_table_name, std::move(external_storage_holder));
-
-    return temporary_table_expression_node;
-}
-
 QueryTreeNodePtr buildQueryTreeDistributed(SelectQueryInfo & query_info,
     const StorageSnapshotPtr & distributed_storage_snapshot,
     const StorageID & remote_storage_id,
@@ -943,8 +684,14 @@ QueryTreeNodePtr buildQueryTreeDistributed(SelectQueryInfo & query_info,
     }
     else
     {
-        auto resolved_remote_storage_id = query_context->resolveStorageID(remote_storage_id);
-        auto storage = std::make_shared<StorageDummy>(resolved_remote_storage_id, distributed_storage_snapshot->metadata->getColumns());
+        auto resolved_remote_storage_id = remote_storage_id;
+        // In case of cross-replication we don't know what database is used for the table.
+        // `storage_id.hasDatabase()` can return false only on the initiator node.
+        // Each shard will use the default database (in the case of cross-replication shards may have different defaults).
+        if (remote_storage_id.hasDatabase())
+            resolved_remote_storage_id = query_context->resolveStorageID(remote_storage_id);
+
+        auto storage = std::make_shared<StorageDummy>(resolved_remote_storage_id, distributed_storage_snapshot->metadata->getColumns(), distributed_storage_snapshot->object_columns);
         auto table_node = std::make_shared<TableNode>(std::move(storage), query_context);
 
         if (table_expression_modifiers)
@@ -957,79 +704,7 @@ QueryTreeNodePtr buildQueryTreeDistributed(SelectQueryInfo & query_info,
 
     auto query_tree_to_modify = query_info.query_tree->cloneAndReplace(query_info.table_expression, std::move(replacement_table_expression));
 
-    CollectColumnSourceToColumnsVisitor collect_column_source_to_columns_visitor;
-    collect_column_source_to_columns_visitor.visit(query_tree_to_modify);
-
-    const auto & column_source_to_columns = collect_column_source_to_columns_visitor.getColumnSourceToColumns();
-
-    DistributedProductModeRewriteInJoinVisitor visitor(query_info.planner_context->getQueryContext());
-    visitor.visit(query_tree_to_modify);
-
-    auto replacement_map = visitor.getReplacementMap();
-    const auto & global_in_or_join_nodes = visitor.getGlobalInOrJoinNodes();
-
-    for (const auto & global_in_or_join_node : global_in_or_join_nodes)
-    {
-        if (auto * join_node = global_in_or_join_node.query_node->as<JoinNode>())
-        {
-            auto join_right_table_expression = join_node->getRightTableExpression();
-            auto join_right_table_expression_node_type = join_right_table_expression->getNodeType();
-
-            QueryTreeNodePtr subquery_node;
-
-            if (join_right_table_expression_node_type == QueryTreeNodeType::QUERY ||
-                join_right_table_expression_node_type == QueryTreeNodeType::UNION)
-            {
-                subquery_node = join_right_table_expression;
-            }
-            else if (join_right_table_expression_node_type == QueryTreeNodeType::TABLE ||
-                join_right_table_expression_node_type == QueryTreeNodeType::TABLE_FUNCTION)
-            {
-                const auto & columns = column_source_to_columns.at(join_right_table_expression).columns;
-                subquery_node = buildSubqueryToReadColumnsFromTableExpression(columns,
-                    join_right_table_expression,
-                    planner_context->getQueryContext());
-            }
-            else
-            {
-                throw Exception(ErrorCodes::LOGICAL_ERROR,
-                    "Expected JOIN right table expression to be table, table function, query or union node. Actual {}",
-                    join_right_table_expression->formatASTForErrorMessage());
-            }
-
-            auto temporary_table_expression_node = executeSubqueryNode(subquery_node,
-                planner_context->getMutableQueryContext(),
-                global_in_or_join_node.subquery_depth);
-            temporary_table_expression_node->setAlias(join_right_table_expression->getAlias());
-            replacement_map.emplace(join_right_table_expression.get(), std::move(temporary_table_expression_node));
-            continue;
-        }
-        else if (auto * in_function_node = global_in_or_join_node.query_node->as<FunctionNode>())
-        {
-            auto & in_function_subquery_node = in_function_node->getArguments().getNodes().at(1);
-            auto in_function_node_type = in_function_subquery_node->getNodeType();
-            if (in_function_node_type != QueryTreeNodeType::QUERY && in_function_node_type != QueryTreeNodeType::UNION)
-                continue;
-
-            auto temporary_table_expression_node = executeSubqueryNode(in_function_subquery_node,
-                planner_context->getMutableQueryContext(),
-                global_in_or_join_node.subquery_depth);
-            in_function_subquery_node = std::move(temporary_table_expression_node);
-        }
-        else
-        {
-            throw Exception(ErrorCodes::LOGICAL_ERROR,
-                "Expected global IN or JOIN query node. Actual {}",
-                global_in_or_join_node.query_node->formatASTForErrorMessage());
-        }
-    }
-
-    if (!replacement_map.empty())
-        query_tree_to_modify = query_tree_to_modify->cloneAndReplace(replacement_map);
-
-    removeGroupingFunctionSpecializations(query_tree_to_modify);
-
-    return query_tree_to_modify;
+    return buildQueryTreeForShard(query_info, query_tree_to_modify);
 }
 
 }
@@ -1057,9 +732,8 @@ void StorageDistributed::read(
             storage_snapshot,
             remote_storage_id,
             remote_table_function_ptr);
-
+        header = InterpreterSelectQueryAnalyzer::getSampleBlock(query_tree_distributed, local_context, SelectQueryOptions(processed_stage).analyze());
         query_ast = queryNodeToSelectQuery(query_tree_distributed);
-        header = InterpreterSelectQueryAnalyzer::getSampleBlock(query_ast, local_context, SelectQueryOptions(processed_stage).analyze());
     }
     else
     {
@@ -1132,7 +806,7 @@ void StorageDistributed::read(
 }
 
 
-SinkToStoragePtr StorageDistributed::write(const ASTPtr &, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+SinkToStoragePtr StorageDistributed::write(const ASTPtr &, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
     auto cluster = getCluster();
     const auto & settings = local_context->getSettingsRef();
diff --git a/src/Storages/StorageDistributed.h b/src/Storages/StorageDistributed.h
index 417fb6447bf..f45286341cf 100644
--- a/src/Storages/StorageDistributed.h
+++ b/src/Storages/StorageDistributed.h
@@ -118,7 +118,7 @@ public:
     bool supportsParallelInsert() const override { return true; }
     std::optional<UInt64> totalBytes(const Settings &) const override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool /*async_insert*/) override;
 
     std::optional<QueryPipeline> distributedWrite(const ASTInsertQuery & query, ContextPtr context) override;
 
diff --git a/src/Storages/StorageDummy.cpp b/src/Storages/StorageDummy.cpp
index e5f3b0b4d8e..e2396a54acb 100644
--- a/src/Storages/StorageDummy.cpp
+++ b/src/Storages/StorageDummy.cpp
@@ -5,12 +5,14 @@
 
 #include <Processors/Chunk.h>
 #include <Processors/Sources/SourceFromSingleChunk.h>
+#include <Processors/QueryPlan/QueryPlan.h>
 
 namespace DB
 {
 
-StorageDummy::StorageDummy(const StorageID & table_id_, const ColumnsDescription & columns_)
+StorageDummy::StorageDummy(const StorageID & table_id_, const ColumnsDescription & columns_, ColumnsDescription object_columns_)
     : IStorage(table_id_)
+    , object_columns(std::move(object_columns_))
 {
     StorageInMemoryMetadata storage_metadata;
     storage_metadata.setColumns(columns_);
diff --git a/src/Storages/StorageDummy.h b/src/Storages/StorageDummy.h
index a7beef9d531..2f9a8beb4d0 100644
--- a/src/Storages/StorageDummy.h
+++ b/src/Storages/StorageDummy.h
@@ -11,7 +11,7 @@ namespace DB
 class StorageDummy : public IStorage
 {
 public:
-    StorageDummy(const StorageID & table_id_, const ColumnsDescription & columns_);
+    StorageDummy(const StorageID & table_id_, const ColumnsDescription & columns_, ColumnsDescription object_columns_ = {});
 
     std::string getName() const override { return "StorageDummy"; }
 
@@ -22,6 +22,11 @@ public:
     bool supportsDynamicSubcolumns() const override { return true; }
     bool canMoveConditionsToPrewhere() const override { return false; }
 
+    StorageSnapshotPtr getStorageSnapshot(const StorageMetadataPtr & metadata_snapshot, ContextPtr /*query_context*/) const override
+    {
+        return std::make_shared<StorageSnapshot>(*this, metadata_snapshot, object_columns);
+    }
+
     QueryProcessingStage::Enum getQueryProcessingStage(
         ContextPtr local_context,
         QueryProcessingStage::Enum to_stage,
@@ -37,6 +42,8 @@ public:
         QueryProcessingStage::Enum processed_stage,
         size_t max_block_size,
         size_t num_streams) override;
+private:
+    const ColumnsDescription object_columns;
 };
 
 class ReadFromDummy : public SourceStepWithFilter
diff --git a/src/Storages/StorageFactory.h b/src/Storages/StorageFactory.h
index 77309541374..f1c1c237393 100644
--- a/src/Storages/StorageFactory.h
+++ b/src/Storages/StorageFactory.h
@@ -2,6 +2,7 @@
 
 #include <Common/NamePrompter.h>
 #include <Parsers/IAST_fwd.h>
+#include <Parsers/ASTCreateQuery.h>
 #include <Storages/ColumnsDescription.h>
 #include <Storages/ConstraintsDescription.h>
 #include <Storages/IStorage_fwd.h>
@@ -14,8 +15,6 @@ namespace DB
 {
 
 class Context;
-class ASTCreateQuery;
-class ASTStorage;
 struct StorageID;
 
 
diff --git a/src/Storages/StorageFile.cpp b/src/Storages/StorageFile.cpp
index 052775aefca..96306a37750 100644
--- a/src/Storages/StorageFile.cpp
+++ b/src/Storages/StorageFile.cpp
@@ -23,6 +23,7 @@
 #include <IO/WriteBufferFromFile.h>
 #include <IO/WriteHelpers.h>
 
+#include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeString.h>
 #include <Formats/FormatFactory.h>
 #include <Formats/ReadSchemaUtils.h>
@@ -40,6 +41,7 @@
 #include <Common/typeid_cast.h>
 #include <Common/parseGlobs.h>
 #include <Common/filesystemHelpers.h>
+#include <Common/logger_useful.h>
 #include <Common/ProfileEvents.h>
 
 #include <QueryPipeline/Pipe.h>
@@ -78,6 +80,7 @@ namespace ErrorCodes
     extern const int UNKNOWN_IDENTIFIER;
     extern const int INCORRECT_FILE_NAME;
     extern const int FILE_DOESNT_EXIST;
+    extern const int FILE_ALREADY_EXISTS;
     extern const int TIMEOUT_EXCEEDED;
     extern const int INCOMPATIBLE_COLUMNS;
     extern const int CANNOT_STAT;
@@ -257,35 +260,40 @@ std::unique_ptr<ReadBuffer> selectReadBuffer(
     return res;
 }
 
-std::unique_ptr<ReadBuffer> createReadBuffer(
-    const String & current_path,
-    bool use_table_fd,
-    const String & storage_name,
-    int table_fd,
-    const String & compression_method,
-    ContextPtr context)
+struct stat getFileStat(const String & current_path, bool use_table_fd, int table_fd, const String & storage_name)
 {
-    CompressionMethod method;
-
     struct stat file_stat{};
-
     if (use_table_fd)
     {
         /// Check if file descriptor allows random reads (and reading it twice).
         if (0 != fstat(table_fd, &file_stat))
             throwFromErrno("Cannot stat table file descriptor, inside " + storage_name, ErrorCodes::CANNOT_STAT);
-
-        method = chooseCompressionMethod("", compression_method);
     }
     else
     {
         /// Check if file descriptor allows random reads (and reading it twice).
         if (0 != stat(current_path.c_str(), &file_stat))
             throwFromErrno("Cannot stat file " + current_path, ErrorCodes::CANNOT_STAT);
-
-        method = chooseCompressionMethod(current_path, compression_method);
     }
 
+    return file_stat;
+}
+
+std::unique_ptr<ReadBuffer> createReadBuffer(
+    const String & current_path,
+    const struct stat & file_stat,
+    bool use_table_fd,
+    int table_fd,
+    const String & compression_method,
+    ContextPtr context)
+{
+    CompressionMethod method;
+
+    if (use_table_fd)
+        method = chooseCompressionMethod("", compression_method);
+    else
+        method = chooseCompressionMethod(current_path, compression_method);
+
     std::unique_ptr<ReadBuffer> nested_buffer = selectReadBuffer(current_path, use_table_fd, table_fd, file_stat, context);
 
     /// For clickhouse-local and clickhouse-client add progress callback to display progress bar.
@@ -355,7 +363,8 @@ ColumnsDescription StorageFile::getTableStructureFromFileDescriptor(ContextPtr c
     {
         /// We will use PeekableReadBuffer to create a checkpoint, so we need a place
         /// where we can store the original read buffer.
-        read_buffer_from_fd = createReadBuffer("", true, getName(), table_fd, compression_method, context);
+        auto file_stat = getFileStat("", true, table_fd, getName());
+        read_buffer_from_fd = createReadBuffer("", file_stat, true, table_fd, compression_method, context);
         auto read_buf = std::make_unique<PeekableReadBuffer>(*read_buffer_from_fd);
         read_buf->setCheckpoint();
         return read_buf;
@@ -396,12 +405,29 @@ ColumnsDescription StorageFile::getTableStructureFromFile(
     if (context->getSettingsRef().schema_inference_use_cache_for_file)
         columns_from_cache = tryGetColumnsFromCache(paths, format, format_settings, context);
 
-    ReadBufferIterator read_buffer_iterator = [&, it = paths.begin()](ColumnsDescription &) mutable -> std::unique_ptr<ReadBuffer>
+    ReadBufferIterator read_buffer_iterator = [&, it = paths.begin(), first = true](ColumnsDescription &) mutable -> std::unique_ptr<ReadBuffer>
     {
-        if (it == paths.end())
-            return nullptr;
+        String path;
+        struct stat file_stat;
+        do
+        {
+            if (it == paths.end())
+            {
+                if (first)
+                    throw Exception(
+                        ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                        "Cannot extract table structure from {} format file, because all files are empty. You must specify table structure manually",
+                        format);
+                return nullptr;
+            }
 
-        return createReadBuffer(*it++, false, "File", -1, compression_method, context);
+            path = *it++;
+            file_stat = getFileStat(path, false, -1, "File");
+        }
+        while (context->getSettingsRef().engine_file_skip_empty_files && file_stat.st_size == 0);
+
+        first = false;
+        return createReadBuffer(path, file_stat, false, -1, compression_method, context);
     };
 
     ColumnsDescription columns;
@@ -462,6 +488,8 @@ StorageFile::StorageFile(const std::string & table_path_, const std::string & us
     else
         path_for_partitioned_write = table_path_;
 
+    file_renamer = FileRenamer(args.rename_after_processing);
+
     setStorageMetadata(args);
 }
 
@@ -595,9 +623,69 @@ public:
             shared_lock = std::shared_lock(storage->rwlock, getLockTimeout(context));
             if (!shared_lock)
                 throw Exception(ErrorCodes::TIMEOUT_EXCEEDED, "Lock timeout exceeded");
+            storage->readers_counter.fetch_add(1, std::memory_order_release);
         }
     }
 
+
+    /**
+      * If specified option --rename_files_after_processing and files created by TableFunctionFile
+      * Last reader will rename files according to specified pattern if desctuctor of reader was called without uncaught exceptions
+      */
+    void beforeDestroy()
+    {
+        if (storage->file_renamer.isEmpty())
+            return;
+
+        int32_t cnt = storage->readers_counter.fetch_sub(1, std::memory_order_acq_rel);
+
+        if (std::uncaught_exceptions() == 0 && cnt == 1 && !storage->was_renamed)
+        {
+            shared_lock.unlock();
+            auto exclusive_lock = std::unique_lock{storage->rwlock, getLockTimeout(context)};
+
+            if (!exclusive_lock)
+                return;
+            if (storage->readers_counter.load(std::memory_order_acquire) != 0 || storage->was_renamed)
+                return;
+
+            for (auto & file_path_ref : storage->paths)
+            {
+                try
+                {
+                    auto file_path = fs::path(file_path_ref);
+                    String new_filename = storage->file_renamer.generateNewFilename(file_path.filename().string());
+                    file_path.replace_filename(new_filename);
+
+                    // Normalize new path
+                    file_path = file_path.lexically_normal();
+
+                    // Checking access rights
+                    checkCreationIsAllowed(context, context->getUserFilesPath(), file_path, true);
+
+                    // Checking an existing of new file
+                    if (fs::exists(file_path))
+                        throw Exception(ErrorCodes::FILE_ALREADY_EXISTS, "File {} already exists", file_path.string());
+
+                    fs::rename(fs::path(file_path_ref), file_path);
+                    file_path_ref = file_path.string();
+                    storage->was_renamed = true;
+                }
+                catch (const std::exception & e)
+                {
+                    // Cannot throw exception from destructor, will write only error
+                    LOG_ERROR(&Poco::Logger::get("~StorageFileSource"), "Failed to rename file {}: {}", file_path_ref, e.what());
+                    continue;
+                }
+            }
+        }
+    }
+
+    ~StorageFileSource() override
+    {
+        beforeDestroy();
+    }
+
     String getName() const override
     {
         return storage->getName();
@@ -628,22 +716,32 @@ public:
                 }
 
                 if (!read_buf)
-                    read_buf = createReadBuffer(current_path, storage->use_table_fd, storage->getName(), storage->table_fd, storage->compression_method, context);
+                {
+                    auto file_stat = getFileStat(current_path, storage->use_table_fd, storage->table_fd, storage->getName());
+                    if (context->getSettingsRef().engine_file_skip_empty_files && file_stat.st_size == 0)
+                        continue;
+                    read_buf = createReadBuffer(current_path, file_stat, storage->use_table_fd, storage->table_fd, storage->compression_method, context);
+                }
+
+                size_t file_size = tryGetFileSizeFromReadBuffer(*read_buf).value_or(0);
+                /// Adjust total_rows_approx_accumulated with new total size.
+                if (total_files_size)
+                    total_rows_approx_accumulated = static_cast<size_t>(std::ceil(static_cast<double>(total_files_size + file_size) / total_files_size * total_rows_approx_accumulated));
+                total_files_size += file_size;
 
                 const Settings & settings = context->getSettingsRef();
                 chassert(!storage->paths.empty());
                 const auto max_parsing_threads = std::max<size_t>(settings.max_threads/ storage->paths.size(), 1UL);
-                auto format
-                    = context->getInputFormat(storage->format_name, *read_buf, block_for_format, max_block_size, storage->format_settings, max_parsing_threads);
+                input_format = context->getInputFormat(storage->format_name, *read_buf, block_for_format, max_block_size, storage->format_settings, max_parsing_threads);
 
                 QueryPipelineBuilder builder;
-                builder.init(Pipe(format));
+                builder.init(Pipe(input_format));
 
                 if (columns_description.hasDefaults())
                 {
                     builder.addSimpleTransform([&](const Block & header)
                     {
-                        return std::make_shared<AddingDefaultsTransform>(header, columns_description, *format, context);
+                        return std::make_shared<AddingDefaultsTransform>(header, columns_description, *input_format, context);
                     });
                 }
 
@@ -673,10 +771,13 @@ public:
                     chunk.addColumn(column->convertToFullColumnIfConst());
                 }
 
-                if (num_rows)
+                if (num_rows && total_files_size)
                 {
+                    size_t chunk_size = input_format->getApproxBytesReadForChunk();
+                    if (!chunk_size)
+                        chunk_size = chunk.bytes();
                     updateRowsProgressApprox(
-                        *this, chunk, files_info->total_bytes_to_read, total_rows_approx_accumulated, total_rows_count_times, total_rows_approx_max);
+                        *this, num_rows, chunk_size, total_files_size, total_rows_approx_accumulated, total_rows_count_times, total_rows_approx_max);
                 }
                 return chunk;
             }
@@ -688,6 +789,7 @@ public:
             /// Close file prematurely if stream was ended.
             reader.reset();
             pipeline.reset();
+            input_format.reset();
             read_buf.reset();
         }
 
@@ -702,6 +804,7 @@ private:
     String current_path;
     Block sample_block;
     std::unique_ptr<ReadBuffer> read_buf;
+    InputFormatPtr input_format;
     std::unique_ptr<QueryPipeline> pipeline;
     std::unique_ptr<PullingPipelineExecutor> reader;
 
@@ -718,6 +821,8 @@ private:
     UInt64 total_rows_approx_accumulated = 0;
     size_t total_rows_count_times = 0;
     UInt64 total_rows_approx_max = 0;
+
+    size_t total_files_size = 0;
 };
 
 
@@ -927,10 +1032,18 @@ public:
         cancelled = true;
     }
 
-    void onException() override
+    void onException(std::exception_ptr exception) override
     {
         std::lock_guard cancel_lock(cancel_mutex);
-        finalize();
+        try
+        {
+            std::rethrow_exception(exception);
+        }
+        catch (...)
+        {
+            /// An exception context is needed to proper delete write buffers without finalization
+            release();
+        }
     }
 
     void onFinish() override
@@ -954,12 +1067,17 @@ private:
         catch (...)
         {
             /// Stop ParallelFormattingOutputFormat correctly.
-            writer.reset();
-            write_buf->finalize();
+            release();
             throw;
         }
     }
 
+    void release()
+    {
+        writer.reset();
+        write_buf->finalize();
+    }
+
     StorageMetadataPtr metadata_snapshot;
     String table_name_for_log;
 
@@ -1049,7 +1167,8 @@ private:
 SinkToStoragePtr StorageFile::write(
     const ASTPtr & query,
     const StorageMetadataPtr & metadata_snapshot,
-    ContextPtr context)
+    ContextPtr context,
+    bool /*async_insert*/)
 {
     if (format_name == "Distributed")
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method write is not implemented for Distributed format");
@@ -1223,6 +1342,7 @@ void registerStorageFile(StorageFactory & factory)
                 factory_args.columns,
                 factory_args.constraints,
                 factory_args.comment,
+                {},
             };
 
             ASTs & engine_args_ast = factory_args.engine_args;
diff --git a/src/Storages/StorageFile.h b/src/Storages/StorageFile.h
index 53ce7eeaaf6..ed50ae73e51 100644
--- a/src/Storages/StorageFile.h
+++ b/src/Storages/StorageFile.h
@@ -2,12 +2,11 @@
 
 #include <Storages/IStorage.h>
 #include <Storages/Cache/SchemaCache.h>
-
+#include <Common/FileRenamer.h>
 
 #include <atomic>
 #include <shared_mutex>
 
-
 namespace DB
 {
 
@@ -23,6 +22,8 @@ public:
         const ColumnsDescription & columns;
         const ConstraintsDescription & constraints;
         const String & comment;
+
+        const std::string rename_after_processing;
     };
 
     /// From file descriptor
@@ -50,7 +51,8 @@ public:
     SinkToStoragePtr write(
         const ASTPtr & query,
         const StorageMetadataPtr & /*metadata_snapshot*/,
-        ContextPtr context) override;
+        ContextPtr context,
+        bool async_insert) override;
 
     void truncate(
         const ASTPtr & /*query*/,
@@ -139,6 +141,11 @@ private:
     std::unique_ptr<ReadBuffer> read_buffer_from_fd;
     std::unique_ptr<ReadBuffer> peekable_read_buffer_from_fd;
     std::atomic<bool> has_peekable_read_buffer_from_fd = false;
+
+    // Counts the number of readers
+    std::atomic<int32_t> readers_counter = 0;
+    FileRenamer file_renamer;
+    bool was_renamed = false;
 };
 
 }
diff --git a/src/Storages/StorageGenerateRandom.cpp b/src/Storages/StorageGenerateRandom.cpp
index e48d3187cb2..293beca9c24 100644
--- a/src/Storages/StorageGenerateRandom.cpp
+++ b/src/Storages/StorageGenerateRandom.cpp
@@ -29,6 +29,7 @@
 
 #include <Common/SipHash.h>
 #include <Common/randomSeed.h>
+#include <Interpreters/Context.h>
 #include <base/unaligned.h>
 
 #include <Functions/FunctionFactory.h>
@@ -81,6 +82,66 @@ void fillBufferWithRandomData(char * __restrict data, size_t limit, size_t size_
 }
 
 
+size_t estimateValueSize(
+    const DataTypePtr type,
+    UInt64 max_array_length,
+    UInt64 max_string_length)
+{
+    if (type->haveMaximumSizeOfValue())
+        return type->getMaximumSizeOfValueInMemory();
+
+    TypeIndex idx = type->getTypeId();
+
+    switch (idx)
+    {
+        case TypeIndex::String:
+        {
+            return max_string_length + sizeof(size_t) + 1;
+        }
+
+        /// The logic in this function should reflect the logic of fillColumnWithRandomData.
+        case TypeIndex::Array:
+        {
+            auto nested_type = typeid_cast<const DataTypeArray &>(*type).getNestedType();
+            return sizeof(size_t) + estimateValueSize(nested_type, max_array_length / 2, max_string_length);
+        }
+
+        case TypeIndex::Map:
+        {
+            const DataTypePtr & nested_type = typeid_cast<const DataTypeMap &>(*type).getNestedType();
+            return sizeof(size_t) + estimateValueSize(nested_type, max_array_length / 2, max_string_length);
+        }
+
+        case TypeIndex::Tuple:
+        {
+            auto elements = typeid_cast<const DataTypeTuple *>(type.get())->getElements();
+            const size_t tuple_size = elements.size();
+            size_t res = 0;
+
+            for (size_t i = 0; i < tuple_size; ++i)
+                res += estimateValueSize(elements[i], max_array_length, max_string_length);
+
+            return res;
+        }
+
+        case TypeIndex::Nullable:
+        {
+            auto nested_type = typeid_cast<const DataTypeNullable &>(*type).getNestedType();
+            return 1 + estimateValueSize(nested_type, max_array_length, max_string_length);
+        }
+
+        case TypeIndex::LowCardinality:
+        {
+            auto nested_type = typeid_cast<const DataTypeLowCardinality &>(*type).getDictionaryType();
+            return sizeof(size_t) + estimateValueSize(nested_type, max_array_length, max_string_length);
+        }
+
+        default:
+            throw Exception(ErrorCodes::NOT_IMPLEMENTED, "The 'GenerateRandom' is not implemented for type {}", type->getName());
+    }
+}
+
+
 ColumnPtr fillColumnWithRandomData(
     const DataTypePtr type,
     UInt64 limit,
@@ -192,7 +253,8 @@ ColumnPtr fillColumnWithRandomData(
                 offsets[i] = offset;
             }
 
-            auto data_column = fillColumnWithRandomData(nested_type, offset, max_array_length, max_string_length, rng, context);
+            /// This division by two makes the size growth subexponential on depth.
+            auto data_column = fillColumnWithRandomData(nested_type, offset, max_array_length / 2, max_string_length, rng, context);
 
             return ColumnArray::create(data_column, std::move(offsets_column));
         }
@@ -200,7 +262,7 @@ ColumnPtr fillColumnWithRandomData(
         case TypeIndex::Map:
         {
             const DataTypePtr & nested_type = typeid_cast<const DataTypeMap &>(*type).getNestedType();
-            auto nested_column = fillColumnWithRandomData(nested_type, limit, max_array_length, max_string_length, rng, context);
+            auto nested_column = fillColumnWithRandomData(nested_type, limit, max_array_length / 2, max_string_length, rng, context);
             return ColumnMap::create(nested_column);
         }
 
@@ -597,6 +659,25 @@ Pipe StorageGenerateRandom::read(
         block_header.insert({std::move(column), name_type.type, name_type.name});
     }
 
+    /// Correction of block size for wide tables.
+    size_t preferred_block_size_bytes = context->getSettingsRef().preferred_block_size_bytes;
+    if (preferred_block_size_bytes)
+    {
+        size_t estimated_row_size_bytes = estimateValueSize(std::make_shared<DataTypeTuple>(block_header.getDataTypes()), max_array_length, max_string_length);
+
+        size_t estimated_block_size_bytes = 0;
+        if (common::mulOverflow(max_block_size, estimated_row_size_bytes, estimated_block_size_bytes))
+            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large estimated block size in GenerateRandom table: its estimation leads to 64bit overflow");
+        chassert(estimated_block_size_bytes != 0);
+
+        if (estimated_block_size_bytes > preferred_block_size_bytes)
+        {
+            max_block_size = static_cast<size_t>(max_block_size * (static_cast<double>(preferred_block_size_bytes) / estimated_block_size_bytes));
+            if (max_block_size == 0)
+                max_block_size = 1;
+        }
+    }
+
     /// Will create more seed values for each source from initial seed.
     pcg64 generate(random_seed);
 
diff --git a/src/Storages/StorageInMemoryMetadata.cpp b/src/Storages/StorageInMemoryMetadata.cpp
index 45abd4bebef..afe75349864 100644
--- a/src/Storages/StorageInMemoryMetadata.cpp
+++ b/src/Storages/StorageInMemoryMetadata.cpp
@@ -236,7 +236,10 @@ bool StorageInMemoryMetadata::hasAnyGroupByTTL() const
     return !table_ttl.group_by_ttl.empty();
 }
 
-ColumnDependencies StorageInMemoryMetadata::getColumnDependencies(const NameSet & updated_columns, bool include_ttl_target) const
+ColumnDependencies StorageInMemoryMetadata::getColumnDependencies(
+    const NameSet & updated_columns,
+    bool include_ttl_target,
+    const std::function<bool(const String & file_name)> & has_indice_or_projection) const
 {
     if (updated_columns.empty())
         return {};
@@ -264,10 +267,16 @@ ColumnDependencies StorageInMemoryMetadata::getColumnDependencies(const NameSet
     };
 
     for (const auto & index : getSecondaryIndices())
-        add_dependent_columns(index.expression, indices_columns);
+    {
+        if (has_indice_or_projection("skp_idx_" + index.name + ".idx") || has_indice_or_projection("skp_idx_" + index.name + ".idx2"))
+            add_dependent_columns(index.expression, indices_columns);
+    }
 
     for (const auto & projection : getProjections())
-        add_dependent_columns(&projection, projections_columns);
+    {
+        if (has_indice_or_projection(projection.getDirectoryName()))
+            add_dependent_columns(&projection, projections_columns);
+    }
 
     auto add_for_rows_ttl = [&](const auto & expression, auto & to_set)
     {
@@ -312,7 +321,6 @@ ColumnDependencies StorageInMemoryMetadata::getColumnDependencies(const NameSet
         res.emplace(column, ColumnDependency::TTL_TARGET);
 
     return res;
-
 }
 
 Block StorageInMemoryMetadata::getSampleBlockInsertable() const
diff --git a/src/Storages/StorageInMemoryMetadata.h b/src/Storages/StorageInMemoryMetadata.h
index 25618c5b03f..4ed7eb8bf29 100644
--- a/src/Storages/StorageInMemoryMetadata.h
+++ b/src/Storages/StorageInMemoryMetadata.h
@@ -147,9 +147,12 @@ struct StorageInMemoryMetadata
     TTLDescriptions getGroupByTTLs() const;
     bool hasAnyGroupByTTL() const;
 
-    /// Returns columns, which will be needed to calculate dependencies (skip
-    /// indices, TTL expressions) if we update @updated_columns set of columns.
-    ColumnDependencies getColumnDependencies(const NameSet & updated_columns, bool include_ttl_target) const;
+    /// Returns columns, which will be needed to calculate dependencies (skip indices, projections,
+    /// TTL expressions) if we update @updated_columns set of columns.
+    ColumnDependencies getColumnDependencies(
+        const NameSet & updated_columns,
+        bool include_ttl_target,
+        const std::function<bool(const String & file_name)> & has_indice_or_projection) const;
 
     /// Block with ordinary + materialized columns.
     Block getSampleBlock() const;
diff --git a/src/Storages/StorageJoin.cpp b/src/Storages/StorageJoin.cpp
index 5113320548d..a238e9ef26c 100644
--- a/src/Storages/StorageJoin.cpp
+++ b/src/Storages/StorageJoin.cpp
@@ -89,10 +89,10 @@ RWLockImpl::LockHolder StorageJoin::tryLockForCurrentQueryTimedWithContext(const
     return lock->getLock(type, query_id, acquire_timeout, false);
 }
 
-SinkToStoragePtr StorageJoin::write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context)
+SinkToStoragePtr StorageJoin::write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, bool /*async_insert*/)
 {
     std::lock_guard mutate_lock(mutate_mutex);
-    return StorageSetOrJoinBase::write(query, metadata_snapshot, context);
+    return StorageSetOrJoinBase::write(query, metadata_snapshot, context, /*async_insert=*/false);
 }
 
 void StorageJoin::truncate(const ASTPtr &, const StorageMetadataPtr &, ContextPtr context, TableExclusiveLockHolder &)
diff --git a/src/Storages/StorageJoin.h b/src/Storages/StorageJoin.h
index a5e85d8788a..5559b5d1ec8 100644
--- a/src/Storages/StorageJoin.h
+++ b/src/Storages/StorageJoin.h
@@ -59,7 +59,7 @@ public:
     /// (but not during processing whole query, it's safe for joinGet that doesn't involve `used_flags` from HashJoin)
     ColumnWithTypeAndName joinGet(const Block & block, const Block & block_with_columns_to_add, ContextPtr context) const;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, bool async_insert) override;
 
     Pipe read(
         const Names & column_names,
diff --git a/src/Storages/StorageKeeperMap.cpp b/src/Storages/StorageKeeperMap.cpp
index deebb9e0096..f2b1b907832 100644
--- a/src/Storages/StorageKeeperMap.cpp
+++ b/src/Storages/StorageKeeperMap.cpp
@@ -524,7 +524,7 @@ Pipe StorageKeeperMap::read(
     return process_keys(std::move(filtered_keys));
 }
 
-SinkToStoragePtr StorageKeeperMap::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+SinkToStoragePtr StorageKeeperMap::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
     checkTable<true>();
     return std::make_shared<StorageKeeperMapSink>(*this, metadata_snapshot->getSampleBlock(), local_context);
diff --git a/src/Storages/StorageKeeperMap.h b/src/Storages/StorageKeeperMap.h
index 552e6b35fe8..ad7b719e972 100644
--- a/src/Storages/StorageKeeperMap.h
+++ b/src/Storages/StorageKeeperMap.h
@@ -42,7 +42,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, bool async_insert) override;
 
     void truncate(const ASTPtr &, const StorageMetadataPtr &, ContextPtr, TableExclusiveLockHolder &) override;
     void drop() override;
diff --git a/src/Storages/StorageLog.cpp b/src/Storages/StorageLog.cpp
index 02dc4843660..d8065b8bb3c 100644
--- a/src/Storages/StorageLog.cpp
+++ b/src/Storages/StorageLog.cpp
@@ -775,6 +775,8 @@ void StorageLog::truncate(const ASTPtr &, const StorageMetadataPtr &, ContextPtr
 
     marks_loaded = true;
     num_marks_saved = 0;
+    total_rows = 0;
+    total_bytes = 0;
     getContext()->dropMMappedFileCache();
 }
 
@@ -855,7 +857,7 @@ Pipe StorageLog::read(
     return Pipe::unitePipes(std::move(pipes));
 }
 
-SinkToStoragePtr StorageLog::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+SinkToStoragePtr StorageLog::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
     WriteLock lock{rwlock, getLockTimeout(local_context)};
     if (!lock)
diff --git a/src/Storages/StorageLog.h b/src/Storages/StorageLog.h
index a2b1356f240..f1d05ed39ac 100644
--- a/src/Storages/StorageLog.h
+++ b/src/Storages/StorageLog.h
@@ -55,7 +55,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool async_insert) override;
 
     void rename(const String & new_path_to_table_data, const StorageID & new_table_id) override;
 
diff --git a/src/Storages/StorageMaterializedMySQL.h b/src/Storages/StorageMaterializedMySQL.h
index 9896265b576..08fbb61960f 100644
--- a/src/Storages/StorageMaterializedMySQL.h
+++ b/src/Storages/StorageMaterializedMySQL.h
@@ -32,7 +32,7 @@ public:
         QueryProcessingStage::Enum processed_stage,
         size_t max_block_size, size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr &, const StorageMetadataPtr &, ContextPtr) override { throwNotAllowed(); }
+    SinkToStoragePtr write(const ASTPtr &, const StorageMetadataPtr &, ContextPtr, bool) override { throwNotAllowed(); }
 
     NamesAndTypesList getVirtuals() const override;
     ColumnSizeByName getColumnSizes() const override;
diff --git a/src/Storages/StorageMaterializedView.cpp b/src/Storages/StorageMaterializedView.cpp
index b96c132d601..16d724d54d8 100644
--- a/src/Storages/StorageMaterializedView.cpp
+++ b/src/Storages/StorageMaterializedView.cpp
@@ -192,13 +192,13 @@ void StorageMaterializedView::read(
     }
 }
 
-SinkToStoragePtr StorageMaterializedView::write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr local_context)
+SinkToStoragePtr StorageMaterializedView::write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr local_context, bool async_insert)
 {
     auto storage = getTargetTable();
     auto lock = storage->lockForShare(local_context->getCurrentQueryId(), local_context->getSettingsRef().lock_acquire_timeout);
 
     auto metadata_snapshot = storage->getInMemoryMetadataPtr();
-    auto sink = storage->write(query, metadata_snapshot, local_context);
+    auto sink = storage->write(query, metadata_snapshot, local_context, async_insert);
 
     sink->addTableLock(lock);
     return sink;
diff --git a/src/Storages/StorageMaterializedView.h b/src/Storages/StorageMaterializedView.h
index f7876005c49..3ec789aa7e3 100644
--- a/src/Storages/StorageMaterializedView.h
+++ b/src/Storages/StorageMaterializedView.h
@@ -39,7 +39,7 @@ public:
         return target_table->mayBenefitFromIndexForIn(left_in_operand, query_context, metadata_snapshot);
     }
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
     void drop() override;
     void dropInnerTableIfAny(bool sync, ContextPtr local_context) override;
diff --git a/src/Storages/StorageMemory.cpp b/src/Storages/StorageMemory.cpp
index caeefa5d96d..6ed0583bd44 100644
--- a/src/Storages/StorageMemory.cpp
+++ b/src/Storages/StorageMemory.cpp
@@ -16,6 +16,7 @@
 #include <Processors/Sinks/SinkToStorage.h>
 #include <Processors/Executors/PullingPipelineExecutor.h>
 #include <Processors/QueryPlan/ReadFromMemoryStorageStep.h>
+#include <Processors/QueryPlan/QueryPlan.h>
 #include <Parsers/ASTCreateQuery.h>
 
 #include <Common/FileChecker.h>
@@ -155,11 +156,11 @@ void StorageMemory::read(
     size_t /*max_block_size*/,
     size_t num_streams)
 {
-    query_plan.addStep(std::make_unique<ReadFromMemoryStorageStep>(column_names, storage_snapshot, num_streams, delay_read_for_global_subqueries));
+    query_plan.addStep(std::make_unique<ReadFromMemoryStorageStep>(column_names, shared_from_this(), storage_snapshot, num_streams, delay_read_for_global_subqueries));
 }
 
 
-SinkToStoragePtr StorageMemory::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr context)
+SinkToStoragePtr StorageMemory::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, bool /*async_insert*/)
 {
     return std::make_shared<MemorySink>(*this, metadata_snapshot, context);
 }
diff --git a/src/Storages/StorageMemory.h b/src/Storages/StorageMemory.h
index ce8a59b8bcd..acb2be4649b 100644
--- a/src/Storages/StorageMemory.h
+++ b/src/Storages/StorageMemory.h
@@ -64,7 +64,7 @@ public:
 
     bool hasEvenlyDistributedRead() const override { return true; }
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, bool async_insert) override;
 
     void drop() override;
 
@@ -132,6 +132,8 @@ private:
     std::atomic<size_t> total_size_rows = 0;
 
     bool compress;
+
+    friend class ReadFromMemoryStorageStep;
 };
 
 }
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 3da4724471d..4c0c0c8e3fa 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -274,7 +274,7 @@ std::optional<UInt64> StorageMergeTree::totalBytes(const Settings &) const
 }
 
 SinkToStoragePtr
-StorageMergeTree::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+StorageMergeTree::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
     const auto & settings = local_context->getSettingsRef();
     return std::make_shared<MergeTreeSink>(
@@ -1303,8 +1303,7 @@ bool StorageMergeTree::scheduleDataProcessingJob(BackgroundJobsAssignee & assign
         /// which is equal or more fresh than commands themselves. In extremely rare case it can happen that we will have alter
         /// in between we took snapshot above and selected commands. That is why we take new snapshot here.
         auto task = std::make_shared<MutatePlainMergeTreeTask>(*this, getInMemoryMetadataPtr(), mutate_entry, shared_lock, common_assignee_trigger);
-        assignee.scheduleMergeMutateTask(task);
-        return true;
+        return assignee.scheduleMergeMutateTask(task);
     }
     if (has_mutations)
     {
@@ -1358,7 +1357,7 @@ size_t StorageMergeTree::getNumberOfUnfinishedMutations() const
     size_t count = 0;
     for (const auto & [version, _] : current_mutations_by_version | std::views::reverse)
     {
-        auto status = getIncompleteMutationsStatusUnlocked(version, lock);
+        auto status = getIncompleteMutationsStatusUnlocked(version, lock, nullptr, true);
         if (!status)
             continue;
 
@@ -1933,7 +1932,8 @@ void StorageMergeTree::replacePartitionFrom(const StoragePtr & source_table, con
         Int64 temp_index = insert_increment.get();
         MergeTreePartInfo dst_part_info(partition_id, temp_index, temp_index, src_part->info.level);
 
-        auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(src_part, TMP_PREFIX, dst_part_info, my_metadata_snapshot, local_context->getCurrentTransaction(), {}, false, {});
+        IDataPartStorage::ClonePartParams clone_params{.txn = local_context->getCurrentTransaction()};
+        auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(src_part, TMP_PREFIX, dst_part_info, my_metadata_snapshot, clone_params);
         dst_parts.emplace_back(std::move(dst_part));
         dst_parts_locks.emplace_back(std::move(part_lock));
     }
@@ -2031,7 +2031,8 @@ void StorageMergeTree::movePartitionToTable(const StoragePtr & dest_table, const
         Int64 temp_index = insert_increment.get();
         MergeTreePartInfo dst_part_info(partition_id, temp_index, temp_index, src_part->info.level);
 
-        auto [dst_part, part_lock] = dest_table_storage->cloneAndLoadDataPartOnSameDisk(src_part, TMP_PREFIX, dst_part_info, dest_metadata_snapshot, local_context->getCurrentTransaction(), {}, false, {});
+        IDataPartStorage::ClonePartParams clone_params{.txn = local_context->getCurrentTransaction()};
+        auto [dst_part, part_lock] = dest_table_storage->cloneAndLoadDataPartOnSameDisk(src_part, TMP_PREFIX, dst_part_info, dest_metadata_snapshot, clone_params);
         dst_parts.emplace_back(std::move(dst_part));
         dst_parts_locks.emplace_back(std::move(part_lock));
     }
@@ -2160,7 +2161,10 @@ void StorageMergeTree::backupData(BackupEntriesCollector & backup_entries_collec
     for (const auto & data_part : data_parts)
         min_data_version = std::min(min_data_version, data_part->info.getDataVersion() + 1);
 
-    backup_entries_collector.addBackupEntries(backupParts(data_parts, data_path_in_backup, backup_settings, local_context));
+    auto parts_backup_entries = backupParts(data_parts, data_path_in_backup, backup_settings, local_context);
+    for (auto & part_backup_entries : parts_backup_entries)
+        backup_entries_collector.addBackupEntries(std::move(part_backup_entries.backup_entries));
+
     backup_entries_collector.addBackupEntries(backupMutations(min_data_version, data_path_in_backup));
 }
 
diff --git a/src/Storages/StorageMergeTree.h b/src/Storages/StorageMergeTree.h
index be9f5426bbd..8099f9c16aa 100644
--- a/src/Storages/StorageMergeTree.h
+++ b/src/Storages/StorageMergeTree.h
@@ -71,7 +71,7 @@ public:
     std::optional<UInt64> totalRowsByPartitionPredicate(const SelectQueryInfo &, ContextPtr) const override;
     std::optional<UInt64> totalBytes(const Settings &) const override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
     /** Perform the next step in combining the parts.
       */
diff --git a/src/Storages/StorageMongoDB.cpp b/src/Storages/StorageMongoDB.cpp
index 63b8c2d00a1..3287e3272e3 100644
--- a/src/Storages/StorageMongoDB.cpp
+++ b/src/Storages/StorageMongoDB.cpp
@@ -99,6 +99,7 @@ public:
         , db_name(db_name_)
         , metadata_snapshot{metadata_snapshot_}
         , connection(connection_)
+        , is_wire_protocol_old(isMongoDBWireProtocolOld(*connection_))
     {
     }
 
@@ -107,7 +108,7 @@ public:
     void consume(Chunk chunk) override
     {
         Poco::MongoDB::Database db(db_name);
-        Poco::MongoDB::Document::Ptr index = new Poco::MongoDB::Document();
+        Poco::MongoDB::Document::Vector documents;
 
         auto block = getHeader().cloneWithColumns(chunk.detachColumns());
 
@@ -118,20 +119,35 @@ public:
         const auto data_types = block.getDataTypes();
         const auto data_names = block.getNames();
 
-        std::vector<std::string> row(num_cols);
+        documents.reserve(num_rows);
+
         for (const auto i : collections::range(0, num_rows))
         {
+            Poco::MongoDB::Document::Ptr document = new Poco::MongoDB::Document();
+
             for (const auto j : collections::range(0, num_cols))
             {
                 WriteBufferFromOwnString ostr;
                 data_types[j]->getDefaultSerialization()->serializeText(*columns[j], i, ostr, FormatSettings{});
-                row[j] = ostr.str();
-                index->add(data_names[j], row[j]);
+                document->add(data_names[j], ostr.str());
             }
+
+            documents.push_back(std::move(document));
+        }
+
+        if (is_wire_protocol_old)
+        {
+            Poco::SharedPtr<Poco::MongoDB::InsertRequest> insert_request = db.createInsertRequest(collection_name);
+            insert_request->documents() = std::move(documents);
+            connection->sendRequest(*insert_request);
+        }
+        else
+        {
+            Poco::SharedPtr<Poco::MongoDB::OpMsgMessage> insert_request = db.createOpMsgMessage(collection_name);
+            insert_request->setCommandName(Poco::MongoDB::OpMsgMessage::CMD_INSERT);
+            insert_request->documents() = std::move(documents);
+            connection->sendRequest(*insert_request);
         }
-        Poco::SharedPtr<Poco::MongoDB::InsertRequest> insert_request = db.createInsertRequest(collection_name);
-        insert_request->documents().push_back(index);
-        connection->sendRequest(*insert_request);
     }
 
 private:
@@ -139,6 +155,8 @@ private:
     String db_name;
     StorageMetadataPtr metadata_snapshot;
     std::shared_ptr<Poco::MongoDB::Connection> connection;
+
+    const bool is_wire_protocol_old;
 };
 
 
@@ -162,10 +180,10 @@ Pipe StorageMongoDB::read(
         sample_block.insert({ column_data.type, column_data.name });
     }
 
-    return Pipe(std::make_shared<MongoDBSource>(connection, createCursor(database_name, collection_name, sample_block), sample_block, max_block_size));
+    return Pipe(std::make_shared<MongoDBSource>(connection, database_name, collection_name, Poco::MongoDB::Document{}, sample_block, max_block_size));
 }
 
-SinkToStoragePtr StorageMongoDB::write(const ASTPtr & /* query */, const StorageMetadataPtr & metadata_snapshot, ContextPtr /* context */)
+SinkToStoragePtr StorageMongoDB::write(const ASTPtr & /* query */, const StorageMetadataPtr & metadata_snapshot, ContextPtr /* context */, bool /*async_insert*/)
 {
     connectIfNotConnected();
     return std::make_shared<StorageMongoDBSink>(collection_name, database_name, metadata_snapshot, connection);
diff --git a/src/Storages/StorageMongoDB.h b/src/Storages/StorageMongoDB.h
index 2b77f076e7e..36090d4584e 100644
--- a/src/Storages/StorageMongoDB.h
+++ b/src/Storages/StorageMongoDB.h
@@ -41,7 +41,8 @@ public:
     SinkToStoragePtr write(
         const ASTPtr & query,
         const StorageMetadataPtr & /*metadata_snapshot*/,
-        ContextPtr context) override;
+        ContextPtr context,
+        bool async_insert) override;
 
     struct Configuration
     {
diff --git a/src/Storages/StorageMySQL.cpp b/src/Storages/StorageMySQL.cpp
index 2a96581d591..3e928c3a811 100644
--- a/src/Storages/StorageMySQL.cpp
+++ b/src/Storages/StorageMySQL.cpp
@@ -252,7 +252,7 @@ private:
 };
 
 
-SinkToStoragePtr StorageMySQL::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+SinkToStoragePtr StorageMySQL::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
     return std::make_shared<StorageMySQLSink>(
         *this,
diff --git a/src/Storages/StorageMySQL.h b/src/Storages/StorageMySQL.h
index 9f47f9925d5..a98afc7ac4d 100644
--- a/src/Storages/StorageMySQL.h
+++ b/src/Storages/StorageMySQL.h
@@ -49,7 +49,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
     struct Configuration
     {
diff --git a/src/Storages/StorageNull.h b/src/Storages/StorageNull.h
index d35c6a0b8b5..f6dd7064a22 100644
--- a/src/Storages/StorageNull.h
+++ b/src/Storages/StorageNull.h
@@ -46,7 +46,7 @@ public:
 
     bool supportsParallelInsert() const override { return true; }
 
-    SinkToStoragePtr write(const ASTPtr &, const StorageMetadataPtr & metadata_snapshot, ContextPtr) override
+    SinkToStoragePtr write(const ASTPtr &, const StorageMetadataPtr & metadata_snapshot, ContextPtr, bool) override
     {
         return std::make_shared<NullSinkToStorage>(metadata_snapshot->getSampleBlock());
     }
diff --git a/src/Storages/StoragePostgreSQL.cpp b/src/Storages/StoragePostgreSQL.cpp
index 5d7dc285c5d..3551ee36819 100644
--- a/src/Storages/StoragePostgreSQL.cpp
+++ b/src/Storages/StoragePostgreSQL.cpp
@@ -451,7 +451,7 @@ private:
 
 
 SinkToStoragePtr StoragePostgreSQL::write(
-        const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr /* context */)
+        const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr /* context */, bool /*async_insert*/)
 {
     return std::make_shared<PostgreSQLSink>(metadata_snapshot, pool->get(), remote_table_name, remote_table_schema, on_conflict);
 }
diff --git a/src/Storages/StoragePostgreSQL.h b/src/Storages/StoragePostgreSQL.h
index be6bbc5ec63..fb8b5a22df2 100644
--- a/src/Storages/StoragePostgreSQL.h
+++ b/src/Storages/StoragePostgreSQL.h
@@ -46,7 +46,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
     struct Configuration
     {
diff --git a/src/Storages/StorageProxy.h b/src/Storages/StorageProxy.h
index e8a664a6382..14b7fc15af2 100644
--- a/src/Storages/StorageProxy.h
+++ b/src/Storages/StorageProxy.h
@@ -68,9 +68,9 @@ public:
         return getNested()->read(query_plan, column_names, storage_snapshot, query_info, context, processed_stage, max_block_size, num_streams);
     }
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context) override
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, bool async_insert) override
     {
-        return getNested()->write(query, metadata_snapshot, context);
+        return getNested()->write(query, metadata_snapshot, context, async_insert);
     }
 
     void drop() override { getNested()->drop(); }
diff --git a/src/Storages/StorageRedis.cpp b/src/Storages/StorageRedis.cpp
new file mode 100644
index 00000000000..ddb1b62c7b0
--- /dev/null
+++ b/src/Storages/StorageRedis.cpp
@@ -0,0 +1,586 @@
+#include <unordered_set>
+#include <IO/WriteHelpers.h>
+#include <Interpreters/MutationsInterpreter.h>
+#include <Interpreters/evaluateConstantExpression.h>
+#include <Parsers/ASTCreateQuery.h>
+#include <Parsers/ASTDropQuery.h>
+#include <Parsers/ASTLiteral.h>
+#include <Processors/Executors/PullingPipelineExecutor.h>
+#include <Processors/Sinks/SinkToStorage.h>
+#include <QueryPipeline/Pipe.h>
+#include <QueryPipeline/QueryPipelineBuilder.h>
+
+#include <Storages/KVStorageUtils.h>
+#include <Storages/KeyDescription.h>
+#include <Storages/NamedCollectionsHelpers.h>
+#include <Storages/StorageFactory.h>
+#include <Storages/StorageInMemoryMetadata.h>
+#include <Storages/StorageRedis.h>
+#include <Storages/checkAndGetLiteralArgument.h>
+
+#include <Common/Exception.h>
+#include <Common/checkStackSize.h>
+#include <Common/logger_useful.h>
+#include <Common/parseAddress.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+    extern const int LOGICAL_ERROR;
+    extern const int INTERNAL_REDIS_ERROR;
+}
+
+class RedisDataSource : public ISource
+{
+public:
+    RedisDataSource(
+        StorageRedis & storage_,
+        const Block & header,
+        FieldVectorPtr keys_,
+        FieldVector::const_iterator begin_,
+        FieldVector::const_iterator end_,
+        const size_t max_block_size_)
+        : ISource(header)
+        , storage(storage_)
+        , primary_key_pos(getPrimaryKeyPos(header, storage.getPrimaryKey()))
+        , keys(keys_)
+        , begin(begin_)
+        , end(end_)
+        , it(begin)
+        , max_block_size(max_block_size_)
+    {
+    }
+
+    RedisDataSource(StorageRedis & storage_, const Block & header, const size_t max_block_size_, const String & pattern_ = "*")
+        : ISource(header)
+        , storage(storage_)
+        , primary_key_pos(getPrimaryKeyPos(header, storage.getPrimaryKey()))
+        , iterator(-1)
+        , pattern(pattern_)
+        , max_block_size(max_block_size_)
+    {
+    }
+
+    String getName() const override { return storage.getName(); }
+
+    Chunk generate() override
+    {
+        if (keys)
+            return generateWithKeys();
+        return generateFullScan();
+    }
+
+    Chunk generateWithKeys()
+    {
+        const auto & sample_block = getPort().getHeader();
+        if (it >= end)
+        {
+            it = {};
+            return {};
+        }
+
+        const auto & key_column_type = sample_block.getByName(storage.getPrimaryKey().at(0)).type;
+        auto raw_keys = serializeKeysToRawString(it, end, key_column_type, max_block_size);
+
+        return storage.getBySerializedKeys(raw_keys, nullptr);
+    }
+
+    /// TODO scan may get duplicated keys when Redis is rehashing, it is a very rare case.
+    Chunk generateFullScan()
+    {
+        checkStackSize();
+
+        /// redis scan ending
+        if (iterator == 0)
+            return {};
+
+        RedisArray scan_keys;
+        RedisIterator next_iterator;
+
+        std::tie(next_iterator, scan_keys) = storage.scan(iterator == -1 ? 0 : iterator, pattern, max_block_size);
+        iterator = next_iterator;
+
+        /// redis scan can return nothing
+        if (scan_keys.isNull() || scan_keys.size() == 0)
+            return generateFullScan();
+
+        const auto & sample_block = getPort().getHeader();
+        MutableColumns columns = sample_block.cloneEmptyColumns();
+
+        RedisArray values = storage.multiGet(scan_keys);
+        for (size_t i = 0; i < scan_keys.size() && !values.get<RedisBulkString>(i).isNull(); i++)
+        {
+            fillColumns(scan_keys.get<RedisBulkString>(i).value(),
+                        values.get<RedisBulkString>(i).value(),
+                        primary_key_pos, sample_block, columns
+            );
+        }
+
+        Block block = sample_block.cloneWithColumns(std::move(columns));
+        return Chunk(block.getColumns(), block.rows());
+    }
+
+private:
+    StorageRedis & storage;
+
+    size_t primary_key_pos;
+
+    /// For key scan
+    FieldVectorPtr keys = nullptr;
+    FieldVector::const_iterator begin;
+    FieldVector::const_iterator end;
+    FieldVector::const_iterator it;
+
+    /// For full scan
+    RedisIterator iterator;
+    String pattern;
+
+    const size_t max_block_size;
+};
+
+
+class RedisSink : public SinkToStorage
+{
+public:
+    RedisSink(StorageRedis & storage_, const StorageMetadataPtr & metadata_snapshot_);
+
+    void consume(Chunk chunk) override;
+    String getName() const override { return "RedisSink"; }
+
+private:
+    StorageRedis & storage;
+    StorageMetadataPtr metadata_snapshot;
+    size_t primary_key_pos = 0;
+};
+
+RedisSink::RedisSink(StorageRedis & storage_, const StorageMetadataPtr & metadata_snapshot_)
+    : SinkToStorage(metadata_snapshot_->getSampleBlock())
+    , storage(storage_)
+    , metadata_snapshot(metadata_snapshot_)
+{
+    for (const auto & column : getHeader())
+    {
+        if (column.name == storage.getPrimaryKey()[0])
+            break;
+        ++primary_key_pos;
+    }
+}
+
+void RedisSink::consume(Chunk chunk)
+{
+    auto rows = chunk.getNumRows();
+    auto block = getHeader().cloneWithColumns(chunk.detachColumns());
+
+    WriteBufferFromOwnString wb_key;
+    WriteBufferFromOwnString wb_value;
+
+    RedisArray data;
+    for (size_t i = 0; i < rows; ++i)
+    {
+        wb_key.restart();
+        wb_value.restart();
+
+        size_t idx = 0;
+        for (const auto & elem : block)
+        {
+            elem.type->getDefaultSerialization()->serializeBinary(*elem.column, i, idx == primary_key_pos ? wb_key : wb_value, {});
+            ++idx;
+        }
+        data.add(wb_key.str());
+        data.add(wb_value.str());
+    }
+
+    storage.multiSet(data);
+}
+
+StorageRedis::StorageRedis(
+    const StorageID & table_id_,
+    const RedisConfiguration & configuration_,
+    ContextPtr context_,
+    const StorageInMemoryMetadata & storage_metadata,
+    const String & primary_key_)
+    : IStorage(table_id_)
+    , WithContext(context_->getGlobalContext())
+    , table_id(table_id_)
+    , configuration(configuration_)
+    , log(&Poco::Logger::get("StorageRedis"))
+    , primary_key(primary_key_)
+{
+    pool = std::make_shared<RedisPool>(configuration.pool_size);
+    setInMemoryMetadata(storage_metadata);
+}
+
+Pipe StorageRedis::read(
+    const Names & column_names,
+    const StorageSnapshotPtr & storage_snapshot,
+    SelectQueryInfo & query_info,
+    ContextPtr context_,
+    QueryProcessingStage::Enum /*processed_stage*/,
+    size_t max_block_size,
+    size_t num_streams)
+{
+    storage_snapshot->check(column_names);
+
+    FieldVectorPtr keys;
+    bool all_scan = false;
+
+    Block header = storage_snapshot->metadata->getSampleBlock();
+    auto primary_key_data_type = header.getByName(primary_key).type;
+
+    std::tie(keys, all_scan) = getFilterKeys(primary_key, primary_key_data_type, query_info, context_);
+
+    if (all_scan)
+    {
+        return Pipe(std::make_shared<RedisDataSource>(*this, header, max_block_size));
+    }
+    else
+    {
+        if (keys->empty())
+            return {};
+
+        Pipes pipes;
+
+        ::sort(keys->begin(), keys->end());
+        keys->erase(std::unique(keys->begin(), keys->end()), keys->end());
+
+        size_t num_keys = keys->size();
+        size_t num_threads = std::min<size_t>(num_streams, keys->size());
+
+        num_threads = std::min<size_t>(num_threads, configuration.pool_size);
+        assert(num_keys <= std::numeric_limits<uint32_t>::max());
+
+        for (size_t thread_idx = 0; thread_idx < num_threads; ++thread_idx)
+        {
+            size_t begin = num_keys * thread_idx / num_threads;
+            size_t end = num_keys * (thread_idx + 1) / num_threads;
+
+            pipes.emplace_back(
+                std::make_shared<RedisDataSource>(*this, header, keys, keys->begin() + begin, keys->begin() + end, max_block_size));
+        }
+        return Pipe::unitePipes(std::move(pipes));
+    }
+}
+
+namespace
+{
+    //  host:port, db_index, password, pool_size
+    RedisConfiguration getRedisConfiguration(ASTs & engine_args, ContextPtr context)
+    {
+        RedisConfiguration configuration;
+
+        if (engine_args.empty())
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Bad arguments count when creating Redis table engine");
+
+        if (auto named_collection = tryGetNamedCollectionWithOverrides(engine_args, context))
+        {
+            validateNamedCollection(
+                *named_collection,
+                ValidateKeysMultiset<RedisEqualKeysSet>{"host", "port", "hostname", "password", "db_index", "pool_size"},
+                {});
+
+            configuration.host = named_collection->getAny<String>({"host", "hostname"});
+            configuration.port = static_cast<uint32_t>(named_collection->getOrDefault<UInt64>("port", 6379));
+            configuration.password = named_collection->getOrDefault<String>("password", DEFAULT_REDIS_PASSWORD);
+            configuration.db_index = static_cast<uint32_t>(named_collection->getOrDefault<UInt64>("db_index", DEFAULT_REDIS_DB_INDEX));
+            configuration.pool_size = static_cast<uint32_t>(named_collection->getOrDefault<UInt64>("pool_size", DEFAULT_REDIS_POOL_SIZE));
+        }
+        else
+        {
+            for (auto & engine_arg : engine_args)
+                engine_arg = evaluateConstantExpressionOrIdentifierAsLiteral(engine_arg, context);
+
+            /// 6379 is the default Redis port.
+            auto parsed_host_port = parseAddress(checkAndGetLiteralArgument<String>(engine_args[0], "host:port"), 6379);
+            configuration.host = parsed_host_port.first;
+            configuration.port = parsed_host_port.second;
+
+            if (engine_args.size() > 1)
+                configuration.db_index = static_cast<uint32_t>(checkAndGetLiteralArgument<UInt64>(engine_args[1], "db_index"));
+            else
+                configuration.db_index = DEFAULT_REDIS_DB_INDEX;
+            if (engine_args.size() > 2)
+                configuration.password = checkAndGetLiteralArgument<String>(engine_args[2], "password");
+            else
+                configuration.password = DEFAULT_REDIS_PASSWORD;
+            if (engine_args.size() > 3)
+                configuration.pool_size = static_cast<uint32_t>(checkAndGetLiteralArgument<UInt64>(engine_args[3], "pool_size"));
+            else
+                configuration.pool_size = DEFAULT_REDIS_POOL_SIZE;
+        }
+
+        context->getRemoteHostFilter().checkHostAndPort(configuration.host, toString(configuration.port));
+        return configuration;
+    }
+
+    StoragePtr createStorageRedis(const StorageFactory::Arguments & args)
+    {
+        auto configuration = getRedisConfiguration(args.engine_args, args.getLocalContext());
+
+        StorageInMemoryMetadata metadata;
+        metadata.setColumns(args.columns);
+        metadata.setConstraints(args.constraints);
+        metadata.setComment(args.comment);
+
+        if (!args.storage_def->primary_key)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "StorageRedis must require one column in primary key");
+
+        auto primary_key_desc = KeyDescription::getKeyFromAST(args.storage_def->primary_key->ptr(), metadata.columns, args.getContext());
+        auto primary_key_names = primary_key_desc.expression->getRequiredColumns();
+
+        if (primary_key_names.size() != 1)
+        {
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "StorageRedis must require one column in primary key");
+        }
+
+        return std::make_shared<StorageRedis>(args.table_id, configuration, args.getContext(), metadata, primary_key_names[0]);
+    }
+}
+
+Chunk StorageRedis::getBySerializedKeys(const std::vector<std::string> & keys, PaddedPODArray<UInt8> * null_map) const
+{
+    RedisArray redis_keys;
+    for (const auto & key : keys)
+        redis_keys.add(key);
+    return getBySerializedKeys(redis_keys, null_map);
+}
+
+Chunk StorageRedis::getBySerializedKeys(const RedisArray & keys, PaddedPODArray<UInt8> * null_map) const
+{
+    Block sample_block = getInMemoryMetadataPtr()->getSampleBlock();
+
+    size_t primary_key_pos = getPrimaryKeyPos(sample_block, getPrimaryKey());
+    MutableColumns columns = sample_block.cloneEmptyColumns();
+
+    RedisArray values = multiGet(keys);
+    if (values.isNull() || values.size() == 0)
+        return {};
+
+    if (null_map)
+    {
+        null_map->clear();
+        null_map->resize_fill(keys.size(), 1);
+    }
+
+    for (size_t i = 0; i < values.size(); ++i)
+    {
+        if (!values.get<RedisBulkString>(i).isNull())
+        {
+            fillColumns(keys.get<RedisBulkString>(i).value(),
+                        values.get<RedisBulkString>(i).value(),
+                        primary_key_pos, sample_block, columns
+            );
+        }
+        else /// key not found
+        {
+            if (null_map)
+            {
+                (*null_map)[i] = 0;
+                for (size_t col_idx = 0; col_idx < sample_block.columns(); ++col_idx)
+                {
+                    columns[col_idx]->insert(sample_block.getByPosition(col_idx).type->getDefault());
+                }
+            }
+        }
+    }
+
+    size_t num_rows = columns.at(0)->size();
+    return Chunk(std::move(columns), num_rows);
+}
+
+std::pair<RedisIterator, RedisArray> StorageRedis::scan(RedisIterator iterator, const String & pattern, uint64_t max_count)
+{
+    auto connection = getRedisConnection(pool, configuration);
+    RedisCommand scan("SCAN");
+    scan << toString(iterator) << "MATCH" << pattern << "COUNT" << toString(max_count);
+
+    const auto & result = connection->client->execute<RedisArray>(scan);
+    RedisIterator next = parse<RedisIterator>(result.get<RedisBulkString>(0).value());
+
+    return {next, result.get<RedisArray>(1)};
+}
+
+RedisArray StorageRedis::multiGet(const RedisArray & keys) const
+{
+    auto connection = getRedisConnection(pool, configuration);
+
+    RedisCommand cmd_mget("MGET");
+    for (size_t i = 0; i < keys.size(); ++i)
+        cmd_mget.add(keys.get<RedisBulkString>(i));
+
+    return connection->client->execute<RedisArray>(cmd_mget);
+}
+
+void StorageRedis::multiSet(const RedisArray & data) const
+{
+    auto connection = getRedisConnection(pool, configuration);
+
+    RedisCommand cmd_mget("MSET");
+    for (size_t i = 0; i < data.size(); ++i)
+        cmd_mget.add(data.get<RedisBulkString>(i));
+
+    auto ret = connection->client->execute<RedisSimpleString>(cmd_mget);
+    if (ret != "OK")
+        throw Exception(ErrorCodes::INTERNAL_REDIS_ERROR, "Fail to write to redis table {}, for {}", table_id.getFullNameNotQuoted(), ret);
+}
+
+RedisInteger StorageRedis::multiDelete(const RedisArray & keys) const
+{
+    auto connection = getRedisConnection(pool, configuration);
+
+    RedisCommand cmd("DEL");
+    for (size_t i = 0; i < keys.size(); ++i)
+        cmd.add(keys.get<RedisBulkString>(i));
+
+    auto ret = connection->client->execute<RedisInteger>(cmd);
+    if (ret != static_cast<RedisInteger>(keys.size()))
+        LOG_DEBUG(
+            log,
+            "Try to delete {} rows but actually deleted {} rows from redis table {}.",
+            keys.size(),
+            ret,
+            table_id.getFullNameNotQuoted());
+
+    return ret;
+}
+
+Chunk StorageRedis::getByKeys(const ColumnsWithTypeAndName & keys, PaddedPODArray<UInt8> & null_map, const Names &) const
+{
+    if (keys.size() != 1)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "StorageRedis supports only one key, got: {}", keys.size());
+
+    auto raw_keys = serializeKeysToRawString(keys[0]);
+
+    if (raw_keys.size() != keys[0].column->size())
+        throw DB::Exception(ErrorCodes::LOGICAL_ERROR, "Assertion failed: {} != {}", raw_keys.size(), keys[0].column->size());
+
+    return getBySerializedKeys(raw_keys, &null_map);
+}
+
+Block StorageRedis::getSampleBlock(const Names &) const
+{
+    return getInMemoryMetadataPtr()->getSampleBlock();
+}
+
+SinkToStoragePtr StorageRedis::write(
+    const ASTPtr & /*query*/,
+    const StorageMetadataPtr & metadata_snapshot,
+    ContextPtr /*context*/,
+    bool /*async_insert*/)
+{
+    return std::make_shared<RedisSink>(*this, metadata_snapshot);
+}
+
+void StorageRedis::truncate(const ASTPtr & query, const StorageMetadataPtr &, ContextPtr, TableExclusiveLockHolder &)
+{
+    auto connection = getRedisConnection(pool, configuration);
+
+    auto * truncate_query = query->as<ASTDropQuery>();
+    assert(truncate_query != nullptr);
+
+    RedisCommand cmd_flush_db("FLUSHDB");
+    if (!truncate_query->sync)
+        cmd_flush_db.add("ASYNC");
+
+    auto ret = connection->client->execute<RedisSimpleString>(cmd_flush_db);
+
+    if (ret != "OK")
+        throw Exception(ErrorCodes::INTERNAL_REDIS_ERROR, "Fail to truncate redis table {}, for {}", table_id.getFullNameNotQuoted(), ret);
+}
+
+void StorageRedis::checkMutationIsPossible(const MutationCommands & commands, const Settings & /* settings */) const
+{
+    if (commands.empty())
+        return;
+
+    if (commands.size() > 1)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Mutations cannot be combined for StorageRedis");
+
+    const auto command_type = commands.front().type;
+    if (command_type != MutationCommand::Type::UPDATE && command_type != MutationCommand::Type::DELETE)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Only DELETE and UPDATE mutation supported for StorageRedis");
+}
+
+void StorageRedis::mutate(const MutationCommands & commands, ContextPtr context_)
+{
+    if (commands.empty())
+        return;
+
+    assert(commands.size() == 1);
+
+    auto metadata_snapshot = getInMemoryMetadataPtr();
+    auto storage = getStorageID();
+    auto storage_ptr = DatabaseCatalog::instance().getTable(storage, context_);
+
+    if (commands.front().type == MutationCommand::Type::DELETE)
+    {
+        MutationsInterpreter::Settings settings(true);
+        settings.return_all_columns = true;
+        settings.return_mutated_rows = true;
+
+        auto interpreter = std::make_unique<MutationsInterpreter>(storage_ptr, metadata_snapshot, commands, context_, settings);
+        auto pipeline = QueryPipelineBuilder::getPipeline(interpreter->execute());
+        PullingPipelineExecutor executor(pipeline);
+
+        auto sink = std::make_shared<RedisSink>(*this, metadata_snapshot);
+
+        auto header = interpreter->getUpdatedHeader();
+        auto primary_key_pos = header.getPositionByName(primary_key);
+
+        Block block;
+        while (executor.pull(block))
+        {
+            auto & column_type_name = block.getByPosition(primary_key_pos);
+
+            auto column = column_type_name.column;
+            auto size = column->size();
+
+            RedisArray keys;
+            WriteBufferFromOwnString wb_key;
+            for (size_t i = 0; i < size; ++i)
+            {
+                wb_key.restart();
+                column_type_name.type->getDefaultSerialization()->serializeBinary(*column, i, wb_key, {});
+                keys.add(wb_key.str());
+            }
+            multiDelete(keys);
+        }
+        return;
+    }
+
+    assert(commands.front().type == MutationCommand::Type::UPDATE);
+    if (commands.front().column_to_update_expression.contains(primary_key))
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Primary key cannot be updated (cannot update column {})", primary_key);
+
+    MutationsInterpreter::Settings settings(true);
+    settings.return_all_columns = true;
+    settings.return_mutated_rows = true;
+
+    auto interpreter = std::make_unique<MutationsInterpreter>(storage_ptr, metadata_snapshot, commands, context_, settings);
+    auto pipeline = QueryPipelineBuilder::getPipeline(interpreter->execute());
+    PullingPipelineExecutor executor(pipeline);
+
+    auto sink = std::make_shared<RedisSink>(*this, metadata_snapshot);
+
+    Block block;
+    while (executor.pull(block))
+    {
+        sink->consume(Chunk{block.getColumns(), block.rows()});
+    }
+}
+
+/// TODO support ttl
+void registerStorageRedis(StorageFactory & factory)
+{
+    StorageFactory::StorageFeatures features{
+        .supports_sort_order = true,
+        .supports_parallel_insert = true,
+        .source_access_type = AccessType::REDIS,
+    };
+
+    factory.registerStorage("Redis", createStorageRedis, features);
+}
+
+}
diff --git a/src/Storages/StorageRedis.h b/src/Storages/StorageRedis.h
new file mode 100644
index 00000000000..a525a4ed7de
--- /dev/null
+++ b/src/Storages/StorageRedis.h
@@ -0,0 +1,83 @@
+#pragma once
+
+#include <Poco/Redis/Redis.h>
+#include <Storages/IStorage.h>
+#include <Storages/RedisCommon.h>
+#include <Interpreters/IKeyValueEntity.h>
+#include <Interpreters/Context_fwd.h>
+#include <Storages/MutationCommands.h>
+
+namespace DB
+{
+/* Implements storage in the Redis.
+ * Use ENGINE = Redis(host:port[, db_index[, password[, pool_size]]]) PRIMARY KEY(key);
+ */
+class StorageRedis : public IStorage, public IKeyValueEntity, WithContext
+{
+public:
+    StorageRedis(
+        const StorageID & table_id_,
+        const RedisConfiguration & configuration_,
+        ContextPtr context_,
+        const StorageInMemoryMetadata & storage_metadata,
+        const String & primary_key_);
+
+    std::string getName() const override { return "Redis"; }
+
+    Pipe read(
+        const Names & column_names,
+        const StorageSnapshotPtr & storage_snapshot,
+        SelectQueryInfo & query_info,
+        ContextPtr context_,
+        QueryProcessingStage::Enum processed_stage,
+        size_t max_block_size,
+        size_t num_streams) override;
+
+    SinkToStoragePtr write(
+        const ASTPtr & query,
+        const StorageMetadataPtr & /*metadata_snapshot*/,
+        ContextPtr context,
+        bool /*async_insert*/) override;
+
+    void truncate(const ASTPtr &,
+        const StorageMetadataPtr & metadata_snapshot,
+        ContextPtr,
+        TableExclusiveLockHolder &) override;
+
+    void checkMutationIsPossible(const MutationCommands & commands, const Settings & settings) const override;
+    void mutate(const MutationCommands &, ContextPtr) override;
+
+    Names getPrimaryKey() const override { return {primary_key}; }
+
+    /// Return chunk with data for given serialized keys.
+    /// If out_null_map is passed, fill it with 1/0 depending on key was/wasn't found. Result chunk may contain default values.
+    /// If out_null_map is not passed. Not found rows excluded from result chunk.
+    Chunk getBySerializedKeys(
+        const std::vector<std::string> & keys,
+        PaddedPODArray<UInt8> * out_null_map) const;
+
+    Chunk getBySerializedKeys(
+        const RedisArray & keys,
+        PaddedPODArray<UInt8> * out_null_map) const;
+
+    std::pair<RedisIterator, RedisArray> scan(RedisIterator iterator, const String & pattern, uint64_t max_count);
+
+    RedisArray multiGet(const RedisArray & keys) const;
+    void multiSet(const RedisArray & data) const;
+    RedisInteger multiDelete(const RedisArray & keys) const;
+
+    Chunk getByKeys(const ColumnsWithTypeAndName & keys, PaddedPODArray<UInt8> & null_map, const Names &) const override;
+
+    Block getSampleBlock(const Names &) const override;
+
+private:
+    StorageID table_id;
+    RedisConfiguration configuration;
+
+    Poco::Logger * log;
+    RedisPoolPtr pool;
+
+    const String primary_key;
+};
+
+}
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 56896f88423..dac9e6923a5 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -4,6 +4,7 @@
 #include <ranges>
 
 #include <base/hex.h>
+#include <base/interpolate.h>
 #include <Common/Macros.h>
 #include <Common/MemoryTracker.h>
 #include <Common/ProfileEventsScope.h>
@@ -12,6 +13,7 @@
 #include <Common/ZooKeeper/Types.h>
 #include <Common/escapeForFileName.h>
 #include <Common/formatReadable.h>
+#include <Common/noexcept_scope.h>
 #include <Common/thread_local_rng.h>
 #include <Common/typeid_cast.h>
 #include <Common/ThreadFuzzer.h>
@@ -20,6 +22,7 @@
 
 #include <base/sort.h>
 
+#include <Storages/buildQueryTreeForShard.h>
 #include <Storages/AlterCommands.h>
 #include <Storages/ColumnsDescription.h>
 #include <Storages/Freeze.h>
@@ -73,20 +76,23 @@
 #include <Processors/QueryPlan/ReadFromPreparedSource.h>
 #include <Processors/Sinks/EmptySink.h>
 
+#include <Planner/Utils.h>
+
 #include <IO/ReadBufferFromString.h>
 #include <IO/Operators.h>
 #include <IO/ConnectionTimeouts.h>
 
-#include <Interpreters/ClusterProxy/executeQuery.h>
 #include <Interpreters/ClusterProxy/SelectStreamFactory.h>
+#include <Interpreters/ClusterProxy/executeQuery.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/DDLTask.h>
 #include <Interpreters/InterpreterAlterQuery.h>
 #include <Interpreters/InterpreterSelectQuery.h>
+#include <Interpreters/InterpreterSelectQueryAnalyzer.h>
 #include <Interpreters/InterserverCredentials.h>
+#include <Interpreters/JoinedTables.h>
 #include <Interpreters/PartLog.h>
 #include <Interpreters/SelectQueryOptions.h>
-#include <Interpreters/JoinedTables.h>
 
 
 #include <Backups/BackupEntriesCollector.h>
@@ -286,7 +292,8 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
     const MergingParams & merging_params_,
     std::unique_ptr<MergeTreeSettings> settings_,
     bool has_force_restore_data_flag,
-    RenamingRestrictions renaming_restrictions_)
+    RenamingRestrictions renaming_restrictions_,
+    bool need_check_structure)
     : MergeTreeData(table_id_,
                     metadata_,
                     context_,
@@ -333,6 +340,7 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
 
     /// Will be activated if we will achieve leader state.
     merge_selecting_task->deactivate();
+    merge_selecting_sleep_ms = getSettings()->merge_selecting_sleep_ms;
 
     mutations_finalizing_task = getContext()->getSchedulePool().createTask(
         getStorageID().getFullTableName() + " (StorageReplicatedMergeTree::mutationsFinalizingTask)", [this] { mutationsFinalizingTask(); });
@@ -423,6 +431,19 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
 
     loadDataParts(skip_sanity_checks);
 
+    if (attach)
+    {
+        /// Provide better initial value of merge_selecting_sleep_ms on server startup
+        auto settings = getSettings();
+        size_t max_parts_in_partition = getMaxPartsCountAndSizeForPartition().first;
+        if (settings->parts_to_delay_insert && max_parts_in_partition < settings->parts_to_delay_insert)
+        {
+            Float64 ratio = 1.0 - static_cast<Float64>(max_parts_in_partition) / settings->parts_to_delay_insert;
+            merge_selecting_sleep_ms = static_cast<UInt64>(interpolateLinear(settings->merge_selecting_sleep_ms,
+                                                                             settings->max_merge_selecting_sleep_ms, ratio));
+        }
+    }
+
     if (!current_zookeeper)
     {
         if (!attach)
@@ -472,11 +493,17 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
             /// information in /replica/metadata.
             other_replicas_fixed_granularity = checkFixedGranularityInZookeeper();
 
-            checkTableStructure(zookeeper_path, metadata_snapshot);
+            /// Allow structure mismatch for secondary queries from Replicated database.
+            /// It may happen if the table was altered just after creation.
+            /// Metadata will be updated in cloneMetadataIfNeeded(...), metadata_version will be 0 for a while.
+            bool same_structure = checkTableStructure(zookeeper_path, metadata_snapshot, need_check_structure);
 
-            Coordination::Stat metadata_stat;
-            current_zookeeper->get(zookeeper_path + "/metadata", &metadata_stat);
-            setInMemoryMetadata(metadata_snapshot->withMetadataVersion(metadata_stat.version));
+            if (same_structure)
+            {
+                Coordination::Stat metadata_stat;
+                current_zookeeper->get(zookeeper_path + "/metadata", &metadata_stat);
+                setInMemoryMetadata(metadata_snapshot->withMetadataVersion(metadata_stat.version));
+            }
         }
         catch (Coordination::Exception & e)
         {
@@ -1166,7 +1193,7 @@ bool StorageReplicatedMergeTree::removeTableNodesFromZooKeeper(zkutil::ZooKeeper
 /** Verify that list of columns and table storage_settings_ptr match those specified in ZK (/metadata).
   * If not, throw an exception.
   */
-void StorageReplicatedMergeTree::checkTableStructure(const String & zookeeper_prefix, const StorageMetadataPtr & metadata_snapshot)
+bool StorageReplicatedMergeTree::checkTableStructure(const String & zookeeper_prefix, const StorageMetadataPtr & metadata_snapshot, bool strict_check)
 {
     auto zookeeper = getZooKeeper();
 
@@ -1181,12 +1208,20 @@ void StorageReplicatedMergeTree::checkTableStructure(const String & zookeeper_pr
     auto columns_from_zk = ColumnsDescription::parse(zookeeper->get(fs::path(zookeeper_prefix) / "columns", &columns_stat));
 
     const ColumnsDescription & old_columns = metadata_snapshot->getColumns();
-    if (columns_from_zk != old_columns)
+    if (columns_from_zk == old_columns)
+        return true;
+
+    if (!strict_check && metadata_stat.version != 0)
     {
-        throw Exception(ErrorCodes::INCOMPATIBLE_COLUMNS,
-            "Table columns structure in ZooKeeper is different from local table structure. Local columns:\n"
-            "{}\nZookeeper columns:\n{}", old_columns.toString(), columns_from_zk.toString());
+        LOG_WARNING(log, "Table columns structure in ZooKeeper is different from local table structure. "
+                    "Assuming it's because the table was altered concurrently. Metadata version: {}. Local columns:\n"
+                    "{}\nZookeeper columns:\n{}", metadata_stat.version, old_columns.toString(), columns_from_zk.toString());
+        return false;
     }
+
+    throw Exception(ErrorCodes::INCOMPATIBLE_COLUMNS,
+        "Table columns structure in ZooKeeper is different from local table structure. Local columns:\n"
+        "{}\nZookeeper columns:\n{}", old_columns.toString(), columns_from_zk.toString());
 }
 
 void StorageReplicatedMergeTree::setTableStructure(const StorageID & table_id, const ContextPtr & local_context,
@@ -1225,12 +1260,57 @@ static time_t tryGetPartCreateTime(zkutil::ZooKeeperPtr & zookeeper, const Strin
     return res;
 }
 
+static void paranoidCheckForCoveredPartsInZooKeeperOnStart(const StorageReplicatedMergeTree * storage, const Strings & parts_in_zk,
+                                                           MergeTreeDataFormatVersion format_version, Poco::Logger * log)
+{
+#ifdef ABORT_ON_LOGICAL_ERROR
+    constexpr bool paranoid_check_for_covered_parts_default = true;
+#else
+    constexpr bool paranoid_check_for_covered_parts_default = false;
+#endif
+
+    bool paranoid_check_for_covered_parts = Context::getGlobalContextInstance()->getConfigRef().getBool(
+        "replicated_merge_tree_paranoid_check_on_startup", paranoid_check_for_covered_parts_default);
+    if (!paranoid_check_for_covered_parts)
+        return;
+
+    /// FIXME https://github.com/ClickHouse/ClickHouse/issues/51182
+    if (storage->getSettings()->use_metadata_cache)
+        return;
+
+    ActiveDataPartSet active_set(format_version);
+    for (const auto & part_name : parts_in_zk)
+        active_set.add(part_name);
+
+    const auto disks = storage->getStoragePolicy()->getDisks();
+    auto path = storage->getRelativeDataPath();
+
+    for (const auto & part_name : parts_in_zk)
+    {
+        String covering_part = active_set.getContainingPart(part_name);
+        if (part_name == covering_part)
+            continue;
+
+        bool found = false;
+        for (const DiskPtr & disk : disks)
+            if (disk->exists(fs::path(path) / part_name))
+                found = true;
+
+        if (!found)
+        {
+            LOG_WARNING(log, "Part {} exists in ZooKeeper and covered by another part in ZooKeeper ({}), but doesn't exist on any disk. "
+                        "It may cause false-positive 'part is lost forever' messages", part_name, covering_part);
+            chassert(false);
+        }
+    }
+}
 
 void StorageReplicatedMergeTree::checkParts(bool skip_sanity_checks)
 {
     auto zookeeper = getZooKeeper();
 
     Strings expected_parts_vec = zookeeper->getChildren(fs::path(replica_path) / "parts");
+    paranoidCheckForCoveredPartsInZooKeeperOnStart(this, expected_parts_vec, format_version, log);
 
     /// Parts in ZK.
     NameSet expected_parts(expected_parts_vec.begin(), expected_parts_vec.end());
@@ -1498,7 +1578,7 @@ void StorageReplicatedMergeTree::checkPartChecksumsAndAddCommitOps(const zkutil:
 }
 
 MergeTreeData::DataPartsVector StorageReplicatedMergeTree::checkPartChecksumsAndCommit(Transaction & transaction,
-    const MutableDataPartPtr & part, std::optional<MergeTreeData::HardlinkedFiles> hardlinked_files, bool replace_zero_copy_lock)
+    const MutableDataPartPtr & part, std::optional<HardlinkedFiles> hardlinked_files, bool replace_zero_copy_lock)
 {
     auto zookeeper = getZooKeeper();
 
@@ -1935,6 +2015,34 @@ MutableDataPartStoragePtr StorageReplicatedMergeTree::executeFetchShared(
     }
 }
 
+static void paranoidCheckForCoveredPartsInZooKeeper(const StorageReplicatedMergeTree * storage, const ZooKeeperPtr & zookeeper, const String & replica_path,
+                                                    MergeTreeDataFormatVersion format_version, const String & covering_part_name)
+{
+#ifdef ABORT_ON_LOGICAL_ERROR
+    constexpr bool paranoid_check_for_covered_parts_default = true;
+#else
+    constexpr bool paranoid_check_for_covered_parts_default = false;
+#endif
+
+    bool paranoid_check_for_covered_parts = Context::getGlobalContextInstance()->getConfigRef().getBool(
+        "replicated_merge_tree_paranoid_check_on_drop_range", paranoid_check_for_covered_parts_default);
+    if (!paranoid_check_for_covered_parts)
+        return;
+
+    /// FIXME https://github.com/ClickHouse/ClickHouse/issues/51182
+    if (storage->getSettings()->use_metadata_cache)
+        return;
+
+    auto drop_range_info = MergeTreePartInfo::fromPartName(covering_part_name, format_version);
+    Strings parts_remain = zookeeper->getChildren(replica_path + "/parts");
+    for (const auto & part_name : parts_remain)
+    {
+        auto part_info = MergeTreePartInfo::fromPartName(part_name, format_version);
+        if (drop_range_info.contains(part_info))
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                            "Part {} remains in ZooKeeper after DROP_RANGE {}", part_name, covering_part_name);
+    }
+}
 
 void StorageReplicatedMergeTree::executeDropRange(const LogEntry & entry)
 {
@@ -1991,6 +2099,7 @@ void StorageReplicatedMergeTree::executeDropRange(const LogEntry & entry)
 
     /// Forcibly remove parts from ZooKeeper
     removePartsFromZooKeeperWithRetries(parts_to_remove);
+    paranoidCheckForCoveredPartsInZooKeeper(this, getZooKeeper(), replica_path, format_version, entry.new_part_name);
 
     if (entry.detach)
         LOG_DEBUG(log, "Detached {} parts inside {}.", parts_to_remove.size(), entry.new_part_name);
@@ -2074,7 +2183,7 @@ bool StorageReplicatedMergeTree::executeReplaceRange(const LogEntry & entry)
         /// A replica that will be used to fetch part
         String replica;
 
-        MergeTreeData::HardlinkedFiles hardlinked_files;
+        HardlinkedFiles hardlinked_files;
 
         scope_guard temporary_part_lock;
     };
@@ -2126,6 +2235,8 @@ bool StorageReplicatedMergeTree::executeReplaceRange(const LogEntry & entry)
     {
         LOG_INFO(log, "All parts from REPLACE PARTITION command have been already attached");
         removePartsFromZooKeeperWithRetries(parts_to_remove);
+        if (replace)
+            paranoidCheckForCoveredPartsInZooKeeper(this, getZooKeeper(), replica_path, format_version, entry_replace.drop_range_part_name);
         return true;
     }
 
@@ -2322,17 +2433,26 @@ bool StorageReplicatedMergeTree::executeReplaceRange(const LogEntry & entry)
 
     static const String TMP_PREFIX = "tmp_replace_from_";
 
-    std::vector<MergeTreeData::HardlinkedFiles> hardlinked_files_for_parts;
-
     auto obtain_part = [&] (PartDescriptionPtr & part_desc)
     {
-        if (part_desc->src_table_part)
+        /// Fetches with zero-copy-replication are cheap, but cloneAndLoadDataPartOnSameDisk will do full copy.
+        /// It's okay to check the setting for current table and disk for the source table, because src and dst part are on the same disk.
+        bool prefer_fetch_from_other_replica = !part_desc->replica.empty() && storage_settings_ptr->allow_remote_fs_zero_copy_replication
+            && part_desc->src_table_part && part_desc->src_table_part->isStoredOnRemoteDiskWithZeroCopySupport();
+
+        if (part_desc->src_table_part && !prefer_fetch_from_other_replica)
         {
             if (part_desc->checksum_hex != part_desc->src_table_part->checksums.getTotalChecksumHex())
                 throw Exception(ErrorCodes::UNFINISHED, "Checksums of {} is suddenly changed", part_desc->src_table_part->name);
 
+            bool zero_copy_enabled = dynamic_cast<const MergeTreeData *>(source_table.get())->getSettings()->allow_remote_fs_zero_copy_replication;
+            IDataPartStorage::ClonePartParams clone_params
+            {
+                .copy_instead_of_hardlink = zero_copy_enabled && part_desc->src_table_part->isStoredOnRemoteDiskWithZeroCopySupport(),
+                .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
+            };
             auto [res_part, temporary_part_lock] = cloneAndLoadDataPartOnSameDisk(
-                part_desc->src_table_part, TMP_PREFIX + "clone_", part_desc->new_part_info, metadata_snapshot, NO_TRANSACTION_PTR, &part_desc->hardlinked_files, false, {});
+                part_desc->src_table_part, TMP_PREFIX + "clone_", part_desc->new_part_info, metadata_snapshot, clone_params);
             part_desc->res_part = std::move(res_part);
             part_desc->temporary_part_lock = std::move(temporary_part_lock);
         }
@@ -2425,6 +2545,8 @@ bool StorageReplicatedMergeTree::executeReplaceRange(const LogEntry & entry)
     }
 
     removePartsFromZooKeeperWithRetries(parts_to_remove);
+    if (replace)
+        paranoidCheckForCoveredPartsInZooKeeper(this, getZooKeeper(), replica_path, format_version, entry_replace.drop_range_part_name);
     res_parts.clear();
     parts_to_remove.clear();
     cleanup_thread.wakeup();
@@ -2778,8 +2900,7 @@ void StorageReplicatedMergeTree::cloneReplica(const String & source_replica, Coo
                 desired_checksums = MinimalisticDataPartChecksums::deserializeFrom(desired_checksums_str);
             }
 
-            const auto [lo, hi] = desired_checksums.hash_of_all_files;
-            log_entry.part_checksum = getHexUIntUppercase(hi) + getHexUIntUppercase(lo);
+            log_entry.part_checksum = getHexUIntUppercase(desired_checksums.hash_of_all_files);
         }
         else
         {
@@ -2822,6 +2943,8 @@ void StorageReplicatedMergeTree::cloneReplica(const String & source_replica, Coo
     }
 
     LOG_DEBUG(log, "Copied {} queue entries, {} entries ignored", total_entries_to_copy, source_queue.size() - total_entries_to_copy);
+    LOG_TRACE(log, "Parts in ZooKeeper after mimic: {}", fmt::join(zookeeper->getChildren(replica_path + "/parts"), ", "));
+    LOG_TRACE(log, "Enqueued fetches after mimic: {}", fmt::join(created_get_parts, ", "));
 }
 
 
@@ -2893,7 +3016,9 @@ void StorageReplicatedMergeTree::cloneMetadataIfNeeded(const String & source_rep
     dummy_alter.alter_version = source_metadata_version;
     dummy_alter.create_time = time(nullptr);
 
-    zookeeper->create(replica_path + "/queue/queue-", dummy_alter.toString(), zkutil::CreateMode::PersistentSequential);
+    String path_created = zookeeper->create(replica_path + "/queue/queue-", dummy_alter.toString(), zkutil::CreateMode::PersistentSequential);
+    LOG_INFO(log, "Created an ALTER_METADATA entry {} to force metadata update after cloning replica from {}. Entry: {}",
+             path_created, source_replica, dummy_alter.toString());
 
     /// We don't need to do anything with mutation_pointer, because mutation log cleanup process is different from
     /// replication log cleanup. A mutation is removed from ZooKeeper only if all replicas had executed the mutation,
@@ -3163,6 +3288,8 @@ bool StorageReplicatedMergeTree::processQueueEntry(ReplicatedMergeTreeQueue::Sel
 
 bool StorageReplicatedMergeTree::scheduleDataProcessingJob(BackgroundJobsAssignee & assignee)
 {
+    cleanup_thread.wakeupEarlierIfNeeded();
+
     /// If replication queue is stopped exit immediately as we successfully executed the task
     if (queue.actions_blocker.isCancelled())
         return false;
@@ -3251,7 +3378,15 @@ void StorageReplicatedMergeTree::mergeSelectingTask()
     const bool cleanup = (storage_settings_ptr->clean_deleted_rows != CleanDeletedRows::Never);
     CreateMergeEntryResult create_result = CreateMergeEntryResult::Other;
 
-    try
+    enum class AttemptStatus
+    {
+        EntryCreated,
+        NeedRetry,
+        Limited,
+        CannotSelect,
+    };
+
+    auto try_assign_merge = [&]() -> AttemptStatus
     {
         /// We must select parts for merge under merge_selecting_mutex because other threads
         /// (OPTIMIZE queries) can assign new merges.
@@ -3273,108 +3408,136 @@ void StorageReplicatedMergeTree::mergeSelectingTask()
                 "Current background tasks memory usage: {}.",
                 formatReadableSizeWithBinarySuffix(background_memory_tracker.getSoftLimit()),
                 formatReadableSizeWithBinarySuffix(background_memory_tracker.get()));
+            return AttemptStatus::Limited;
         }
-        else if (merges_and_mutations_sum >= storage_settings_ptr->max_replicated_merges_in_queue)
+
+        if (merges_and_mutations_sum >= storage_settings_ptr->max_replicated_merges_in_queue)
         {
             LOG_TRACE(log, "Number of queued merges ({}) and part mutations ({})"
                 " is greater than max_replicated_merges_in_queue ({}), so won't select new parts to merge or mutate.",
                 merges_and_mutations_queued.merges,
                 merges_and_mutations_queued.mutations,
                 storage_settings_ptr->max_replicated_merges_in_queue);
+            return AttemptStatus::Limited;
         }
-        else
+
+        UInt64 max_source_parts_size_for_merge = merger_mutator.getMaxSourcePartsSizeForMerge(
+            storage_settings_ptr->max_replicated_merges_in_queue, merges_and_mutations_sum);
+
+        UInt64 max_source_part_size_for_mutation = merger_mutator.getMaxSourcePartSizeForMutation();
+
+        bool merge_with_ttl_allowed = merges_and_mutations_queued.merges_with_ttl < storage_settings_ptr->max_replicated_merges_with_ttl_in_queue &&
+            getTotalMergesWithTTLInMergeList() < storage_settings_ptr->max_number_of_merges_with_ttl_in_pool;
+
+        auto future_merged_part = std::make_shared<FutureMergedMutatedPart>();
+        if (storage_settings.get()->assign_part_uuids)
+            future_merged_part->uuid = UUIDHelpers::generateV4();
+
+        bool can_assign_merge = max_source_parts_size_for_merge > 0;
+        PartitionIdsHint partitions_to_merge_in;
+        if (can_assign_merge)
         {
-            UInt64 max_source_parts_size_for_merge = merger_mutator.getMaxSourcePartsSizeForMerge(
-                storage_settings_ptr->max_replicated_merges_in_queue, merges_and_mutations_sum);
+            auto lightweight_merge_pred = LocalMergePredicate(queue);
+            partitions_to_merge_in = merger_mutator.getPartitionsThatMayBeMerged(
+                max_source_parts_size_for_merge, lightweight_merge_pred, merge_with_ttl_allowed, NO_TRANSACTION_PTR);
+            if (partitions_to_merge_in.empty())
+                can_assign_merge = false;
+            else
+                merge_pred.emplace(queue.getMergePredicate(zookeeper, partitions_to_merge_in));
+        }
 
-            UInt64 max_source_part_size_for_mutation = merger_mutator.getMaxSourcePartSizeForMutation();
+        if (can_assign_merge &&
+            merger_mutator.selectPartsToMerge(future_merged_part, false, max_source_parts_size_for_merge, *merge_pred,
+                                              merge_with_ttl_allowed, NO_TRANSACTION_PTR, nullptr, &partitions_to_merge_in) == SelectPartsDecision::SELECTED)
+        {
+            create_result = createLogEntryToMergeParts(
+                zookeeper,
+                future_merged_part->parts,
+                future_merged_part->name,
+                future_merged_part->uuid,
+                future_merged_part->part_format,
+                deduplicate,
+                deduplicate_by_columns,
+                cleanup,
+                nullptr,
+                merge_pred->getVersion(),
+                future_merged_part->merge_type);
 
-            bool merge_with_ttl_allowed = merges_and_mutations_queued.merges_with_ttl < storage_settings_ptr->max_replicated_merges_with_ttl_in_queue &&
-                getTotalMergesWithTTLInMergeList() < storage_settings_ptr->max_number_of_merges_with_ttl_in_pool;
 
-            auto future_merged_part = std::make_shared<FutureMergedMutatedPart>();
-            if (storage_settings.get()->assign_part_uuids)
-                future_merged_part->uuid = UUIDHelpers::generateV4();
+            if (create_result == CreateMergeEntryResult::Ok)
+                return AttemptStatus::EntryCreated;
+            if (create_result == CreateMergeEntryResult::LogUpdated)
+                return AttemptStatus::NeedRetry;
+        }
 
-            bool can_assign_merge = max_source_parts_size_for_merge > 0;
-            PartitionIdsHint partitions_to_merge_in;
-            if (can_assign_merge)
+        /// If there are many mutations in queue, it may happen, that we cannot enqueue enough merges to merge all new parts
+        if (max_source_part_size_for_mutation == 0 || merges_and_mutations_queued.mutations >= storage_settings_ptr->max_replicated_mutations_in_queue)
+            return AttemptStatus::Limited;
+
+        if (queue.countMutations() > 0)
+        {
+            /// We don't need the list of committing blocks to choose a part to mutate
+            if (!merge_pred)
+                merge_pred.emplace(queue.getMergePredicate(zookeeper, PartitionIdsHint{}));
+
+            /// Choose a part to mutate.
+            DataPartsVector data_parts = getDataPartsVectorForInternalUsage();
+            for (const auto & part : data_parts)
             {
-                auto lightweight_merge_pred = LocalMergePredicate(queue);
-                partitions_to_merge_in = merger_mutator.getPartitionsThatMayBeMerged(
-                    max_source_parts_size_for_merge, lightweight_merge_pred, merge_with_ttl_allowed, NO_TRANSACTION_PTR);
-                if (partitions_to_merge_in.empty())
-                    can_assign_merge = false;
-                else
-                    merge_pred.emplace(queue.getMergePredicate(zookeeper, partitions_to_merge_in));
-            }
+                if (part->getBytesOnDisk() > max_source_part_size_for_mutation)
+                    continue;
 
-            if (can_assign_merge &&
-                merger_mutator.selectPartsToMerge(future_merged_part, false, max_source_parts_size_for_merge, *merge_pred,
-                                                  merge_with_ttl_allowed, NO_TRANSACTION_PTR, nullptr, &partitions_to_merge_in) == SelectPartsDecision::SELECTED)
-            {
-                create_result = createLogEntryToMergeParts(
-                    zookeeper,
-                    future_merged_part->parts,
-                    future_merged_part->name,
+                std::optional<std::pair<Int64, int>> desired_mutation_version = merge_pred->getDesiredMutationVersion(part);
+                if (!desired_mutation_version)
+                    continue;
+
+                create_result = createLogEntryToMutatePart(
+                    *part,
                     future_merged_part->uuid,
-                    future_merged_part->part_format,
-                    deduplicate,
-                    deduplicate_by_columns,
-                    cleanup,
-                    nullptr,
-                    merge_pred->getVersion(),
-                    future_merged_part->merge_type);
-            }
-            /// If there are many mutations in queue, it may happen, that we cannot enqueue enough merges to merge all new parts
-            else if (max_source_part_size_for_mutation > 0 && queue.countMutations() > 0
-                     && merges_and_mutations_queued.mutations < storage_settings_ptr->max_replicated_mutations_in_queue)
-            {
-                /// We don't need the list of committing blocks to choose a part to mutate
-                if (!merge_pred)
-                    merge_pred.emplace(queue.getMergePredicate(zookeeper, PartitionIdsHint{}));
+                    desired_mutation_version->first,
+                    desired_mutation_version->second,
+                    merge_pred->getVersion());
 
-                /// Choose a part to mutate.
-                DataPartsVector data_parts = getDataPartsVectorForInternalUsage();
-                for (const auto & part : data_parts)
-                {
-                    if (part->getBytesOnDisk() > max_source_part_size_for_mutation)
-                        continue;
-
-                    std::optional<std::pair<Int64, int>> desired_mutation_version = merge_pred->getDesiredMutationVersion(part);
-                    if (!desired_mutation_version)
-                        continue;
-
-                    create_result = createLogEntryToMutatePart(
-                        *part,
-                        future_merged_part->uuid,
-                        desired_mutation_version->first,
-                        desired_mutation_version->second,
-                        merge_pred->getVersion());
-
-                    if (create_result == CreateMergeEntryResult::Ok ||
-                        create_result == CreateMergeEntryResult::LogUpdated)
-                        break;
-                }
+                if (create_result == CreateMergeEntryResult::Ok)
+                    return AttemptStatus::EntryCreated;
+                if (create_result == CreateMergeEntryResult::LogUpdated)
+                    return AttemptStatus::NeedRetry;
             }
         }
+
+        return AttemptStatus::CannotSelect;
+    };
+
+    AttemptStatus result = AttemptStatus::CannotSelect;
+    try
+    {
+        result = try_assign_merge();
     }
     catch (...)
     {
         tryLogCurrentException(log, __PRETTY_FUNCTION__);
     }
 
-    if (!is_leader)
-        return;
 
-    if (create_result != CreateMergeEntryResult::Ok
-        && create_result != CreateMergeEntryResult::LogUpdated)
-    {
-        merge_selecting_task->scheduleAfter(storage_settings_ptr->merge_selecting_sleep_ms);
-    }
+    Float32 new_sleep_ms = merge_selecting_sleep_ms;
+    if (result == AttemptStatus::EntryCreated || result == AttemptStatus::NeedRetry)
+        new_sleep_ms /= storage_settings_ptr->merge_selecting_sleep_slowdown_factor;
+    else if (result == AttemptStatus::CannotSelect)
+        new_sleep_ms *= storage_settings_ptr->merge_selecting_sleep_slowdown_factor;
+    new_sleep_ms *= std::uniform_real_distribution<Float32>(1.f, 1.1f)(thread_local_rng);
+    merge_selecting_sleep_ms = static_cast<UInt64>(new_sleep_ms);
+
+    if (merge_selecting_sleep_ms < storage_settings_ptr->merge_selecting_sleep_ms)
+        merge_selecting_sleep_ms = storage_settings_ptr->merge_selecting_sleep_ms;
+    if (merge_selecting_sleep_ms > storage_settings_ptr->max_merge_selecting_sleep_ms)
+        merge_selecting_sleep_ms = storage_settings_ptr->max_merge_selecting_sleep_ms;
+
+    if (result == AttemptStatus::EntryCreated)
+        merge_selecting_task->schedule();
     else
     {
-        merge_selecting_task->schedule();
+        LOG_TRACE(log, "Scheduling next merge selecting task after {}ms", merge_selecting_sleep_ms);
+        merge_selecting_task->scheduleAfter(merge_selecting_sleep_ms);
     }
 }
 
@@ -4115,6 +4278,11 @@ bool StorageReplicatedMergeTree::fetchPart(
             profile_events_scope.getSnapshot());
     };
 
+    auto is_zero_copy_part = [&settings_ptr](const auto & data_part)
+    {
+        return settings_ptr->allow_remote_fs_zero_copy_replication && data_part->isStoredOnRemoteDiskWithZeroCopySupport();
+    };
+
     DataPartPtr part_to_clone;
     {
         /// If the desired part is a result of a part mutation, try to find the source part and compare
@@ -4126,7 +4294,7 @@ bool StorageReplicatedMergeTree::fetchPart(
         auto source_part = getActiveContainingPart(covered_part_info);
 
         /// Fetch for zero-copy replication is cheap and straightforward, so we don't use local clone here
-        if (source_part && (!settings_ptr->allow_remote_fs_zero_copy_replication || !source_part->getDataPartStorage().supportZeroCopyReplication()))
+        if (source_part && !is_zero_copy_part(source_part))
         {
             auto source_part_header = ReplicatedMergeTreePartHeader::fromColumnsAndChecksums(
                 source_part->getColumns(), source_part->checksums);
@@ -4175,14 +4343,15 @@ bool StorageReplicatedMergeTree::fetchPart(
     InterserverCredentialsPtr credentials;
     std::optional<CurrentlySubmergingEmergingTagger> tagger_ptr;
     std::function<MutableDataPartPtr()> get_part;
-    MergeTreeData::HardlinkedFiles hardlinked_files;
     scope_guard part_directory_lock;
 
     if (part_to_clone)
     {
         get_part = [&, part_to_clone]()
         {
-            auto [cloned_part, lock] = cloneAndLoadDataPartOnSameDisk(part_to_clone, "tmp_clone_", part_info, metadata_snapshot, NO_TRANSACTION_PTR, &hardlinked_files, false, {});
+            chassert(!is_zero_copy_part(part_to_clone));
+            IDataPartStorage::ClonePartParams clone_params{ .keep_metadata_version = true };
+            auto [cloned_part, lock] = cloneAndLoadDataPartOnSameDisk(part_to_clone, "tmp_clone_", part_info, metadata_snapshot, clone_params);
             part_directory_lock = std::move(lock);
             return cloned_part;
         };
@@ -4232,7 +4401,8 @@ bool StorageReplicatedMergeTree::fetchPart(
             Transaction transaction(*this, NO_TRANSACTION_RAW);
             renameTempPartAndReplace(part, transaction);
 
-            replaced_parts = checkPartChecksumsAndCommit(transaction, part, hardlinked_files, !part_to_clone);
+            chassert(!part_to_clone || !is_zero_copy_part(part));
+            replaced_parts = checkPartChecksumsAndCommit(transaction, part, /*hardlinked_files*/ {}, /*replace_zero_copy_lock*/ true);
 
             /** If a quorum is tracked for this part, you must update it.
               * If you do not have time, in case of losing the session, when you restart the server - see the `ReplicatedMergeTreeRestartingThread::updateQuorumIfWeHavePart` method.
@@ -4701,15 +4871,28 @@ void StorageReplicatedMergeTree::read(
     {
         auto table_id = getStorageID();
 
-        const auto & modified_query_ast =  ClusterProxy::rewriteSelectQuery(
-            local_context, query_info.query,
-            table_id.database_name, table_id.table_name, /*remote_table_function_ptr*/nullptr);
+        ASTPtr modified_query_ast;
+
+        Block header;
+
+        if (local_context->getSettingsRef().allow_experimental_analyzer)
+        {
+            auto modified_query_tree = buildQueryTreeForShard(query_info, query_info.query_tree);
+
+            header = InterpreterSelectQueryAnalyzer::getSampleBlock(
+                modified_query_tree, local_context, SelectQueryOptions(processed_stage).analyze());
+            modified_query_ast = queryNodeToSelectQuery(modified_query_tree);
+        }
+        else
+        {
+            modified_query_ast = ClusterProxy::rewriteSelectQuery(local_context, query_info.query,
+                table_id.database_name, table_id.table_name, /*remote_table_function_ptr*/nullptr);
+            header
+                = InterpreterSelectQuery(modified_query_ast, local_context, SelectQueryOptions(processed_stage).analyze()).getSampleBlock();
+        }
 
         auto cluster = local_context->getCluster(local_context->getSettingsRef().cluster_for_parallel_replicas);
 
-        Block header =
-            InterpreterSelectQuery(modified_query_ast, local_context, SelectQueryOptions(processed_stage).analyze()).getSampleBlock();
-
         ClusterProxy::SelectStreamFactory select_stream_factory =
             ClusterProxy::SelectStreamFactory(
                 header,
@@ -4790,7 +4973,7 @@ void StorageReplicatedMergeTree::assertNotReadonly() const
 }
 
 
-SinkToStoragePtr StorageReplicatedMergeTree::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+SinkToStoragePtr StorageReplicatedMergeTree::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool async_insert)
 {
     if (!initialization_done)
         throw Exception(ErrorCodes::NOT_INITIALIZED, "Table is not initialized yet");
@@ -4807,7 +4990,7 @@ SinkToStoragePtr StorageReplicatedMergeTree::write(const ASTPtr & /*query*/, con
     const auto storage_settings_ptr = getSettings();
     const Settings & query_settings = local_context->getSettingsRef();
     bool deduplicate = storage_settings_ptr->replicated_deduplication_window != 0 && query_settings.insert_deduplicate;
-    bool async_deduplicate = query_settings.async_insert && query_settings.async_insert_deduplicate && storage_settings_ptr->replicated_deduplication_window_for_async_inserts != 0 && query_settings.insert_deduplicate;
+    bool async_deduplicate = async_insert && query_settings.async_insert_deduplicate && storage_settings_ptr->replicated_deduplication_window_for_async_inserts != 0 && query_settings.insert_deduplicate;
     if (async_deduplicate)
         return std::make_shared<ReplicatedMergeTreeSinkWithAsyncDeduplicate>(
             *this, metadata_snapshot, query_settings.insert_quorum.valueOr(0),
@@ -5427,6 +5610,7 @@ void StorageReplicatedMergeTree::alter(
     if (mutation_znode)
     {
         LOG_DEBUG(log, "Metadata changes applied. Will wait for data changes.");
+        merge_selecting_task->schedule();
         waitMutation(*mutation_znode, query_context->getSettingsRef().alter_sync);
         LOG_DEBUG(log, "Data changes applied.");
     }
@@ -5439,7 +5623,7 @@ String getPartNamePossiblyFake(MergeTreeDataFormatVersion format_version, const
     if (format_version < MERGE_TREE_DATA_MIN_FORMAT_VERSION_WITH_CUSTOM_PARTITIONING)
     {
         /// The date range is all month long.
-        const auto & lut = DateLUT::instance();
+        const auto & lut = DateLUT::serverTimezoneInstance();
         time_t start_time = lut.YYYYMMDDToDate(parse<UInt32>(part_info.partition_id + "01"));
         DayNum left_date = DayNum(lut.toDayNum(start_time).toUnderType());
         DayNum right_date = DayNum(static_cast<size_t>(left_date) + lut.daysInMonth(start_time) - 1);
@@ -6578,6 +6762,8 @@ void StorageReplicatedMergeTree::mutate(const MutationCommands & commands, Conte
             throw Coordination::Exception("Unable to create a mutation znode", rc);
     }
 
+    merge_selecting_task->schedule();
+
     waitMutation(mutation_entry.znode_name, query_context->getSettingsRef().mutations_sync);
 }
 
@@ -6643,18 +6829,24 @@ bool StorageReplicatedMergeTree::hasLightweightDeletedMask() const
     return has_lightweight_delete_parts.load(std::memory_order_relaxed);
 }
 
-void StorageReplicatedMergeTree::clearOldPartsAndRemoveFromZK()
+size_t StorageReplicatedMergeTree::clearOldPartsAndRemoveFromZK()
 {
-    auto table_lock = lockForShare(
-            RWLockImpl::NO_QUERY, getSettings()->lock_acquire_timeout_for_background_operations);
+    auto table_lock = lockForShare(RWLockImpl::NO_QUERY, getSettings()->lock_acquire_timeout_for_background_operations);
     auto zookeeper = getZooKeeper();
 
     /// Now these parts are in Deleting state. If we fail to remove some of them we must roll them back to Outdated state.
     /// Otherwise they will not be deleted.
     DataPartsVector parts = grabOldParts();
+    size_t total_parts_to_remove = parts.size();
     if (parts.empty())
-        return;
+        return total_parts_to_remove;
 
+    NOEXCEPT_SCOPE({ clearOldPartsAndRemoveFromZKImpl(zookeeper, std::move(parts)); });
+    return total_parts_to_remove;
+}
+
+void StorageReplicatedMergeTree::clearOldPartsAndRemoveFromZKImpl(zkutil::ZooKeeperPtr zookeeper, DataPartsVector && parts)
+{
     DataPartsVector parts_to_delete_only_from_filesystem;    // Only duplicates
     DataPartsVector parts_to_delete_completely;              // All parts except duplicates
     DataPartsVector parts_to_retry_deletion;                 // Parts that should be retried due to network problems
@@ -6665,7 +6857,11 @@ void StorageReplicatedMergeTree::clearOldPartsAndRemoveFromZK()
         /// Broken part can be removed from zk by removePartAndEnqueueFetch(...) only.
         /// Removal without enqueueing a fetch leads to intersecting parts.
         if (part->is_duplicate || part->outdated_because_broken)
+        {
+            LOG_WARNING(log, "Will not remove part {} from ZooKeeper (is_duplicate: {}, outdated_because_broken: {})",
+                        part->name, part->is_duplicate, part->outdated_because_broken);
             parts_to_delete_only_from_filesystem.emplace_back(part);
+        }
         else
             parts_to_delete_completely.emplace_back(part);
     }
@@ -6691,7 +6887,7 @@ void StorageReplicatedMergeTree::clearOldPartsAndRemoveFromZK()
             if (!rollback_parts.empty())
                 rollbackDeletingParts(rollback_parts);
         }
-        else  /// all parts was successfully removed
+        else  /// all parts were successfully removed
         {
             finally_remove_parts = parts_to_delete;
         }
@@ -6764,6 +6960,31 @@ void StorageReplicatedMergeTree::clearOldPartsAndRemoveFromZK()
 }
 
 
+void StorageReplicatedMergeTree::forcefullyRemoveBrokenOutdatedPartFromZooKeeperBeforeDetaching(const String & part_name)
+{
+    /// An outdated part is broken and we are going to move it do detached/
+    /// But we need to remove it from ZooKeeper as well. Otherwise it will be considered as "lost forever".
+
+    /// Since the part is Outdated, it should be safe to remove it, but it's still dangerous.
+    /// It could became Outdated because it was merged/mutated (so we have a covering part) or because it was dropped.
+    /// But DROP [PART]ITION waits for all Outdated parts to be loaded, so it's not the case.
+
+    auto zookeeper = getZooKeeper();
+    String part_path = replica_path + "/parts/" + part_name;
+    if (!zookeeper->exists(part_path))
+        return;
+
+    auto part = getActiveContainingPart(part_name);
+    if (!part)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Outdated part {} is broken and going to be detached, "
+                        "but there's no active covering part, so we are not sure that it can be safely removed from ZooKeeper "
+                        "(path: {})", part_name, part_path);
+
+    LOG_WARNING(log, "Outdated part {} is broken and going to be detached, removing it from ZooKeeper. The part is covered by {}",
+                part_name, part->name);
+    removePartsFromZooKeeperWithRetries({part_name}, /* infinite retries */ 0);
+}
+
 void StorageReplicatedMergeTree::removePartsFromZooKeeperWithRetries(PartsToRemoveFromZooKeeper & parts, size_t max_retries)
 {
     Strings part_names_to_remove;
@@ -6775,114 +6996,57 @@ void StorageReplicatedMergeTree::removePartsFromZooKeeperWithRetries(PartsToRemo
 
 void StorageReplicatedMergeTree::removePartsFromZooKeeperWithRetries(const Strings & part_names, size_t max_retries)
 {
+    auto zookeeper = getZooKeeper();
+    NameSet parts_to_retry_set;
+    removePartsFromZooKeeper(zookeeper, part_names, &parts_to_retry_set);
+
     size_t num_tries = 0;
-    bool success = false;
-
-    while (!success && (max_retries == 0 || num_tries < max_retries))
+    while (!parts_to_retry_set.empty() && (max_retries == 0 || num_tries < max_retries))
     {
-        try
-        {
-            ++num_tries;
-            success = true;
-
-            auto zookeeper = getZooKeeper();
-
-            Strings exists_paths;
-            exists_paths.reserve(part_names.size());
-            for (const String & part_name : part_names)
-            {
-                exists_paths.emplace_back(fs::path(replica_path) / "parts" / part_name);
-            }
-
-            auto exists_results = zookeeper->exists(exists_paths);
-
-            std::vector<std::future<Coordination::MultiResponse>> remove_futures;
-            remove_futures.reserve(part_names.size());
-            for (size_t i = 0; i < part_names.size(); ++i)
-            {
-                Coordination::ExistsResponse exists_resp = exists_results[i];
-                if (exists_resp.error == Coordination::Error::ZOK)
-                {
-                    Coordination::Requests ops;
-                    getRemovePartFromZooKeeperOps(part_names[i], ops, exists_resp.stat.numChildren > 0);
-                    remove_futures.emplace_back(zookeeper->asyncTryMultiNoThrow(ops));
-                }
-            }
-
-            for (auto & future : remove_futures)
-            {
-                auto response = future.get();
-
-                if (response.error == Coordination::Error::ZOK || response.error == Coordination::Error::ZNONODE)
-                    continue;
-
-                if (Coordination::isHardwareError(response.error))
-                {
-                    success = false;
-                    continue;
-                }
-
-                throw Coordination::Exception(response.error);
-            }
-        }
-        catch (Coordination::Exception & e)
-        {
-            success = false;
-
-            if (Coordination::isHardwareError(e.code))
-                tryLogCurrentException(log, __PRETTY_FUNCTION__);
-            else
-                throw;
-        }
-
-        if (!success && num_tries < max_retries)
-            std::this_thread::sleep_for(std::chrono::milliseconds(1000));
+        zookeeper = getZooKeeper();
+        Strings parts_to_retry;
+        std::move(parts_to_retry_set.begin(), parts_to_retry_set.end(), std::back_inserter(parts_to_retry));
+        parts_to_retry_set.clear();
+        removePartsFromZooKeeper(zookeeper, parts_to_retry, &parts_to_retry_set);
+        ++num_tries;
     }
 
-    if (!success)
-        throw Exception(ErrorCodes::UNFINISHED, "Failed to remove parts from ZooKeeper after {} retries", num_tries);
+    if (!parts_to_retry_set.empty())
+        throw Exception(ErrorCodes::UNFINISHED, "Failed to remove {} parts from ZooKeeper after {} retries", parts_to_retry_set.size(), num_tries);
 }
 
 void StorageReplicatedMergeTree::removePartsFromZooKeeper(
     zkutil::ZooKeeperPtr & zookeeper, const Strings & part_names, NameSet * parts_should_be_retried)
+try
 {
     Strings exists_paths;
     std::vector<std::future<Coordination::MultiResponse>> remove_futures;
     exists_paths.reserve(part_names.size());
     remove_futures.reserve(part_names.size());
-    try
+    /// Exception can be thrown from loop
+    /// if zk session will be dropped
+    for (const String & part_name : part_names)
     {
-        /// Exception can be thrown from loop
-        /// if zk session will be dropped
-        for (const String & part_name : part_names)
-        {
-            exists_paths.emplace_back(fs::path(replica_path) / "parts" / part_name);
-        }
-
-        auto exists_results = zookeeper->exists(exists_paths);
-
-        for (size_t i = 0; i < part_names.size(); ++i)
-        {
-            auto exists_resp = exists_results[i];
-            if (exists_resp.error == Coordination::Error::ZOK)
-            {
-                Coordination::Requests ops;
-                getRemovePartFromZooKeeperOps(part_names[i], ops, exists_resp.stat.numChildren > 0);
-                remove_futures.emplace_back(zookeeper->asyncTryMultiNoThrow(ops));
-            }
-            else
-            {
-                LOG_DEBUG(log, "There is no part {} in ZooKeeper, it was only in filesystem", part_names[i]);
-                // emplace invalid future so that the total number of futures is the same as part_names.size();
-                remove_futures.emplace_back();
-            }
-        }
+        exists_paths.emplace_back(fs::path(replica_path) / "parts" / part_name);
     }
-    catch (const Coordination::Exception & e)
+
+    auto exists_results = zookeeper->exists(exists_paths);
+
+    for (size_t i = 0; i < part_names.size(); ++i)
     {
-        if (parts_should_be_retried && Coordination::isHardwareError(e.code))
-            parts_should_be_retried->insert(part_names.begin(), part_names.end());
-        throw;
+        auto exists_resp = exists_results[i];
+        if (exists_resp.error == Coordination::Error::ZOK)
+        {
+            Coordination::Requests ops;
+            getRemovePartFromZooKeeperOps(part_names[i], ops, exists_resp.stat.numChildren > 0);
+            remove_futures.emplace_back(zookeeper->asyncTryMultiNoThrow(ops));
+        }
+        else
+        {
+            LOG_DEBUG(log, "There is no part {} in ZooKeeper, it was only in filesystem", part_names[i]);
+            // emplace invalid future so that the total number of futures is the same as part_names.size();
+            remove_futures.emplace_back();
+        }
     }
 
     for (size_t i = 0; i < remove_futures.size(); ++i)
@@ -6895,21 +7059,27 @@ void StorageReplicatedMergeTree::removePartsFromZooKeeper(
         auto response = future.get();
         if (response.error == Coordination::Error::ZOK)
             continue;
-        else if (response.error == Coordination::Error::ZNONODE)
+
+        if (response.error == Coordination::Error::ZNONODE)
         {
             LOG_DEBUG(log, "There is no part {} in ZooKeeper, it was only in filesystem", part_names[i]);
-            continue;
         }
-        else if (Coordination::isHardwareError(response.error))
+        else
         {
             if (parts_should_be_retried)
                 parts_should_be_retried->insert(part_names[i]);
-            continue;
+
+            if (!Coordination::isHardwareError(response.error))
+                LOG_WARNING(log, "Cannot remove part {} from ZooKeeper: {}", part_names[i], Coordination::errorMessage(response.error));
         }
-        else
-            LOG_WARNING(log, "Cannot remove part {} from ZooKeeper: {}", part_names[i], Coordination::errorMessage(response.error));
     }
 }
+catch (...)
+{
+    if (parts_should_be_retried)
+        parts_should_be_retried->insert(part_names.begin(), part_names.end());
+    throw;
+}
 
 void StorageReplicatedMergeTree::clearLockedBlockNumbersInPartition(
     zkutil::ZooKeeper & zookeeper, const String & partition_id, Int64 min_block_num, Int64 max_block_num)
@@ -7100,7 +7270,6 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
         assert(replace == !LogEntry::ReplaceRangeEntry::isMovePartitionOrAttachFrom(drop_range));
 
         String drop_range_fake_part_name = getPartNamePossiblyFake(format_version, drop_range);
-        std::vector<MergeTreeData::HardlinkedFiles> hardlinked_files_for_parts;
 
         for (const auto & src_part : src_all_parts)
         {
@@ -7131,19 +7300,21 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
 
             UInt64 index = lock->getNumber();
             MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
-            MergeTreeData::HardlinkedFiles hardlinked_files;
 
-            bool copy_instead_of_hardlink = storage_settings_ptr->allow_remote_fs_zero_copy_replication
-                                            && src_part->isStoredOnRemoteDiskWithZeroCopySupport();
-
-            auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(src_part, TMP_PREFIX, dst_part_info, metadata_snapshot, NO_TRANSACTION_PTR, &hardlinked_files, copy_instead_of_hardlink, {});
+            bool zero_copy_enabled = storage_settings_ptr->allow_remote_fs_zero_copy_replication
+                || dynamic_cast<const MergeTreeData *>(source_table.get())->getSettings()->allow_remote_fs_zero_copy_replication;
+            IDataPartStorage::ClonePartParams clone_params
+            {
+                .copy_instead_of_hardlink = zero_copy_enabled && src_part->isStoredOnRemoteDiskWithZeroCopySupport(),
+                .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
+            };
+            auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(src_part, TMP_PREFIX, dst_part_info, metadata_snapshot, clone_params);
             src_parts.emplace_back(src_part);
             dst_parts.emplace_back(dst_part);
             dst_parts_locks.emplace_back(std::move(part_lock));
             ephemeral_locks.emplace_back(std::move(*lock));
             block_id_paths.emplace_back(block_id_path);
             part_checksums.emplace_back(hash_hex);
-            hardlinked_files_for_parts.emplace_back(hardlinked_files);
         }
 
         ReplicatedMergeTreeLogEntryData entry;
@@ -7175,8 +7346,8 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
             clearBlocksInPartition(*zookeeper, drop_range.partition_id, drop_range.max_block, drop_range.max_block);
         }
 
-        PartsToRemoveFromZooKeeper parts_to_remove;
         Coordination::Responses op_results;
+        DataPartsVector parts_holder;
 
         try
         {
@@ -7204,8 +7375,8 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
                     renameTempPartAndReplaceUnlocked(part, transaction, data_parts_lock);
             }
 
-            for (size_t i = 0; i < dst_parts.size(); ++i)
-                lockSharedData(*dst_parts[i], false, hardlinked_files_for_parts[i]);
+            for (const auto & dst_part : dst_parts)
+                lockSharedData(*dst_part, false, /*hardlinked_files*/ {});
 
             Coordination::Error code = zookeeper->tryMulti(ops, op_results);
             if (code == Coordination::Error::ZOK)
@@ -7226,7 +7397,10 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
                 auto data_parts_lock = lockParts();
                 transaction.commit(&data_parts_lock);
                 if (replace)
-                    parts_to_remove = removePartsInRangeFromWorkingSetAndGetPartsToRemoveFromZooKeeper(NO_TRANSACTION_RAW, drop_range, data_parts_lock);
+                {
+                    parts_holder = getDataPartsVectorInPartitionForInternalUsage(MergeTreeDataPartState::Active, drop_range.partition_id, &data_parts_lock);
+                    removePartsInRangeFromWorkingSet(NO_TRANSACTION_RAW, drop_range, data_parts_lock);
+                }
             }
 
             PartLog::addNewParts(getContext(), PartLog::createPartLogEntries(dst_parts, watch.elapsed(), profile_events_scope.getSnapshot()));
@@ -7246,16 +7420,15 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
         for (auto & lock : ephemeral_locks)
             lock.assumeUnlocked();
 
-        /// Forcibly remove replaced parts from ZooKeeper
-        removePartsFromZooKeeperWithRetries(parts_to_remove);
-
-        /// Speedup removing of replaced parts from filesystem
-        parts_to_remove.clear();
-        cleanup_thread.wakeup();
-
         lock2.reset();
         lock1.reset();
 
+        /// We need to pull the DROP_RANGE before cleaning the replaced parts (otherwise CHeckThread may decide that parts are lost)
+        queue.pullLogsToQueue(getZooKeeperAndAssertNotReadonly(), {}, ReplicatedMergeTreeQueue::SYNC);
+        parts_holder.clear();
+        cleanup_thread.wakeup();
+
+
         waitForLogEntryToBeProcessedIfNecessary(entry, query_context);
 
         return;
@@ -7344,7 +7517,6 @@ void StorageReplicatedMergeTree::movePartitionToTable(const StoragePtr & dest_ta
         String dest_alter_partition_version_path = dest_table_storage->zookeeper_path + "/alter_partition_version";
         Coordination::Stat dest_alter_partition_version_stat;
         zookeeper->get(dest_alter_partition_version_path, &dest_alter_partition_version_stat);
-        std::vector<MergeTreeData::HardlinkedFiles> hardlinked_files_for_parts;
         std::vector<scope_guard> temporary_parts_locks;
 
         for (const auto & src_part : src_all_parts)
@@ -7367,12 +7539,14 @@ void StorageReplicatedMergeTree::movePartitionToTable(const StoragePtr & dest_ta
             UInt64 index = lock->getNumber();
             MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
 
-            MergeTreeData::HardlinkedFiles hardlinked_files;
-
-            bool copy_instead_of_hardlink = storage_settings_ptr->allow_remote_fs_zero_copy_replication
-                                            && src_part->isStoredOnRemoteDiskWithZeroCopySupport();
-
-            auto [dst_part, dst_part_lock] = dest_table_storage->cloneAndLoadDataPartOnSameDisk(src_part, TMP_PREFIX, dst_part_info, dest_metadata_snapshot, NO_TRANSACTION_PTR, &hardlinked_files, copy_instead_of_hardlink, {});
+            bool zero_copy_enabled = storage_settings_ptr->allow_remote_fs_zero_copy_replication
+                || dynamic_cast<const MergeTreeData *>(dest_table.get())->getSettings()->allow_remote_fs_zero_copy_replication;
+            IDataPartStorage::ClonePartParams clone_params
+            {
+                .copy_instead_of_hardlink = zero_copy_enabled && src_part->isStoredOnRemoteDiskWithZeroCopySupport(),
+                .metadata_version_to_write = dest_metadata_snapshot->getMetadataVersion()
+            };
+            auto [dst_part, dst_part_lock] = dest_table_storage->cloneAndLoadDataPartOnSameDisk(src_part, TMP_PREFIX, dst_part_info, dest_metadata_snapshot, clone_params);
 
             src_parts.emplace_back(src_part);
             dst_parts.emplace_back(dst_part);
@@ -7380,7 +7554,6 @@ void StorageReplicatedMergeTree::movePartitionToTable(const StoragePtr & dest_ta
             ephemeral_locks.emplace_back(std::move(*lock));
             block_id_paths.emplace_back(block_id_path);
             part_checksums.emplace_back(hash_hex);
-            hardlinked_files_for_parts.emplace_back(hardlinked_files);
         }
 
         ReplicatedMergeTreeLogEntryData entry_delete;
@@ -7419,9 +7592,10 @@ void StorageReplicatedMergeTree::movePartitionToTable(const StoragePtr & dest_ta
 
         clearBlocksInPartition(*zookeeper, drop_range.partition_id, drop_range.max_block, drop_range.max_block);
 
-        PartsToRemoveFromZooKeeper parts_to_remove;
         Coordination::Responses op_results;
 
+        /// We should hold replaced parts until we actually create DROP_RANGE in ZooKeeper
+        DataPartsVector parts_holder;
         try
         {
             Coordination::Requests ops;
@@ -7447,8 +7621,8 @@ void StorageReplicatedMergeTree::movePartitionToTable(const StoragePtr & dest_ta
                 for (auto & part : dst_parts)
                     dest_table_storage->renameTempPartAndReplaceUnlocked(part, transaction, dest_data_parts_lock);
 
-                for (size_t i = 0; i < dst_parts.size(); ++i)
-                    dest_table_storage->lockSharedData(*dst_parts[i], false, hardlinked_files_for_parts[i]);
+                for (const auto & dst_part : dst_parts)
+                    dest_table_storage->lockSharedData(*dst_part, false, /*hardlinked_files*/ {});
 
                 Coordination::Error code = zookeeper->tryMulti(ops, op_results);
                 if (code == Coordination::Error::ZBADVERSION)
@@ -7456,7 +7630,8 @@ void StorageReplicatedMergeTree::movePartitionToTable(const StoragePtr & dest_ta
                 else
                     zkutil::KeeperMultiException::check(code, ops, op_results);
 
-                parts_to_remove = removePartsInRangeFromWorkingSetAndGetPartsToRemoveFromZooKeeper(NO_TRANSACTION_RAW, drop_range, src_data_parts_lock);
+                parts_holder = getDataPartsVectorInPartitionForInternalUsage(MergeTreeDataPartState::Active, drop_range.partition_id, &src_data_parts_lock);
+                removePartsInRangeFromWorkingSet(NO_TRANSACTION_RAW, drop_range, src_data_parts_lock);
                 transaction.commit(&src_data_parts_lock);
             }
 
@@ -7478,10 +7653,6 @@ void StorageReplicatedMergeTree::movePartitionToTable(const StoragePtr & dest_ta
         for (auto & lock : ephemeral_locks)
             lock.assumeUnlocked();
 
-        removePartsFromZooKeeperWithRetries(parts_to_remove);
-
-        parts_to_remove.clear();
-        cleanup_thread.wakeup();
         lock2.reset();
 
         dest_table_storage->waitForLogEntryToBeProcessedIfNecessary(entry, query_context);
@@ -7500,6 +7671,12 @@ void StorageReplicatedMergeTree::movePartitionToTable(const StoragePtr & dest_ta
         entry_delete.znode_name = log_znode_path.substr(log_znode_path.find_last_of('/') + 1);
 
         lock1.reset();
+
+        /// We need to pull the DROP_RANGE before cleaning the replaced parts (otherwise CHeckThread may decide that parts are lost)
+        queue.pullLogsToQueue(getZooKeeperAndAssertNotReadonly(), {}, ReplicatedMergeTreeQueue::SYNC);
+        parts_holder.clear();
+        cleanup_thread.wakeup();
+
         waitForLogEntryToBeProcessedIfNecessary(entry_delete, query_context);
 
         /// Cleaning possibly stored information about parts from /quorum/last_part node in ZooKeeper.
@@ -9363,45 +9540,17 @@ void StorageReplicatedMergeTree::backupData(
     else
         data_parts = getVisibleDataPartsVector(local_context);
 
-    auto backup_entries = backupParts(data_parts, /* data_path_in_backup */ "", backup_settings, local_context);
+    auto parts_backup_entries = backupParts(data_parts, /* data_path_in_backup */ "", backup_settings, local_context);
 
     auto coordination = backup_entries_collector.getBackupCoordination();
     String shared_id = getTableSharedID();
     coordination->addReplicatedDataPath(shared_id, data_path_in_backup);
 
-    std::unordered_map<String, SipHash> part_names_with_hashes_calculating;
-    for (auto & [relative_path, backup_entry] : backup_entries)
-    {
-        size_t slash_pos = relative_path.find('/');
-        if (slash_pos != String::npos)
-        {
-            String part_name = relative_path.substr(0, slash_pos);
-            if (MergeTreePartInfo::tryParsePartName(part_name, MERGE_TREE_DATA_MIN_FORMAT_VERSION_WITH_CUSTOM_PARTITIONING))
-            {
-                auto & hash = part_names_with_hashes_calculating[part_name];
-                if (relative_path.ends_with(".bin"))
-                {
-                    hash.update(relative_path);
-                    hash.update(backup_entry->getSize());
-                    hash.update(backup_entry->getChecksum());
-                }
-                continue;
-            }
-        }
-        /// Not a part name, probably error.
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "{} doesn't follow the format <part_name>/<path>", quoteString(relative_path));
-    }
-
-    std::vector<IBackupCoordination::PartNameAndChecksum> part_names_with_hashes;
-    part_names_with_hashes.reserve(part_names_with_hashes_calculating.size());
-    for (auto & [part_name, hash] : part_names_with_hashes_calculating)
-    {
-        UInt128 checksum;
-        hash.get128(checksum);
-        auto & part_name_with_hash = part_names_with_hashes.emplace_back();
-        part_name_with_hash.part_name = part_name;
-        part_name_with_hash.checksum = checksum;
-    }
+    using PartNameAndChecksum = IBackupCoordination::PartNameAndChecksum;
+    std::vector<PartNameAndChecksum> part_names_with_hashes;
+    part_names_with_hashes.reserve(parts_backup_entries.size());
+    for (const auto & part_backup_entries : parts_backup_entries)
+        part_names_with_hashes.emplace_back(PartNameAndChecksum{part_backup_entries.part_name, part_backup_entries.part_checksum});
 
     /// Send our list of part names to the coordination (to compare with other replicas).
     coordination->addReplicatedPartNames(shared_id, getStorageID().getFullTableName(), getReplicaName(), part_names_with_hashes);
@@ -9429,7 +9578,7 @@ void StorageReplicatedMergeTree::backupData(
     auto post_collecting_task = [shared_id,
                                  my_replica_name = getReplicaName(),
                                  coordination,
-                                 my_backup_entries = std::move(backup_entries),
+                                 my_parts_backup_entries = std::move(parts_backup_entries),
                                  &backup_entries_collector]()
     {
         Strings data_paths = coordination->getReplicatedDataPaths(shared_id);
@@ -9441,14 +9590,14 @@ void StorageReplicatedMergeTree::backupData(
         Strings part_names = coordination->getReplicatedPartNames(shared_id, my_replica_name);
         std::unordered_set<std::string_view> part_names_set{part_names.begin(), part_names.end()};
 
-        for (const auto & [relative_path, backup_entry] : my_backup_entries)
+        for (const auto & part_backup_entries : my_parts_backup_entries)
         {
-            size_t slash_pos = relative_path.find('/');
-            String part_name = relative_path.substr(0, slash_pos);
-            if (!part_names_set.contains(part_name))
-                continue;
-            for (const auto & data_path : data_paths_fs)
-                backup_entries_collector.addBackupEntry(data_path / relative_path, backup_entry);
+            if (part_names_set.contains(part_backup_entries.part_name))
+            {
+                for (const auto & [relative_path, backup_entry] : part_backup_entries.backup_entries)
+                    for (const auto & data_path : data_paths_fs)
+                        backup_entries_collector.addBackupEntry(data_path / relative_path, backup_entry);
+            }
         }
 
         auto mutation_infos = coordination->getReplicatedMutations(shared_id, my_replica_name);
diff --git a/src/Storages/StorageReplicatedMergeTree.h b/src/Storages/StorageReplicatedMergeTree.h
index cb93dd0b5e3..bdd3f0da5bf 100644
--- a/src/Storages/StorageReplicatedMergeTree.h
+++ b/src/Storages/StorageReplicatedMergeTree.h
@@ -108,7 +108,8 @@ public:
         const MergingParams & merging_params_,
         std::unique_ptr<MergeTreeSettings> settings_,
         bool has_force_restore_data_flag,
-        RenamingRestrictions renaming_restrictions_);
+        RenamingRestrictions renaming_restrictions_,
+        bool need_check_structure);
 
     void startup() override;
     void shutdown() override;
@@ -138,7 +139,7 @@ public:
     std::optional<UInt64> totalRowsByPartitionPredicate(const SelectQueryInfo & query_info, ContextPtr context) const override;
     std::optional<UInt64> totalBytes(const Settings & settings) const override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
     std::optional<QueryPipeline> distributedWrite(const ASTInsertQuery & /*query*/, ContextPtr /*context*/) override;
 
@@ -342,8 +343,9 @@ public:
 private:
     std::atomic_bool are_restoring_replica {false};
 
-    /// Delete old parts from disk and from ZooKeeper.
-    void clearOldPartsAndRemoveFromZK();
+    /// Delete old parts from disk and from ZooKeeper. Returns the number of removed parts
+    size_t clearOldPartsAndRemoveFromZK();
+    void clearOldPartsAndRemoveFromZKImpl(zkutil::ZooKeeperPtr zookeeper, DataPartsVector && parts);
 
     template<bool async_insert>
     friend class ReplicatedMergeTreeSinkImpl;
@@ -457,6 +459,8 @@ private:
     /// It is acquired for each iteration of the selection of parts to merge or each OPTIMIZE query.
     std::mutex merge_selecting_mutex;
 
+    UInt64 merge_selecting_sleep_ms;
+
     /// A task that marks finished mutations as done.
     BackgroundSchedulePool::TaskHolder mutations_finalizing_task;
 
@@ -526,7 +530,7 @@ private:
       */
     void createNewZooKeeperNodes();
 
-    void checkTableStructure(const String & zookeeper_prefix, const StorageMetadataPtr & metadata_snapshot);
+    bool checkTableStructure(const String & zookeeper_prefix, const StorageMetadataPtr & metadata_snapshot, bool strict_check = true);
 
     /// A part of ALTER: apply metadata changes only (data parts are altered separately).
     /// Must be called under IStorage::lockForAlter() lock.
@@ -578,6 +582,8 @@ private:
     void removePartsFromZooKeeperWithRetries(const Strings & part_names, size_t max_retries = 5);
     void removePartsFromZooKeeperWithRetries(PartsToRemoveFromZooKeeper & parts, size_t max_retries = 5);
 
+    void forcefullyRemoveBrokenOutdatedPartFromZooKeeperBeforeDetaching(const String & part_name) override;
+
     /// Removes a part from ZooKeeper and adds a task to the queue to download it. It is supposed to do this with broken parts.
     void removePartAndEnqueueFetch(const String & part_name, bool storage_init);
 
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 2d8aaec0f07..292ae4813dd 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -460,7 +460,10 @@ public:
         for (auto && key : all_keys)
         {
             std::optional<S3::ObjectInfo> info;
-            if (need_total_size)
+            /// In case all_keys.size() > 1, avoid getting object info now
+            /// (it will be done anyway eventually, but with delay and in parallel).
+            /// But progress bar will not work in this case.
+            if (need_total_size && all_keys.size() == 1)
             {
                 info = S3::getObjectInfo(client_, bucket, key, version_id_, request_settings_);
                 total_size += info->size;
@@ -570,19 +573,29 @@ StorageS3Source::StorageS3Source(
 {
     reader = createReader();
     if (reader)
+    {
+        total_objects_size = tryGetFileSizeFromReadBuffer(*reader.getReadBuffer()).value_or(0);
         reader_future = createReaderAsync();
+    }
 }
 
 StorageS3Source::ReaderHolder StorageS3Source::createReader()
 {
-    auto [current_key, info] = (*file_iterator)();
-    if (current_key.empty())
-        return {};
+    KeyWithInfo key_with_info;
+    size_t object_size;
+    do
+    {
+        key_with_info = (*file_iterator)();
+        if (key_with_info.key.empty())
+            return {};
 
-    size_t object_size = info ? info->size : S3::getObjectSize(*client, bucket, current_key, version_id, request_settings);
-    auto compression_method = chooseCompressionMethod(current_key, compression_hint);
+        object_size = key_with_info.info ? key_with_info.info->size : S3::getObjectSize(*client, bucket, key_with_info.key, version_id, request_settings);
+    }
+    while (getContext()->getSettingsRef().s3_skip_empty_files && object_size == 0);
 
-    auto read_buf = createS3ReadBuffer(current_key, object_size);
+    auto compression_method = chooseCompressionMethod(key_with_info.key, compression_hint);
+
+    auto read_buf = createS3ReadBuffer(key_with_info.key, object_size);
     auto input_format = FormatFactory::instance().getInput(
             format, *read_buf, sample_block, getContext(), max_block_size,
             format_settings, std::nullopt, std::nullopt,
@@ -601,7 +614,7 @@ StorageS3Source::ReaderHolder StorageS3Source::createReader()
     auto pipeline = std::make_unique<QueryPipeline>(QueryPipelineBuilder::getPipeline(std::move(builder)));
     auto current_reader = std::make_unique<PullingPipelineExecutor>(*pipeline);
 
-    return ReaderHolder{fs::path(bucket) / current_key, std::move(read_buf), std::move(pipeline), std::move(current_reader)};
+    return ReaderHolder{fs::path(bucket) / key_with_info.key, std::move(read_buf), input_format, std::move(pipeline), std::move(current_reader)};
 }
 
 std::future<StorageS3Source::ReaderHolder> StorageS3Source::createReaderAsync()
@@ -657,7 +670,7 @@ std::unique_ptr<ReadBuffer> StorageS3Source::createAsyncS3ReadBuffer(
         std::move(read_buffer_creator),
         StoredObjects{StoredObject{key, object_size}},
         read_settings,
-        /* cache_log */nullptr);
+        /* cache_log */nullptr, /* use_external_buffer */true);
 
     auto modified_settings{read_settings};
     /// FIXME: Changing this setting to default value breaks something around parquet reading
@@ -702,11 +715,13 @@ Chunk StorageS3Source::generate()
             UInt64 num_rows = chunk.getNumRows();
 
             const auto & file_path = reader.getPath();
-            size_t total_size = file_iterator->getTotalSize();
-            if (num_rows && total_size)
+
+            if (num_rows && total_objects_size)
             {
-                updateRowsProgressApprox(
-                    *this, chunk, total_size, total_rows_approx_accumulated, total_rows_count_times, total_rows_approx_max);
+                size_t chunk_size = reader.getFormat()->getApproxBytesReadForChunk();
+                if (!chunk_size)
+                    chunk_size = chunk.bytes();
+                updateRowsProgressApprox(*this, num_rows, chunk_size, total_objects_size, total_rows_approx_accumulated, total_rows_count_times, total_rows_approx_max);
             }
 
             for (const auto & virtual_column : requested_virtual_columns)
@@ -733,6 +748,13 @@ Chunk StorageS3Source::generate()
         if (!reader)
             break;
 
+        size_t object_size = tryGetFileSizeFromReadBuffer(*reader.getReadBuffer()).value_or(0);
+        /// Adjust total_rows_approx_accumulated with new total size.
+        if (total_objects_size)
+            total_rows_approx_accumulated = static_cast<size_t>(
+                std::ceil(static_cast<double>(total_objects_size + object_size) / total_objects_size * total_rows_approx_accumulated));
+        total_objects_size += object_size;
+
         /// Even if task is finished the thread may be not freed in pool.
         /// So wait until it will be freed before scheduling a new task.
         create_reader_pool.wait();
@@ -766,7 +788,7 @@ public:
                 DBMS_DEFAULT_BUFFER_SIZE,
                 configuration_.request_settings,
                 std::nullopt,
-                threadPoolCallbackRunner<void>(IOThreadPool::get(), "S3ParallelWrite"),
+                threadPoolCallbackRunner<void>(getIOThreadPool().get(), "S3ParallelWrite"),
                 context->getWriteSettings()),
             compression_method,
             3);
@@ -791,10 +813,18 @@ public:
         cancelled = true;
     }
 
-    void onException() override
+    void onException(std::exception_ptr exception) override
     {
         std::lock_guard lock(cancel_mutex);
-        finalize();
+        try
+        {
+            std::rethrow_exception(exception);
+        }
+        catch (...)
+        {
+            /// An exception context is needed to proper delete write buffers without finalization
+            release();
+        }
     }
 
     void onFinish() override
@@ -818,12 +848,17 @@ private:
         catch (...)
         {
             /// Stop ParallelFormattingOutputFormat correctly.
-            writer.reset();
-            write_buf->finalize();
+            release();
             throw;
         }
     }
 
+    void release()
+    {
+        writer.reset();
+        write_buf.reset();
+    }
+
     Block sample_block;
     std::optional<FormatSettings> format_settings;
     std::unique_ptr<WriteBuffer> write_buf;
@@ -1086,7 +1121,7 @@ Pipe StorageS3::read(
     return Pipe::unitePipes(std::move(pipes));
 }
 
-SinkToStoragePtr StorageS3::write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+SinkToStoragePtr StorageS3::write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
     auto query_configuration = updateConfigurationAndGetCopy(local_context);
 
@@ -1446,38 +1481,45 @@ ColumnsDescription StorageS3::getTableStructureFromDataImpl(
 
     ReadBufferIterator read_buffer_iterator = [&, first = true](ColumnsDescription & cached_columns) mutable -> std::unique_ptr<ReadBuffer>
     {
-        auto [key, _] = (*file_iterator)();
-
-        if (key.empty())
+        while (true)
         {
-            if (first)
-                throw Exception(
-                    ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-                    "Cannot extract table structure from {} format file, because there are no files with provided path "
-                    "in S3. You must specify table structure manually", configuration.format);
+            auto key_with_info = (*file_iterator)();
 
-            return nullptr;
-        }
-
-        /// S3 file iterator could get new keys after new iteration, check them in schema cache.
-        if (ctx->getSettingsRef().schema_inference_use_cache_for_s3 && read_keys.size() > prev_read_keys_size)
-        {
-            columns_from_cache = tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end(), configuration, format_settings, ctx);
-            prev_read_keys_size = read_keys.size();
-            if (columns_from_cache)
+            if (key_with_info.key.empty())
             {
-                cached_columns = *columns_from_cache;
+                if (first)
+                    throw Exception(
+                        ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                        "Cannot extract table structure from {} format file, because there are no files with provided path "
+                        "in S3 or all files are empty. You must specify table structure manually",
+                        configuration.format);
+
                 return nullptr;
             }
-        }
 
-        first = false;
-        int zstd_window_log_max = static_cast<int>(ctx->getSettingsRef().zstd_window_log_max);
-        return wrapReadBufferWithCompressionMethod(
-            std::make_unique<ReadBufferFromS3>(
-                configuration.client, configuration.url.bucket, key, configuration.url.version_id, configuration.request_settings, ctx->getReadSettings()),
-            chooseCompressionMethod(key, configuration.compression_method),
-            zstd_window_log_max);
+            /// S3 file iterator could get new keys after new iteration, check them in schema cache.
+            if (ctx->getSettingsRef().schema_inference_use_cache_for_s3 && read_keys.size() > prev_read_keys_size)
+            {
+                columns_from_cache = tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end(), configuration, format_settings, ctx);
+                prev_read_keys_size = read_keys.size();
+                if (columns_from_cache)
+                {
+                    cached_columns = *columns_from_cache;
+                    return nullptr;
+                }
+            }
+
+            if (ctx->getSettingsRef().s3_skip_empty_files && key_with_info.info && key_with_info.info->size == 0)
+                continue;
+
+            int zstd_window_log_max = static_cast<int>(ctx->getSettingsRef().zstd_window_log_max);
+            auto impl = std::make_unique<ReadBufferFromS3>(configuration.client, configuration.url.bucket, key_with_info.key, configuration.url.version_id, configuration.request_settings, ctx->getReadSettings());
+            if (!ctx->getSettingsRef().s3_skip_empty_files || !impl->eof())
+            {
+                first = false;
+                return wrapReadBufferWithCompressionMethod(std::move(impl), chooseCompressionMethod(key_with_info.key, configuration.compression_method), zstd_window_log_max);
+            }
+        }
     };
 
     ColumnsDescription columns;
diff --git a/src/Storages/StorageS3.h b/src/Storages/StorageS3.h
index a4c120b99a6..13053833623 100644
--- a/src/Storages/StorageS3.h
+++ b/src/Storages/StorageS3.h
@@ -163,10 +163,12 @@ private:
         ReaderHolder(
             String path_,
             std::unique_ptr<ReadBuffer> read_buf_,
+            std::shared_ptr<IInputFormat> input_format_,
             std::unique_ptr<QueryPipeline> pipeline_,
             std::unique_ptr<PullingPipelineExecutor> reader_)
             : path(std::move(path_))
             , read_buf(std::move(read_buf_))
+            , input_format(input_format_)
             , pipeline(std::move(pipeline_))
             , reader(std::move(reader_))
         {
@@ -187,11 +189,16 @@ private:
             /// reader uses pipeline, pipeline uses read_buf.
             reader = std::move(other.reader);
             pipeline = std::move(other.pipeline);
+            input_format = std::move(other.input_format);
             read_buf = std::move(other.read_buf);
             path = std::move(other.path);
             return *this;
         }
 
+        const std::unique_ptr<ReadBuffer> & getReadBuffer() const { return read_buf; }
+
+        const std::shared_ptr<IInputFormat> & getFormat() const { return input_format; }
+
         explicit operator bool() const { return reader != nullptr; }
         PullingPipelineExecutor * operator->() { return reader.get(); }
         const PullingPipelineExecutor * operator->() const { return reader.get(); }
@@ -200,6 +207,7 @@ private:
     private:
         String path;
         std::unique_ptr<ReadBuffer> read_buf;
+        std::shared_ptr<IInputFormat> input_format;
         std::unique_ptr<QueryPipeline> pipeline;
         std::unique_ptr<PullingPipelineExecutor> reader;
     };
@@ -219,6 +227,7 @@ private:
     UInt64 total_rows_approx_max = 0;
     size_t total_rows_count_times = 0;
     UInt64 total_rows_approx_accumulated = 0;
+    size_t total_objects_size = 0;
 
     /// Recreate ReadBuffer and Pipeline for each file.
     ReaderHolder createReader();
@@ -293,7 +302,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
     void truncate(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, TableExclusiveLockHolder &) override;
 
diff --git a/src/Storages/StorageSQLite.cpp b/src/Storages/StorageSQLite.cpp
index bd445217979..d5ae6f2383f 100644
--- a/src/Storages/StorageSQLite.cpp
+++ b/src/Storages/StorageSQLite.cpp
@@ -169,7 +169,7 @@ private:
 };
 
 
-SinkToStoragePtr StorageSQLite::write(const ASTPtr & /* query */, const StorageMetadataPtr & metadata_snapshot, ContextPtr)
+SinkToStoragePtr StorageSQLite::write(const ASTPtr & /* query */, const StorageMetadataPtr & metadata_snapshot, ContextPtr /*context*/, bool /*async_insert*/)
 {
     if (!sqlite_db)
         sqlite_db = openSQLiteDB(database_path, getContext(), /* throw_on_error */true);
diff --git a/src/Storages/StorageSQLite.h b/src/Storages/StorageSQLite.h
index 323c29ac8bb..9da040cbd5c 100644
--- a/src/Storages/StorageSQLite.h
+++ b/src/Storages/StorageSQLite.h
@@ -40,7 +40,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
     static ColumnsDescription getTableStructureFromData(
         const SQLitePtr & sqlite_db_,
diff --git a/src/Storages/StorageSet.cpp b/src/Storages/StorageSet.cpp
index 00b5dbfc5e3..79369ab4bcb 100644
--- a/src/Storages/StorageSet.cpp
+++ b/src/Storages/StorageSet.cpp
@@ -106,7 +106,7 @@ void SetOrJoinSink::onFinish()
 }
 
 
-SinkToStoragePtr StorageSetOrJoinBase::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr context)
+SinkToStoragePtr StorageSetOrJoinBase::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, bool /*async_insert*/)
 {
     UInt64 id = ++increment;
     return std::make_shared<SetOrJoinSink>(
@@ -147,7 +147,7 @@ StorageSet::StorageSet(
     const String & comment,
     bool persistent_)
     : StorageSetOrJoinBase{disk_, relative_path_, table_id_, columns_, constraints_, comment, persistent_}
-    , set(std::make_shared<Set>(SizeLimits(), false, true))
+    , set(std::make_shared<Set>(SizeLimits(), 0, true))
 {
     Block header = getInMemoryMetadataPtr()->getSampleBlock();
     set->setHeader(header.getColumnsWithTypeAndName());
@@ -176,7 +176,7 @@ void StorageSet::truncate(const ASTPtr &, const StorageMetadataPtr & metadata_sn
     Block header = metadata_snapshot->getSampleBlock();
 
     increment = 0;
-    set = std::make_shared<Set>(SizeLimits(), false, true);
+    set = std::make_shared<Set>(SizeLimits(), 0, true);
     set->setHeader(header.getColumnsWithTypeAndName());
 }
 
diff --git a/src/Storages/StorageSet.h b/src/Storages/StorageSet.h
index ccd1eb9912b..b310f817eb9 100644
--- a/src/Storages/StorageSet.h
+++ b/src/Storages/StorageSet.h
@@ -24,7 +24,7 @@ class StorageSetOrJoinBase : public IStorage
 public:
     void rename(const String & new_path_to_table_data, const StorageID & new_table_id) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
     bool storesDataOnDisk() const override { return true; }
     Strings getDataPaths() const override { return {path}; }
diff --git a/src/Storages/StorageStripeLog.cpp b/src/Storages/StorageStripeLog.cpp
index b2e7c202800..d8bbd523cbf 100644
--- a/src/Storages/StorageStripeLog.cpp
+++ b/src/Storages/StorageStripeLog.cpp
@@ -394,7 +394,7 @@ Pipe StorageStripeLog::read(
 }
 
 
-SinkToStoragePtr StorageStripeLog::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+SinkToStoragePtr StorageStripeLog::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
     WriteLock lock{rwlock, getLockTimeout(local_context)};
     if (!lock)
@@ -424,6 +424,8 @@ void StorageStripeLog::truncate(const ASTPtr &, const StorageMetadataPtr &, Cont
 
     indices_loaded = true;
     num_indices_saved = 0;
+    total_rows = 0;
+    total_bytes = 0;
     getContext()->dropMMappedFileCache();
 }
 
diff --git a/src/Storages/StorageStripeLog.h b/src/Storages/StorageStripeLog.h
index 3f1b4ed0ad5..f889a1de71b 100644
--- a/src/Storages/StorageStripeLog.h
+++ b/src/Storages/StorageStripeLog.h
@@ -49,7 +49,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool async_insert) override;
 
     void rename(const String & new_path_to_table_data, const StorageID & new_table_id) override;
 
diff --git a/src/Storages/StorageTableFunction.h b/src/Storages/StorageTableFunction.h
index ccec087a8d9..26cbe1f0233 100644
--- a/src/Storages/StorageTableFunction.h
+++ b/src/Storages/StorageTableFunction.h
@@ -130,7 +130,8 @@ public:
     SinkToStoragePtr write(
             const ASTPtr & query,
             const StorageMetadataPtr & metadata_snapshot,
-            ContextPtr context) override
+            ContextPtr context,
+            bool async_insert) override
     {
         auto storage = getNested();
         auto cached_structure = metadata_snapshot->getSampleBlock();
@@ -139,7 +140,7 @@ public:
         {
             throw Exception(ErrorCodes::INCOMPATIBLE_COLUMNS, "Source storage and table function have different structure");
         }
-        return storage->write(query, metadata_snapshot, context);
+        return storage->write(query, metadata_snapshot, context, async_insert);
     }
 
     void renameInMemory(const StorageID & new_table_id) override
diff --git a/src/Storages/StorageURL.cpp b/src/Storages/StorageURL.cpp
index efc44a069dd..e6953afe68e 100644
--- a/src/Storages/StorageURL.cpp
+++ b/src/Storages/StorageURL.cpp
@@ -14,10 +14,8 @@
 #include <Parsers/ASTIdentifier.h>
 
 #include <IO/ConnectionTimeouts.h>
-#include <IO/ParallelReadBuffer.h>
 #include <IO/WriteBufferFromHTTP.h>
 #include <IO/WriteHelpers.h>
-#include <IO/WithFileSize.h>
 
 #include <Formats/FormatFactory.h>
 #include <Formats/ReadSchemaUtils.h>
@@ -29,7 +27,6 @@
 #include <Common/ThreadStatus.h>
 #include <Common/parseRemoteDescription.h>
 #include <Common/NamedCollections/NamedCollections.h>
-#include <IO/HTTPCommon.h>
 #include <IO/ReadWriteBufferFromHTTP.h>
 #include <IO/HTTPHeaderEntries.h>
 
@@ -39,6 +36,7 @@
 #include <Poco/Net/HTTPRequest.h>
 #include <regex>
 #include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 
 
 namespace DB
@@ -48,7 +46,7 @@ namespace ErrorCodes
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int NETWORK_ERROR;
     extern const int BAD_ARGUMENTS;
-    extern const int LOGICAL_ERROR;
+    extern const int CANNOT_EXTRACT_TABLE_STRUCTURE;
 }
 
 static constexpr auto bad_arguments_error_message = "Storage URL requires 1-4 arguments: "
@@ -242,39 +240,57 @@ StorageURLSource::StorageURLSource(
     auto headers = getHeaders(headers_);
 
     /// Lazy initialization. We should not perform requests in constructor, because we need to do it in query pipeline.
-    initialize = [=, this](const FailoverOptions & uri_options)
+    initialize = [=, this]()
     {
-        if (uri_options.empty())
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty url list");
+        std::vector<String> current_uri_options;
+        std::pair<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> uri_and_buf;
+        do
+        {
+            current_uri_options = (*uri_iterator)();
+            if (current_uri_options.empty())
+                return false;
 
-        auto first_option = uri_options.begin();
-        auto [actual_uri, buf] = getFirstAvailableURIAndReadBuffer(
-            first_option,
-            uri_options.end(),
-            context,
-            params,
-            http_method,
-            callback,
-            timeouts,
-            credentials,
-            headers,
-            glob_url,
-            uri_options.size() == 1);
+            auto first_option = current_uri_options.cbegin();
+            uri_and_buf = getFirstAvailableURIAndReadBuffer(
+                first_option,
+                current_uri_options.end(),
+                context,
+                params,
+                http_method,
+                callback,
+                timeouts,
+                credentials,
+                headers,
+                glob_url,
+                current_uri_options.size() == 1);
 
-        curr_uri = actual_uri;
-        read_buf = std::move(buf);
+            /// If file is empty and engine_url_skip_empty_files=1, skip it and go to the next file.
+        }
+        while (context->getSettingsRef().engine_url_skip_empty_files && uri_and_buf.second->eof());
 
+        curr_uri = uri_and_buf.first;
+        read_buf = std::move(uri_and_buf.second);
+
+        size_t file_size = 0;
         try
         {
-            total_size += getFileSizeFromReadBuffer(*read_buf);
+            file_size = getFileSizeFromReadBuffer(*read_buf);
         }
         catch (...)
         {
-            // we simply continue without total_size
+            // we simply continue without updating total_size
+        }
+
+        if (file_size)
+        {
+            /// Adjust total_rows_approx_accumulated with new total size.
+            if (total_size)
+                total_rows_approx_accumulated = static_cast<size_t>(std::ceil(static_cast<double>(total_size + file_size) / total_size * total_rows_approx_accumulated));
+            total_size += file_size;
         }
 
         // TODO: Pass max_parsing_threads and max_download_threads adjusted for num_streams.
-        auto input_format = FormatFactory::instance().getInput(
+        input_format = FormatFactory::instance().getInput(
             format,
             *read_buf,
             sample_block,
@@ -294,6 +310,7 @@ StorageURLSource::StorageURLSource(
 
         pipeline = std::make_unique<QueryPipeline>(QueryPipelineBuilder::getPipeline(std::move(builder)));
         reader = std::make_unique<PullingPipelineExecutor>(*pipeline);
+        return true;
     };
 }
 
@@ -308,22 +325,21 @@ Chunk StorageURLSource::generate()
             break;
         }
 
-        if (!reader)
-        {
-            auto current_uri = (*uri_iterator)();
-            if (current_uri.empty())
-                return {};
-
-            initialize(current_uri);
-        }
+        if (!reader && !initialize())
+            return {};
 
         Chunk chunk;
         if (reader->pull(chunk))
         {
             UInt64 num_rows = chunk.getNumRows();
             if (num_rows && total_size)
+            {
+                size_t chunk_size = input_format->getApproxBytesReadForChunk();
+                if (!chunk_size)
+                    chunk_size = chunk.bytes();
                 updateRowsProgressApprox(
-                    *this, chunk, total_size, total_rows_approx_accumulated, total_rows_count_times, total_rows_approx_max);
+                    *this, num_rows, chunk_size, total_size, total_rows_approx_accumulated, total_rows_count_times, total_rows_approx_max);
+            }
 
             const String & path{curr_uri.getPath()};
 
@@ -346,11 +362,13 @@ Chunk StorageURLSource::generate()
 
         pipeline->reset();
         reader.reset();
+        input_format.reset();
+        read_buf.reset();
     }
     return {};
 }
 
-std::tuple<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> StorageURLSource::getFirstAvailableURIAndReadBuffer(
+std::pair<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> StorageURLSource::getFirstAvailableURIAndReadBuffer(
     std::vector<String>::const_iterator & option,
     const std::vector<String>::const_iterator & end,
     ContextPtr context,
@@ -367,6 +385,7 @@ std::tuple<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> StorageURLSource
     ReadSettings read_settings = context->getReadSettings();
 
     size_t options = std::distance(option, end);
+    std::pair<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> last_skipped_empty_res;
     for (; option != end; ++option)
     {
         bool skip_url_not_found_error = glob_url && read_settings.http_skip_not_found_url_for_globs && option == std::prev(end);
@@ -396,6 +415,12 @@ std::tuple<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> StorageURLSource
                 /* use_external_buffer */ false,
                 /* skip_url_not_found_error */ skip_url_not_found_error);
 
+            if (context->getSettingsRef().engine_url_skip_empty_files && res->eof() && option != std::prev(end))
+            {
+                last_skipped_empty_res = {request_uri, std::move(res)};
+                continue;
+            }
+
             return std::make_tuple(request_uri, std::move(res));
         }
         catch (...)
@@ -412,6 +437,11 @@ std::tuple<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> StorageURLSource
         }
     }
 
+    /// If all options are unreachable except empty ones that we skipped,
+    /// return last empty result. It will be skipped later.
+    if (last_skipped_empty_res.second)
+        return last_skipped_empty_res;
+
     throw Exception(ErrorCodes::NETWORK_ERROR, "All uri ({}) options are unreachable: {}", options, first_exception_message);
 }
 
@@ -453,10 +483,18 @@ void StorageURLSink::onCancel()
     cancelled = true;
 }
 
-void StorageURLSink::onException()
+void StorageURLSink::onException(std::exception_ptr exception)
 {
     std::lock_guard lock(cancel_mutex);
-    finalize();
+    try
+    {
+        std::rethrow_exception(exception);
+    }
+    catch (...)
+    {
+        /// An exception context is needed to proper delete write buffers without finalization
+        release();
+    }
 }
 
 void StorageURLSink::onFinish()
@@ -479,12 +517,17 @@ void StorageURLSink::finalize()
     catch (...)
     {
         /// Stop ParallelFormattingOutputFormat correctly.
-        writer.reset();
-        write_buf->finalize();
+        release();
         throw;
     }
 }
 
+void StorageURLSink::release()
+{
+    writer.reset();
+    write_buf->finalize();
+}
+
 class PartitionedStorageURLSink : public PartitionedSink
 {
 public:
@@ -593,26 +636,41 @@ ColumnsDescription IStorageURLBase::getTableStructureFromData(
     if (context->getSettingsRef().schema_inference_use_cache_for_url)
         columns_from_cache = tryGetColumnsFromCache(urls_to_check, headers, credentials, format, format_settings, context);
 
-    ReadBufferIterator read_buffer_iterator = [&, it = urls_to_check.cbegin()](ColumnsDescription &) mutable -> std::unique_ptr<ReadBuffer>
+    ReadBufferIterator read_buffer_iterator = [&, it = urls_to_check.cbegin(), first = true](ColumnsDescription &) mutable -> std::unique_ptr<ReadBuffer>
     {
-        if (it == urls_to_check.cend())
-            return nullptr;
+        std::pair<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> uri_and_buf;
+        do
+        {
+            if (it == urls_to_check.cend())
+            {
+                if (first)
+                    throw Exception(
+                        ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                        "Cannot extract table structure from {} format file, because all files are empty. "
+                        "You must specify table structure manually",
+                        format);
+                return nullptr;
+            }
 
-        auto [_, buf] = StorageURLSource::getFirstAvailableURIAndReadBuffer(
-            it,
-            urls_to_check.cend(),
-            context,
-            {},
-            Poco::Net::HTTPRequest::HTTP_GET,
-            {},
-            getHTTPTimeouts(context),
-            credentials,
-            headers,
-            false,
-            false);
-        ++it;
+            uri_and_buf = StorageURLSource::getFirstAvailableURIAndReadBuffer(
+                it,
+                urls_to_check.cend(),
+                context,
+                {},
+                Poco::Net::HTTPRequest::HTTP_GET,
+                {},
+                getHTTPTimeouts(context),
+                credentials,
+                headers,
+                false,
+                false);
+
+            ++it;
+        } while (context->getSettingsRef().engine_url_skip_empty_files && uri_and_buf.second->eof());
+
+        first = false;
         return wrapReadBufferWithCompressionMethod(
-            std::move(buf),
+            std::move(uri_and_buf.second),
             compression_method,
             static_cast<int>(context->getSettingsRef().zstd_window_log_max));
     };
@@ -803,7 +861,7 @@ Pipe StorageURLWithFailover::read(
 }
 
 
-SinkToStoragePtr IStorageURLBase::write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context)
+SinkToStoragePtr IStorageURLBase::write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, bool /*async_insert*/)
 {
     if (http_method.empty())
         http_method = Poco::Net::HTTPRequest::HTTP_POST;
diff --git a/src/Storages/StorageURL.h b/src/Storages/StorageURL.h
index 316b142aec0..345f813dd7c 100644
--- a/src/Storages/StorageURL.h
+++ b/src/Storages/StorageURL.h
@@ -19,6 +19,7 @@ namespace DB
 class IOutputFormat;
 using OutputFormatPtr = std::shared_ptr<IOutputFormat>;
 
+class IInputFormat;
 struct ConnectionTimeouts;
 class NamedCollection;
 class PullingPipelineExecutor;
@@ -41,7 +42,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
     bool supportsPartitionBy() const override { return true; }
 
@@ -183,7 +184,7 @@ public:
 
     static Block getHeader(Block sample_block, const std::vector<NameAndTypePair> & requested_virtual_columns);
 
-    static std::tuple<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> getFirstAvailableURIAndReadBuffer(
+    static std::pair<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> getFirstAvailableURIAndReadBuffer(
         std::vector<String>::const_iterator & option,
         const std::vector<String>::const_iterator & end,
         ContextPtr context,
@@ -197,7 +198,7 @@ public:
         bool delay_initialization);
 
 private:
-    using InitializeFunc = std::function<void(const FailoverOptions &)>;
+    using InitializeFunc = std::function<bool()>;
     InitializeFunc initialize;
 
     String name;
@@ -206,6 +207,7 @@ private:
     Poco::URI curr_uri;
 
     std::unique_ptr<ReadBuffer> read_buf;
+    std::shared_ptr<IInputFormat> input_format;
     std::unique_ptr<QueryPipeline> pipeline;
     std::unique_ptr<PullingPipelineExecutor> reader;
 
@@ -234,11 +236,12 @@ public:
     std::string getName() const override { return "StorageURLSink"; }
     void consume(Chunk chunk) override;
     void onCancel() override;
-    void onException() override;
+    void onException(std::exception_ptr exception) override;
     void onFinish() override;
 
 private:
     void finalize();
+    void release();
     std::unique_ptr<WriteBuffer> write_buf;
     OutputFormatPtr writer;
     std::mutex cancel_mutex;
diff --git a/src/Storages/StorageValues.h b/src/Storages/StorageValues.h
index 55222903797..af1c134077b 100644
--- a/src/Storages/StorageValues.h
+++ b/src/Storages/StorageValues.h
@@ -36,6 +36,8 @@ public:
     /// FIXME probably it should return false, but StorageValues is used in ExecutingInnerQueryFromViewTransform (whatever it is)
     bool supportsTransactions() const override { return true; }
 
+    bool parallelizeOutputAfterReading(ContextPtr) const override { return false; }
+
 private:
     Block res_block;
     NamesAndTypesList virtuals;
diff --git a/src/Storages/StorageXDBC.cpp b/src/Storages/StorageXDBC.cpp
index 9b3e203e337..b532d1c91f0 100644
--- a/src/Storages/StorageXDBC.cpp
+++ b/src/Storages/StorageXDBC.cpp
@@ -116,7 +116,7 @@ Pipe StorageXDBC::read(
     return IStorageURLBase::read(column_names, storage_snapshot, query_info, local_context, processed_stage, max_block_size, num_streams);
 }
 
-SinkToStoragePtr StorageXDBC::write(const ASTPtr & /* query */, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context)
+SinkToStoragePtr StorageXDBC::write(const ASTPtr & /* query */, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
     bridge_helper->startBridgeSync();
 
diff --git a/src/Storages/StorageXDBC.h b/src/Storages/StorageXDBC.h
index aa313e024ca..d7a1138c710 100644
--- a/src/Storages/StorageXDBC.h
+++ b/src/Storages/StorageXDBC.h
@@ -38,7 +38,7 @@ public:
         ContextPtr context_,
         BridgeHelperPtr bridge_helper_);
 
-    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context) override;
+    SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
     std::string getName() const override;
 private:
diff --git a/src/Storages/System/StorageSystemBuildOptions.cpp.in b/src/Storages/System/StorageSystemBuildOptions.cpp.in
index 3465e47449b..c2d35c96ce5 100644
--- a/src/Storages/System/StorageSystemBuildOptions.cpp.in
+++ b/src/Storages/System/StorageSystemBuildOptions.cpp.in
@@ -64,6 +64,7 @@ const char * auto_config_build[]
     "USE_ARROW", "@USE_ARROW@",
     "USE_ORC", "@USE_ORC@",
     "USE_MSGPACK", "@USE_MSGPACK@",
+    "USE_QPL", "@ENABLE_QPL@",
     "GIT_HASH", "@GIT_HASH@",
     "GIT_BRANCH", R"IRjaNsZIL9Yh7FQ4(@GIT_BRANCH@)IRjaNsZIL9Yh7FQ4",
     "GIT_DATE", "@GIT_DATE@",
diff --git a/src/Storages/System/StorageSystemColumns.cpp b/src/Storages/System/StorageSystemColumns.cpp
index 18e7d269795..e4ca6a15138 100644
--- a/src/Storages/System/StorageSystemColumns.cpp
+++ b/src/Storages/System/StorageSystemColumns.cpp
@@ -74,6 +74,8 @@ public:
         : ISource(header_)
         , columns_mask(std::move(columns_mask_)), max_block_size(max_block_size_)
         , databases(std::move(databases_)), tables(std::move(tables_)), storages(std::move(storages_))
+        , client_info_interface(context->getClientInfo().interface)
+        , use_mysql_types(context->getSettingsRef().use_mysql_types_in_show_columns)
         , total_tables(tables->size()), access(context->getAccess())
         , query_id(context->getCurrentQueryId()), lock_acquire_timeout(context->getSettingsRef().lock_acquire_timeout)
     {
@@ -129,6 +131,18 @@ protected:
 
             bool check_access_for_columns = check_access_for_tables && !access->isGranted(AccessType::SHOW_COLUMNS, database_name, table_name);
 
+            auto get_type_name = [this](const IDataType& type) -> std::string
+            {
+                // Check if the use_mysql_types_in_show_columns setting is enabled and client is connected via MySQL protocol
+                if (use_mysql_types && client_info_interface == DB::ClientInfo::Interface::MYSQL)
+                {
+                    return type.getSQLCompatibleName();
+                }
+                else
+                {
+                    return type.getName();
+                }
+            };
             size_t position = 0;
             for (const auto & column : columns)
             {
@@ -146,7 +160,7 @@ protected:
                 if (columns_mask[src_index++])
                     res_columns[res_index++]->insert(column.name);
                 if (columns_mask[src_index++])
-                    res_columns[res_index++]->insert(column.type->getName());
+                    res_columns[res_index++]->insert(get_type_name(*column.type));
                 if (columns_mask[src_index++])
                     res_columns[res_index++]->insert(position);
 
@@ -281,6 +295,8 @@ private:
     ColumnPtr databases;
     ColumnPtr tables;
     Storages storages;
+    ClientInfo::Interface client_info_interface;
+    bool use_mysql_types;
     size_t db_table_num = 0;
     size_t total_tables;
     std::shared_ptr<const ContextAccess> access;
diff --git a/src/Storages/System/StorageSystemContributors.generated.cpp b/src/Storages/System/StorageSystemContributors.generated.cpp
index 0f307650c9c..f84c554afc0 100644
--- a/src/Storages/System/StorageSystemContributors.generated.cpp
+++ b/src/Storages/System/StorageSystemContributors.generated.cpp
@@ -83,6 +83,8 @@ const char * auto_contributors[] {
     "Alexey Boykov",
     "Alexey Dushechkin",
     "Alexey Elymanov",
+    "Alexey Gerasimchuck",
+    "Alexey Gerasimchuk",
     "Alexey Gusev",
     "Alexey Ilyukhov",
     "Alexey Ivanov",
@@ -143,6 +145,7 @@ const char * auto_contributors[] {
     "Anmol Arora",
     "Anna",
     "Anna Shakhova",
+    "AnneClickHouse",
     "Anselmo D. Adams",
     "Anthony N. Simon",
     "Anton Ivashkin",
@@ -223,6 +226,7 @@ const char * auto_contributors[] {
     "Carbyn",
     "Carlos Rodríguez Hernández",
     "Caspian",
+    "Chang Chen",
     "Chao Ma",
     "Chao Wang",
     "CheSema",
@@ -288,6 +292,7 @@ const char * auto_contributors[] {
     "Dmitry Belyavtsev",
     "Dmitry Bilunov",
     "Dmitry Galuza",
+    "Dmitry Kardymon",
     "Dmitry Krylov",
     "Dmitry Luhtionov",
     "Dmitry Moskowski",
@@ -305,6 +310,7 @@ const char * auto_contributors[] {
     "Dr. Strange Looker",
     "Duc Canh Le",
     "DuckSoft",
+    "Duyet Le",
     "Egor O'Sten",
     "Egor Savin",
     "Eirik",
@@ -321,6 +327,7 @@ const char * auto_contributors[] {
     "Eric",
     "Eric Daniel",
     "Eric Thomas",
+    "Eridanus",
     "Erixonich",
     "Ernest Poletaev",
     "Eugene Galkin",
@@ -347,6 +354,7 @@ const char * auto_contributors[] {
     "Federico Ceratto",
     "Federico Rodriguez",
     "FeehanG",
+    "Feng Kaiyu",
     "FgoDt",
     "Filatenkov Artur",
     "Filipe Caixeta",
@@ -402,6 +410,7 @@ const char * auto_contributors[] {
     "HeenaBansal2009",
     "Hiroaki Nakamura",
     "Hongbin",
+    "Hongbin Ma",
     "Hosun Lee",
     "HuFuwang",
     "Hui Wang",
@@ -444,6 +453,7 @@ const char * auto_contributors[] {
     "Ivan Milov",
     "Ivan Remen",
     "Ivan Starkov",
+    "Ivan Takarlikov",
     "Ivan Zhukov",
     "Jachen Duschletta",
     "Jack Song",
@@ -477,18 +487,21 @@ const char * auto_contributors[] {
     "John Skopis",
     "Jonatas Freitas",
     "Jonathan-Ackerman",
+    "Jordi",
     "Jordi Villar",
     "Joris Giovannangeli",
     "Jose",
     "Josh Taylor",
     "João Figueiredo",
     "Julian Gilyadov",
+    "Julian Maicher",
     "Julian Zhou",
     "Julio Jimenez",
     "Junfu Wu",
     "Jus",
     "Justin Hilliard",
     "Justin de Guzman",
+    "János Benjamin Antal",
     "Kang Liu",
     "Karl Pietrzak",
     "Keiji Yoshida",
@@ -523,6 +536,7 @@ const char * auto_contributors[] {
     "Kruglov Pavel",
     "Krzysztof Góralski",
     "Kseniia Sumarokova",
+    "Kuba Kaflik",
     "Kunal Gurnani",
     "Kuz Le",
     "Ky Li",
@@ -540,6 +554,7 @@ const char * auto_contributors[] {
     "Leopold Schabel",
     "Lev Borodin",
     "Lewinma",
+    "Li Shuai",
     "Li Yin",
     "Liu Cong",
     "LiuCong",
@@ -549,12 +564,14 @@ const char * auto_contributors[] {
     "Lopatin Konstantin",
     "Lorenzo Mangani",
     "Loud_Scream",
+    "Lucas Chang",
     "Lucid Dreams",
     "Luck-Chang",
     "Luis Bosque",
     "Lv Feng",
     "Léo Ercolanelli",
     "M0r64n",
+    "M1eyu2018",
     "MEX7",
     "MaceWindu",
     "MagiaGroz",
@@ -564,8 +581,10 @@ const char * auto_contributors[] {
     "Maksim Fedotov",
     "Maksim Kita",
     "Maksym Sobolyev",
+    "Mal Curtis",
     "Mallik Hassan",
     "Malte",
+    "Manas Alekar",
     "Manuel de la Peña",
     "Marat IDRISOV",
     "Marcelo Rodriguez",
@@ -650,7 +669,9 @@ const char * auto_contributors[] {
     "Milad Arabi",
     "Mingliang Pan",
     "Misko Lee",
+    "Misz606",
     "Mohamad Fadhil",
+    "Mohammad Arab Anvari",
     "Mohammad Hossein Sekhavat",
     "Mojtaba Yaghoobzadeh",
     "Mostafa Dahab",
@@ -764,6 +785,7 @@ const char * auto_contributors[] {
     "Rajkumar Varada",
     "Ramazan Polat",
     "Rami Dridi",
+    "Raqbit",
     "Ravengg",
     "Raúl Marín",
     "Realist007",
@@ -791,6 +813,7 @@ const char * auto_contributors[] {
     "Roman Peshkurov",
     "Roman Tsisyk",
     "Roman Vasin",
+    "Roman Vlasenko",
     "Roman Zhukov",
     "Roy Bellingan",
     "Ruslan",
@@ -825,6 +848,8 @@ const char * auto_contributors[] {
     "Sergey Demurin",
     "Sergey Elantsev",
     "Sergey Fedorov",
+    "Sergey Kazmin",
+    "Sergey Kislov",
     "Sergey Kononenko",
     "Sergey Lazarev",
     "Sergey Magidovich",
@@ -840,6 +865,7 @@ const char * auto_contributors[] {
     "Sergio Tulentsev",
     "SevaCode",
     "Seyed Mehrshad Hosseini",
+    "Shane Andrade",
     "Sherry Wang",
     "Shoh Jahon",
     "Sichen Zhao",
@@ -857,6 +883,8 @@ const char * auto_contributors[] {
     "SmitaRKulkarni",
     "Snow",
     "Sofia Antipushina",
+    "Sorck",
+    "Stanislav Dobrovolschii",
     "Stanislav Pavlovichev",
     "Stas Kelvich",
     "Stas Pavlovichev",
@@ -893,6 +921,7 @@ const char * auto_contributors[] {
     "Thom O'Connor",
     "Thomas Berdy",
     "Thomas Casteleyn",
+    "Thomas Panetti",
     "Tian Xinhui",
     "Tiaonmmn",
     "Tigran Khudaverdyan",
@@ -922,6 +951,8 @@ const char * auto_contributors[] {
     "Vadym Chekan",
     "Vage Ogannisian",
     "Val",
+    "Val Doroshchuk",
+    "Valentin Alexeev",
     "Valera Ryaboshapko",
     "Varinara",
     "Vasily Kozhukhovskiy",
@@ -935,8 +966,10 @@ const char * auto_contributors[] {
     "Veselkov Konstantin",
     "Viachaslau Boben",
     "Victor",
+    "Victor Krasnov",
     "Victor Tarnavsky",
     "Viktor Taranenko",
+    "Vincent",
     "Vincent Bernat",
     "Vitalii S",
     "Vitaliy",
@@ -994,6 +1027,7 @@ const char * auto_contributors[] {
     "Y Lu",
     "Yakko Majuri",
     "Yakov Olkhovskiy",
+    "YalalovSM",
     "Yangkuan Liu",
     "Yatian Xu",
     "Yatsishin Ilya",
@@ -1018,12 +1052,14 @@ const char * auto_contributors[] {
     "Yuriy Korzhenevskiy",
     "Yury Karpovich",
     "Yury Stankevich",
+    "Yusuke Tanaka",
     "ZhiYong Wang",
     "Zhichang Yu",
     "Zhichun Wu",
     "Zhiguo Zhou",
     "Zhipeng",
     "Zijie Lu",
+    "Ziy1-Tan",
     "Zoran Pandovski",
     "[데이터플랫폼팀] 이호선",
     "a.palagashvili",
@@ -1039,6 +1075,7 @@ const char * auto_contributors[] {
     "akazz",
     "akonyaev",
     "akuzm",
+    "alekar",
     "alekseik1",
     "alekseygolub",
     "alesapin",
@@ -1072,6 +1109,7 @@ const char * auto_contributors[] {
     "asiana21",
     "atereh",
     "attack204",
+    "auxten",
     "avasiliev",
     "avogar",
     "avoiderboi",
@@ -1094,6 +1132,7 @@ const char * auto_contributors[] {
     "caipengxiang",
     "candiduslynx",
     "canenoneko",
+    "cangyin",
     "caspian",
     "cekc",
     "centos7",
@@ -1131,6 +1170,7 @@ const char * auto_contributors[] {
     "damozhaeva",
     "dankondr",
     "daoready",
+    "darkkeks",
     "dasmfm",
     "davydovska",
     "decaseal",
@@ -1189,6 +1229,7 @@ const char * auto_contributors[] {
     "franklee",
     "fredchenbj",
     "freedomDR",
+    "frinkr",
     "fuqi",
     "fuwhu",
     "fuzhe1989",
@@ -1236,6 +1277,7 @@ const char * auto_contributors[] {
     "ikopylov",
     "imgbot[bot]",
     "ip",
+    "ismailakpolat",
     "it1804",
     "ivan-klass",
     "ivan-kush",
@@ -1255,6 +1297,7 @@ const char * auto_contributors[] {
     "jianmei zhang",
     "jinjunzh",
     "jkuklis",
+    "johanngan",
     "jthmath",
     "jun won",
     "jus1096",
@@ -1263,6 +1306,7 @@ const char * auto_contributors[] {
     "kashwy",
     "keenwolf",
     "kevin wan",
+    "kevinyhzou",
     "kgurjev",
     "khamadiev",
     "kigerzhang",
@@ -1280,6 +1324,7 @@ const char * auto_contributors[] {
     "kst-morozov",
     "l",
     "l1tsolaiki",
+    "laimuxi",
     "lalex",
     "lanfz",
     "larryluogit",
@@ -1298,8 +1343,10 @@ const char * auto_contributors[] {
     "liang.huang",
     "liangqian",
     "libenwang",
+    "libin",
     "lichengxiang",
     "liding1992",
+    "lihaibo42",
     "linceyou",
     "lincion",
     "lingo-xp",
@@ -1341,6 +1388,7 @@ const char * auto_contributors[] {
     "mastertheknife",
     "mateng0915",
     "mateng915",
+    "mauidude",
     "maxim",
     "maxim-babenko",
     "maxkuzn",
@@ -1352,6 +1400,7 @@ const char * auto_contributors[] {
     "meo",
     "meoww-bot",
     "mergify[bot]",
+    "merlllle",
     "metahys",
     "mf5137",
     "mfridental",
@@ -1398,6 +1447,7 @@ const char * auto_contributors[] {
     "olevino",
     "olevino999",
     "olgarev",
+    "ongkong",
     "orantius",
     "p0ny",
     "palasonicq",
@@ -1473,6 +1523,7 @@ const char * auto_contributors[] {
     "spongedc",
     "spume",
     "spyros87",
+    "sslouis",
     "stan",
     "stavrolia",
     "stepenhu",
@@ -1501,6 +1552,7 @@ const char * auto_contributors[] {
     "tiger.yan",
     "tison",
     "topvisor",
+    "tpanetti",
     "turbo jason",
     "tyrionhuang",
     "ubuntu",
@@ -1518,6 +1570,7 @@ const char * auto_contributors[] {
     "vicdashkov",
     "vicgao",
     "vinity",
+    "vitac",
     "vitstn",
     "vivarum",
     "vladimir golovchenko",
@@ -1527,6 +1580,7 @@ const char * auto_contributors[] {
     "vzakaznikov",
     "wangchao",
     "wangdh15",
+    "wangxiaobo",
     "weeds085490",
     "whysage",
     "wineternity",
@@ -1537,6 +1591,7 @@ const char * auto_contributors[] {
     "xieyichen",
     "xinhuitian",
     "xlwh",
+    "xmy",
     "yakkomajuri",
     "yakov-olkhovskiy",
     "yandd",
@@ -1589,6 +1644,7 @@ const char * auto_contributors[] {
     "zvvr",
     "zxc111",
     "zxealous",
+    "zy-kkk",
     "zzsmdfj",
     "Šimon Podlipský",
     "Александр",
@@ -1605,6 +1661,7 @@ const char * auto_contributors[] {
     "Сундуков Алексей",
     "万康",
     "何李夫",
+    "你不要过来啊",
     "凌涛",
     "刘浩林",
     "刘陶峰",
@@ -1624,6 +1681,7 @@ const char * auto_contributors[] {
     "董海镔",
     "谢磊",
     "贾顺名(Jarvis)",
+    "郭小龙",
     "陈小玉",
     "靳阳",
     "黄朝晖",
diff --git a/src/Storages/System/StorageSystemDetachedParts.cpp b/src/Storages/System/StorageSystemDetachedParts.cpp
index 9f80b994051..97af4094e42 100644
--- a/src/Storages/System/StorageSystemDetachedParts.cpp
+++ b/src/Storages/System/StorageSystemDetachedParts.cpp
@@ -194,7 +194,7 @@ private:
             futures.push_back(
                         scheduleFromThreadPool<void>(
                             std::move(worker),
-                            IOThreadPool::get(),
+                            getIOThreadPool().get(),
                             "DP_BytesOnDisk"));
         }
 
diff --git a/src/Storages/System/StorageSystemFilesystemCache.cpp b/src/Storages/System/StorageSystemFilesystemCache.cpp
index 8e9ad2ac501..e03fd9ca081 100644
--- a/src/Storages/System/StorageSystemFilesystemCache.cpp
+++ b/src/Storages/System/StorageSystemFilesystemCache.cpp
@@ -26,7 +26,6 @@ NamesAndTypesList StorageSystemFilesystemCache::getNamesAndTypes()
         {"cache_hits", std::make_shared<DataTypeUInt64>()},
         {"references", std::make_shared<DataTypeUInt64>()},
         {"downloaded_size", std::make_shared<DataTypeUInt64>()},
-        {"persistent", std::make_shared<DataTypeNumber<UInt8>>()},
         {"kind", std::make_shared<DataTypeString>()},
         {"unbound", std::make_shared<DataTypeNumber<UInt8>>()},
     };
@@ -48,25 +47,25 @@ void StorageSystemFilesystemCache::fillData(MutableColumns & res_columns, Contex
 
         for (const auto & file_segment : *file_segments)
         {
-            res_columns[0]->insert(cache_name);
-            res_columns[1]->insert(cache->getBasePath());
+            size_t i = 0;
+            res_columns[i++]->insert(cache_name);
+            res_columns[i++]->insert(cache->getBasePath());
 
             /// Do not use `file_segment->getPathInLocalCache` here because it will lead to nullptr dereference
             /// (because file_segments in getSnapshot doesn't have `cache` field set)
-            res_columns[2]->insert(cache->getPathInLocalCache(file_segment->key(), file_segment->offset(), file_segment->getKind()));
-            res_columns[3]->insert(file_segment->key().toString());
+            res_columns[i++]->insert(cache->getPathInLocalCache(file_segment->key(), file_segment->offset(), file_segment->getKind()));
+            res_columns[i++]->insert(file_segment->key().toString());
 
             const auto & range = file_segment->range();
-            res_columns[4]->insert(range.left);
-            res_columns[5]->insert(range.right);
-            res_columns[6]->insert(range.size());
-            res_columns[7]->insert(FileSegment::stateToString(file_segment->state()));
-            res_columns[8]->insert(file_segment->getHitsCount());
-            res_columns[9]->insert(file_segment->getRefCount());
-            res_columns[10]->insert(file_segment->getDownloadedSize(false));
-            res_columns[11]->insert(file_segment->isPersistent());
-            res_columns[12]->insert(toString(file_segment->getKind()));
-            res_columns[13]->insert(file_segment->isUnbound());
+            res_columns[i++]->insert(range.left);
+            res_columns[i++]->insert(range.right);
+            res_columns[i++]->insert(range.size());
+            res_columns[i++]->insert(FileSegment::stateToString(file_segment->state()));
+            res_columns[i++]->insert(file_segment->getHitsCount());
+            res_columns[i++]->insert(file_segment->getRefCount());
+            res_columns[i++]->insert(file_segment->getDownloadedSize(false));
+            res_columns[i++]->insert(toString(file_segment->getKind()));
+            res_columns[i++]->insert(file_segment->isUnbound());
         }
     }
 }
diff --git a/src/Storages/System/StorageSystemNumbers.h b/src/Storages/System/StorageSystemNumbers.h
index 80590718d03..acddac681ef 100644
--- a/src/Storages/System/StorageSystemNumbers.h
+++ b/src/Storages/System/StorageSystemNumbers.h
@@ -40,8 +40,6 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    bool parallelizeOutputAfterReading(ContextPtr) const override { return false; }
-
     bool hasEvenlyDistributedRead() const override { return true; }
     bool isSystemStorage() const override { return true; }
     bool supportsTransactions() const override { return true; }
diff --git a/src/Storages/System/StorageSystemOne.h b/src/Storages/System/StorageSystemOne.h
index e3b6e1d5f78..d8a26f1def4 100644
--- a/src/Storages/System/StorageSystemOne.h
+++ b/src/Storages/System/StorageSystemOne.h
@@ -30,8 +30,6 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    bool parallelizeOutputAfterReading(ContextPtr) const override { return false; }
-
     bool isSystemStorage() const override { return true; }
 
     bool supportsTransactions() const override { return true; }
diff --git a/src/Storages/System/StorageSystemParts.cpp b/src/Storages/System/StorageSystemParts.cpp
index 86ecb336b51..7399bd789a7 100644
--- a/src/Storages/System/StorageSystemParts.cpp
+++ b/src/Storages/System/StorageSystemParts.cpp
@@ -252,17 +252,17 @@ void StorageSystemParts::processNextStorage(
             if (columns_mask[src_index++])
             {
                 auto checksum = helper.hash_of_all_files;
-                columns[res_index++]->insert(getHexUIntLowercase(checksum.first) + getHexUIntLowercase(checksum.second));
+                columns[res_index++]->insert(getHexUIntLowercase(checksum));
             }
             if (columns_mask[src_index++])
             {
                 auto checksum = helper.hash_of_uncompressed_files;
-                columns[res_index++]->insert(getHexUIntLowercase(checksum.first) + getHexUIntLowercase(checksum.second));
+                columns[res_index++]->insert(getHexUIntLowercase(checksum));
             }
             if (columns_mask[src_index++])
             {
                 auto checksum = helper.uncompressed_hash_of_compressed_files;
-                columns[res_index++]->insert(getHexUIntLowercase(checksum.first) + getHexUIntLowercase(checksum.second));
+                columns[res_index++]->insert(getHexUIntLowercase(checksum));
             }
         }
 
diff --git a/src/Storages/System/StorageSystemPartsColumns.cpp b/src/Storages/System/StorageSystemPartsColumns.cpp
index 00b958b015f..67c8d06e432 100644
--- a/src/Storages/System/StorageSystemPartsColumns.cpp
+++ b/src/Storages/System/StorageSystemPartsColumns.cpp
@@ -8,6 +8,7 @@
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeNested.h>
+#include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/NestedUtils.h>
 #include <DataTypes/DataTypeUUID.h>
 #include <Storages/VirtualColumnUtils.h>
@@ -62,6 +63,8 @@ StorageSystemPartsColumns::StorageSystemPartsColumns(const StorageID & table_id_
         {"column_data_compressed_bytes",               std::make_shared<DataTypeUInt64>()},
         {"column_data_uncompressed_bytes",             std::make_shared<DataTypeUInt64>()},
         {"column_marks_bytes",                         std::make_shared<DataTypeUInt64>()},
+        {"column_modification_time",                   std::make_shared<DataTypeNullable>(std::make_shared<DataTypeDateTime>())},
+
         {"serialization_kind",                         std::make_shared<DataTypeString>()},
         {"subcolumns.names",                           std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>())},
         {"subcolumns.types",                           std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>())},
@@ -235,6 +238,13 @@ void StorageSystemPartsColumns::processNextStorage(
                 columns[res_index++]->insert(column_size.data_uncompressed);
             if (columns_mask[src_index++])
                 columns[res_index++]->insert(column_size.marks);
+            if (columns_mask[src_index++])
+            {
+                if (auto column_modification_time = part->getColumnModificationTime(column.name))
+                    columns[res_index++]->insert(UInt64(column_modification_time.value()));
+                else
+                    columns[res_index++]->insertDefault();
+            }
 
             auto serialization = part->getSerialization(column.name);
             if (columns_mask[src_index++])
diff --git a/src/Storages/System/StorageSystemProjectionParts.cpp b/src/Storages/System/StorageSystemProjectionParts.cpp
index d2c6c3ef287..213865a8d61 100644
--- a/src/Storages/System/StorageSystemProjectionParts.cpp
+++ b/src/Storages/System/StorageSystemProjectionParts.cpp
@@ -221,17 +221,17 @@ void StorageSystemProjectionParts::processNextStorage(
             if (columns_mask[src_index++])
             {
                 auto checksum = helper.hash_of_all_files;
-                columns[res_index++]->insert(getHexUIntLowercase(checksum.first) + getHexUIntLowercase(checksum.second));
+                columns[res_index++]->insert(getHexUIntLowercase(checksum));
             }
             if (columns_mask[src_index++])
             {
                 auto checksum = helper.hash_of_uncompressed_files;
-                columns[res_index++]->insert(getHexUIntLowercase(checksum.first) + getHexUIntLowercase(checksum.second));
+                columns[res_index++]->insert(getHexUIntLowercase(checksum));
             }
             if (columns_mask[src_index++])
             {
                 auto checksum = helper.uncompressed_hash_of_compressed_files;
-                columns[res_index++]->insert(getHexUIntLowercase(checksum.first) + getHexUIntLowercase(checksum.second));
+                columns[res_index++]->insert(getHexUIntLowercase(checksum));
             }
         }
 
diff --git a/src/Storages/System/StorageSystemProjectionPartsColumns.cpp b/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
index a5968597885..06becc6d91c 100644
--- a/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
+++ b/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
@@ -7,6 +7,7 @@
 #include <DataTypes/DataTypeDateTime.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeUUID.h>
+#include <DataTypes/DataTypeNullable.h>
 #include <Storages/VirtualColumnUtils.h>
 #include <Databases/IDatabase.h>
 #include <Parsers/queryToString.h>
@@ -66,7 +67,8 @@ StorageSystemProjectionPartsColumns::StorageSystemProjectionPartsColumns(const S
         {"column_bytes_on_disk",                       std::make_shared<DataTypeUInt64>()},
         {"column_data_compressed_bytes",               std::make_shared<DataTypeUInt64>()},
         {"column_data_uncompressed_bytes",             std::make_shared<DataTypeUInt64>()},
-        {"column_marks_bytes",                         std::make_shared<DataTypeUInt64>()}
+        {"column_marks_bytes",                         std::make_shared<DataTypeUInt64>()},
+        {"column_modification_time",                   std::make_shared<DataTypeNullable>(std::make_shared<DataTypeDateTime>())},
     }
     )
 {
@@ -247,6 +249,13 @@ void StorageSystemProjectionPartsColumns::processNextStorage(
                 columns[res_index++]->insert(column_size.data_uncompressed);
             if (columns_mask[src_index++])
                 columns[res_index++]->insert(column_size.marks);
+            if (columns_mask[src_index++])
+            {
+                if (auto column_modification_time = part->getColumnModificationTime(column.name))
+                    columns[res_index++]->insert(UInt64(column_modification_time.value()));
+                else
+                    columns[res_index++]->insertDefault();
+            }
 
             if (has_state_column)
                 columns[res_index++]->insert(part->stateString());
diff --git a/src/Storages/System/StorageSystemQueryCache.cpp b/src/Storages/System/StorageSystemQueryCache.cpp
index 245f4b7fd26..117fb4e8a5c 100644
--- a/src/Storages/System/StorageSystemQueryCache.cpp
+++ b/src/Storages/System/StorageSystemQueryCache.cpp
@@ -29,7 +29,7 @@ StorageSystemQueryCache::StorageSystemQueryCache(const StorageID & table_id_)
 
 void StorageSystemQueryCache::fillData(MutableColumns & res_columns, ContextPtr context, const SelectQueryInfo &) const
 {
-    auto query_cache = context->getQueryCache();
+    QueryCachePtr query_cache = context->getQueryCache();
 
     if (!query_cache)
         return;
@@ -47,7 +47,7 @@ void StorageSystemQueryCache::fillData(MutableColumns & res_columns, ContextPtr
         res_columns[0]->insert(key.queryStringFromAst()); /// approximates the original query string
         res_columns[1]->insert(QueryCache::QueryCacheEntryWeight()(*query_result));
         res_columns[2]->insert(key.expires_at < std::chrono::system_clock::now());
-        res_columns[3]->insert(!key.is_shared);
+        res_columns[3]->insert(key.is_shared);
         res_columns[4]->insert(key.is_compressed);
         res_columns[5]->insert(std::chrono::system_clock::to_time_t(key.expires_at));
         res_columns[6]->insert(key.ast->getTreeHash().first);
diff --git a/src/Storages/System/StorageSystemUserProcesses.cpp b/src/Storages/System/StorageSystemUserProcesses.cpp
new file mode 100644
index 00000000000..de34fede0ac
--- /dev/null
+++ b/src/Storages/System/StorageSystemUserProcesses.cpp
@@ -0,0 +1,57 @@
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnsNumber.h>
+#include <Core/Settings.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeMap.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <Interpreters/Context.h>
+#include <Interpreters/ProcessList.h>
+#include <Interpreters/ProfileEventsExt.h>
+#include <Storages/System/StorageSystemUserProcesses.h>
+
+
+namespace DB
+{
+
+NamesAndTypesList StorageSystemUserProcesses::getNamesAndTypes()
+{
+    return {
+        {"user", std::make_shared<DataTypeString>()},
+        {"memory_usage", std::make_shared<DataTypeInt64>()},
+        {"peak_memory_usage", std::make_shared<DataTypeInt64>()},
+        {"ProfileEvents", std::make_shared<DataTypeMap>(std::make_shared<DataTypeString>(), std::make_shared<DataTypeUInt64>())},
+    };
+}
+
+NamesAndAliases StorageSystemUserProcesses::getNamesAndAliases()
+{
+    return {
+        {"ProfileEvents.Names", {std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>())}, "mapKeys(ProfileEvents)"},
+        {"ProfileEvents.Values", {std::make_shared<DataTypeArray>(std::make_shared<DataTypeUInt64>())}, "mapValues(ProfileEvents)"}};
+}
+
+void StorageSystemUserProcesses::fillData(MutableColumns & res_columns, ContextPtr context, const SelectQueryInfo &) const
+{
+    const auto user_info = context->getProcessList().getUserInfo(true);
+
+    for (const auto & [user, info] : user_info)
+    {
+        size_t i = 0;
+
+        res_columns[i++]->insert(user);
+        res_columns[i++]->insert(info.memory_usage);
+        res_columns[i++]->insert(info.peak_memory_usage);
+        {
+            IColumn * column = res_columns[i++].get();
+
+            if (info.profile_counters)
+                ProfileEvents::dumpToMapColumn(*info.profile_counters, column, true);
+            else
+            {
+                column->insertDefault();
+            }
+        }
+    }
+}
+}
diff --git a/src/Storages/System/StorageSystemUserProcesses.h b/src/Storages/System/StorageSystemUserProcesses.h
new file mode 100644
index 00000000000..9bdc009d849
--- /dev/null
+++ b/src/Storages/System/StorageSystemUserProcesses.h
@@ -0,0 +1,29 @@
+#pragma once
+
+#include <Storages/System/IStorageSystemOneBlock.h>
+
+
+namespace DB
+{
+
+class Context;
+
+
+/** Implements `processes` system table, which allows you to get information about the queries that are currently executing.
+  */
+class StorageSystemUserProcesses final : public IStorageSystemOneBlock<StorageSystemUserProcesses>
+{
+public:
+    std::string getName() const override { return "SystemUserProcesses"; }
+
+    static NamesAndTypesList getNamesAndTypes();
+
+    static NamesAndAliases getNamesAndAliases();
+
+protected:
+    using IStorageSystemOneBlock::IStorageSystemOneBlock;
+
+    void fillData(MutableColumns & res_columns, ContextPtr context, const SelectQueryInfo & query_info) const override;
+};
+
+}
diff --git a/src/Storages/System/StorageSystemZeros.h b/src/Storages/System/StorageSystemZeros.h
index 84b4b752aae..64443a3cfd6 100644
--- a/src/Storages/System/StorageSystemZeros.h
+++ b/src/Storages/System/StorageSystemZeros.h
@@ -31,8 +31,6 @@ public:
         size_t max_block_size,
         size_t num_streams) override;
 
-    bool parallelizeOutputAfterReading(ContextPtr) const override { return false; }
-
     bool hasEvenlyDistributedRead() const override { return true; }
     bool isSystemStorage() const override { return true; }
     bool supportsTransactions() const override { return true; }
diff --git a/src/Storages/System/StorageSystemZooKeeper.cpp b/src/Storages/System/StorageSystemZooKeeper.cpp
index 6ca74406b17..4d7f59b8ccd 100644
--- a/src/Storages/System/StorageSystemZooKeeper.cpp
+++ b/src/Storages/System/StorageSystemZooKeeper.cpp
@@ -9,18 +9,21 @@
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTFunction.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/ProcessList.h>
 #include <Interpreters/evaluateConstantExpression.h>
 #include <Common/ZooKeeper/ZooKeeper.h>
 #include <Common/typeid_cast.h>
 #include <Columns/ColumnSet.h>
 #include <Columns/ColumnConst.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 #include <Functions/IFunction.h>
 #include <Parsers/ASTSubquery.h>
 #include <Interpreters/Set.h>
 #include <Interpreters/interpretSubquery.h>
 #include <Processors/Executors/PullingPipelineExecutor.h>
 #include <Processors/Sinks/SinkToStorage.h>
+#include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/SourceStepWithFilter.h>
 #include <QueryPipeline/QueryPipelineBuilder.h>
 #include <boost/algorithm/string/join.hpp>
@@ -161,6 +164,17 @@ public:
     }
 };
 
+/// Type of path to be fetched
+enum class ZkPathType
+{
+    Exact,   /// Fetch all nodes under this path
+    Prefix,  /// Fetch all nodes starting with this prefix, recursively (multiple paths may match prefix)
+    Recurse, /// Fatch all nodes under this path, recursively
+};
+
+/// List of paths to be feched from zookeeper
+using Paths = std::deque<std::pair<String, ZkPathType>>;
+
 class ReadFromSystemZooKeeper final : public SourceStepWithFilter
 {
 public:
@@ -170,11 +184,14 @@ public:
 
     void initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings & settings) override;
 
+    void applyFilters() override;
+
 private:
-    void fillData(MutableColumns & res_columns) const;
+    void fillData(MutableColumns & res_columns);
 
     std::shared_ptr<const StorageLimitsList> storage_limits;
     ContextPtr context;
+    Paths paths;
 };
 
 StorageSystemZooKeeper::StorageSystemZooKeeper(const StorageID & table_id_)
@@ -215,7 +232,7 @@ void StorageSystemZooKeeper::read(
     query_plan.addStep(std::move(read_step));
 }
 
-SinkToStoragePtr StorageSystemZooKeeper::write(const ASTPtr &, const StorageMetadataPtr &, ContextPtr context)
+SinkToStoragePtr StorageSystemZooKeeper::write(const ASTPtr &, const StorageMetadataPtr &, ContextPtr context, bool /*async_insert*/)
 {
     if (!context->getConfigRef().getBool("allow_zookeeper_write", false))
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Prohibit writing to system.zookeeper, unless config `allow_zookeeper_write` as true");
@@ -246,17 +263,6 @@ NamesAndTypesList StorageSystemZooKeeper::getNamesAndTypes()
     };
 }
 
-/// Type of path to be fetched
-enum class ZkPathType
-{
-    Exact,   /// Fetch all nodes under this path
-    Prefix,  /// Fetch all nodes starting with this prefix, recursively (multiple paths may match prefix)
-    Recurse, /// Fatch all nodes under this path, recursively
-};
-
-/// List of paths to be feched from zookeeper
-using Paths = std::deque<std::pair<String, ZkPathType>>;
-
 static String pathCorrected(const String & path)
 {
     String path_corrected;
@@ -313,11 +319,12 @@ static void extractPathImpl(const ActionsDAG::Node & node, Paths & res, ContextP
         if (!column_set)
             return;
 
-        auto set = column_set->getData();
-        if (!set || !set->isCreated())
+        auto future_set = column_set->getData();
+        if (!future_set)
             return;
 
-        if (!set->hasExplicitSetElements())
+        auto set = future_set->buildOrderedSetInplace(context);
+        if (!set || !set->hasExplicitSetElements())
             return;
 
         set->checkColumnsNumber(1);
@@ -414,10 +421,13 @@ static Paths extractPath(const ActionsDAG::NodeRawConstPtrs & filter_nodes, Cont
 }
 
 
-void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns) const
+void ReadFromSystemZooKeeper::applyFilters()
 {
-    Paths paths = extractPath(getFilterNodes().nodes, context, context->getSettingsRef().allow_unrestricted_reads_from_keeper);
+    paths = extractPath(getFilterNodes().nodes, context, context->getSettingsRef().allow_unrestricted_reads_from_keeper);
+}
 
+void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
+{
     zkutil::ZooKeeperPtr zookeeper = context->getZooKeeper();
 
     if (paths.empty())
@@ -426,60 +436,106 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns) const
                         "or path IN ('path1','path2'...) or path IN (subquery) "
                         "in WHERE clause unless `set allow_unrestricted_reads_from_keeper = 'true'`.");
 
+    const Int64 max_inflight_requests = std::max<Int64>(1, context->getSettingsRef().max_download_threads.value);
+
+    struct ListTask
+    {
+        String path;
+        ZkPathType path_type;
+        String prefix;
+        String path_corrected;
+        String path_part;
+    };
+    std::vector<ListTask> list_tasks;
     std::unordered_set<String> added;
     while (!paths.empty())
     {
-        auto [path, path_type] = std::move(paths.front());
-        paths.pop_front();
-
-        String prefix;
-        if (path_type == ZkPathType::Prefix)
+        list_tasks.clear();
+        std::vector<String> paths_to_list;
+        while (!paths.empty() && static_cast<Int64>(list_tasks.size()) < max_inflight_requests)
         {
-            prefix = path;
-            size_t last_slash = prefix.rfind('/');
-            path = prefix.substr(0, last_slash == String::npos ? 0 : last_slash);
-        }
+            auto [path, path_type] = std::move(paths.front());
+            paths.pop_front();
 
-        String path_corrected = pathCorrected(path);
-
-        /// Node can be deleted concurrently. It's Ok, we don't provide any
-        /// consistency guarantees for system.zookeeper table.
-        zkutil::Strings nodes;
-        zookeeper->tryGetChildren(path_corrected, nodes);
-
-        String path_part = path_corrected;
-        if (path_part == "/")
-            path_part.clear();
-
-        if (!prefix.empty())
-        {
-            // Remove nodes that do not match specified prefix
-            std::erase_if(nodes, [&prefix, &path_part] (const String & node)
+            ListTask task;
+            task.path = path;
+            task.path_type = path_type;
+            if (path_type == ZkPathType::Prefix)
             {
-                return (path_part + '/' + node).substr(0, prefix.size()) != prefix;
-            });
+                task.prefix = path;
+                size_t last_slash = task.prefix.rfind('/');
+                path = task.prefix.substr(0, last_slash == String::npos ? 0 : last_slash);
+            }
+
+            task.path_corrected = pathCorrected(path);
+
+            paths_to_list.emplace_back(task.path_corrected);
+            list_tasks.emplace_back(std::move(task));
+        }
+        auto list_responses = zookeeper->tryGetChildren(paths_to_list);
+
+        struct GetTask
+        {
+            size_t list_task_idx;   /// Index of 'parent' request in list_tasks
+            String node;            /// Node name
+        };
+        std::vector<GetTask> get_tasks;
+        std::vector<String> paths_to_get;
+        for (size_t list_task_idx = 0; list_task_idx < list_tasks.size(); ++list_task_idx)
+        {
+            auto & list_result = list_responses[list_task_idx];
+            /// Node can be deleted concurrently. It's Ok, we don't provide any
+            /// consistency guarantees for system.zookeeper table.
+            if (list_result.error == Coordination::Error::ZNONODE)
+                continue;
+
+            auto & task = list_tasks[list_task_idx];
+            context->getProcessListElement()->checkTimeLimit();
+
+            Strings nodes = std::move(list_result.names);
+
+            task.path_part = task.path_corrected;
+            if (task.path_part == "/")
+                task.path_part.clear();
+
+            if (!task.prefix.empty())
+            {
+                // Remove nodes that do not match specified prefix
+                std::erase_if(nodes, [&task] (const String & node)
+                {
+                    return (task.path_part + '/' + node).substr(0, task.prefix.size()) != task.prefix;
+                });
+            }
+
+            get_tasks.reserve(get_tasks.size() + nodes.size());
+            for (const String & node : nodes)
+            {
+                paths_to_get.emplace_back(task.path_part + '/' + node);
+                get_tasks.emplace_back(GetTask{list_task_idx, node});
+            }
         }
 
-        std::vector<std::future<Coordination::GetResponse>> futures;
-        futures.reserve(nodes.size());
-        for (const String & node : nodes)
-            futures.push_back(zookeeper->asyncTryGet(path_part + '/' + node));
+        auto get_responses = zookeeper->tryGet(paths_to_get);
 
-        for (size_t i = 0, size = nodes.size(); i < size; ++i)
+        for (size_t i = 0, size = get_tasks.size(); i < size; ++i)
         {
-            auto res = futures[i].get();
+            auto & res = get_responses[i];
             if (res.error == Coordination::Error::ZNONODE)
                 continue; /// Node was deleted meanwhile.
 
+            auto & get_task = get_tasks[i];
+            auto & list_task = list_tasks[get_task.list_task_idx];
+            context->getProcessListElement()->checkTimeLimit();
+
             // Deduplication
-            String key = path_part + '/' + nodes[i];
+            String key = list_task.path_part + '/' + get_task.node;
             if (auto [it, inserted] = added.emplace(key); !inserted)
                 continue;
 
             const Coordination::Stat & stat = res.stat;
 
             size_t col_num = 0;
-            res_columns[col_num++]->insert(nodes[i]);
+            res_columns[col_num++]->insert(get_task.node);
             res_columns[col_num++]->insert(res.data);
             res_columns[col_num++]->insert(stat.czxid);
             res_columns[col_num++]->insert(stat.mzxid);
@@ -493,9 +549,9 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns) const
             res_columns[col_num++]->insert(stat.numChildren);
             res_columns[col_num++]->insert(stat.pzxid);
             res_columns[col_num++]->insert(
-                path); /// This is the original path. In order to process the request, condition in WHERE should be triggered.
+                list_task.path); /// This is the original path. In order to process the request, condition in WHERE should be triggered.
 
-            if (path_type != ZkPathType::Exact && res.stat.numChildren > 0)
+            if (list_task.path_type != ZkPathType::Exact && res.stat.numChildren > 0)
             {
                 paths.emplace_back(key, ZkPathType::Recurse);
             }
diff --git a/src/Storages/System/StorageSystemZooKeeper.h b/src/Storages/System/StorageSystemZooKeeper.h
index c8988d787a0..a016d3ad74c 100644
--- a/src/Storages/System/StorageSystemZooKeeper.h
+++ b/src/Storages/System/StorageSystemZooKeeper.h
@@ -20,7 +20,7 @@ public:
 
     static NamesAndTypesList getNamesAndTypes();
 
-    SinkToStoragePtr write(const ASTPtr & /*query*/, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr /*context*/) override;
+    SinkToStoragePtr write(const ASTPtr & /*query*/, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr /*context*/, bool /*async_insert*/) override;
 
     void read(
         QueryPlan & query_plan,
diff --git a/src/Storages/System/StorageSystemZooKeeperConnection.cpp b/src/Storages/System/StorageSystemZooKeeperConnection.cpp
index 559e12ad5ee..33268d58358 100644
--- a/src/Storages/System/StorageSystemZooKeeperConnection.cpp
+++ b/src/Storages/System/StorageSystemZooKeeperConnection.cpp
@@ -1,8 +1,11 @@
 #include <Interpreters/Context.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeEnum.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeDateTime.h>
 #include <Common/ZooKeeper/ZooKeeper.h>
+#include <Coordination/KeeperFeatureFlags.h>
 #include <Storages/System/StorageSystemZooKeeperConnection.h>
 
 namespace DB
@@ -10,15 +13,24 @@ namespace DB
 
 NamesAndTypesList StorageSystemZooKeeperConnection::getNamesAndTypes()
 {
+    DataTypeEnum16::Values feature_flags_enum_values;
+    feature_flags_enum_values.reserve(magic_enum::enum_count<KeeperFeatureFlag>());
+    for (const auto & [feature_flag, feature_flag_string] : magic_enum::enum_entries<KeeperFeatureFlag>())
+        feature_flags_enum_values.push_back(std::pair{std::string{feature_flag_string}, static_cast<Int16>(feature_flag)});
+
+    auto feature_flags_enum = std::make_shared<DataTypeEnum16>(std::move(feature_flags_enum_values));
+
     return {
         {"name", std::make_shared<DataTypeString>()},
         {"host", std::make_shared<DataTypeString>()},
         {"port", std::make_shared<DataTypeUInt16>()},
         {"index", std::make_shared<DataTypeUInt8>()},
         {"connected_time", std::make_shared<DataTypeDateTime>()},
+        {"session_uptime_elapsed_seconds", std::make_shared<DataTypeUInt64>()},
         {"is_expired", std::make_shared<DataTypeUInt8>()},
         {"keeper_api_version", std::make_shared<DataTypeUInt8>()},
-        {"client_id", std::make_shared<DataTypeInt64>()}
+        {"client_id", std::make_shared<DataTypeInt64>()},
+        {"enabled_feature_flags", std::make_shared<DataTypeArray>(std::move(feature_flags_enum))}
     };
 }
 
@@ -29,10 +41,30 @@ void StorageSystemZooKeeperConnection::fillData(MutableColumns & res_columns, Co
     res_columns[1]->insert(context->getZooKeeper()->getConnectedZooKeeperHost());
     res_columns[2]->insert(context->getZooKeeper()->getConnectedZooKeeperPort());
     res_columns[3]->insert(context->getZooKeeper()->getConnectedZooKeeperIndex());
-    res_columns[4]->insert(context->getZooKeeperSessionUptime());
-    res_columns[5]->insert(context->getZooKeeper()->expired());
-    res_columns[6]->insert(context->getZooKeeper()->getApiVersion());
-    res_columns[7]->insert(context->getZooKeeper()->getClientID());
+    res_columns[4]->insert(context->getZooKeeper()->getConnectedTime());
+    res_columns[5]->insert(context->getZooKeeperSessionUptime());
+    res_columns[6]->insert(context->getZooKeeper()->expired());
+    res_columns[7]->insert(0);
+    res_columns[8]->insert(context->getZooKeeper()->getClientID());
+
+    const auto add_enabled_feature_flags = [&](const auto & zookeeper)
+    {
+        Array enabled_feature_flags;
+        const auto * feature_flags = zookeeper->getKeeperFeatureFlags();
+        if (feature_flags)
+        {
+            for (const auto & feature_flag : magic_enum::enum_values<KeeperFeatureFlag>())
+            {
+                if (feature_flags->isEnabled(feature_flag))
+                {
+                    enabled_feature_flags.push_back(feature_flag);
+                }
+            }
+        }
+        res_columns[9]->insert(std::move(enabled_feature_flags));
+    };
+
+    add_enabled_feature_flags(context->getZooKeeper());
 
     for (const auto & elem : context->getAuxiliaryZooKeepers())
     {
@@ -40,10 +72,12 @@ void StorageSystemZooKeeperConnection::fillData(MutableColumns & res_columns, Co
         res_columns[1]->insert(elem.second->getConnectedZooKeeperHost());
         res_columns[2]->insert(elem.second->getConnectedZooKeeperPort());
         res_columns[3]->insert(elem.second->getConnectedZooKeeperIndex());
-        res_columns[4]->insert(elem.second->getSessionUptime());
-        res_columns[5]->insert(elem.second->expired());
-        res_columns[6]->insert(elem.second->getApiVersion());
-        res_columns[7]->insert(elem.second->getClientID());
+        res_columns[4]->insert(elem.second->getConnectedTime());
+        res_columns[5]->insert(elem.second->getSessionUptime());
+        res_columns[6]->insert(elem.second->expired());
+        res_columns[7]->insert(0);
+        res_columns[8]->insert(elem.second->getClientID());
+        add_enabled_feature_flags(elem.second);
     }
 
 }
diff --git a/src/Storages/System/attachSystemTables.cpp b/src/Storages/System/attachSystemTables.cpp
index 424c74662ec..7d21d9e39d2 100644
--- a/src/Storages/System/attachSystemTables.cpp
+++ b/src/Storages/System/attachSystemTables.cpp
@@ -36,6 +36,7 @@
 #include <Storages/System/StorageSystemPartsColumns.h>
 #include <Storages/System/StorageSystemProjectionPartsColumns.h>
 #include <Storages/System/StorageSystemProcesses.h>
+#include <Storages/System/StorageSystemUserProcesses.h>
 #include <Storages/System/StorageSystemReplicas.h>
 #include <Storages/System/StorageSystemReplicationQueue.h>
 #include <Storages/System/StorageSystemDistributionQueue.h>
@@ -185,6 +186,7 @@ void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, b
     attach<StorageSystemRemoteDataPaths>(context, system_database, "remote_data_paths");
     attach<StorageSystemCertificates>(context, system_database, "certificates");
     attach<StorageSystemNamedCollections>(context, system_database, "named_collections");
+    attach<StorageSystemUserProcesses>(context, system_database, "user_processes");
 
     if (has_zookeeper)
     {
diff --git a/src/Storages/TTLDescription.cpp b/src/Storages/TTLDescription.cpp
index e1a80800630..f601fed06ac 100644
--- a/src/Storages/TTLDescription.cpp
+++ b/src/Storages/TTLDescription.cpp
@@ -285,7 +285,7 @@ TTLDescription TTLDescription::getTTLFromAST(
         {
             result.recompression_codec =
                 CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(
-                    ttl_element->recompression_codec, {}, !context->getSettingsRef().allow_suspicious_codecs, context->getSettingsRef().allow_experimental_codecs);
+                    ttl_element->recompression_codec, {}, !context->getSettingsRef().allow_suspicious_codecs, context->getSettingsRef().allow_experimental_codecs, context->getSettingsRef().enable_deflate_qpl_codec);
         }
     }
 
diff --git a/src/Storages/VirtualColumnUtils.cpp b/src/Storages/VirtualColumnUtils.cpp
index c38a2b4ed42..907fc0cd22c 100644
--- a/src/Storages/VirtualColumnUtils.cpp
+++ b/src/Storages/VirtualColumnUtils.cpp
@@ -20,9 +20,18 @@
 #include <Columns/ColumnsCommon.h>
 #include <Columns/FilterDescription.h>
 
+#include <Processors/QueryPlan/QueryPlan.h>
+#include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
+#include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
+#include <Processors/Sinks/EmptySink.h>
+#include <Processors/Executors/CompletedPipelineExecutor.h>
+#include <QueryPipeline/QueryPipelineBuilder.h>
+
 #include <Storages/VirtualColumnUtils.h>
 #include <IO/WriteHelpers.h>
 #include <Common/typeid_cast.h>
+#include <Columns/ColumnSet.h>
+#include <Functions/FunctionHelpers.h>
 #include <Interpreters/ActionsVisitor.h>
 
 
@@ -80,25 +89,6 @@ ASTPtr buildWhereExpression(const ASTs & functions)
     return makeASTFunction("and", functions);
 }
 
-void buildSets(const ASTPtr & expression, ExpressionAnalyzer & analyzer)
-{
-    const auto * func = expression->as<ASTFunction>();
-    if (func && functionIsInOrGlobalInOperator(func->name))
-    {
-        const IAST & args = *func->arguments;
-        const ASTPtr & arg = args.children.at(1);
-        if (arg->as<ASTSubquery>() || arg->as<ASTTableIdentifier>())
-        {
-            analyzer.tryMakeSetForIndexFromSubquery(arg);
-        }
-    }
-    else
-    {
-        for (const auto & child : expression->children)
-            buildSets(child, analyzer);
-    }
-}
-
 }
 
 namespace VirtualColumnUtils
@@ -199,9 +189,36 @@ void filterBlockWithQuery(const ASTPtr & query, Block & block, ContextPtr contex
     /// Let's analyze and calculate the prepared expression.
     auto syntax_result = TreeRewriter(context).analyze(expression_ast, block.getNamesAndTypesList());
     ExpressionAnalyzer analyzer(expression_ast, syntax_result, context);
-    buildSets(expression_ast, analyzer);
     ExpressionActionsPtr actions = analyzer.getActions(false /* add alises */, true /* project result */, CompileExpressions::yes);
 
+    for (const auto & node : actions->getNodes())
+    {
+        if (node.type == ActionsDAG::ActionType::COLUMN)
+        {
+            const ColumnSet * column_set = checkAndGetColumnConstData<const ColumnSet>(node.column.get());
+            if (!column_set)
+                column_set = checkAndGetColumn<const ColumnSet>(node.column.get());
+
+            if (column_set)
+            {
+                auto future_set = column_set->getData();
+                if (!future_set->get())
+                {
+                    if (auto * set_from_subquery = typeid_cast<FutureSetFromSubquery *>(future_set.get()))
+                    {
+                        auto plan = set_from_subquery->build(context);
+                        auto builder = plan->buildQueryPipeline(QueryPlanOptimizationSettings::fromContext(context), BuildQueryPipelineSettings::fromContext(context));
+                        auto pipeline = QueryPipelineBuilder::getPipeline(std::move(*builder));
+                        pipeline.complete(std::make_shared<EmptySink>(Block()));
+
+                        CompletedPipelineExecutor executor(pipeline);
+                        executor.execute();
+                    }
+                }
+            }
+        }
+    }
+
     Block block_with_filter = block;
     actions->execute(block_with_filter);
 
diff --git a/src/Storages/WindowView/StorageWindowView.cpp b/src/Storages/WindowView/StorageWindowView.cpp
index 94d5db170a8..242e8e5d570 100644
--- a/src/Storages/WindowView/StorageWindowView.cpp
+++ b/src/Storages/WindowView/StorageWindowView.cpp
@@ -1340,7 +1340,7 @@ ASTPtr StorageWindowView::innerQueryParser(const ASTSelectQuery & query)
         time_zone = &DateLUT::instance(window_view_timezone);
     }
     else
-        time_zone = &DateLUT::instance();
+        time_zone = &DateLUT::serverTimezoneInstance();
 
     return result;
 }
@@ -1549,7 +1549,7 @@ void StorageWindowView::writeIntoWindowView(
     auto lock = inner_table->lockForShare(
         local_context->getCurrentQueryId(), local_context->getSettingsRef().lock_acquire_timeout);
     auto metadata_snapshot = inner_table->getInMemoryMetadataPtr();
-    auto output = inner_table->write(window_view.getMergeableQuery(), metadata_snapshot, local_context);
+    auto output = inner_table->write(window_view.getMergeableQuery(), metadata_snapshot, local_context, /*async_insert=*/false);
     output->addTableLock(lock);
 
     if (!blocksHaveEqualStructure(builder.getHeader(), output->getHeader()))
diff --git a/src/Storages/buildQueryTreeForShard.cpp b/src/Storages/buildQueryTreeForShard.cpp
new file mode 100644
index 00000000000..1ee7d747fcc
--- /dev/null
+++ b/src/Storages/buildQueryTreeForShard.cpp
@@ -0,0 +1,378 @@
+
+#include <Storages/buildQueryTreeForShard.h>
+
+#include <Analyzer/ColumnNode.h>
+#include <Analyzer/FunctionNode.h>
+#include <Analyzer/IQueryTreeNode.h>
+#include <Analyzer/InDepthQueryTreeVisitor.h>
+#include <Analyzer/TableNode.h>
+#include <Analyzer/JoinNode.h>
+#include <Analyzer/Utils.h>
+#include <Functions/FunctionFactory.h>
+#include <Interpreters/InterpreterSelectQueryAnalyzer.h>
+#include <Storages/removeGroupingFunctionSpecializations.h>
+#include <Storages/StorageDistributed.h>
+#include <Storages/StorageDummy.h>
+#include <Planner/Utils.h>
+#include <Processors/Executors/CompletedPipelineExecutor.h>
+#include <Processors/QueryPlan/ExpressionStep.h>
+#include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
+#include <QueryPipeline/QueryPipelineBuilder.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+    extern const int DISTRIBUTED_IN_JOIN_SUBQUERY_DENIED;
+}
+
+namespace
+{
+
+/// Visitor that collect column source to columns mapping from query and all subqueries
+class CollectColumnSourceToColumnsVisitor : public InDepthQueryTreeVisitor<CollectColumnSourceToColumnsVisitor>
+{
+public:
+    struct Columns
+    {
+        NameSet column_names;
+        NamesAndTypes columns;
+
+        void addColumn(NameAndTypePair column)
+        {
+            if (column_names.contains(column.name))
+                return;
+
+            column_names.insert(column.name);
+            columns.push_back(std::move(column));
+        }
+    };
+
+    const std::unordered_map<QueryTreeNodePtr, Columns> & getColumnSourceToColumns() const
+    {
+        return column_source_to_columns;
+    }
+
+    void visitImpl(QueryTreeNodePtr & node)
+    {
+        auto * column_node = node->as<ColumnNode>();
+        if (!column_node)
+            return;
+
+        auto column_source = column_node->getColumnSourceOrNull();
+        if (!column_source)
+            return;
+
+        auto it = column_source_to_columns.find(column_source);
+        if (it == column_source_to_columns.end())
+        {
+            auto [insert_it, _] = column_source_to_columns.emplace(column_source, Columns());
+            it = insert_it;
+        }
+
+        it->second.addColumn(column_node->getColumn());
+    }
+
+private:
+    std::unordered_map<QueryTreeNodePtr, Columns> column_source_to_columns;
+};
+
+/** Visitor that rewrites IN and JOINs in query and all subqueries according to distributed_product_mode and
+  * prefer_global_in_and_join settings.
+  *
+  * Additionally collects GLOBAL JOIN and GLOBAL IN query nodes.
+  *
+  * If distributed_product_mode = deny, then visitor throws exception if there are multiple distributed tables.
+  * If distributed_product_mode = local, then visitor collects replacement map for tables that must be replaced
+  * with local tables.
+  * If distributed_product_mode = global or prefer_global_in_and_join setting is true, then visitor rewrites JOINs and IN functions that
+  * contain distributed tables to GLOBAL JOINs and GLOBAL IN functions.
+  * If distributed_product_mode = allow, then visitor does not rewrite query if there are multiple distributed tables.
+  */
+class DistributedProductModeRewriteInJoinVisitor : public InDepthQueryTreeVisitorWithContext<DistributedProductModeRewriteInJoinVisitor>
+{
+public:
+    using Base = InDepthQueryTreeVisitorWithContext<DistributedProductModeRewriteInJoinVisitor>;
+    using Base::Base;
+
+    explicit DistributedProductModeRewriteInJoinVisitor(const ContextPtr & context_)
+        : Base(context_)
+    {}
+
+    struct InFunctionOrJoin
+    {
+        QueryTreeNodePtr query_node;
+        size_t subquery_depth = 0;
+    };
+
+    const std::unordered_map<const IQueryTreeNode *, QueryTreeNodePtr> & getReplacementMap() const
+    {
+        return replacement_map;
+    }
+
+    const std::vector<InFunctionOrJoin> & getGlobalInOrJoinNodes() const
+    {
+        return global_in_or_join_nodes;
+    }
+
+    static bool needChildVisit(QueryTreeNodePtr & parent, QueryTreeNodePtr & child)
+    {
+        auto * function_node = parent->as<FunctionNode>();
+        if (function_node && isNameOfGlobalInFunction(function_node->getFunctionName()))
+            return false;
+
+        auto * join_node = parent->as<JoinNode>();
+        if (join_node && join_node->getLocality() == JoinLocality::Global && join_node->getRightTableExpression() == child)
+            return false;
+
+        return true;
+    }
+
+    void visitImpl(QueryTreeNodePtr & node)
+    {
+        auto * function_node = node->as<FunctionNode>();
+        auto * join_node = node->as<JoinNode>();
+
+        if ((function_node && isNameOfGlobalInFunction(function_node->getFunctionName())) ||
+            (join_node && join_node->getLocality() == JoinLocality::Global))
+        {
+            InFunctionOrJoin in_function_or_join_entry;
+            in_function_or_join_entry.query_node = node;
+            in_function_or_join_entry.subquery_depth = getSubqueryDepth();
+            global_in_or_join_nodes.push_back(std::move(in_function_or_join_entry));
+            return;
+        }
+
+        if ((function_node && isNameOfLocalInFunction(function_node->getFunctionName())) ||
+            (join_node && join_node->getLocality() != JoinLocality::Global))
+        {
+            InFunctionOrJoin in_function_or_join_entry;
+            in_function_or_join_entry.query_node = node;
+            in_function_or_join_entry.subquery_depth = getSubqueryDepth();
+            in_function_or_join_stack.push_back(in_function_or_join_entry);
+            return;
+        }
+
+        if (node->getNodeType() == QueryTreeNodeType::TABLE)
+            tryRewriteTableNodeIfNeeded(node);
+    }
+
+    void leaveImpl(QueryTreeNodePtr & node)
+    {
+        if (!in_function_or_join_stack.empty() && node.get() == in_function_or_join_stack.back().query_node.get())
+            in_function_or_join_stack.pop_back();
+    }
+
+private:
+    void tryRewriteTableNodeIfNeeded(const QueryTreeNodePtr & table_node)
+    {
+        const auto & table_node_typed = table_node->as<TableNode &>();
+        const auto * distributed_storage = typeid_cast<const StorageDistributed *>(table_node_typed.getStorage().get());
+        if (!distributed_storage)
+            return;
+
+        bool distributed_valid_for_rewrite = distributed_storage->getShardCount() >= 2;
+        if (!distributed_valid_for_rewrite)
+            return;
+
+        auto distributed_product_mode = getSettings().distributed_product_mode;
+
+        if (distributed_product_mode == DistributedProductMode::LOCAL)
+        {
+            StorageID remote_storage_id = StorageID{distributed_storage->getRemoteDatabaseName(),
+                distributed_storage->getRemoteTableName()};
+            auto resolved_remote_storage_id = getContext()->resolveStorageID(remote_storage_id);
+            const auto & distributed_storage_columns = table_node_typed.getStorageSnapshot()->metadata->getColumns();
+            auto storage = std::make_shared<StorageDummy>(resolved_remote_storage_id, distributed_storage_columns);
+            auto replacement_table_expression = std::make_shared<TableNode>(std::move(storage), getContext());
+            replacement_map.emplace(table_node.get(), std::move(replacement_table_expression));
+        }
+        else if ((distributed_product_mode == DistributedProductMode::GLOBAL || getSettings().prefer_global_in_and_join) &&
+            !in_function_or_join_stack.empty())
+        {
+            auto * in_or_join_node_to_modify = in_function_or_join_stack.back().query_node.get();
+
+            if (auto * in_function_to_modify = in_or_join_node_to_modify->as<FunctionNode>())
+            {
+                auto global_in_function_name = getGlobalInFunctionNameForLocalInFunctionName(in_function_to_modify->getFunctionName());
+                auto global_in_function_resolver = FunctionFactory::instance().get(global_in_function_name, getContext());
+                in_function_to_modify->resolveAsFunction(global_in_function_resolver->build(in_function_to_modify->getArgumentColumns()));
+            }
+            else if (auto * join_node_to_modify = in_or_join_node_to_modify->as<JoinNode>())
+            {
+                join_node_to_modify->setLocality(JoinLocality::Global);
+            }
+
+            global_in_or_join_nodes.push_back(in_function_or_join_stack.back());
+        }
+        else if (distributed_product_mode == DistributedProductMode::ALLOW)
+        {
+            return;
+        }
+        else if (distributed_product_mode == DistributedProductMode::DENY)
+        {
+            throw Exception(ErrorCodes::DISTRIBUTED_IN_JOIN_SUBQUERY_DENIED,
+                "Double-distributed IN/JOIN subqueries is denied (distributed_product_mode = 'deny'). "
+                "You may rewrite query to use local tables "
+                "in subqueries, or use GLOBAL keyword, or set distributed_product_mode to suitable value.");
+        }
+    }
+
+    std::vector<InFunctionOrJoin> in_function_or_join_stack;
+    std::unordered_map<const IQueryTreeNode *, QueryTreeNodePtr> replacement_map;
+    std::vector<InFunctionOrJoin> global_in_or_join_nodes;
+};
+
+/** Execute subquery node and put result in mutable context temporary table.
+  * Returns table node that is initialized with temporary table storage.
+  */
+TableNodePtr executeSubqueryNode(const QueryTreeNodePtr & subquery_node,
+    ContextMutablePtr & mutable_context,
+    size_t subquery_depth)
+{
+    auto subquery_hash = subquery_node->getTreeHash();
+    String temporary_table_name = fmt::format("_data_{}_{}", subquery_hash.first, subquery_hash.second);
+
+    const auto & external_tables = mutable_context->getExternalTables();
+    auto external_table_it = external_tables.find(temporary_table_name);
+    if (external_table_it != external_tables.end())
+    {
+        auto temporary_table_expression_node = std::make_shared<TableNode>(external_table_it->second, mutable_context);
+        temporary_table_expression_node->setTemporaryTableName(temporary_table_name);
+        return temporary_table_expression_node;
+    }
+
+    auto subquery_options = SelectQueryOptions(QueryProcessingStage::Complete, subquery_depth, true /*is_subquery*/);
+    auto context_copy = Context::createCopy(mutable_context);
+    updateContextForSubqueryExecution(context_copy);
+
+    InterpreterSelectQueryAnalyzer interpreter(subquery_node, context_copy, subquery_options);
+    auto & query_plan = interpreter.getQueryPlan();
+
+    auto sample_block_with_unique_names = query_plan.getCurrentDataStream().header;
+    makeUniqueColumnNamesInBlock(sample_block_with_unique_names);
+
+    if (!blocksHaveEqualStructure(sample_block_with_unique_names, query_plan.getCurrentDataStream().header))
+    {
+        auto actions_dag = ActionsDAG::makeConvertingActions(
+            query_plan.getCurrentDataStream().header.getColumnsWithTypeAndName(),
+            sample_block_with_unique_names.getColumnsWithTypeAndName(),
+            ActionsDAG::MatchColumnsMode::Position);
+        auto converting_step = std::make_unique<ExpressionStep>(query_plan.getCurrentDataStream(), std::move(actions_dag));
+        query_plan.addStep(std::move(converting_step));
+    }
+
+    Block sample = interpreter.getSampleBlock();
+    NamesAndTypesList columns = sample.getNamesAndTypesList();
+
+    auto external_storage_holder = TemporaryTableHolder(
+        mutable_context,
+        ColumnsDescription{columns},
+        ConstraintsDescription{},
+        nullptr /*query*/,
+        true /*create_for_global_subquery*/);
+
+    StoragePtr external_storage = external_storage_holder.getTable();
+    auto temporary_table_expression_node = std::make_shared<TableNode>(external_storage, mutable_context);
+    temporary_table_expression_node->setTemporaryTableName(temporary_table_name);
+
+    auto table_out = external_storage->write({}, external_storage->getInMemoryMetadataPtr(), mutable_context, /*async_insert=*/false);
+
+    auto optimization_settings = QueryPlanOptimizationSettings::fromContext(mutable_context);
+    auto build_pipeline_settings = BuildQueryPipelineSettings::fromContext(mutable_context);
+    auto pipeline = QueryPipelineBuilder::getPipeline(std::move(*query_plan.buildQueryPipeline(optimization_settings, build_pipeline_settings)));
+
+    pipeline.complete(std::move(table_out));
+    CompletedPipelineExecutor executor(pipeline);
+    executor.execute();
+    mutable_context->addExternalTable(temporary_table_name, std::move(external_storage_holder));
+
+    return temporary_table_expression_node;
+}
+
+}
+
+QueryTreeNodePtr buildQueryTreeForShard(SelectQueryInfo & query_info, QueryTreeNodePtr query_tree_to_modify)
+{
+    auto & planner_context = query_info.planner_context;
+
+    CollectColumnSourceToColumnsVisitor collect_column_source_to_columns_visitor;
+    collect_column_source_to_columns_visitor.visit(query_tree_to_modify);
+
+    const auto & column_source_to_columns = collect_column_source_to_columns_visitor.getColumnSourceToColumns();
+
+    DistributedProductModeRewriteInJoinVisitor visitor(planner_context->getQueryContext());
+    visitor.visit(query_tree_to_modify);
+
+    auto replacement_map = visitor.getReplacementMap();
+    const auto & global_in_or_join_nodes = visitor.getGlobalInOrJoinNodes();
+
+    for (const auto & global_in_or_join_node : global_in_or_join_nodes)
+    {
+        if (auto * join_node = global_in_or_join_node.query_node->as<JoinNode>())
+        {
+            auto join_right_table_expression = join_node->getRightTableExpression();
+            auto join_right_table_expression_node_type = join_right_table_expression->getNodeType();
+
+            QueryTreeNodePtr subquery_node;
+
+            if (join_right_table_expression_node_type == QueryTreeNodeType::QUERY ||
+                join_right_table_expression_node_type == QueryTreeNodeType::UNION)
+            {
+                subquery_node = join_right_table_expression;
+            }
+            else if (join_right_table_expression_node_type == QueryTreeNodeType::TABLE ||
+                join_right_table_expression_node_type == QueryTreeNodeType::TABLE_FUNCTION)
+            {
+                const auto & columns = column_source_to_columns.at(join_right_table_expression).columns;
+                subquery_node = buildSubqueryToReadColumnsFromTableExpression(columns,
+                    join_right_table_expression,
+                    planner_context->getQueryContext());
+            }
+            else
+            {
+                throw Exception(ErrorCodes::LOGICAL_ERROR,
+                    "Expected JOIN right table expression to be table, table function, query or union node. Actual {}",
+                    join_right_table_expression->formatASTForErrorMessage());
+            }
+
+            auto temporary_table_expression_node = executeSubqueryNode(subquery_node,
+                planner_context->getMutableQueryContext(),
+                global_in_or_join_node.subquery_depth);
+            temporary_table_expression_node->setAlias(join_right_table_expression->getAlias());
+
+            replacement_map.emplace(join_right_table_expression.get(), std::move(temporary_table_expression_node));
+            continue;
+        }
+        else if (auto * in_function_node = global_in_or_join_node.query_node->as<FunctionNode>())
+        {
+            auto & in_function_subquery_node = in_function_node->getArguments().getNodes().at(1);
+            auto in_function_node_type = in_function_subquery_node->getNodeType();
+            if (in_function_node_type != QueryTreeNodeType::QUERY && in_function_node_type != QueryTreeNodeType::UNION)
+                continue;
+
+            auto temporary_table_expression_node = executeSubqueryNode(in_function_subquery_node,
+                planner_context->getMutableQueryContext(),
+                global_in_or_join_node.subquery_depth);
+
+            in_function_subquery_node = std::move(temporary_table_expression_node);
+        }
+        else
+        {
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                "Expected global IN or JOIN query node. Actual {}",
+                global_in_or_join_node.query_node->formatASTForErrorMessage());
+        }
+    }
+
+    if (!replacement_map.empty())
+        query_tree_to_modify = query_tree_to_modify->cloneAndReplace(replacement_map);
+
+    removeGroupingFunctionSpecializations(query_tree_to_modify);
+
+    return query_tree_to_modify;
+}
+
+}
diff --git a/src/Storages/buildQueryTreeForShard.h b/src/Storages/buildQueryTreeForShard.h
new file mode 100644
index 00000000000..05d63faeb9f
--- /dev/null
+++ b/src/Storages/buildQueryTreeForShard.h
@@ -0,0 +1,15 @@
+#pragma once
+
+#include <memory>
+
+namespace DB
+{
+
+struct SelectQueryInfo;
+
+class IQueryTreeNode;
+using QueryTreeNodePtr = std::shared_ptr<IQueryTreeNode>;
+
+QueryTreeNodePtr buildQueryTreeForShard(SelectQueryInfo & query_info, QueryTreeNodePtr query_tree_to_modify);
+
+}
diff --git a/src/Storages/getStructureOfRemoteTable.cpp b/src/Storages/getStructureOfRemoteTable.cpp
index b2737249166..e5fc01be9f4 100644
--- a/src/Storages/getStructureOfRemoteTable.cpp
+++ b/src/Storages/getStructureOfRemoteTable.cpp
@@ -60,6 +60,15 @@ ColumnsDescription getStructureOfRemoteTableInShard(
     ColumnsDescription res;
     auto new_context = ClusterProxy::updateSettingsForCluster(cluster, context, context->getSettingsRef(), table_id);
 
+    /// Ignore limit for result number of rows (that could be set during handling CSE/CTE),
+    /// since this is a service query and should not lead to query failure.
+    {
+        Settings new_settings = new_context->getSettings();
+        new_settings.max_result_rows = 0;
+        new_settings.max_result_bytes = 0;
+        new_context->setSettings(new_settings);
+    }
+
     /// Expect only needed columns from the result of DESC TABLE. NOTE 'comment' column is ignored for compatibility reasons.
     Block sample_block
     {
diff --git a/src/Storages/registerStorages.cpp b/src/Storages/registerStorages.cpp
index 8be176a5375..a4f1d963704 100644
--- a/src/Storages/registerStorages.cpp
+++ b/src/Storages/registerStorages.cpp
@@ -59,6 +59,7 @@ void registerStorageMySQL(StorageFactory & factory);
 #endif
 
 void registerStorageMongoDB(StorageFactory & factory);
+void registerStorageRedis(StorageFactory & factory);
 
 
 #if USE_RDKAFKA
@@ -96,6 +97,10 @@ void registerStorageSQLite(StorageFactory & factory);
 
 void registerStorageKeeperMap(StorageFactory & factory);
 
+#if USE_AZURE_BLOB_STORAGE
+void registerStorageAzureBlob(StorageFactory & factory);
+#endif
+
 void registerStorages()
 {
     auto & factory = StorageFactory::instance();
@@ -156,6 +161,7 @@ void registerStorages()
     #endif
 
     registerStorageMongoDB(factory);
+    registerStorageRedis(factory);
 
     #if USE_RDKAFKA
     registerStorageKafka(factory);
@@ -191,6 +197,10 @@ void registerStorages()
     #endif
 
     registerStorageKeeperMap(factory);
+
+    #if USE_AZURE_BLOB_STORAGE
+    registerStorageAzureBlob(factory);
+    #endif
 }
 
 }
diff --git a/src/Storages/tests/gtest_storage_log.cpp b/src/Storages/tests/gtest_storage_log.cpp
index b63de6a66ef..352c44554bd 100644
--- a/src/Storages/tests/gtest_storage_log.cpp
+++ b/src/Storages/tests/gtest_storage_log.cpp
@@ -95,7 +95,7 @@ std::string writeData(int rows, DB::StoragePtr & table, const DB::ContextPtr con
         block.insert(column);
     }
 
-    QueryPipeline pipeline(table->write({}, metadata_snapshot, context));
+    QueryPipeline pipeline(table->write({}, metadata_snapshot, context, /*async_insert=*/false));
 
     PushingPipelineExecutor executor(pipeline);
     executor.push(block);
diff --git a/src/TableFunctions/CMakeLists.txt b/src/TableFunctions/CMakeLists.txt
index b1fa61a72ee..c9e5c66fe4a 100644
--- a/src/TableFunctions/CMakeLists.txt
+++ b/src/TableFunctions/CMakeLists.txt
@@ -1,5 +1,7 @@
 include("${ClickHouse_SOURCE_DIR}/cmake/dbms_glob_sources.cmake")
+
 add_headers_and_sources(clickhouse_table_functions .)
+
 if (TARGET ch_contrib::hivemetastore)
     add_headers_and_sources(clickhouse_table_functions Hive)
 endif ()
@@ -16,6 +18,11 @@ list(REMOVE_ITEM clickhouse_table_functions_headers
 add_library(clickhouse_table_functions ${clickhouse_table_functions_sources})
 
 target_link_libraries(clickhouse_table_functions PRIVATE clickhouse_parsers clickhouse_storages_system dbms)
+
 if (TARGET ch_contrib::hivemetastore)
     target_link_libraries(clickhouse_table_functions PRIVATE ch_contrib::hivemetastore ch_contrib::hdfs ch_contrib::parquet)
 endif ()
+
+if (TARGET ch_contrib::azure_sdk)
+    target_link_libraries(clickhouse_table_functions PRIVATE ch_contrib::azure_sdk)
+endif ()
diff --git a/src/TableFunctions/ITableFunctionCluster.h b/src/TableFunctions/ITableFunctionCluster.h
index ad88d7b54f0..a8329684ee6 100644
--- a/src/TableFunctions/ITableFunctionCluster.h
+++ b/src/TableFunctions/ITableFunctionCluster.h
@@ -2,12 +2,13 @@
 
 #include "config.h"
 
-#include <TableFunctions/ITableFunction.h>
-#include <TableFunctions/TableFunctionS3.h>
-#include <Storages/StorageS3Cluster.h>
-#include <Interpreters/evaluateConstantExpression.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/evaluateConstantExpression.h>
+#include <Storages/StorageS3Cluster.h>
 #include <Storages/checkAndGetLiteralArgument.h>
+#include <TableFunctions/ITableFunction.h>
+#include <TableFunctions/TableFunctionAzureBlobStorage.h>
+#include <TableFunctions/TableFunctionS3.h>
 
 
 namespace DB
diff --git a/src/TableFunctions/TableFunctionAzureBlobStorage.cpp b/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
new file mode 100644
index 00000000000..d2a96173491
--- /dev/null
+++ b/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
@@ -0,0 +1,255 @@
+#include "config.h"
+
+#if USE_AZURE_BLOB_STORAGE
+
+#include <Interpreters/evaluateConstantExpression.h>
+#include <Interpreters/Context.h>
+#include <TableFunctions/TableFunctionFactory.h>
+#include <TableFunctions/TableFunctionS3.h>
+#include <TableFunctions/TableFunctionAzureBlobStorage.h>
+#include <Interpreters/parseColumnsListForTableFunction.h>
+#include <Access/Common/AccessFlags.h>
+#include <Parsers/ASTLiteral.h>
+#include <Parsers/ASTIdentifier.h>
+#include <Parsers/ASTFunction.h>
+#include <Storages/checkAndGetLiteralArgument.h>
+#include <Storages/StorageAzureBlob.h>
+#include <Storages/StorageURL.h>
+#include <Storages/NamedCollectionsHelpers.h>
+#include <Formats/FormatFactory.h>
+#include "registerTableFunctions.h"
+#include <Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+
+#include <boost/algorithm/string.hpp>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int BAD_ARGUMENTS;
+}
+
+namespace
+{
+
+bool isConnectionString(const std::string & candidate)
+{
+    return candidate.starts_with("DefaultEndpointsProtocol");
+}
+
+}
+
+StorageAzureBlob::Configuration TableFunctionAzureBlobStorage::parseArgumentsImpl(ASTs & engine_args, const ContextPtr & local_context, bool get_format_from_file)
+{
+    StorageAzureBlob::Configuration configuration;
+
+    /// Supported signatures:
+    ///
+    /// AzureBlobStorage(connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression, structure])
+    ///
+
+    if (auto named_collection = tryGetNamedCollectionWithOverrides(engine_args, local_context))
+    {
+        StorageAzureBlob::processNamedCollectionResult(configuration, *named_collection);
+
+        configuration.blobs_paths = {configuration.blob_path};
+
+        if (configuration.format == "auto" && get_format_from_file)
+            configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path, true);
+
+        return configuration;
+    }
+
+    if (engine_args.size() < 3 || engine_args.size() > 8)
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                        "Storage Azure requires 3 to 7 arguments: "
+                        "AzureBlobStorage(connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression, structure])");
+
+    for (auto & engine_arg : engine_args)
+        engine_arg = evaluateConstantExpressionOrIdentifierAsLiteral(engine_arg, local_context);
+
+    std::unordered_map<std::string_view, size_t> engine_args_to_idx;
+
+    configuration.connection_url = checkAndGetLiteralArgument<String>(engine_args[0], "connection_string/storage_account_url");
+    configuration.is_connection_string = isConnectionString(configuration.connection_url);
+
+    configuration.container = checkAndGetLiteralArgument<String>(engine_args[1], "container");
+    configuration.blob_path = checkAndGetLiteralArgument<String>(engine_args[2], "blobpath");
+
+    auto is_format_arg = [] (const std::string & s) -> bool
+    {
+        return s == "auto" || FormatFactory::instance().getAllFormats().contains(s);
+    };
+
+    if (engine_args.size() == 4)
+    {
+        auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name/structure");
+        if (is_format_arg(fourth_arg))
+        {
+            configuration.format = fourth_arg;
+        }
+        else
+        {
+            configuration.structure = fourth_arg;
+        }
+    }
+    else if (engine_args.size() == 5)
+    {
+        auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name");
+        if (is_format_arg(fourth_arg))
+        {
+            configuration.format = fourth_arg;
+            configuration.compression_method = checkAndGetLiteralArgument<String>(engine_args[4], "compression");
+        }
+        else
+        {
+            configuration.account_name = fourth_arg;
+            configuration.account_key = checkAndGetLiteralArgument<String>(engine_args[4], "account_key");
+        }
+    }
+    else if (engine_args.size() == 6)
+    {
+        auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name");
+        if (is_format_arg(fourth_arg))
+        {
+            configuration.format = fourth_arg;
+            configuration.compression_method = checkAndGetLiteralArgument<String>(engine_args[4], "compression");
+            configuration.structure = checkAndGetLiteralArgument<String>(engine_args[5], "structure");
+        }
+        else
+        {
+            configuration.account_name = fourth_arg;
+            configuration.account_key = checkAndGetLiteralArgument<String>(engine_args[4], "account_key");
+            auto sixth_arg = checkAndGetLiteralArgument<String>(engine_args[5], "format/account_name");
+            if (!is_format_arg(sixth_arg))
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown format {}", sixth_arg);
+            configuration.format = sixth_arg;
+        }
+    }
+    else if (engine_args.size() == 7)
+    {
+        auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name");
+        if (is_format_arg(fourth_arg))
+        {
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Format, compression and structure must be last arguments");
+        }
+        else
+        {
+            configuration.account_name = fourth_arg;
+            configuration.account_key = checkAndGetLiteralArgument<String>(engine_args[4], "account_key");
+            auto sixth_arg = checkAndGetLiteralArgument<String>(engine_args[5], "format/account_name");
+            if (!is_format_arg(sixth_arg))
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown format {}", sixth_arg);
+            configuration.format = sixth_arg;
+            configuration.compression_method = checkAndGetLiteralArgument<String>(engine_args[6], "compression");
+        }
+    }
+    else if (engine_args.size() == 8)
+    {
+
+        auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name");
+        if (is_format_arg(fourth_arg))
+        {
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Format and compression must be last arguments");
+        }
+        else
+        {
+            configuration.account_name = fourth_arg;
+            configuration.account_key = checkAndGetLiteralArgument<String>(engine_args[4], "account_key");
+            auto sixth_arg = checkAndGetLiteralArgument<String>(engine_args[5], "format/account_name");
+            if (!is_format_arg(sixth_arg))
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown format {}", sixth_arg);
+            configuration.format = sixth_arg;
+            configuration.compression_method = checkAndGetLiteralArgument<String>(engine_args[6], "compression");
+            configuration.structure = checkAndGetLiteralArgument<String>(engine_args[7], "structure");
+        }
+    }
+
+    configuration.blobs_paths = {configuration.blob_path};
+
+    if (configuration.format == "auto" && get_format_from_file)
+        configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path, true);
+
+    return configuration;
+}
+
+void TableFunctionAzureBlobStorage::parseArguments(const ASTPtr & ast_function, ContextPtr context)
+{
+    /// Clone ast function, because we can modify its arguments like removing headers.
+    auto ast_copy = ast_function->clone();
+
+    ASTs & args_func = ast_function->children;
+
+    if (args_func.size() != 1)
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' must have arguments.", getName());
+
+    auto & args = args_func.at(0)->children;
+
+    configuration = parseArgumentsImpl(args, context);
+}
+
+ColumnsDescription TableFunctionAzureBlobStorage::getActualTableStructure(ContextPtr context) const
+{
+    if (configuration.structure == "auto")
+    {
+        context->checkAccess(getSourceAccessType());
+        auto client = StorageAzureBlob::createClient(configuration);
+        auto settings = StorageAzureBlob::createSettings(context);
+
+        auto object_storage = std::make_unique<AzureObjectStorage>("AzureBlobStorageTableFunction", std::move(client), std::move(settings));
+        return StorageAzureBlob::getTableStructureFromData(object_storage.get(), configuration, std::nullopt, context);
+    }
+
+    return parseColumnsListFromString(configuration.structure, context);
+}
+
+bool TableFunctionAzureBlobStorage::supportsReadingSubsetOfColumns()
+{
+    return FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(configuration.format);
+}
+
+StoragePtr TableFunctionAzureBlobStorage::executeImpl(const ASTPtr & /*ast_function*/, ContextPtr context, const std::string & table_name, ColumnsDescription /*cached_columns*/) const
+{
+    auto client = StorageAzureBlob::createClient(configuration);
+    auto settings = StorageAzureBlob::createSettings(context);
+
+    ColumnsDescription columns;
+    if (configuration.structure != "auto")
+        columns = parseColumnsListFromString(configuration.structure, context);
+    else if (!structure_hint.empty())
+        columns = structure_hint;
+
+    StoragePtr storage = std::make_shared<StorageAzureBlob>(
+        configuration,
+        std::make_unique<AzureObjectStorage>(table_name, std::move(client), std::move(settings)),
+        context,
+        StorageID(getDatabaseName(), table_name),
+        columns,
+        ConstraintsDescription{},
+        String{},
+        /// No format_settings for table function Azure
+        std::nullopt,
+        nullptr);
+
+    storage->startup();
+
+    return storage;
+}
+
+void registerTableFunctionAzureBlobStorage(TableFunctionFactory & factory)
+{
+    factory.registerFunction<TableFunctionAzureBlobStorage>(
+        {.documentation
+         = {.description=R"(The table function can be used to read the data stored on Azure Blob Storage.)",
+            .examples{{"azureBlobStorage", "SELECT * FROM  azureBlobStorage(connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression, structure])", ""}}},
+         .allow_readonly = false});
+}
+
+}
+
+#endif
diff --git a/src/TableFunctions/TableFunctionAzureBlobStorage.h b/src/TableFunctions/TableFunctionAzureBlobStorage.h
new file mode 100644
index 00000000000..0ac3f9771c7
--- /dev/null
+++ b/src/TableFunctions/TableFunctionAzureBlobStorage.h
@@ -0,0 +1,70 @@
+#pragma once
+
+#include "config.h"
+
+#if USE_AZURE_BLOB_STORAGE
+
+#include <TableFunctions/ITableFunction.h>
+#include <Storages/StorageAzureBlob.h>
+
+
+namespace DB
+{
+
+class Context;
+
+/* AzureBlob(source, [access_key_id, secret_access_key,] [format, structure, compression]) - creates a temporary storage for a file in AzureBlob.
+ */
+class TableFunctionAzureBlobStorage : public ITableFunction
+{
+public:
+    static constexpr auto name = "azureBlobStorage";
+    static constexpr auto signature = "- connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression, structure]\n";
+
+    static size_t getMaxNumberOfArguments() { return 8; }
+
+    String getName() const override
+    {
+        return name;
+    }
+
+    virtual String getSignature() const
+    {
+        return signature;
+    }
+
+    bool hasStaticStructure() const override { return configuration.structure != "auto"; }
+
+    bool needStructureHint() const override { return configuration.structure == "auto"; }
+
+    void setStructureHint(const ColumnsDescription & structure_hint_) override { structure_hint = structure_hint_; }
+
+    bool supportsReadingSubsetOfColumns() override;
+
+    std::unordered_set<String> getVirtualsToCheckBeforeUsingStructureHint() const override
+    {
+        return {"_path", "_file"};
+    }
+
+    static StorageAzureBlob::Configuration parseArgumentsImpl(ASTs & args, const ContextPtr & context, bool get_format_from_file = true);
+
+protected:
+
+    StoragePtr executeImpl(
+        const ASTPtr & ast_function,
+        ContextPtr context,
+        const std::string & table_name,
+        ColumnsDescription cached_columns) const override;
+
+    const char * getStorageTypeName() const override { return "Azure"; }
+
+    ColumnsDescription getActualTableStructure(ContextPtr context) const override;
+    void parseArguments(const ASTPtr & ast_function, ContextPtr context) override;
+
+    mutable StorageAzureBlob::Configuration configuration;
+    ColumnsDescription structure_hint;
+};
+
+}
+
+#endif
diff --git a/src/TableFunctions/TableFunctionFile.cpp b/src/TableFunctions/TableFunctionFile.cpp
index ff64bb3dc67..0e49f26db40 100644
--- a/src/TableFunctions/TableFunctionFile.cpp
+++ b/src/TableFunctions/TableFunctionFile.cpp
@@ -75,6 +75,7 @@ StoragePtr TableFunctionFile::getStorage(const String & source,
         columns,
         ConstraintsDescription{},
         String{},
+        global_context->getSettingsRef().rename_files_after_processing,
     };
     if (fd >= 0)
         return std::make_shared<StorageFile>(fd, args);
diff --git a/src/TableFunctions/TableFunctionRedis.cpp b/src/TableFunctions/TableFunctionRedis.cpp
new file mode 100644
index 00000000000..ec659ae61e0
--- /dev/null
+++ b/src/TableFunctions/TableFunctionRedis.cpp
@@ -0,0 +1,94 @@
+#include <TableFunctions/TableFunctionRedis.h>
+
+#include <Common/Exception.h>
+#include <Common/parseAddress.h>
+
+#include <Interpreters/Context.h>
+
+#include <Parsers/ASTFunction.h>
+#include <Parsers/ASTIdentifier.h>
+
+#include <Interpreters/parseColumnsListForTableFunction.h>
+#include <Storages/ColumnsDescription.h>
+#include <TableFunctions/TableFunctionFactory.h>
+#include <TableFunctions/registerTableFunctions.h>
+#include <Storages/checkAndGetLiteralArgument.h>
+#include <Interpreters/evaluateConstantExpression.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+}
+
+StoragePtr TableFunctionRedis::executeImpl(
+    const ASTPtr & /*ast_function*/, ContextPtr context, const String & table_name, ColumnsDescription /*cached_columns*/) const
+{
+    auto columns = getActualTableStructure(context);
+
+    StorageInMemoryMetadata metadata;
+    metadata.setColumns(columns);
+
+    String db_name = "redis" + getDatabaseName() + "_db_" + toString(configuration.db_index);
+    auto storage = std::make_shared<StorageRedis>(
+        StorageID(db_name, table_name), configuration, context, metadata, primary_key);
+    storage->startup();
+    return storage;
+}
+
+ColumnsDescription TableFunctionRedis::getActualTableStructure(ContextPtr context) const
+{
+    return parseColumnsListFromString(structure, context);
+}
+
+void TableFunctionRedis::parseArguments(const ASTPtr & ast_function, ContextPtr context)
+{
+    const auto & func_args = ast_function->as<ASTFunction &>();
+    if (!func_args.arguments)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Table function 'redis' must have arguments.");
+
+    ASTs & args = func_args.arguments->children;
+
+    if (args.size() < 3)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Bad arguments count when creating Redis table function");
+
+    for (auto & arg : args)
+        arg = evaluateConstantExpressionOrIdentifierAsLiteral(arg, context);
+
+    auto parsed_host_port = parseAddress(checkAndGetLiteralArgument<String>(args[0], "host:port"), 6379);
+    configuration.host = parsed_host_port.first;
+    configuration.port = parsed_host_port.second;
+
+    primary_key = checkAndGetLiteralArgument<String>(args[1], "key");
+    structure = checkAndGetLiteralArgument<String>(args[2], "structure");
+
+    if (args.size() > 3)
+        configuration.db_index = static_cast<uint32_t>(checkAndGetLiteralArgument<UInt64>(args[3], "db_index"));
+    else
+        configuration.db_index = DEFAULT_REDIS_DB_INDEX;
+    if (args.size() > 4)
+        configuration.password = checkAndGetLiteralArgument<String>(args[4], "password");
+    else
+        configuration.password = DEFAULT_REDIS_PASSWORD;
+    if (args.size() > 5)
+        configuration.pool_size = static_cast<uint32_t>(checkAndGetLiteralArgument<UInt64>(args[5], "pool_size"));
+    else
+        configuration.pool_size = DEFAULT_REDIS_POOL_SIZE;
+
+    context->getRemoteHostFilter().checkHostAndPort(configuration.host, toString(configuration.port));
+
+    auto columns = parseColumnsListFromString(structure, context);
+    if (!columns.has(primary_key))
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Bad arguments redis table function structure should contains key.");
+}
+
+
+void registerTableFunctionRedis(TableFunctionFactory & factory)
+{
+    factory.registerFunction<TableFunctionRedis>();
+}
+
+}
diff --git a/src/TableFunctions/TableFunctionRedis.h b/src/TableFunctions/TableFunctionRedis.h
new file mode 100644
index 00000000000..b985a89e3d7
--- /dev/null
+++ b/src/TableFunctions/TableFunctionRedis.h
@@ -0,0 +1,34 @@
+#pragma once
+
+#include <Storages/StorageRedis.h>
+#include <TableFunctions/ITableFunction.h>
+#include <Storages/ExternalDataSourceConfiguration.h>
+
+namespace DB
+{
+
+/* Implements Redis table function.
+ * Use redis(host:port, key, structure[, db_index[, password[, pool_size]]]);
+ */
+class TableFunctionRedis : public ITableFunction
+{
+public:
+    static constexpr auto name = "redis";
+    String getName() const override { return name; }
+
+private:
+    StoragePtr executeImpl(
+        const ASTPtr & ast_function, ContextPtr context,
+        const String & table_name, ColumnsDescription cached_columns) const override;
+
+    const char * getStorageTypeName() const override { return "Redis"; }
+
+    ColumnsDescription getActualTableStructure(ContextPtr context) const override;
+    void parseArguments(const ASTPtr & ast_function, ContextPtr context) override;
+
+    RedisConfiguration configuration;
+    String structure;
+    String primary_key;
+};
+
+}
diff --git a/src/TableFunctions/TableFunctionRemote.cpp b/src/TableFunctions/TableFunctionRemote.cpp
index b2f09adf773..4143014a7b3 100644
--- a/src/TableFunctions/TableFunctionRemote.cpp
+++ b/src/TableFunctions/TableFunctionRemote.cpp
@@ -262,7 +262,7 @@ void TableFunctionRemote::parseArguments(const ASTPtr & ast_function, ContextPtr
             treat_local_as_remote,
             treat_local_port_as_remote,
             secure,
-            /* priority= */ 1,
+            /* priority= */ Priority{1},
             /* cluster_name= */ "",
             /* password= */ ""
         };
diff --git a/src/TableFunctions/registerTableFunctions.cpp b/src/TableFunctions/registerTableFunctions.cpp
index 4f3411df4c5..eb6e0372223 100644
--- a/src/TableFunctions/registerTableFunctions.cpp
+++ b/src/TableFunctions/registerTableFunctions.cpp
@@ -21,6 +21,7 @@ void registerTableFunctions()
     registerTableFunctionInput(factory);
     registerTableFunctionGenerate(factory);
     registerTableFunctionMongoDB(factory);
+    registerTableFunctionRedis(factory);
 
     registerTableFunctionMeiliSearch(factory);
 
@@ -71,6 +72,12 @@ void registerTableFunctions()
 
     registerTableFunctionFormat(factory);
     registerTableFunctionExplain(factory);
+
+#if USE_AZURE_BLOB_STORAGE
+    registerTableFunctionAzureBlobStorage(factory);
+#endif
+
+
 }
 
 }
diff --git a/src/TableFunctions/registerTableFunctions.h b/src/TableFunctions/registerTableFunctions.h
index c51522a5e99..758e193e88f 100644
--- a/src/TableFunctions/registerTableFunctions.h
+++ b/src/TableFunctions/registerTableFunctions.h
@@ -18,6 +18,7 @@ void registerTableFunctionValues(TableFunctionFactory & factory);
 void registerTableFunctionInput(TableFunctionFactory & factory);
 void registerTableFunctionGenerate(TableFunctionFactory & factory);
 void registerTableFunctionMongoDB(TableFunctionFactory & factory);
+void registerTableFunctionRedis(TableFunctionFactory & factory);
 
 void registerTableFunctionMeiliSearch(TableFunctionFactory & factory);
 
@@ -69,6 +70,10 @@ void registerTableFunctionFormat(TableFunctionFactory & factory);
 
 void registerTableFunctionExplain(TableFunctionFactory & factory);
 
+#if USE_AZURE_BLOB_STORAGE
+void registerTableFunctionAzureBlobStorage(TableFunctionFactory & factory);
+#endif
+
 void registerTableFunctions();
 
 }
diff --git a/tests/broken_tests.txt b/tests/analyzer_tech_debt.txt
similarity index 90%
rename from tests/broken_tests.txt
rename to tests/analyzer_tech_debt.txt
index 02935712325..0872033aed0 100644
--- a/tests/broken_tests.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -11,7 +11,6 @@
 00927_asof_joins
 00940_order_by_read_in_order_query_plan
 00945_bloom_filter_index
-00952_input_function
 00979_set_index_not
 00981_in_subquery_with_tuple
 01049_join_low_card_bug_long
@@ -21,14 +20,12 @@
 01072_optimize_skip_unused_shards_const_expr_eval
 01083_expressions_in_engine_arguments
 01086_odbc_roundtrip
-01152_cross_replication
 01155_rename_move_materialized_view
 01173_transaction_control_queries
 01211_optimize_skip_unused_shards_type_mismatch
 01213_optimize_skip_unused_shards_DISTINCT
 01214_test_storage_merge_aliases_with_where
 01231_distributed_aggregation_memory_efficient_mix_levels
-01232_extremes
 01244_optimize_distributed_group_by_sharding_key
 01247_optimize_distributed_group_by_sharding_key_dist_on_dist
 01268_mv_scalars
@@ -37,7 +34,6 @@
 01319_optimize_skip_unused_shards_nesting
 01353_low_cardinality_join_types
 01455_shard_leaf_max_rows_bytes_to_read
-01487_distributed_in_not_default_db
 01495_subqueries_in_with_statement
 01504_rocksdb
 01527_dist_sharding_key_dictGet_reload
@@ -51,10 +47,8 @@
 01585_use_index_for_global_in
 01585_use_index_for_global_in_with_null
 01586_columns_pruning
-01615_random_one_shard_insertion
 01624_soft_constraints
 01651_bugs_from_15889
-01655_plan_optimizations
 01656_test_query_log_factories_info
 01681_bloom_filter_nullable_column
 01700_system_zookeeper_path_in
@@ -80,7 +74,6 @@
 01952_optimize_distributed_group_by_sharding_key
 02000_join_on_const
 02001_shard_num_shard_count
-02024_join_on_or_long
 02131_used_row_policies_in_query_log
 02139_MV_with_scalar_subquery
 02174_cte_scalar_cache_mv
@@ -89,14 +82,11 @@
 02302_s3_file_pruning
 02317_distinct_in_order_optimization_explain
 02341_global_join_cte
-02343_aggregation_pipeline
 02345_implicit_transaction
-02346_additional_filters_distr
 02352_grouby_shadows_arg
 02354_annoy
 02366_union_decimal_conversion
 02375_rocksdb_with_filters
-02377_optimize_sorting_by_input_stream_properties_explain
 02382_join_and_filtering_set
 02402_merge_engine_with_view
 02404_memory_bound_merging
@@ -107,13 +97,11 @@
 02458_use_structure_from_insertion_table
 02479_race_condition_between_insert_and_droppin_mv
 02493_inconsistent_hex_and_binary_number
-02494_optimize_group_by_function_keys_and_alias_columns
 02521_aggregation_by_partitions
 02554_fix_grouping_sets_predicate_push_down
 02575_merge_prewhere_different_default_kind
 02713_array_low_cardinality_string
 02707_skip_index_with_in
-02324_map_combinator_bug
 02241_join_rocksdb_bs
 02003_WithMergeableStateAfterAggregationAndLimit_LIMIT_BY_LIMIT_OFFSET
 01115_join_with_dictionary
@@ -121,7 +109,6 @@
 00917_multiple_joins_denny_crane
 00725_join_on_bug_1
 00636_partition_key_parts_pruning
-00261_storage_aliases_and_array_join
 01825_type_json_multiple_files
 01281_group_by_limit_memory_tracking
 02723_zookeeper_name
@@ -135,6 +122,7 @@
 02703_row_policy_for_database
 02721_url_cluster
 02534_s3_cluster_insert_select_schema_inference
-02764_parallel_replicas_plain_merge_tree
 02765_parallel_replicas_final_modifier
-
+02784_parallel_replicas_automatic_disabling
+02581_share_big_sets_between_mutation_tasks_long
+02581_share_big_sets_between_multiple_mutations_tasks_long
diff --git a/tests/ci/attach_gdb.lib b/tests/ci/attach_gdb.lib
new file mode 100644
index 00000000000..e937cf6dba7
--- /dev/null
+++ b/tests/ci/attach_gdb.lib
@@ -0,0 +1,44 @@
+#!/bin/bash
+
+source /usr/share/clickhouse-test/ci/utils.lib
+
+function attach_gdb_to_clickhouse()
+{
+    # Set follow-fork-mode to parent, because we attach to clickhouse-server, not to watchdog
+    # and clickhouse-server can do fork-exec, for example, to run some bridge.
+    # Do not set nostop noprint for all signals, because some it may cause gdb to hang,
+    # explicitly ignore non-fatal signals that are used by server.
+    # Number of SIGRTMIN can be determined only in runtime.
+    RTMIN=$(kill -l SIGRTMIN)
+  echo "
+set follow-fork-mode parent
+handle SIGHUP nostop noprint pass
+handle SIGINT nostop noprint pass
+handle SIGQUIT nostop noprint pass
+handle SIGPIPE nostop noprint pass
+handle SIGTERM nostop noprint pass
+handle SIGUSR1 nostop noprint pass
+handle SIGUSR2 nostop noprint pass
+handle SIG$RTMIN nostop noprint pass
+info signals
+continue
+backtrace full
+thread apply all backtrace full
+info registers
+disassemble /s
+up
+disassemble /s
+up
+disassemble /s
+p \"done\"
+detach
+quit
+" > script.gdb
+
+    # FIXME Hung check may work incorrectly because of attached gdb
+    # We cannot attach another gdb to get stacktraces if some queries hung
+    gdb -batch -command script.gdb -p "$(cat /var/run/clickhouse-server/clickhouse-server.pid)" | ts '%Y-%m-%d %H:%M:%S' >> /test_output/gdb.log &
+    sleep 5
+    # gdb will send SIGSTOP, spend some time loading debug info and then send SIGCONT, wait for it (up to send_timeout, 300s)
+    run_with_retry 60 clickhouse-client --query "SELECT 'Connected to clickhouse-server after attaching gdb'"
+}
diff --git a/tests/ci/autoscale_runners_lambda/app.py b/tests/ci/autoscale_runners_lambda/app.py
index cbc9f4f8901..d3f26732df6 100644
--- a/tests/ci/autoscale_runners_lambda/app.py
+++ b/tests/ci/autoscale_runners_lambda/app.py
@@ -2,30 +2,27 @@
 
 """The lambda to decrease/increase ASG desired capacity based on current queue"""
 
-import json
 import logging
-import time
 from dataclasses import dataclass
 from pprint import pformat
 from typing import Any, List, Literal, Optional, Tuple
 
 import boto3  # type: ignore
-import requests  # type: ignore
 
-RUNNER_TYPE_LABELS = [
-    "builder",
-    "func-tester",
-    "func-tester-aarch64",
-    "fuzzer-unit-tester",
-    "stress-tester",
-    "style-checker",
-    "style-checker-aarch64",
-]
+from lambda_shared import (
+    CHException,
+    ClickHouseHelper,
+    RUNNER_TYPE_LABELS,
+    get_parameter_from_ssm,
+)
 
+### Update comment on the change ###
 # 4 HOUR - is a balance to get the most precise values
 #   - Our longest possible running check is around 5h on the worst scenario
 #   - The long queue won't be wiped out and replaced, so the measurmenet is fine
 #   - If the data is spoiled by something, we are from the bills perspective
+# Changed it to 3 HOUR: in average we have 1h tasks, but p90 is around 2h.
+# With 4h we have too much wasted computing time in case of issues with DB
 QUEUE_QUERY = f"""SELECT
     last_status AS status,
     toUInt32(count()) AS length,
@@ -40,7 +37,7 @@ FROM
     FROM default.workflow_jobs
     WHERE has(labels, 'self-hosted')
         AND hasAny({RUNNER_TYPE_LABELS}, labels)
-        AND started_at > now() - INTERVAL 4 HOUR
+        AND started_at > now() - INTERVAL 3 HOUR
     GROUP BY ALL
     HAVING last_status IN ('in_progress', 'queued')
 )
@@ -62,70 +59,22 @@ def get_scales(runner_type: str) -> Tuple[int, int]:
     scale_down = 2
     scale_up = 5
     if runner_type == "style-checker":
-        # the style checkers have so many noise, so it scales up too quickly
+        # The ASG should deflate almost instantly
         scale_down = 1
+        # the style checkers have so many noise, so it scales up too quickly
         # The 5 was too quick, there are complainings regarding too slow with
         # 10. I am trying 7 now.
+        # 7 still looks a bit slow, so I try 6
         # UPDATE THE COMMENT ON CHANGES
-        scale_up = 7
+        scale_up = 6
+    elif runner_type == "limited-tester":
+        # The limited runners should inflate and deflate faster
+        scale_down = 1
+        scale_up = 2
     return scale_down, scale_up
 
 
-### VENDORING
-def get_parameter_from_ssm(name, decrypt=True, client=None):
-    if not client:
-        client = boto3.client("ssm", region_name="us-east-1")
-    return client.get_parameter(Name=name, WithDecryption=decrypt)["Parameter"]["Value"]
-
-
-class CHException(Exception):
-    pass
-
-
-class ClickHouseHelper:
-    def __init__(
-        self,
-        url: Optional[str] = None,
-        user: Optional[str] = None,
-        password: Optional[str] = None,
-    ):
-        self.url = url
-        self.auth = {}
-        if user:
-            self.auth["X-ClickHouse-User"] = user
-        if password:
-            self.auth["X-ClickHouse-Key"] = password
-
-    def _select_and_get_json_each_row(self, db, query):
-        params = {
-            "database": db,
-            "query": query,
-            "default_format": "JSONEachRow",
-        }
-        for i in range(5):
-            response = None
-            try:
-                response = requests.get(self.url, params=params, headers=self.auth)
-                response.raise_for_status()
-                return response.text
-            except Exception as ex:
-                logging.warning("Cannot fetch data with exception %s", str(ex))
-                if response:
-                    logging.warning("Reponse text %s", response.text)
-                time.sleep(0.1 * i)
-
-        raise CHException("Cannot fetch data from clickhouse")
-
-    def select_json_each_row(self, db, query):
-        text = self._select_and_get_json_each_row(db, query)
-        result = []
-        for line in text.split("\n"):
-            if line:
-                result.append(json.loads(line))
-        return result
-
-
-CH_CLIENT = ClickHouseHelper(get_parameter_from_ssm("clickhouse-test-stat-url"), "play")
+CH_CLIENT = None  # type: Optional[ClickHouseHelper]
 
 
 def set_capacity(
@@ -153,8 +102,15 @@ def set_capacity(
         raise ValueError("Queue status is not in ['in_progress', 'queued']")
 
     scale_down, scale_up = get_scales(runner_type)
+    # With lyfecycle hooks some instances are actually free because some of
+    # them are in 'Terminating:Wait' state
+    effective_capacity = max(
+        asg["DesiredCapacity"],
+        len([ins for ins in asg["Instances"] if ins["HealthStatus"] == "Healthy"]),
+    )
+
     # How much nodes are free (positive) or need to be added (negative)
-    capacity_reserve = asg["DesiredCapacity"] - running - queued
+    capacity_reserve = effective_capacity - running - queued
     stop = False
     if capacity_reserve < 0:
         # This part is about scaling up
@@ -170,12 +126,24 @@ def set_capacity(
         # Finally, should the capacity be even changed
         stop = stop or asg["DesiredCapacity"] == desired_capacity
         if stop:
+            logging.info(
+                "Do not increase ASG %s capacity, current capacity=%s, effective "
+                "capacity=%s, maximum capacity=%s, running jobs=%s, queue size=%s",
+                asg["AutoScalingGroupName"],
+                asg["DesiredCapacity"],
+                effective_capacity,
+                asg["MaxSize"],
+                running,
+                queued,
+            )
             return
+
         logging.info(
             "The ASG %s capacity will be increased to %s, current capacity=%s, "
-            "maximum capacity=%s, running jobs=%s, queue size=%s",
+            "effective capacity=%sm maximum capacity=%s, running jobs=%s, queue size=%s",
             asg["AutoScalingGroupName"],
             desired_capacity,
+            effective_capacity,
             asg["DesiredCapacity"],
             asg["MaxSize"],
             running,
@@ -195,14 +163,25 @@ def set_capacity(
     desired_capacity = min(desired_capacity, asg["MaxSize"])
     stop = stop or asg["DesiredCapacity"] == desired_capacity
     if stop:
+        logging.info(
+            "Do not decrease ASG %s capacity, current capacity=%s, effective "
+            "capacity=%s, minimum capacity=%s, running jobs=%s, queue size=%s",
+            asg["AutoScalingGroupName"],
+            asg["DesiredCapacity"],
+            effective_capacity,
+            asg["MinSize"],
+            running,
+            queued,
+        )
         return
 
     logging.info(
-        "The ASG %s capacity will be decreased to %s, current capacity=%s, "
-        "minimum capacity=%s, running jobs=%s, queue size=%s",
+        "The ASG %s capacity will be decreased to %s, current capacity=%s, effective "
+        "capacity=%s, minimum capacity=%s, running jobs=%s, queue size=%s",
         asg["AutoScalingGroupName"],
         desired_capacity,
         asg["DesiredCapacity"],
+        effective_capacity,
         asg["MinSize"],
         running,
         queued,
@@ -219,6 +198,9 @@ def main(dry_run: bool = True) -> None:
     asg_client = boto3.client("autoscaling")
     try:
         global CH_CLIENT
+        CH_CLIENT = CH_CLIENT or ClickHouseHelper(
+            get_parameter_from_ssm("clickhouse-test-stat-url"), "play"
+        )
         queues = CH_CLIENT.select_json_each_row("default", QUEUE_QUERY)
     except CHException as ex:
         logging.exception(
diff --git a/tests/ci/autoscale_runners_lambda_test.py b/tests/ci/autoscale_runners_lambda/autoscale_runners_lambda_test.py
similarity index 97%
rename from tests/ci/autoscale_runners_lambda_test.py
rename to tests/ci/autoscale_runners_lambda/autoscale_runners_lambda_test.py
index 8e3828f51c0..6a6451cbd2a 100644
--- a/tests/ci/autoscale_runners_lambda_test.py
+++ b/tests/ci/autoscale_runners_lambda/autoscale_runners_lambda_test.py
@@ -4,7 +4,7 @@ import unittest
 from dataclasses import dataclass
 from typing import Any, List
 
-from autoscale_runners_lambda.app import set_capacity, Queue
+from app import set_capacity, Queue
 
 
 @dataclass
@@ -56,6 +56,7 @@ class TestSetCapacity(unittest.TestCase):
                         "DesiredCapacity": desired_capacity,
                         "MinSize": min_size,
                         "MaxSize": max_size,
+                        "Instances": [],  # necessary for ins["HealthStatus"] check
                     }
                 ]
             }
@@ -71,7 +72,7 @@ class TestSetCapacity(unittest.TestCase):
             # Increase capacity
             TestCase("increase", 1, 13, 20, [Queue("queued", 23, "increase")], 15),
             TestCase(
-                "style-checker", 1, 13, 20, [Queue("queued", 33, "style-checker")], 15
+                "style-checker", 1, 13, 20, [Queue("queued", 33, "style-checker")], 16
             ),
             TestCase("increase", 1, 13, 20, [Queue("queued", 18, "increase")], 14),
             TestCase("increase", 1, 13, 20, [Queue("queued", 183, "increase")], 20),
diff --git a/tests/ci/autoscale_runners_lambda/lambda_shared b/tests/ci/autoscale_runners_lambda/lambda_shared
new file mode 120000
index 00000000000..ba86e090f6c
--- /dev/null
+++ b/tests/ci/autoscale_runners_lambda/lambda_shared
@@ -0,0 +1 @@
+../lambda_shared_package/lambda_shared
\ No newline at end of file
diff --git a/tests/ci/autoscale_runners_lambda/requirements.txt b/tests/ci/autoscale_runners_lambda/requirements.txt
index 3bcbe2dfd07..098e04a9798 100644
--- a/tests/ci/autoscale_runners_lambda/requirements.txt
+++ b/tests/ci/autoscale_runners_lambda/requirements.txt
@@ -1 +1 @@
-requests<2.30
+../lambda_shared_package
diff --git a/tests/ci/build_check.py b/tests/ci/build_check.py
index 4bc61c79fc0..35b98a7c3bb 100644
--- a/tests/ci/build_check.py
+++ b/tests/ci/build_check.py
@@ -343,6 +343,15 @@ def main():
         f"sudo chown -R ubuntu:ubuntu {build_output_path}", shell=True
     )
     logging.info("Build finished with %s, log path %s", success, log_path)
+    if not success:
+        # We check if docker works, because if it's down, it's infrastructure
+        try:
+            subprocess.check_call("docker info", shell=True)
+        except subprocess.CalledProcessError:
+            logging.error(
+                "The dockerd looks down, won't upload anything and generate report"
+            )
+            sys.exit(1)
 
     # FIXME performance
     performance_urls = []
diff --git a/tests/ci/cancel_and_rerun_workflow_lambda/app.py b/tests/ci/cancel_and_rerun_workflow_lambda/app.py
index 54c87fbcfa5..250655ddeb2 100644
--- a/tests/ci/cancel_and_rerun_workflow_lambda/app.py
+++ b/tests/ci/cancel_and_rerun_workflow_lambda/app.py
@@ -9,9 +9,10 @@ import json
 import re
 import time
 
-import jwt
 import requests  # type: ignore
-import boto3  # type: ignore
+
+from lambda_shared.pr import CATEGORY_TO_LABEL, check_pr_description
+from lambda_shared.token import get_cached_access_token
 
 
 NEED_RERUN_ON_EDITED = {
@@ -27,123 +28,6 @@ MAX_RETRY = 5
 
 DEBUG_INFO = {}  # type: Dict[str, Any]
 
-# Descriptions are used in .github/PULL_REQUEST_TEMPLATE.md, keep comments there
-# updated accordingly
-# The following lists are append only, try to avoid editing them
-# They still could be cleaned out after the decent time though.
-LABELS = {
-    "pr-backward-incompatible": ["Backward Incompatible Change"],
-    "pr-bugfix": [
-        "Bug Fix",
-        "Bug Fix (user-visible misbehavior in an official stable release)",
-        "Bug Fix (user-visible misbehaviour in official stable or prestable release)",
-        "Bug Fix (user-visible misbehavior in official stable or prestable release)",
-    ],
-    "pr-build": [
-        "Build/Testing/Packaging Improvement",
-        "Build Improvement",
-        "Build/Testing Improvement",
-        "Build",
-        "Packaging Improvement",
-    ],
-    "pr-documentation": [
-        "Documentation (changelog entry is not required)",
-        "Documentation",
-    ],
-    "pr-feature": ["New Feature"],
-    "pr-improvement": ["Improvement"],
-    "pr-not-for-changelog": [
-        "Not for changelog (changelog entry is not required)",
-        "Not for changelog",
-    ],
-    "pr-performance": ["Performance Improvement"],
-}
-
-CATEGORY_TO_LABEL = {c: lb for lb, categories in LABELS.items() for c in categories}
-
-
-def check_pr_description(pr_body: str) -> Tuple[str, str]:
-    """The function checks the body to being properly formatted according to
-    .github/PULL_REQUEST_TEMPLATE.md, if the first returned string is not empty,
-    then there is an error."""
-    lines = list(map(lambda x: x.strip(), pr_body.split("\n") if pr_body else []))
-    lines = [re.sub(r"\s+", " ", line) for line in lines]
-
-    # Check if body contains "Reverts ClickHouse/ClickHouse#36337"
-    if [
-        True
-        for line in lines
-        if re.match(r"\AReverts {GITHUB_REPOSITORY}#[\d]+\Z", line)
-    ]:
-        return "", LABELS["pr-not-for-changelog"][0]
-
-    category = ""
-    entry = ""
-    description_error = ""
-
-    i = 0
-    while i < len(lines):
-        if re.match(r"(?i)^[#>*_ ]*change\s*log\s*category", lines[i]):
-            i += 1
-            if i >= len(lines):
-                break
-            # Can have one empty line between header and the category
-            # itself. Filter it out.
-            if not lines[i]:
-                i += 1
-                if i >= len(lines):
-                    break
-            category = re.sub(r"^[-*\s]*", "", lines[i])
-            i += 1
-
-            # Should not have more than one category. Require empty line
-            # after the first found category.
-            if i >= len(lines):
-                break
-            if lines[i]:
-                second_category = re.sub(r"^[-*\s]*", "", lines[i])
-                description_error = (
-                    "More than one changelog category specified: "
-                    f"'{category}', '{second_category}'"
-                )
-                return description_error, category
-
-        elif re.match(
-            r"(?i)^[#>*_ ]*(short\s*description|change\s*log\s*entry)", lines[i]
-        ):
-            i += 1
-            # Can have one empty line between header and the entry itself.
-            # Filter it out.
-            if i < len(lines) and not lines[i]:
-                i += 1
-            # All following lines until empty one are the changelog entry.
-            entry_lines = []
-            while i < len(lines) and lines[i]:
-                entry_lines.append(lines[i])
-                i += 1
-            entry = " ".join(entry_lines)
-            # Don't accept changelog entries like '...'.
-            entry = re.sub(r"[#>*_.\- ]", "", entry)
-            # Don't accept changelog entries like 'Close #12345'.
-            entry = re.sub(r"^[\w\-\s]{0,10}#?\d{5,6}\.?$", "", entry)
-        else:
-            i += 1
-
-    if not category:
-        description_error = "Changelog category is empty"
-    # Filter out the PR categories that are not for changelog.
-    elif re.match(
-        r"(?i)doc|((non|in|not|un)[-\s]*significant)|(not[ ]*for[ ]*changelog)",
-        category,
-    ):
-        pass  # to not check the rest of the conditions
-    elif category not in CATEGORY_TO_LABEL:
-        description_error, category = f"Category '{category}' is not valid", ""
-    elif not entry:
-        description_error = f"Changelog entry required for category '{category}'"
-
-    return description_error, category
-
 
 class Worker(Thread):
     def __init__(
@@ -166,58 +50,6 @@ class Worker(Thread):
         self.queue.task_done()
 
 
-def get_installation_id(jwt_token):
-    headers = {
-        "Authorization": f"Bearer {jwt_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-    response = requests.get("https://api.github.com/app/installations", headers=headers)
-    response.raise_for_status()
-    data = response.json()
-    for installation in data:
-        if installation["account"]["login"] == "ClickHouse":
-            installation_id = installation["id"]
-    return installation_id
-
-
-def get_access_token(jwt_token, installation_id):
-    headers = {
-        "Authorization": f"Bearer {jwt_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-    response = requests.post(
-        f"https://api.github.com/app/installations/{installation_id}/access_tokens",
-        headers=headers,
-    )
-    response.raise_for_status()
-    data = response.json()
-    return data["token"]
-
-
-def get_key_and_app_from_aws():
-    secret_name = "clickhouse_github_secret_key"
-    session = boto3.session.Session()
-    client = session.client(
-        service_name="secretsmanager",
-    )
-    get_secret_value_response = client.get_secret_value(SecretId=secret_name)
-    data = json.loads(get_secret_value_response["SecretString"])
-    return data["clickhouse-app-key"], int(data["clickhouse-app-id"])
-
-
-def get_token_from_aws():
-    private_key, app_id = get_key_and_app_from_aws()
-    payload = {
-        "iat": int(time.time()) - 60,
-        "exp": int(time.time()) + (10 * 60),
-        "iss": app_id,
-    }
-
-    encoded_jwt = jwt.encode(payload, private_key, algorithm="RS256")
-    installation_id = get_installation_id(encoded_jwt)
-    return get_access_token(encoded_jwt, installation_id)
-
-
 def _exec_get_with_retry(url: str, token: str) -> dict:
     headers = {"Authorization": f"token {token}"}
     for i in range(MAX_RETRY):
@@ -407,7 +239,7 @@ def exec_workflow_url(urls_to_post, token):
 
 
 def main(event):
-    token = get_token_from_aws()
+    token = get_cached_access_token()
     DEBUG_INFO["event"] = event
     if event["isBase64Encoded"]:
         event_data = json.loads(b64decode(event["body"]))
diff --git a/tests/ci/cancel_and_rerun_workflow_lambda/lambda_shared b/tests/ci/cancel_and_rerun_workflow_lambda/lambda_shared
new file mode 120000
index 00000000000..ba86e090f6c
--- /dev/null
+++ b/tests/ci/cancel_and_rerun_workflow_lambda/lambda_shared
@@ -0,0 +1 @@
+../lambda_shared_package/lambda_shared
\ No newline at end of file
diff --git a/tests/ci/cancel_and_rerun_workflow_lambda/requirements.txt b/tests/ci/cancel_and_rerun_workflow_lambda/requirements.txt
index 98be09ab232..4cb3fba0f7b 100644
--- a/tests/ci/cancel_and_rerun_workflow_lambda/requirements.txt
+++ b/tests/ci/cancel_and_rerun_workflow_lambda/requirements.txt
@@ -1,3 +1 @@
-requests<2.30
-PyJWT
-cryptography<38
+../lambda_shared_package[token]
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index d829115cfe1..c680b5810fc 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -410,6 +410,99 @@ REQUIRED_CHECKS = [
     "Fast test",
     "Stateful tests (release)",
     "Stateless tests (release)",
+    "Stateless tests (debug) [1/5]",
+    "Stateless tests (debug) [2/5]",
+    "Stateless tests (debug) [3/5]",
+    "Stateless tests (debug) [4/5]",
+    "Stateless tests (debug) [5/5]",
+    "AST fuzzer (asan)",
+    "AST fuzzer (msan)",
+    "AST fuzzer (tsan)",
+    "AST fuzzer (ubsan)",
+    "AST fuzzer (debug)",
+    "Compatibility check (aarch64)",
+    "Compatibility check (amd64)",
+    "Install packages (amd64)",
+    "Install packages (arm64)",
+    "Integration tests (asan) [1/6]",
+    "Integration tests (asan) [2/6]",
+    "Integration tests (asan) [3/6]",
+    "Integration tests (asan) [4/6]",
+    "Integration tests (asan) [5/6]",
+    "Integration tests (asan) [6/6]",
+    "Integration tests (release) [1/4]",
+    "Integration tests (release) [2/4]",
+    "Integration tests (release) [3/4]",
+    "Integration tests (release) [4/4]",
+    "Integration tests (tsan) [1/6]",
+    "Integration tests (tsan) [2/6]",
+    "Integration tests (tsan) [3/6]",
+    "Integration tests (tsan) [4/6]",
+    "Integration tests (tsan) [5/6]",
+    "Integration tests (tsan) [6/6]",
+    "Integration tests flaky check (asan)",
+    "Stateful tests (aarch64)",
+    "Stateful tests (asan)",
+    "Stateful tests (asan, ParallelReplicas)",
+    "Stateful tests (debug)",
+    "Stateful tests (debug, ParallelReplicas)",
+    "Stateful tests (msan)",
+    "Stateful tests (msan, ParallelReplicas)",
+    "Stateful tests (release, ParallelReplicas)",
+    "Stateful tests (tsan)",
+    "Stateful tests (tsan, ParallelReplicas)",
+    "Stateful tests (ubsan)",
+    "Stateful tests (ubsan, ParallelReplicas)",
+    "Stateless tests (aarch64)",
+    "Stateless tests (asan) [1/4]",
+    "Stateless tests (asan) [2/4]",
+    "Stateless tests (asan) [3/4]",
+    "Stateless tests (asan) [4/4]",
+    "Stateless tests (debug) [1/5]",
+    "Stateless tests (debug) [2/5]",
+    "Stateless tests (debug) [3/5]",
+    "Stateless tests (debug) [4/5]",
+    "Stateless tests (debug) [5/5]",
+    "Stateless tests (debug, s3 storage) [1/6]",
+    "Stateless tests (debug, s3 storage) [2/6]",
+    "Stateless tests (debug, s3 storage) [3/6]",
+    "Stateless tests (debug, s3 storage) [4/6]",
+    "Stateless tests (debug, s3 storage) [5/6]",
+    "Stateless tests (debug, s3 storage) [6/6]",
+    "Stateless tests (msan) [1/6]",
+    "Stateless tests (msan) [2/6]",
+    "Stateless tests (msan) [3/6]",
+    "Stateless tests (msan) [4/6]",
+    "Stateless tests (msan) [5/6]",
+    "Stateless tests (msan) [6/6]",
+    "Stateless tests (release, DatabaseReplicated) [1/4]",
+    "Stateless tests (release, DatabaseReplicated) [2/4]",
+    "Stateless tests (release, DatabaseReplicated) [3/4]",
+    "Stateless tests (release, DatabaseReplicated) [4/4]",
+    "Stateless tests (release, s3 storage) [1/2]",
+    "Stateless tests (release, s3 storage) [2/2]",
+    "Stateless tests (release, wide parts enabled)",
+    "Stateless tests (tsan) [1/5]",
+    "Stateless tests (tsan) [2/5]",
+    "Stateless tests (tsan) [3/5]",
+    "Stateless tests (tsan) [4/5]",
+    "Stateless tests (tsan) [5/5]",
+    "Stateless tests (tsan, s3 storage) [1/5]",
+    "Stateless tests (tsan, s3 storage) [2/5]",
+    "Stateless tests (tsan, s3 storage) [3/5]",
+    "Stateless tests (tsan, s3 storage) [4/5]",
+    "Stateless tests (tsan, s3 storage) [5/5]",
+    "Stateless tests (ubsan) [1/2]",
+    "Stateless tests (ubsan) [2/2]",
+    "Stress test (asan)",
+    "Stress test (debug)",
+    "Stress test (msan)",
+    "Stress test (tsan)",
+    "Stress test (ubsan)",
+    "Upgrade check (asan)",
+    "Upgrade check (debug)",
+    "Upgrade check (msan)",
+    "Upgrade check (tsan)",
     "Style Check",
     "Unit tests (asan)",
     "Unit tests (msan)",
diff --git a/tests/ci/ci_runners_metrics_lambda/app.py b/tests/ci/ci_runners_metrics_lambda/app.py
index 341e1b674ec..5cb1e45dd14 100644
--- a/tests/ci/ci_runners_metrics_lambda/app.py
+++ b/tests/ci/ci_runners_metrics_lambda/app.py
@@ -8,235 +8,32 @@ Lambda function to:
 
 import argparse
 import sys
-import json
-import time
-from collections import namedtuple
 from datetime import datetime
-from typing import Dict, List, Tuple
+from typing import Dict, List
 
-import jwt
 import requests  # type: ignore
 import boto3  # type: ignore
 from botocore.exceptions import ClientError  # type: ignore
 
-UNIVERSAL_LABEL = "universal"
-RUNNER_TYPE_LABELS = [
-    "builder",
-    "func-tester",
-    "func-tester-aarch64",
-    "fuzzer-unit-tester",
-    "stress-tester",
-    "style-checker",
-    "style-checker-aarch64",
-]
-
-RunnerDescription = namedtuple(
-    "RunnerDescription", ["id", "name", "tags", "offline", "busy"]
+from lambda_shared import (
+    RUNNER_TYPE_LABELS,
+    RunnerDescription,
+    RunnerDescriptions,
+    list_runners,
+)
+from lambda_shared.token import (
+    get_cached_access_token,
+    get_key_and_app_from_aws,
+    get_access_token_by_key_app,
 )
-RunnerDescriptions = List[RunnerDescription]
 
-
-def get_dead_runners_in_ec2(runners: RunnerDescriptions) -> RunnerDescriptions:
-    """Returns instances that are offline/dead in EC2, or not found in EC2"""
-    ids = {
-        runner.name: runner
-        for runner in runners
-        # Only `i-deadbead123` are valid names for an instance ID
-        if runner.name.startswith("i-") and runner.offline and not runner.busy
-    }
-    if not ids:
-        return []
-
-    # Delete all offline runners with wrong name
-    result_to_delete = [
-        runner
-        for runner in runners
-        if not ids.get(runner.name) and runner.offline and not runner.busy
-    ]
-
-    client = boto3.client("ec2")
-
-    i = 0
-    inc = 100
-
-    print("Checking ids: ", " ".join(ids.keys()))
-    instances_statuses = []
-    while i < len(ids.keys()):
-        try:
-            instances_statuses.append(
-                client.describe_instance_status(
-                    InstanceIds=list(ids.keys())[i : i + inc]
-                )
-            )
-            # It applied only if all ids exist in EC2
-            i += inc
-        except ClientError as e:
-            # The list of non-existent instances is in the message:
-            #   The instance IDs 'i-069b1c256c06cf4e3, i-0f26430432b044035,
-            #   i-0faa2ff44edbc147e, i-0eccf2514585045ec, i-0ee4ee53e0daa7d4a,
-            #   i-07928f15acd473bad, i-0eaddda81298f9a85' do not exist
-            message = e.response["Error"]["Message"]
-            if message.startswith("The instance IDs '") and message.endswith(
-                "' do not exist"
-            ):
-                non_existent = message[18:-14].split(", ")
-                for n in non_existent:
-                    result_to_delete.append(ids.pop(n))
-            else:
-                raise
-
-    found_instances = set([])
-    print("Response", instances_statuses)
-    for instances_status in instances_statuses:
-        for instance_status in instances_status["InstanceStatuses"]:
-            if instance_status["InstanceState"]["Name"] in ("pending", "running"):
-                found_instances.add(instance_status["InstanceId"])
-
-    print("Found instances", found_instances)
-    for runner in result_to_delete:
-        print("Instance", runner.name, "is not alive, going to remove it")
-    for instance_id, runner in ids.items():
-        if instance_id not in found_instances:
-            print("Instance", instance_id, "is not found in EC2, going to remove it")
-            result_to_delete.append(runner)
-    return result_to_delete
-
-
-def get_lost_ec2_instances(runners: RunnerDescriptions) -> List[dict]:
-    client = boto3.client("ec2")
-    reservations = client.describe_instances(
-        Filters=[{"Name": "tag-key", "Values": ["github:runner-type"]}]
-    )["Reservations"]
-    lost_instances = []
-    offline_runners = [
-        runner.name for runner in runners if runner.offline and not runner.busy
-    ]
-    # Here we refresh the runners to get the most recent state
-    now = datetime.now().timestamp()
-
-    for reservation in reservations:
-        for instance in reservation["Instances"]:
-            # Do not consider instances started 20 minutes ago as problematic
-            if now - instance["LaunchTime"].timestamp() < 1200:
-                continue
-
-            runner_type = [
-                tag["Value"]
-                for tag in instance["Tags"]
-                if tag["Key"] == "github:runner-type"
-            ][0]
-            # If there's no necessary labels in runner type it's fine
-            if not (
-                UNIVERSAL_LABEL in runner_type or runner_type in RUNNER_TYPE_LABELS
-            ):
-                continue
-
-            if instance["InstanceId"] in offline_runners:
-                lost_instances.append(instance)
-                continue
-
-            if instance["State"]["Name"] == "running" and (
-                not [
-                    runner
-                    for runner in runners
-                    if runner.name == instance["InstanceId"]
-                ]
-            ):
-                lost_instances.append(instance)
-
-    return lost_instances
-
-
-def get_key_and_app_from_aws() -> Tuple[str, int]:
-    secret_name = "clickhouse_github_secret_key"
-    session = boto3.session.Session()
-    client = session.client(
-        service_name="secretsmanager",
-    )
-    get_secret_value_response = client.get_secret_value(SecretId=secret_name)
-    data = json.loads(get_secret_value_response["SecretString"])
-    return data["clickhouse-app-key"], int(data["clickhouse-app-id"])
+UNIVERSAL_LABEL = "universal"
 
 
 def handler(event, context):
-    private_key, app_id = get_key_and_app_from_aws()
-    main(private_key, app_id, True, True)
-
-
-def get_installation_id(jwt_token: str) -> int:
-    headers = {
-        "Authorization": f"Bearer {jwt_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-    response = requests.get("https://api.github.com/app/installations", headers=headers)
-    response.raise_for_status()
-    data = response.json()
-    for installation in data:
-        if installation["account"]["login"] == "ClickHouse":
-            installation_id = installation["id"]
-            break
-
-    return installation_id  # type: ignore
-
-
-def get_access_token(jwt_token: str, installation_id: int) -> str:
-    headers = {
-        "Authorization": f"Bearer {jwt_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-    response = requests.post(
-        f"https://api.github.com/app/installations/{installation_id}/access_tokens",
-        headers=headers,
-    )
-    response.raise_for_status()
-    data = response.json()
-    return data["token"]  # type: ignore
-
-
-def list_runners(access_token: str) -> RunnerDescriptions:
-    headers = {
-        "Authorization": f"token {access_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-    per_page = 100
-    response = requests.get(
-        f"https://api.github.com/orgs/ClickHouse/actions/runners?per_page={per_page}",
-        headers=headers,
-    )
-    response.raise_for_status()
-    data = response.json()
-    total_runners = data["total_count"]
-    print("Expected total runners", total_runners)
-    runners = data["runners"]
-
-    # round to 0 for 0, 1 for 1..100, but to 2 for 101..200
-    total_pages = (total_runners - 1) // per_page + 1
-
-    print("Total pages", total_pages)
-    for i in range(2, total_pages + 1):
-        response = requests.get(
-            "https://api.github.com/orgs/ClickHouse/actions/runners"
-            f"?page={i}&per_page={per_page}",
-            headers=headers,
-        )
-        response.raise_for_status()
-        data = response.json()
-        runners += data["runners"]
-
-    print("Total runners", len(runners))
-    result = []
-    for runner in runners:
-        tags = [tag["name"] for tag in runner["labels"]]
-        desc = RunnerDescription(
-            id=runner["id"],
-            name=runner["name"],
-            tags=tags,
-            offline=runner["status"] == "offline",
-            busy=runner["busy"],
-        )
-        result.append(desc)
-
-    return result
+    _ = event
+    _ = context
+    main(get_cached_access_token(), True)
 
 
 def group_runners_by_tag(
@@ -265,18 +62,21 @@ def group_runners_by_tag(
 
 
 def push_metrics_to_cloudwatch(
-    listed_runners: RunnerDescriptions, namespace: str
+    listed_runners: RunnerDescriptions, group_name: str
 ) -> None:
     client = boto3.client("cloudwatch")
+    namespace = "RunnersMetrics"
     metrics_data = []
     busy_runners = sum(
         1 for runner in listed_runners if runner.busy and not runner.offline
     )
+    dimensions = [{"Name": "group", "Value": group_name}]
     metrics_data.append(
         {
             "MetricName": "BusyRunners",
             "Value": busy_runners,
             "Unit": "Count",
+            "Dimensions": dimensions,
         }
     )
     total_active_runners = sum(1 for runner in listed_runners if not runner.offline)
@@ -285,6 +85,7 @@ def push_metrics_to_cloudwatch(
             "MetricName": "ActiveRunners",
             "Value": total_active_runners,
             "Unit": "Count",
+            "Dimensions": dimensions,
         }
     )
     total_runners = len(listed_runners)
@@ -293,6 +94,7 @@ def push_metrics_to_cloudwatch(
             "MetricName": "TotalRunners",
             "Value": total_runners,
             "Unit": "Count",
+            "Dimensions": dimensions,
         }
     )
     if total_active_runners == 0:
@@ -305,67 +107,28 @@ def push_metrics_to_cloudwatch(
             "MetricName": "BusyRunnersRatio",
             "Value": busy_ratio,
             "Unit": "Percent",
+            "Dimensions": dimensions,
         }
     )
 
     client.put_metric_data(Namespace=namespace, MetricData=metrics_data)
 
 
-def delete_runner(access_token: str, runner: RunnerDescription) -> bool:
-    headers = {
-        "Authorization": f"token {access_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-
-    response = requests.delete(
-        f"https://api.github.com/orgs/ClickHouse/actions/runners/{runner.id}",
-        headers=headers,
-    )
-    response.raise_for_status()
-    print(f"Response code deleting {runner.name} is {response.status_code}")
-    return bool(response.status_code == 204)
-
-
 def main(
-    github_secret_key: str,
-    github_app_id: int,
+    access_token: str,
     push_to_cloudwatch: bool,
-    delete_offline_runners: bool,
 ) -> None:
-    payload = {
-        "iat": int(time.time()) - 60,
-        "exp": int(time.time()) + (10 * 60),
-        "iss": github_app_id,
-    }
-
-    encoded_jwt = jwt.encode(payload, github_secret_key, algorithm="RS256")
-    installation_id = get_installation_id(encoded_jwt)
-    access_token = get_access_token(encoded_jwt, installation_id)
     gh_runners = list_runners(access_token)
     grouped_runners = group_runners_by_tag(gh_runners)
     for group, group_runners in grouped_runners.items():
         if push_to_cloudwatch:
             print(f"Pushing metrics for group '{group}'")
-            push_metrics_to_cloudwatch(group_runners, "RunnersMetrics/" + group)
+            push_metrics_to_cloudwatch(group_runners, group)
         else:
             print(group, f"({len(group_runners)})")
             for runner in group_runners:
                 print("\t", runner)
 
-    if delete_offline_runners:
-        print("Going to delete offline runners")
-        dead_runners = get_dead_runners_in_ec2(gh_runners)
-        for runner in dead_runners:
-            print("Deleting runner", runner)
-            delete_runner(access_token, runner)
-
-        lost_instances = get_lost_ec2_instances(gh_runners)
-        if lost_instances:
-            print("Going to terminate lost runners")
-            ids = [i["InstanceId"] for i in lost_instances]
-            print("Terminating runners:", ids)
-            boto3.client("ec2").terminate_instances(InstanceIds=ids)
-
 
 if __name__ == "__main__":
     parser = argparse.ArgumentParser(description="Get list of runners and their states")
@@ -381,9 +144,6 @@ if __name__ == "__main__":
         action="store_true",
         help="Push metrics for active and busy runners to cloudwatch",
     )
-    parser.add_argument(
-        "--delete-offline", action="store_true", help="Remove offline runners"
-    )
 
     args = parser.parse_args()
 
@@ -408,4 +168,6 @@ if __name__ == "__main__":
         print("Attempt to get key and id from AWS secret manager")
         private_key, args.app_id = get_key_and_app_from_aws()
 
-    main(private_key, args.app_id, args.push_to_cloudwatch, args.delete_offline)
+    token = get_access_token_by_key_app(private_key, args.app_id)
+
+    main(token, args.push_to_cloudwatch)
diff --git a/tests/ci/ci_runners_metrics_lambda/lambda_shared b/tests/ci/ci_runners_metrics_lambda/lambda_shared
new file mode 120000
index 00000000000..ba86e090f6c
--- /dev/null
+++ b/tests/ci/ci_runners_metrics_lambda/lambda_shared
@@ -0,0 +1 @@
+../lambda_shared_package/lambda_shared
\ No newline at end of file
diff --git a/tests/ci/ci_runners_metrics_lambda/requirements.txt b/tests/ci/ci_runners_metrics_lambda/requirements.txt
index 98be09ab232..e2b16067a93 100644
--- a/tests/ci/ci_runners_metrics_lambda/requirements.txt
+++ b/tests/ci/ci_runners_metrics_lambda/requirements.txt
@@ -1,3 +1,2 @@
-requests<2.30
-PyJWT
-cryptography<38
+../lambda_shared_package
+../lambda_shared_package[token]
diff --git a/tests/ci/clean_lost_instances_lambda/app.py b/tests/ci/clean_lost_instances_lambda/app.py
new file mode 100644
index 00000000000..65f6ff78d4a
--- /dev/null
+++ b/tests/ci/clean_lost_instances_lambda/app.py
@@ -0,0 +1,336 @@
+#!/usr/bin/env python3
+"""
+Lambda function to:
+    - calculate number of running runners
+    - cleaning dead runners from GitHub
+    - terminating stale lost runners in EC2
+"""
+
+import argparse
+import sys
+from datetime import datetime
+from dataclasses import dataclass
+from typing import Dict, List
+
+import requests  # type: ignore
+import boto3  # type: ignore
+from botocore.exceptions import ClientError  # type: ignore
+
+from lambda_shared import (
+    RUNNER_TYPE_LABELS,
+    RunnerDescription,
+    RunnerDescriptions,
+    list_runners,
+)
+from lambda_shared.token import (
+    get_cached_access_token,
+    get_key_and_app_from_aws,
+    get_access_token_by_key_app,
+)
+
+UNIVERSAL_LABEL = "universal"
+
+
+@dataclass
+class LostInstance:
+    counter: int
+    seen: datetime
+
+    def set_offline(self) -> None:
+        now = datetime.now()
+        if now.timestamp() <= self.seen.timestamp() + 120:
+            # the instance is offline for more than 2 minutes, so we increase
+            # the counter
+            self.counter += 1
+        else:
+            self.counter = 1
+        self.seen = now
+
+    @property
+    def recently_offline(self) -> bool:
+        """Returns True if the instance has been seen less than 5 minutes ago"""
+        return datetime.now().timestamp() <= self.seen.timestamp() + 300
+
+    @property
+    def stable_offline(self) -> bool:
+        return self.counter >= 3
+
+
+LOST_INSTANCES = {}  # type: Dict["str", LostInstance]
+
+
+def get_dead_runners_in_ec2(runners: RunnerDescriptions) -> RunnerDescriptions:
+    """Returns instances that are offline/dead in EC2, or not found in EC2"""
+    ids = {
+        runner.name: runner
+        for runner in runners
+        # Only `i-deadbead123` are valid names for an instance ID
+        if runner.name.startswith("i-") and runner.offline and not runner.busy
+    }
+    if not ids:
+        return []
+
+    # Delete all offline runners with wrong name
+    result_to_delete = [
+        runner
+        for runner in runners
+        if not ids.get(runner.name) and runner.offline and not runner.busy
+    ]
+
+    client = boto3.client("ec2")
+
+    i = 0
+    inc = 100
+
+    print("Checking ids: ", " ".join(ids.keys()))
+    instances_statuses = []
+    while i < len(ids.keys()):
+        try:
+            instances_statuses.append(
+                client.describe_instance_status(
+                    InstanceIds=list(ids.keys())[i : i + inc]
+                )
+            )
+            # It applied only if all ids exist in EC2
+            i += inc
+        except ClientError as e:
+            # The list of non-existent instances is in the message:
+            #   The instance IDs 'i-069b1c256c06cf4e3, i-0f26430432b044035,
+            #   i-0faa2ff44edbc147e, i-0eccf2514585045ec, i-0ee4ee53e0daa7d4a,
+            #   i-07928f15acd473bad, i-0eaddda81298f9a85' do not exist
+            message = e.response["Error"]["Message"]
+            if message.startswith("The instance IDs '") and message.endswith(
+                "' do not exist"
+            ):
+                non_existent = message[18:-14].split(", ")
+                for n in non_existent:
+                    result_to_delete.append(ids.pop(n))
+            else:
+                raise
+
+    found_instances = set([])
+    print("Response", instances_statuses)
+    for instances_status in instances_statuses:
+        for instance_status in instances_status["InstanceStatuses"]:
+            if instance_status["InstanceState"]["Name"] in ("pending", "running"):
+                found_instances.add(instance_status["InstanceId"])
+
+    print("Found instances", found_instances)
+    for runner in result_to_delete:
+        print("Instance", runner.name, "is not alive, going to remove it")
+    for instance_id, runner in ids.items():
+        if instance_id not in found_instances:
+            print("Instance", instance_id, "is not found in EC2, going to remove it")
+            result_to_delete.append(runner)
+    return result_to_delete
+
+
+def handler(event, context):
+    _ = event
+    _ = context
+    main(get_cached_access_token(), True)
+
+
+def delete_runner(access_token: str, runner: RunnerDescription) -> bool:
+    headers = {
+        "Authorization": f"token {access_token}",
+        "Accept": "application/vnd.github.v3+json",
+    }
+
+    response = requests.delete(
+        f"https://api.github.com/orgs/ClickHouse/actions/runners/{runner.id}",
+        headers=headers,
+    )
+    response.raise_for_status()
+    print(f"Response code deleting {runner.name} is {response.status_code}")
+    return bool(response.status_code == 204)
+
+
+def get_lost_ec2_instances(runners: RunnerDescriptions) -> List[str]:
+    global LOST_INSTANCES
+    now = datetime.now()
+    client = boto3.client("ec2")
+    reservations = client.describe_instances(
+        Filters=[
+            {"Name": "tag-key", "Values": ["github:runner-type"]},
+            {"Name": "instance-state-name", "Values": ["pending", "running"]},
+        ],
+    )["Reservations"]
+    # flatten the reservation into instances
+    instances = [
+        instance
+        for reservation in reservations
+        for instance in reservation["Instances"]
+    ]
+    offline_runner_names = {
+        runner.name for runner in runners if runner.offline and not runner.busy
+    }
+    runner_names = {runner.name for runner in runners}
+
+    def offline_instance(iid: str) -> None:
+        if iid in LOST_INSTANCES:
+            LOST_INSTANCES[iid].set_offline()
+            return
+        LOST_INSTANCES[iid] = LostInstance(1, now)
+
+    for instance in instances:
+        # Do not consider instances started 20 minutes ago as problematic
+        if now.timestamp() - instance["LaunchTime"].timestamp() < 1200:
+            continue
+
+        runner_type = [
+            tag["Value"]
+            for tag in instance["Tags"]
+            if tag["Key"] == "github:runner-type"
+        ][0]
+        # If there's no necessary labels in runner type it's fine
+        if not (UNIVERSAL_LABEL in runner_type or runner_type in RUNNER_TYPE_LABELS):
+            continue
+
+        if instance["InstanceId"] in offline_runner_names:
+            offline_instance(instance["InstanceId"])
+            continue
+
+        if (
+            instance["State"]["Name"] == "running"
+            and not instance["InstanceId"] in runner_names
+        ):
+            offline_instance(instance["InstanceId"])
+
+    instance_ids = [instance["InstanceId"] for instance in instances]
+    # clean out long unseen instances
+    LOST_INSTANCES = {
+        instance_id: stats
+        for instance_id, stats in LOST_INSTANCES.items()
+        if stats.recently_offline and instance_id in instance_ids
+    }
+    print("The remained LOST_INSTANCES: ", LOST_INSTANCES)
+
+    return [
+        instance_id
+        for instance_id, stats in LOST_INSTANCES.items()
+        if stats.stable_offline
+    ]
+
+
+def continue_lifecycle_hooks(delete_offline_runners: bool) -> None:
+    """The function to trigger CONTINUE for instances' lifectycle hooks"""
+    client = boto3.client("ec2")
+    reservations = client.describe_instances(
+        Filters=[
+            {"Name": "tag-key", "Values": ["github:runner-type"]},
+            {"Name": "instance-state-name", "Values": ["shutting-down", "terminated"]},
+        ],
+    )["Reservations"]
+    # flatten the reservation into instances
+    terminated_instances = [
+        instance["InstanceId"]
+        for reservation in reservations
+        for instance in reservation["Instances"]
+    ]
+
+    asg_client = boto3.client("autoscaling")
+    as_groups = asg_client.describe_auto_scaling_groups(
+        Filters=[{"Name": "tag-key", "Values": ["github:runner-type"]}]
+    )["AutoScalingGroups"]
+    for asg in as_groups:
+        lifecycle_hooks = [
+            lch
+            for lch in asg_client.describe_lifecycle_hooks(
+                AutoScalingGroupName=asg["AutoScalingGroupName"]
+            )["LifecycleHooks"]
+            if lch["LifecycleTransition"] == "autoscaling:EC2_INSTANCE_TERMINATING"
+        ]
+        if not lifecycle_hooks:
+            continue
+        for instance in asg["Instances"]:
+            continue_instance = False
+            if instance["LifecycleState"] == "Terminating:Wait":
+                if instance["HealthStatus"] == "Unhealthy":
+                    print(f"The instance {instance['InstanceId']} is Unhealthy")
+                    continue_instance = True
+                elif (
+                    instance["HealthStatus"] == "Healthy"
+                    and instance["InstanceId"] in terminated_instances
+                ):
+                    print(
+                        f"The instance {instance['InstanceId']} is already terminated"
+                    )
+                    continue_instance = True
+            if continue_instance:
+                if delete_offline_runners:
+                    for lch in lifecycle_hooks:
+                        print(f"Continue lifecycle hook {lch['LifecycleHookName']}")
+                        asg_client.complete_lifecycle_action(
+                            LifecycleHookName=lch["LifecycleHookName"],
+                            AutoScalingGroupName=asg["AutoScalingGroupName"],
+                            LifecycleActionResult="CONTINUE",
+                            InstanceId=instance["InstanceId"],
+                        )
+
+
+def main(
+    access_token: str,
+    delete_offline_runners: bool,
+) -> None:
+    gh_runners = list_runners(access_token)
+
+    dead_runners = get_dead_runners_in_ec2(gh_runners)
+    print("Runners in GH API to terminate: ", [runner.name for runner in dead_runners])
+    if delete_offline_runners and dead_runners:
+        print("Going to delete offline runners")
+        for runner in dead_runners:
+            print("Deleting runner", runner)
+            delete_runner(access_token, runner)
+    elif dead_runners:
+        print("Would delete dead runners: ", dead_runners)
+
+    lost_instances = get_lost_ec2_instances(gh_runners)
+    print("Instances to terminate: ", lost_instances)
+    if delete_offline_runners:
+        if lost_instances:
+            print("Going to terminate lost instances")
+            boto3.client("ec2").terminate_instances(InstanceIds=lost_instances)
+
+    continue_lifecycle_hooks(delete_offline_runners)
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="Get list of runners and their states")
+    parser.add_argument(
+        "-p", "--private-key-path", help="Path to file with private key"
+    )
+    parser.add_argument("-k", "--private-key", help="Private key")
+    parser.add_argument(
+        "-a", "--app-id", type=int, help="GitHub application ID", required=True
+    )
+    parser.add_argument(
+        "--delete-offline", action="store_true", help="Remove offline runners"
+    )
+
+    args = parser.parse_args()
+
+    if not args.private_key_path and not args.private_key:
+        print(
+            "Either --private-key-path or --private-key must be specified",
+            file=sys.stderr,
+        )
+
+    if args.private_key_path and args.private_key:
+        print(
+            "Either --private-key-path or --private-key must be specified",
+            file=sys.stderr,
+        )
+
+    if args.private_key:
+        private_key = args.private_key
+    elif args.private_key_path:
+        with open(args.private_key_path, "r") as key_file:
+            private_key = key_file.read()
+    else:
+        print("Attempt to get key and id from AWS secret manager")
+        private_key, args.app_id = get_key_and_app_from_aws()
+
+    token = get_access_token_by_key_app(private_key, args.app_id)
+
+    main(token, args.delete_offline)
diff --git a/tests/ci/clean_lost_instances_lambda/build_and_deploy_archive.sh b/tests/ci/clean_lost_instances_lambda/build_and_deploy_archive.sh
new file mode 120000
index 00000000000..96ba3fa024e
--- /dev/null
+++ b/tests/ci/clean_lost_instances_lambda/build_and_deploy_archive.sh
@@ -0,0 +1 @@
+../team_keys_lambda/build_and_deploy_archive.sh
\ No newline at end of file
diff --git a/tests/ci/clean_lost_instances_lambda/lambda_shared b/tests/ci/clean_lost_instances_lambda/lambda_shared
new file mode 120000
index 00000000000..ba86e090f6c
--- /dev/null
+++ b/tests/ci/clean_lost_instances_lambda/lambda_shared
@@ -0,0 +1 @@
+../lambda_shared_package/lambda_shared
\ No newline at end of file
diff --git a/tests/ci/clean_lost_instances_lambda/requirements.txt b/tests/ci/clean_lost_instances_lambda/requirements.txt
new file mode 100644
index 00000000000..e2b16067a93
--- /dev/null
+++ b/tests/ci/clean_lost_instances_lambda/requirements.txt
@@ -0,0 +1,2 @@
+../lambda_shared_package
+../lambda_shared_package[token]
diff --git a/tests/ci/codebrowser_check.py b/tests/ci/codebrowser_check.py
index 2dba5176c8b..a3414156bba 100644
--- a/tests/ci/codebrowser_check.py
+++ b/tests/ci/codebrowser_check.py
@@ -87,25 +87,37 @@ def main():
 
     report_path = result_path / "html_report"
     logging.info("Report path %s", report_path)
+
     s3_path_prefix = "codebrowser"
+    index_template = (
+        f'<a href="{S3_DOWNLOAD}/{S3_TEST_REPORTS_BUCKET}/{s3_path_prefix}/index.html">'
+        "{}</a>"
+    )
+    additional_logs = [path.absolute() for path in result_path.glob("*.log")]
+    test_results = [
+        TestResult(
+            index_template.format("Generate codebrowser site"),
+            state,
+            stopwatch.duration_seconds,
+            additional_logs,
+        )
+    ]
+
     if state == "success":
+        stopwatch.reset()
         _ = s3_helper.fast_parallel_upload_dir(
             report_path, s3_path_prefix, S3_TEST_REPORTS_BUCKET
         )
-
-    index_html = (
-        f'<a href="{S3_DOWNLOAD}/{S3_TEST_REPORTS_BUCKET}/codebrowser/index.html">'
-        "Generate codebrowser site</a>"
-    )
-
-    additional_logs = [path.absolute() for path in result_path.glob("*.log")]
-
-    test_results = [
-        TestResult(index_html, state, stopwatch.duration_seconds, additional_logs)
-    ]
+        test_results.append(
+            TestResult(
+                index_template.format("Upload codebrowser site"),
+                state,
+                stopwatch.duration_seconds,
+            )
+        )
 
     # Check if the run log contains `FATAL Error:`, that means the code problem
-    stopwatch = Stopwatch()
+    stopwatch.reset()
     fatal_error = "FATAL Error:"
     logging.info("Search for '%s' in %s", fatal_error, run_log_path)
     with open(run_log_path, "r", encoding="utf-8") as rlfd:
diff --git a/tests/ci/commit_status_helper.py b/tests/ci/commit_status_helper.py
index 8731f8280e2..efe149b0aa4 100644
--- a/tests/ci/commit_status_helper.py
+++ b/tests/ci/commit_status_helper.py
@@ -7,7 +7,7 @@ from typing import Dict, List, Literal, Optional, Union
 import logging
 
 from github import Github
-from github.GithubObject import _NotSetType, NotSet as NotSet  # type: ignore
+from github.GithubObject import _NotSetType, NotSet as NotSet
 from github.Commit import Commit
 from github.CommitStatus import CommitStatus
 from github.IssueComment import IssueComment
@@ -369,8 +369,6 @@ def update_mergeable_check(gh: Github, pr_info: PRInfo, check_name: str) -> None
 
     if fail:
         description = "failed: " + ", ".join(fail)
-        if success:
-            description += "; succeeded: " + ", ".join(success)
         description = format_description(description)
         if mergeable_status is None or mergeable_status.description != description:
             set_mergeable_check(commit, description, "failure")
diff --git a/tests/ci/docker_test.py b/tests/ci/docker_test.py
index 9d68f436439..d5d27f73694 100644
--- a/tests/ci/docker_test.py
+++ b/tests/ci/docker_test.py
@@ -10,9 +10,8 @@ from pr_info import PRInfo
 from report import TestResult
 import docker_images_check as di
 
-with patch("git_helper.Git"):
-    from version_helper import get_version_from_string
-    import docker_server as ds
+from version_helper import get_version_from_string
+import docker_server as ds
 
 # di.logging.basicConfig(level=di.logging.INFO)
 
@@ -312,7 +311,3 @@ class TestDockerServer(unittest.TestCase):
         for case in cases_equal:
             release = ds.auto_release_type(case[0], "auto")
             self.assertEqual(case[1], release)
-
-
-if __name__ == "__main__":
-    unittest.main()
diff --git a/tests/ci/fast_test_check.py b/tests/ci/fast_test_check.py
index 89066ade2cb..d5198e5c3d7 100644
--- a/tests/ci/fast_test_check.py
+++ b/tests/ci/fast_test_check.py
@@ -11,6 +11,7 @@ from typing import List, Tuple
 
 from github import Github
 
+from build_check import get_release_or_pr
 from clickhouse_helper import (
     ClickHouseHelper,
     mark_flaky_tests,
@@ -31,6 +32,7 @@ from s3_helper import S3Helper
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 from upload_result_helper import upload_results
+from version_helper import get_version_from_repo
 
 NAME = "Fast test"
 
@@ -150,7 +152,7 @@ def main():
         os.makedirs(logs_path)
 
     run_log_path = os.path.join(logs_path, "run.log")
-    with TeePopen(run_cmd, run_log_path, timeout=40 * 60) as process:
+    with TeePopen(run_cmd, run_log_path, timeout=90 * 60) as process:
         retcode = process.wait()
         if retcode == 0:
             logging.info("Run successfully")
@@ -189,6 +191,17 @@ def main():
 
     ch_helper = ClickHouseHelper()
     mark_flaky_tests(ch_helper, NAME, test_results)
+    s3_path_prefix = os.path.join(
+        get_release_or_pr(pr_info, get_version_from_repo())[0],
+        pr_info.sha,
+        "fast_tests",
+    )
+    build_urls = s3_helper.upload_build_folder_to_s3(
+        os.path.join(output_path, "binaries"),
+        s3_path_prefix,
+        keep_dirs_in_s3_path=False,
+        upload_symlinks=False,
+    )
 
     report_url = upload_results(
         s3_helper,
@@ -197,6 +210,7 @@ def main():
         test_results,
         [run_log_path] + additional_logs,
         NAME,
+        build_urls,
     )
     print(f"::notice ::Report url: {report_url}")
     post_commit_status(commit, state, report_url, description, NAME, pr_info)
@@ -214,8 +228,11 @@ def main():
 
     # Refuse other checks to run if fast test failed
     if state != "success":
-        if FORCE_TESTS_LABEL in pr_info.labels and state != "error":
-            print(f"'{FORCE_TESTS_LABEL}' enabled, will report success")
+        if state == "error":
+            print("The status is 'error', report failure disregard the labels")
+            sys.exit(1)
+        elif FORCE_TESTS_LABEL in pr_info.labels:
+            print(f"'{FORCE_TESTS_LABEL}' enabled, reporting success")
         else:
             sys.exit(1)
 
diff --git a/tests/ci/functional_test_check.py b/tests/ci/functional_test_check.py
index 037bb13f1f8..9279b19b187 100644
--- a/tests/ci/functional_test_check.py
+++ b/tests/ci/functional_test_check.py
@@ -108,7 +108,7 @@ def get_run_command(
 
     env_str = " ".join(envs)
     volume_with_broken_test = (
-        f"--volume={repo_tests_path}/broken_tests.txt:/broken_tests.txt"
+        f"--volume={repo_tests_path}/analyzer_tech_debt.txt:/analyzer_tech_debt.txt"
         if "analyzer" in check_name
         else ""
     )
@@ -355,7 +355,10 @@ def main():
         else:
             logging.info("Run failed")
 
-    subprocess.check_call(f"sudo chown -R ubuntu:ubuntu {temp_path}", shell=True)
+    try:
+        subprocess.check_call(f"sudo chown -R ubuntu:ubuntu {temp_path}", shell=True)
+    except subprocess.CalledProcessError:
+        logging.warning("Failed to change files owner in %s, ignoring it", temp_path)
 
     s3_helper = S3Helper()
 
@@ -378,34 +381,16 @@ def main():
 
     print(f"::notice:: {check_name} Report url: {report_url}")
     if args.post_commit_status == "commit_status":
-        if "parallelreplicas" in check_name.lower():
-            post_commit_status(
-                commit,
-                "success",
-                report_url,
-                description,
-                check_name_with_group,
-                pr_info,
-            )
-        else:
-            post_commit_status(
-                commit, state, report_url, description, check_name_with_group, pr_info
-            )
+        post_commit_status(
+            commit, state, report_url, description, check_name_with_group, pr_info
+        )
     elif args.post_commit_status == "file":
-        if "parallelreplicas" in check_name.lower():
-            post_commit_status_to_file(
-                post_commit_path,
-                description,
-                "success",
-                report_url,
-            )
-        else:
-            post_commit_status_to_file(
-                post_commit_path,
-                description,
-                state,
-                report_url,
-            )
+        post_commit_status_to_file(
+            post_commit_path,
+            description,
+            state,
+            report_url,
+        )
     else:
         raise Exception(
             f'Unknown post_commit_status option "{args.post_commit_status}"'
@@ -423,11 +408,7 @@ def main():
     ch_helper.insert_events_into(db="default", table="checks", events=prepared_events)
 
     if state != "success":
-        # Parallel replicas are always green for now
-        if (
-            FORCE_TESTS_LABEL in pr_info.labels
-            or "parallelreplicas" in check_name.lower()
-        ):
+        if FORCE_TESTS_LABEL in pr_info.labels:
             print(f"'{FORCE_TESTS_LABEL}' enabled, will report success")
         else:
             sys.exit(1)
diff --git a/tests/ci/git_helper.py b/tests/ci/git_helper.py
index eb5e835eab3..ab1caa42660 100644
--- a/tests/ci/git_helper.py
+++ b/tests/ci/git_helper.py
@@ -126,15 +126,16 @@ class Git:
         # Format should match TAG_REGEXP
         if self._ignore_no_tags and is_shallow():
             try:
-                self._update_tags()
+                self._update_tags(True)
             except subprocess.CalledProcessError:
                 pass
 
             return
         self._update_tags()
 
-    def _update_tags(self):
-        self.latest_tag = self.run("git describe --tags --abbrev=0")
+    def _update_tags(self, suppress_stderr: bool = False) -> None:
+        stderr = subprocess.DEVNULL if suppress_stderr else None
+        self.latest_tag = self.run("git describe --tags --abbrev=0", stderr=stderr)
         # Format should be: {latest_tag}-{commits_since_tag}-g{sha_short}
         self.description = self.run("git describe --tags --long")
         self.commits_since_tag = int(
@@ -171,7 +172,16 @@ class Git:
         if not self.latest_tag.endswith("-testing"):
             # When we are on the tag, we still need to have tweak=1 to not
             # break cmake with versions like 12.13.14.0
-            return self.commits_since_tag or TWEAK
+            if not self.commits_since_tag:
+                # We are in a tagged commit. The tweak should match the
+                # current version's value
+                version = self.latest_tag.split("-", maxsplit=1)[0]
+                try:
+                    return int(version.split(".")[-1])
+                except ValueError:
+                    # There are no tags, or a wrong tag. Return default
+                    return TWEAK
+            return self.commits_since_tag
 
         version = self.latest_tag.split("-", maxsplit=1)[0]
         return int(version.split(".")[-1]) + self.commits_since_tag
diff --git a/tests/ci/github_helper.py b/tests/ci/github_helper.py
index 834c8247cb8..f7256e523b1 100644
--- a/tests/ci/github_helper.py
+++ b/tests/ci/github_helper.py
@@ -111,7 +111,7 @@ class GitHub(github.Github):
             # See https://github.com/PyGithub/PyGithub/issues/2202,
             # obj._rawData doesn't spend additional API requests
             # pylint: disable=protected-access
-            repo_url = issue._rawData["repository_url"]  # type: ignore
+            repo_url = issue._rawData["repository_url"]
             if repo_url not in repos:
                 repos[repo_url] = issue.repository
             prs.append(
diff --git a/tests/ci/jepsen_check.py b/tests/ci/jepsen_check.py
index 9d35d2d6e35..c21fafa2605 100644
--- a/tests/ci/jepsen_check.py
+++ b/tests/ci/jepsen_check.py
@@ -25,6 +25,7 @@ from stopwatch import Stopwatch
 from tee_popen import TeePopen
 from upload_result_helper import upload_results
 from version_helper import get_version_from_repo
+from build_check import get_release_or_pr
 
 JEPSEN_GROUP_NAME = "jepsen_group"
 
@@ -210,12 +211,7 @@ if __name__ == "__main__":
 
     build_name = get_build_name_for_check(check_name)
 
-    if pr_info.number == 0:
-        version = get_version_from_repo()
-        release_or_pr = f"{version.major}.{version.minor}"
-    else:
-        # PR number for anything else
-        release_or_pr = str(pr_info.number)
+    release_or_pr, _ = get_release_or_pr(pr_info, get_version_from_repo())
 
     # This check run separately from other checks because it requires exclusive
     # run (see .github/workflows/jepsen.yml) So we cannot add explicit
diff --git a/tests/ci/lambda_shared_package/.gitignore b/tests/ci/lambda_shared_package/.gitignore
new file mode 100644
index 00000000000..59d52651e06
--- /dev/null
+++ b/tests/ci/lambda_shared_package/.gitignore
@@ -0,0 +1,2 @@
+build
+*.egg-info
diff --git a/tests/ci/cancel_and_rerun_workflow_lambda/__init__.py b/tests/ci/lambda_shared_package/__init__.py
similarity index 100%
rename from tests/ci/cancel_and_rerun_workflow_lambda/__init__.py
rename to tests/ci/lambda_shared_package/__init__.py
diff --git a/tests/ci/lambda_shared_package/lambda_shared/__init__.py b/tests/ci/lambda_shared_package/lambda_shared/__init__.py
new file mode 100644
index 00000000000..c56994cc86a
--- /dev/null
+++ b/tests/ci/lambda_shared_package/lambda_shared/__init__.py
@@ -0,0 +1,221 @@
+"""The shared code and types for all our CI lambdas
+It exists as __init__.py and lambda_shared/__init__.py to work both in local and venv"""
+
+import json
+import logging
+import time
+from collections import namedtuple
+from typing import Any, Dict, Iterable, List, Optional
+
+import boto3  # type: ignore
+import requests  # type: ignore
+
+RUNNER_TYPE_LABELS = [
+    "builder",
+    "func-tester",
+    "func-tester-aarch64",
+    "fuzzer-unit-tester",
+    "limited-tester",
+    "stress-tester",
+    "style-checker",
+    "style-checker-aarch64",
+]
+
+
+### VENDORING
+def get_parameter_from_ssm(
+    name: str, decrypt: bool = True, client: Optional[Any] = None
+) -> str:
+    if not client:
+        client = boto3.client("ssm", region_name="us-east-1")
+    return client.get_parameter(Name=name, WithDecryption=decrypt)[  # type: ignore
+        "Parameter"
+    ]["Value"]
+
+
+class CHException(Exception):
+    pass
+
+
+class InsertException(CHException):
+    pass
+
+
+class ClickHouseHelper:
+    def __init__(
+        self,
+        url: str,
+        user: Optional[str] = None,
+        password: Optional[str] = None,
+    ):
+        self.url = url
+        self.auth = {}
+        if user:
+            self.auth["X-ClickHouse-User"] = user
+        if password:
+            self.auth["X-ClickHouse-Key"] = password
+
+    @staticmethod
+    def _insert_json_str_info_impl(
+        url: str, auth: Dict[str, str], db: str, table: str, json_str: str
+    ) -> None:
+        params = {
+            "database": db,
+            "query": f"INSERT INTO {table} FORMAT JSONEachRow",
+            "date_time_input_format": "best_effort",
+            "send_logs_level": "warning",
+        }
+
+        for i in range(5):
+            try:
+                response = requests.post(
+                    url, params=params, data=json_str, headers=auth
+                )
+            except Exception as e:
+                error = f"Received exception while sending data to {url} on {i} attempt: {e}"
+                logging.warning(error)
+                continue
+
+            logging.info("Response content '%s'", response.content)
+
+            if response.ok:
+                break
+
+            error = (
+                "Cannot insert data into clickhouse at try "
+                + str(i)
+                + ": HTTP code "
+                + str(response.status_code)
+                + ": '"
+                + str(response.text)
+                + "'"
+            )
+
+            if response.status_code >= 500:
+                # A retriable error
+                time.sleep(1)
+                continue
+
+            logging.info(
+                "Request headers '%s', body '%s'",
+                response.request.headers,
+                response.request.body,
+            )
+
+            raise InsertException(error)
+        else:
+            raise InsertException(error)
+
+    def _insert_json_str_info(self, db: str, table: str, json_str: str) -> None:
+        self._insert_json_str_info_impl(self.url, self.auth, db, table, json_str)
+
+    def insert_event_into(
+        self, db: str, table: str, event: object, safe: bool = True
+    ) -> None:
+        event_str = json.dumps(event)
+        try:
+            self._insert_json_str_info(db, table, event_str)
+        except InsertException as e:
+            logging.error(
+                "Exception happened during inserting data into clickhouse: %s", e
+            )
+            if not safe:
+                raise
+
+    def insert_events_into(
+        self, db: str, table: str, events: Iterable[object], safe: bool = True
+    ) -> None:
+        jsons = []
+        for event in events:
+            jsons.append(json.dumps(event))
+
+        try:
+            self._insert_json_str_info(db, table, ",".join(jsons))
+        except InsertException as e:
+            logging.error(
+                "Exception happened during inserting data into clickhouse: %s", e
+            )
+            if not safe:
+                raise
+
+    def _select_and_get_json_each_row(self, db: str, query: str) -> str:
+        params = {
+            "database": db,
+            "query": query,
+            "default_format": "JSONEachRow",
+        }
+        for i in range(5):
+            response = None
+            try:
+                response = requests.get(self.url, params=params, headers=self.auth)
+                response.raise_for_status()
+                return response.text  # type: ignore
+            except Exception as ex:
+                logging.warning("Cannot fetch data with exception %s", str(ex))
+                if response:
+                    logging.warning("Reponse text %s", response.text)
+                time.sleep(0.1 * i)
+
+        raise CHException("Cannot fetch data from clickhouse")
+
+    def select_json_each_row(self, db: str, query: str) -> List[dict]:
+        text = self._select_and_get_json_each_row(db, query)
+        result = []
+        for line in text.split("\n"):
+            if line:
+                result.append(json.loads(line))
+        return result
+
+
+### Runners
+
+RunnerDescription = namedtuple(
+    "RunnerDescription", ["id", "name", "tags", "offline", "busy"]
+)
+RunnerDescriptions = List[RunnerDescription]
+
+
+def list_runners(access_token: str) -> RunnerDescriptions:
+    headers = {
+        "Authorization": f"token {access_token}",
+        "Accept": "application/vnd.github.v3+json",
+    }
+    per_page = 100
+    response = requests.get(
+        f"https://api.github.com/orgs/ClickHouse/actions/runners?per_page={per_page}",
+        headers=headers,
+    )
+    response.raise_for_status()
+    data = response.json()
+    total_runners = data["total_count"]
+    print("Expected total runners", total_runners)
+    runners = data["runners"]
+
+    # round to 0 for 0, 1 for 1..100, but to 2 for 101..200
+    total_pages = (total_runners - 1) // per_page + 1
+
+    print("Total pages", total_pages)
+    for i in range(2, total_pages + 1):
+        response = requests.get(
+            "https://api.github.com/orgs/ClickHouse/actions/runners"
+            f"?page={i}&per_page={per_page}",
+            headers=headers,
+        )
+        response.raise_for_status()
+        data = response.json()
+        runners += data["runners"]
+
+    print("Total runners", len(runners))
+    result = []
+    for runner in runners:
+        tags = [tag["name"] for tag in runner["labels"]]
+        desc = RunnerDescription(
+            id=runner["id"],
+            name=runner["name"],
+            tags=tags,
+            offline=runner["status"] == "offline",
+            busy=runner["busy"],
+        )
+        result.append(desc)
+
+    return result
diff --git a/tests/ci/lambda_shared_package/lambda_shared/pr.py b/tests/ci/lambda_shared_package/lambda_shared/pr.py
new file mode 100644
index 00000000000..ef47eacc082
--- /dev/null
+++ b/tests/ci/lambda_shared_package/lambda_shared/pr.py
@@ -0,0 +1,184 @@
+#!/usr/bin/env python
+
+import re
+from typing import Tuple
+
+# Individual trusted contirbutors who are not in any trusted organization.
+# Can be changed in runtime: we will append users that we learned to be in
+# a trusted org, to save GitHub API calls.
+TRUSTED_CONTRIBUTORS = {
+    e.lower()
+    for e in [
+        "achimbab",
+        "adevyatova ",  # DOCSUP
+        "Algunenano",  # Raúl Marín, Tinybird
+        "amosbird",
+        "AnaUvarova",  # DOCSUP
+        "anauvarova",  # technical writer, Yandex
+        "annvsh",  # technical writer, Yandex
+        "atereh",  # DOCSUP
+        "azat",
+        "bharatnc",  # Newbie, but already with many contributions.
+        "bobrik",  # Seasoned contributor, CloudFlare
+        "BohuTANG",
+        "codyrobert",  # Flickerbox engineer
+        "cwurm",  # Employee
+        "damozhaeva",  # DOCSUP
+        "den-crane",
+        "flickerbox-tom",  # Flickerbox
+        "gyuton",  # DOCSUP
+        "hagen1778",  # Roman Khavronenko, seasoned contributor
+        "hczhcz",
+        "hexiaoting",  # Seasoned contributor
+        "ildus",  # adjust, ex-pgpro
+        "javisantana",  # a Spanish ClickHouse enthusiast, ex-Carto
+        "ka1bi4",  # DOCSUP
+        "kirillikoff",  # DOCSUP
+        "kreuzerkrieg",
+        "lehasm",  # DOCSUP
+        "michon470",  # DOCSUP
+        "nikvas0",
+        "nvartolomei",
+        "olgarev",  # DOCSUP
+        "otrazhenia",  # Yandex docs contractor
+        "pdv-ru",  # DOCSUP
+        "podshumok",  # cmake expert from QRator Labs
+        "s-mx",  # Maxim Sabyanin, former employee, present contributor
+        "sevirov",  # technical writer, Yandex
+        "spongedu",  # Seasoned contributor
+        "taiyang-li",
+        "ucasFL",  # Amos Bird's friend
+        "vdimir",  # Employee
+        "vzakaznikov",
+        "YiuRULE",
+        "zlobober",  # Developer of YT
+        "ilejn",  # Arenadata, responsible for Kerberized Kafka
+        "thomoco",  # ClickHouse
+        "BoloniniD",  # Seasoned contributor, HSE
+        "tonickkozlov",  # Cloudflare
+        "tylerhannan",  # ClickHouse Employee
+        "myrrc",  # Mike Kot, DoubleCloud
+        "thevar1able",  # ClickHouse Employee
+        "aalexfvk",
+        "MikhailBurdukov",
+        "tsolodov",  # ClickHouse Employee
+        "kitaisreal",
+    ]
+}
+
+# Descriptions are used in .github/PULL_REQUEST_TEMPLATE.md, keep comments there
+# updated accordingly
+# The following lists are append only, try to avoid editing them
+# They still could be cleaned out after the decent time though.
+LABELS = {
+    "pr-backward-incompatible": ["Backward Incompatible Change"],
+    "pr-bugfix": [
+        "Bug Fix",
+        "Bug Fix (user-visible misbehavior in an official stable release)",
+        "Bug Fix (user-visible misbehaviour in official stable or prestable release)",
+        "Bug Fix (user-visible misbehavior in official stable or prestable release)",
+    ],
+    "pr-build": [
+        "Build/Testing/Packaging Improvement",
+        "Build Improvement",
+        "Build/Testing Improvement",
+        "Build",
+        "Packaging Improvement",
+    ],
+    "pr-documentation": [
+        "Documentation (changelog entry is not required)",
+        "Documentation",
+    ],
+    "pr-feature": ["New Feature"],
+    "pr-improvement": ["Improvement"],
+    "pr-not-for-changelog": [
+        "Not for changelog (changelog entry is not required)",
+        "Not for changelog",
+    ],
+    "pr-performance": ["Performance Improvement"],
+}
+
+CATEGORY_TO_LABEL = {c: lb for lb, categories in LABELS.items() for c in categories}
+
+
+def check_pr_description(pr_body: str) -> Tuple[str, str]:
+    """The function checks the body to being properly formatted according to
+    .github/PULL_REQUEST_TEMPLATE.md, if the first returned string is not empty,
+    then there is an error."""
+    lines = list(map(lambda x: x.strip(), pr_body.split("\n") if pr_body else []))
+    lines = [re.sub(r"\s+", " ", line) for line in lines]
+
+    # Check if body contains "Reverts ClickHouse/ClickHouse#36337"
+    if [
+        True
+        for line in lines
+        if re.match(r"\AReverts {GITHUB_REPOSITORY}#[\d]+\Z", line)
+    ]:
+        return "", LABELS["pr-not-for-changelog"][0]
+
+    category = ""
+    entry = ""
+    description_error = ""
+
+    i = 0
+    while i < len(lines):
+        if re.match(r"(?i)^[#>*_ ]*change\s*log\s*category", lines[i]):
+            i += 1
+            if i >= len(lines):
+                break
+            # Can have one empty line between header and the category
+            # itself. Filter it out.
+            if not lines[i]:
+                i += 1
+                if i >= len(lines):
+                    break
+            category = re.sub(r"^[-*\s]*", "", lines[i])
+            i += 1
+
+            # Should not have more than one category. Require empty line
+            # after the first found category.
+            if i >= len(lines):
+                break
+            if lines[i]:
+                second_category = re.sub(r"^[-*\s]*", "", lines[i])
+                description_error = (
+                    "More than one changelog category specified: "
+                    f"'{category}', '{second_category}'"
+                )
+                return description_error, category
+
+        elif re.match(
+            r"(?i)^[#>*_ ]*(short\s*description|change\s*log\s*entry)", lines[i]
+        ):
+            i += 1
+            # Can have one empty line between header and the entry itself.
+            # Filter it out.
+            if i < len(lines) and not lines[i]:
+                i += 1
+            # All following lines until empty one are the changelog entry.
+            entry_lines = []
+            while i < len(lines) and lines[i]:
+                entry_lines.append(lines[i])
+                i += 1
+            entry = " ".join(entry_lines)
+            # Don't accept changelog entries like '...'.
+            entry = re.sub(r"[#>*_.\- ]", "", entry)
+            # Don't accept changelog entries like 'Close #12345'.
+            entry = re.sub(r"^[\w\-\s]{0,10}#?\d{5,6}\.?$", "", entry)
+        else:
+            i += 1
+
+    if not category:
+        description_error = "Changelog category is empty"
+    # Filter out the PR categories that are not for changelog.
+    elif re.match(
+        r"(?i)doc|((non|in|not|un)[-\s]*significant)|(not[ ]*for[ ]*changelog)",
+        category,
+    ):
+        pass  # to not check the rest of the conditions
+    elif category not in CATEGORY_TO_LABEL:
+        description_error, category = f"Category '{category}' is not valid", ""
+    elif not entry:
+        description_error = f"Changelog entry required for category '{category}'"
+
+    return description_error, category
diff --git a/tests/ci/lambda_shared_package/lambda_shared/token.py b/tests/ci/lambda_shared_package/lambda_shared/token.py
new file mode 100644
index 00000000000..d3bf15ab259
--- /dev/null
+++ b/tests/ci/lambda_shared_package/lambda_shared/token.py
@@ -0,0 +1,92 @@
+"""Module to get the token for GitHub"""
+from dataclasses import dataclass
+import json
+import time
+from typing import Tuple
+
+import boto3  # type: ignore
+import jwt
+import requests  # type: ignore
+
+
+def get_key_and_app_from_aws() -> Tuple[str, int]:
+    secret_name = "clickhouse_github_secret_key"
+    session = boto3.session.Session()
+    client = session.client(
+        service_name="secretsmanager",
+    )
+    get_secret_value_response = client.get_secret_value(SecretId=secret_name)
+    data = json.loads(get_secret_value_response["SecretString"])
+    return data["clickhouse-app-key"], int(data["clickhouse-app-id"])
+
+
+def get_installation_id(jwt_token: str) -> int:
+    headers = {
+        "Authorization": f"Bearer {jwt_token}",
+        "Accept": "application/vnd.github.v3+json",
+    }
+    response = requests.get("https://api.github.com/app/installations", headers=headers)
+    response.raise_for_status()
+    data = response.json()
+    for installation in data:
+        if installation["account"]["login"] == "ClickHouse":
+            installation_id = installation["id"]
+
+    return installation_id  # type: ignore
+
+
+def get_access_token_by_jwt(jwt_token: str, installation_id: int) -> str:
+    headers = {
+        "Authorization": f"Bearer {jwt_token}",
+        "Accept": "application/vnd.github.v3+json",
+    }
+    response = requests.post(
+        f"https://api.github.com/app/installations/{installation_id}/access_tokens",
+        headers=headers,
+    )
+    response.raise_for_status()
+    data = response.json()
+    return data["token"]  # type: ignore
+
+
+def get_token_from_aws() -> str:
+    private_key, app_id = get_key_and_app_from_aws()
+    return get_access_token_by_key_app(private_key, app_id)
+
+
+def get_access_token_by_key_app(private_key: str, app_id: int) -> str:
+    payload = {
+        "iat": int(time.time()) - 60,
+        "exp": int(time.time()) + (10 * 60),
+        "iss": app_id,
+    }
+
+    encoded_jwt = jwt.encode(payload, private_key, algorithm="RS256")
+    installation_id = get_installation_id(encoded_jwt)
+    return get_access_token_by_jwt(encoded_jwt, installation_id)
+
+
+@dataclass
+class CachedToken:
+    time: int
+    value: str
+    updating: bool = False
+
+
+_cached_token = CachedToken(0, "")
+
+
+def get_cached_access_token() -> str:
+    if time.time() - 550 < _cached_token.time or _cached_token.updating:
+        return _cached_token.value
+    # Indicate that the value is updating now, so the cached value can be
+    # used. The first setting and close-to-ttl are not counted as update
+    if _cached_token.time != 0 or time.time() - 590 < _cached_token.time:
+        _cached_token.updating = True
+    else:
+        _cached_token.updating = False
+    private_key, app_id = get_key_and_app_from_aws()
+    _cached_token.time = int(time.time())
+    _cached_token.value = get_access_token_by_key_app(private_key, app_id)
+    _cached_token.updating = False
+    return _cached_token.value
diff --git a/tests/ci/lambda_shared_package/pyproject.toml b/tests/ci/lambda_shared_package/pyproject.toml
new file mode 100644
index 00000000000..dff36b89fbb
--- /dev/null
+++ b/tests/ci/lambda_shared_package/pyproject.toml
@@ -0,0 +1,24 @@
+[build-system]
+requires = ["setuptools"]
+build-backend = "setuptools.build_meta"
+
+[project]
+name = "lambda_shared"
+version = "0.0.1"
+dependencies = [
+  "requests",
+  "urllib3 < 2"
+]
+
+[project.optional-dependencies]
+token = [
+  "PyJWT",
+  "cryptography",
+]
+dev = [
+  "boto3",
+  "lambda_shared[token]",
+]
+
+[tool.distutils.bdist_wheel]
+universal = true
diff --git a/tests/ci/lambda_shared_package/setup.cfg b/tests/ci/lambda_shared_package/setup.cfg
new file mode 100644
index 00000000000..744280ae41b
--- /dev/null
+++ b/tests/ci/lambda_shared_package/setup.cfg
@@ -0,0 +1,8 @@
+### This file exists for clear builds in docker ###
+#   without it the `build` directory wouldn't be  #
+# updated on the fly and will require manual clean #
+[build]
+build_base = /tmp/lambda_shared
+
+[egg_info]
+egg_base = /tmp/
diff --git a/tests/ci/merge_pr.py b/tests/ci/merge_pr.py
index 2d6d81a152a..14844ed9b25 100644
--- a/tests/ci/merge_pr.py
+++ b/tests/ci/merge_pr.py
@@ -154,7 +154,7 @@ def get_workflows_for_head(repo: Repository, head_sha: str) -> List[WorkflowRun]
     return list(
         PaginatedList(
             WorkflowRun,
-            repo._requester,  # type:ignore # pylint:disable=protected-access
+            repo._requester,  # pylint:disable=protected-access
             f"{repo.url}/actions/runs",
             {"head_sha": head_sha},
             list_item="workflow_runs",
diff --git a/tests/ci/performance_comparison_check.py b/tests/ci/performance_comparison_check.py
index bf5704f31bd..41ace95c350 100644
--- a/tests/ci/performance_comparison_check.py
+++ b/tests/ci/performance_comparison_check.py
@@ -219,6 +219,12 @@ if __name__ == "__main__":
     except Exception:
         traceback.print_exc()
 
+    def too_many_slow(msg):
+        match = re.search(r"(|.* )(\d+) slower.*", msg)
+        # This threshold should be synchronized with the value in https://github.com/ClickHouse/ClickHouse/blob/master/docker/test/performance-comparison/report.py#L629
+        threshold = 5
+        return int(match.group(2).strip()) > threshold if match else False
+
     # Try to fetch status from the report.
     status = ""
     message = ""
@@ -236,7 +242,7 @@ if __name__ == "__main__":
 
         # TODO: Remove me, always green mode for the first time, unless errors
         status = "success"
-        if "errors" in message.lower():
+        if "errors" in message.lower() or too_many_slow(message.lower()):
             status = "failure"
         # TODO: Remove until here
     except Exception:
diff --git a/tests/ci/run_check.py b/tests/ci/run_check.py
index 9849f19a1e4..330a1309016 100644
--- a/tests/ci/run_check.py
+++ b/tests/ci/run_check.py
@@ -20,9 +20,11 @@ from docs_check import NAME as DOCS_NAME
 from env_helper import GITHUB_REPOSITORY, GITHUB_SERVER_URL
 from get_robot_token import get_best_robot_token
 from pr_info import FORCE_TESTS_LABEL, PRInfo
-
-from cancel_and_rerun_workflow_lambda.app import CATEGORY_TO_LABEL, check_pr_description
-from workflow_approve_rerun_lambda.app import TRUSTED_CONTRIBUTORS
+from lambda_shared_package.lambda_shared.pr import (
+    CATEGORY_TO_LABEL,
+    TRUSTED_CONTRIBUTORS,
+    check_pr_description,
+)
 
 TRUSTED_ORG_IDS = {
     54801242,  # clickhouse
diff --git a/tests/ci/runner_token_rotation_lambda/app.py b/tests/ci/runner_token_rotation_lambda/app.py
index 70ee5da01f4..6544eee9581 100644
--- a/tests/ci/runner_token_rotation_lambda/app.py
+++ b/tests/ci/runner_token_rotation_lambda/app.py
@@ -2,40 +2,11 @@
 
 import argparse
 import sys
-import json
-import time
 
 import boto3  # type: ignore
-import jwt
 import requests  # type: ignore
 
-
-def get_installation_id(jwt_token):
-    headers = {
-        "Authorization": f"Bearer {jwt_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-    response = requests.get("https://api.github.com/app/installations", headers=headers)
-    response.raise_for_status()
-    data = response.json()
-    for installation in data:
-        if installation["account"]["login"] == "ClickHouse":
-            installation_id = installation["id"]
-    return installation_id
-
-
-def get_access_token(jwt_token, installation_id):
-    headers = {
-        "Authorization": f"Bearer {jwt_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-    response = requests.post(
-        f"https://api.github.com/app/installations/{installation_id}/access_tokens",
-        headers=headers,
-    )
-    response.raise_for_status()
-    data = response.json()
-    return data["token"]
+from lambda_shared.token import get_cached_access_token, get_access_token_by_key_app
 
 
 def get_runner_registration_token(access_token):
@@ -52,32 +23,10 @@ def get_runner_registration_token(access_token):
     return data["token"]
 
 
-def get_key_and_app_from_aws():
-    secret_name = "clickhouse_github_secret_key"
-    session = boto3.session.Session()
-    client = session.client(
-        service_name="secretsmanager",
-    )
-    get_secret_value_response = client.get_secret_value(SecretId=secret_name)
-    data = json.loads(get_secret_value_response["SecretString"])
-    return data["clickhouse-app-key"], int(data["clickhouse-app-id"])
-
-
-def main(github_secret_key, github_app_id, push_to_ssm, ssm_parameter_name):
-    payload = {
-        "iat": int(time.time()) - 60,
-        "exp": int(time.time()) + (10 * 60),
-        "iss": github_app_id,
-    }
-
-    encoded_jwt = jwt.encode(payload, github_secret_key, algorithm="RS256")
-    installation_id = get_installation_id(encoded_jwt)
-    access_token = get_access_token(encoded_jwt, installation_id)
+def main(access_token, push_to_ssm, ssm_parameter_name):
     runner_registration_token = get_runner_registration_token(access_token)
 
     if push_to_ssm:
-        import boto3
-
         print("Trying to put params into ssm manager")
         client = boto3.client("ssm")
         client.put_parameter(
@@ -94,8 +43,7 @@ def main(github_secret_key, github_app_id, push_to_ssm, ssm_parameter_name):
 
 
 def handler(event, context):
-    private_key, app_id = get_key_and_app_from_aws()
-    main(private_key, app_id, True, "github_runner_registration_token")
+    main(get_cached_access_token(), True, "github_runner_registration_token")
 
 
 if __name__ == "__main__":
@@ -140,4 +88,5 @@ if __name__ == "__main__":
         with open(args.private_key_path, "r") as key_file:
             private_key = key_file.read()
 
-    main(private_key, args.app_id, args.push_to_ssm, args.ssm_parameter_name)
+    token = get_access_token_by_key_app(private_key, args.app_id)
+    main(token, args.push_to_ssm, args.ssm_parameter_name)
diff --git a/tests/ci/runner_token_rotation_lambda/lambda_shared b/tests/ci/runner_token_rotation_lambda/lambda_shared
new file mode 120000
index 00000000000..ba86e090f6c
--- /dev/null
+++ b/tests/ci/runner_token_rotation_lambda/lambda_shared
@@ -0,0 +1 @@
+../lambda_shared_package/lambda_shared
\ No newline at end of file
diff --git a/tests/ci/runner_token_rotation_lambda/requirements.txt b/tests/ci/runner_token_rotation_lambda/requirements.txt
index 98be09ab232..4cb3fba0f7b 100644
--- a/tests/ci/runner_token_rotation_lambda/requirements.txt
+++ b/tests/ci/runner_token_rotation_lambda/requirements.txt
@@ -1,3 +1 @@
-requests<2.30
-PyJWT
-cryptography<38
+../lambda_shared_package[token]
diff --git a/tests/ci/sqlancer_check.py b/tests/ci/sqlancer_check.py
index 144dea54133..7c8ffbab7f7 100644
--- a/tests/ci/sqlancer_check.py
+++ b/tests/ci/sqlancer_check.py
@@ -153,10 +153,10 @@ def main():
     test_results = []  # type: TestResults
     # Try to get status message saved by the SQLancer
     try:
-        # with open(
-        #     os.path.join(workspace_path, "status.txt"), "r", encoding="utf-8"
-        # ) as status_f:
-        #     status = status_f.readline().rstrip("\n")
+        with open(
+            os.path.join(workspace_path, "status.txt"), "r", encoding="utf-8"
+        ) as status_f:
+            status = status_f.readline().rstrip("\n")
         if os.path.exists(os.path.join(workspace_path, "server_crashed.log")):
             test_results.append(TestResult("Server crashed", "FAIL"))
         with open(
@@ -171,7 +171,7 @@ def main():
         ) as desc_f:
             description = desc_f.readline().rstrip("\n")
     except:
-        # status = "failure"
+        status = "failure"
         description = "Task failed: $?=" + str(retcode)
 
     description = format_description(description)
diff --git a/tests/ci/stopwatch.py b/tests/ci/stopwatch.py
index 1ab6737530c..a63eb954a4d 100644
--- a/tests/ci/stopwatch.py
+++ b/tests/ci/stopwatch.py
@@ -5,8 +5,7 @@ import datetime
 
 class Stopwatch:
     def __init__(self):
-        self.start_time = datetime.datetime.utcnow()
-        self.start_time_str_value = self.start_time.strftime("%Y-%m-%d %H:%M:%S")
+        self.reset()
 
     @property
     def duration_seconds(self) -> float:
@@ -15,3 +14,7 @@ class Stopwatch:
     @property
     def start_time_str(self) -> str:
         return self.start_time_str_value
+
+    def reset(self) -> None:
+        self.start_time = datetime.datetime.utcnow()
+        self.start_time_str_value = self.start_time.strftime("%Y-%m-%d %H:%M:%S")
diff --git a/tests/ci/stress.py b/tests/ci/stress.py
index b9044874071..6d17384c63f 100755
--- a/tests/ci/stress.py
+++ b/tests/ci/stress.py
@@ -20,6 +20,7 @@ def get_options(i, upgrade_check):
             '''--db-engine="Replicated('/test/db/test_{}', 's1', 'r1')"'''.format(i)
         )
         client_options.append("allow_experimental_database_replicated=1")
+        client_options.append("enable_deflate_qpl_codec=1")
 
     # If database name is not specified, new database is created for each functional test.
     # Run some threads with one database for all tests.
diff --git a/tests/ci/stress_tests.lib b/tests/ci/stress_tests.lib
index 04df50b3248..2b8ac77b952 100644
--- a/tests/ci/stress_tests.lib
+++ b/tests/ci/stress_tests.lib
@@ -9,6 +9,8 @@ FAIL="\tFAIL\t\\N\t"
 FAILURE_CONTEXT_LINES=100
 FAILURE_CONTEXT_MAX_LINE_WIDTH=300
 
+source attach_gdb.lib
+
 function escaped()
 {
     # That's the simplest way I found to escape a string in bash. Yep, bash is the most convenient programming language.
@@ -184,44 +186,7 @@ function start()
         counter=$((counter + 1))
     done
 
-    # Set follow-fork-mode to parent, because we attach to clickhouse-server, not to watchdog
-    # and clickhouse-server can do fork-exec, for example, to run some bridge.
-    # Do not set nostop noprint for all signals, because some it may cause gdb to hang,
-    # explicitly ignore non-fatal signals that are used by server.
-    # Number of SIGRTMIN can be determined only in runtime.
-    RTMIN=$(kill -l SIGRTMIN)
-    echo "
-set follow-fork-mode parent
-handle SIGHUP nostop noprint pass
-handle SIGINT nostop noprint pass
-handle SIGQUIT nostop noprint pass
-handle SIGPIPE nostop noprint pass
-handle SIGTERM nostop noprint pass
-handle SIGUSR1 nostop noprint pass
-handle SIGUSR2 nostop noprint pass
-handle SIG$RTMIN nostop noprint pass
-info signals
-continue
-backtrace full
-thread apply all backtrace full
-info registers
-disassemble /s
-up
-disassemble /s
-up
-disassemble /s
-p \"done\"
-detach
-quit
-" > script.gdb
-
-    # FIXME Hung check may work incorrectly because of attached gdb
-    # 1. False positives are possible
-    # 2. We cannot attach another gdb to get stacktraces if some queries hung
-    gdb -batch -command script.gdb -p "$(cat /var/run/clickhouse-server/clickhouse-server.pid)" | ts '%Y-%m-%d %H:%M:%S' >> /test_output/gdb.log &
-    sleep 5
-    # gdb will send SIGSTOP, spend some time loading debug info and then send SIGCONT, wait for it (up to send_timeout, 300s)
-    time clickhouse-client --query "SELECT 'Connected to clickhouse-server after attaching gdb'" ||:
+    attach_gdb_to_clickhouse
 }
 
 function check_server_start()
diff --git a/tests/ci/team_keys_lambda/app.py b/tests/ci/team_keys_lambda/app.py
index 870d41c441e..f562fbe101d 100644
--- a/tests/ci/team_keys_lambda/app.py
+++ b/tests/ci/team_keys_lambda/app.py
@@ -81,6 +81,8 @@ def get_cached_members_keys(members: set) -> Keys:
 
 
 def get_token_from_aws() -> str:
+    # We need a separate token, since the clickhouse-ci app does not have
+    # access to the organization members' endpoint
     secret_name = "clickhouse_robot_token"
     session = boto3.session.Session()
     client = session.client(
@@ -130,4 +132,4 @@ if __name__ == "__main__":
     args = parser.parse_args()
     output = main(args.token, args.organization, args.team)
 
-    print(f"# Just shoing off the keys:\n{output}")
+    print(f"# Just showing off the keys:\n{output}")
diff --git a/tests/ci/team_keys_lambda/build_and_deploy_archive.sh b/tests/ci/team_keys_lambda/build_and_deploy_archive.sh
index 4aee85c588a..02d5638cf18 100644
--- a/tests/ci/team_keys_lambda/build_and_deploy_archive.sh
+++ b/tests/ci/team_keys_lambda/build_and_deploy_archive.sh
@@ -3,13 +3,19 @@ set -xeo pipefail
 
 WORKDIR=$(dirname "$0")
 WORKDIR=$(readlink -f "${WORKDIR}")
+DIR_NAME=$(basename "$WORKDIR")
 cd "$WORKDIR"
 
-PY_VERSION=3.10
+# Do not deploy the lambda to AWS
+DRY_RUN=${DRY_RUN:-}
+# Python runtime to install dependencies
+PY_VERSION=${PY_VERSION:-3.10}
 PY_EXEC="python${PY_VERSION}"
-DOCKER_IMAGE="python:${PY_VERSION}-slim"
-LAMBDA_NAME=$(basename "$WORKDIR")
-LAMBDA_NAME=${LAMBDA_NAME//_/-}
+# Image to build the lambda zip package
+DOCKER_IMAGE="public.ecr.aws/lambda/python:${PY_VERSION}"
+# Rename the_lambda_name directory to the-lambda-name lambda in AWS
+LAMBDA_NAME=${DIR_NAME//_/-}
+# The name of directory with lambda code
 PACKAGE=lambda-package
 rm -rf "$PACKAGE" "$PACKAGE".zip
 mkdir "$PACKAGE"
@@ -17,8 +23,9 @@ cp app.py "$PACKAGE"
 if [ -f requirements.txt ]; then
   VENV=lambda-venv
   rm -rf "$VENV" lambda-package.zip
-  docker run --rm --user="${UID}" --volume="${WORKDIR}:/lambda" --workdir="/lambda" "${DOCKER_IMAGE}" \
-    /bin/bash -c "
+  docker run --rm --user="${UID}" -e HOME=/tmp --entrypoint=/bin/bash \
+    --volume="${WORKDIR}/..:/ci" --workdir="/ci/${DIR_NAME}" "${DOCKER_IMAGE}" \
+    -exc "
       '$PY_EXEC' -m venv '$VENV' &&
       source '$VENV/bin/activate' &&
       pip install -r requirements.txt
@@ -28,4 +35,6 @@ if [ -f requirements.txt ]; then
 fi
 ( cd "$PACKAGE" && zip -9 -r ../"$PACKAGE".zip . )
 
-aws lambda update-function-code --function-name "$LAMBDA_NAME" --zip-file fileb://"$PACKAGE".zip
+if [ -z "$DRY_RUN" ]; then
+  aws lambda update-function-code --function-name "$LAMBDA_NAME" --zip-file fileb://"$WORKDIR/$PACKAGE".zip
+fi
diff --git a/tests/ci/team_keys_lambda/lambda_shared b/tests/ci/team_keys_lambda/lambda_shared
new file mode 120000
index 00000000000..ba86e090f6c
--- /dev/null
+++ b/tests/ci/team_keys_lambda/lambda_shared
@@ -0,0 +1 @@
+../lambda_shared_package/lambda_shared
\ No newline at end of file
diff --git a/tests/ci/team_keys_lambda/requirements.txt b/tests/ci/team_keys_lambda/requirements.txt
index 3bcbe2dfd07..098e04a9798 100644
--- a/tests/ci/team_keys_lambda/requirements.txt
+++ b/tests/ci/team_keys_lambda/requirements.txt
@@ -1 +1 @@
-requests<2.30
+../lambda_shared_package
diff --git a/tests/ci/tee_popen.py b/tests/ci/tee_popen.py
index 4869301785e..7872b489951 100644
--- a/tests/ci/tee_popen.py
+++ b/tests/ci/tee_popen.py
@@ -11,7 +11,7 @@ import os
 import sys
 
 
-# Very simple tee logic implementation. You can specify shell command, output
+# Very simple tee logic implementation. You can specify a shell command, output
 # logfile and env variables. After TeePopen is created you can only wait until
 # it finishes. stderr and stdout will be redirected both to specified file and
 # stdout.
diff --git a/tests/ci/terminate_runner_lambda/app.py b/tests/ci/terminate_runner_lambda/app.py
index c9192417575..ed198d855b9 100644
--- a/tests/ci/terminate_runner_lambda/app.py
+++ b/tests/ci/terminate_runner_lambda/app.py
@@ -4,132 +4,47 @@ import argparse
 import json
 import sys
 import time
-from collections import namedtuple
 from dataclasses import dataclass
-from typing import Any, Dict, List, Tuple
+from typing import Any, Dict, List
 
 import boto3  # type: ignore
-import requests  # type: ignore
-import jwt
 
-
-def get_key_and_app_from_aws() -> Tuple[str, int]:
-    secret_name = "clickhouse_github_secret_key"
-    session = boto3.session.Session()
-    client = session.client(
-        service_name="secretsmanager",
-    )
-    get_secret_value_response = client.get_secret_value(SecretId=secret_name)
-    data = json.loads(get_secret_value_response["SecretString"])
-    return data["clickhouse-app-key"], int(data["clickhouse-app-id"])
-
-
-def get_installation_id(jwt_token: str) -> int:
-    headers = {
-        "Authorization": f"Bearer {jwt_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-    response = requests.get("https://api.github.com/app/installations", headers=headers)
-    response.raise_for_status()
-    data = response.json()
-    for installation in data:
-        if installation["account"]["login"] == "ClickHouse":
-            installation_id = installation["id"]
-            break
-
-    return installation_id  # type: ignore
-
-
-def get_access_token(jwt_token: str, installation_id: int) -> str:
-    headers = {
-        "Authorization": f"Bearer {jwt_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-    response = requests.post(
-        f"https://api.github.com/app/installations/{installation_id}/access_tokens",
-        headers=headers,
-    )
-    response.raise_for_status()
-    data = response.json()
-    return data["token"]  # type: ignore
+from lambda_shared import RunnerDescriptions, list_runners
+from lambda_shared.token import get_access_token_by_key_app, get_cached_access_token
 
 
 @dataclass
-class CachedToken:
+class CachedInstances:
     time: int
-    value: str
+    value: dict
+    updating: bool = False
 
 
-cached_token = CachedToken(0, "")
+cached_instances = CachedInstances(0, {})
 
 
-def get_cached_access_token() -> str:
-    if time.time() - 500 < cached_token.time:
-        return cached_token.value
-    private_key, app_id = get_key_and_app_from_aws()
-    payload = {
-        "iat": int(time.time()) - 60,
-        "exp": int(time.time()) + (10 * 60),
-        "iss": app_id,
-    }
-
-    encoded_jwt = jwt.encode(payload, private_key, algorithm="RS256")
-    installation_id = get_installation_id(encoded_jwt)
-    cached_token.time = int(time.time())
-    cached_token.value = get_access_token(encoded_jwt, installation_id)
-    return cached_token.value
-
-
-RunnerDescription = namedtuple(
-    "RunnerDescription", ["id", "name", "tags", "offline", "busy"]
-)
-RunnerDescriptions = List[RunnerDescription]
-
-
-def list_runners(access_token: str) -> RunnerDescriptions:
-    headers = {
-        "Authorization": f"token {access_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-    per_page = 100
-    response = requests.get(
-        f"https://api.github.com/orgs/ClickHouse/actions/runners?per_page={per_page}",
-        headers=headers,
+def get_cached_instances() -> dict:
+    """return cached instances description with updating it once per five minutes"""
+    if time.time() - 250 < cached_instances.time or cached_instances.updating:
+        return cached_instances.value
+    # Indicate that the value is updating now, so the cached value can be
+    # used. The first setting and close-to-ttl are not counted as update
+    if cached_instances.time != 0 or time.time() - 300 < cached_instances.time:
+        cached_instances.updating = True
+    else:
+        cached_instances.updating = False
+    ec2_client = boto3.client("ec2")
+    instances_response = ec2_client.describe_instances(
+        Filters=[{"Name": "instance-state-name", "Values": ["running"]}]
     )
-    response.raise_for_status()
-    data = response.json()
-    total_runners = data["total_count"]
-    print("Expected total runners", total_runners)
-    runners = data["runners"]
-
-    # round to 0 for 0, 1 for 1..100, but to 2 for 101..200
-    total_pages = (total_runners - 1) // per_page + 1
-
-    print("Total pages", total_pages)
-    for i in range(2, total_pages + 1):
-        response = requests.get(
-            "https://api.github.com/orgs/ClickHouse/actions/runners"
-            f"?page={i}&per_page={per_page}",
-            headers=headers,
-        )
-        response.raise_for_status()
-        data = response.json()
-        runners += data["runners"]
-
-    print("Total runners", len(runners))
-    result = []
-    for runner in runners:
-        tags = [tag["name"] for tag in runner["labels"]]
-        desc = RunnerDescription(
-            id=runner["id"],
-            name=runner["name"],
-            tags=tags,
-            offline=runner["status"] == "offline",
-            busy=runner["busy"],
-        )
-        result.append(desc)
-
-    return result
+    cached_instances.time = int(time.time())
+    cached_instances.value = {
+        instance["InstanceId"]: instance
+        for reservation in instances_response["Reservations"]
+        for instance in reservation["Instances"]
+    }
+    cached_instances.updating = False
+    return cached_instances.value
 
 
 def how_many_instances_to_kill(event_data: dict) -> Dict[str, int]:
@@ -160,11 +75,37 @@ def get_candidates_to_be_killed(event_data: dict) -> Dict[str, List[str]]:
 
 
 def main(access_token: str, event: dict) -> Dict[str, List[str]]:
-    print("Got event", json.dumps(event, sort_keys=True, indent=4))
+    start = time.time()
+    print("Got event", json.dumps(event, sort_keys=True).replace("\n", ""))
     to_kill_by_zone = how_many_instances_to_kill(event)
     instances_by_zone = get_candidates_to_be_killed(event)
+    # Getting ASG and instances' descriptions from the API
+    # We don't kill instances that alive for less than 10 minutes, since they
+    # could be not in the GH active runners yet
+    print(f"Check other hosts from the same ASG {event['AutoScalingGroupName']}")
+    asg_client = boto3.client("autoscaling")
+    as_groups_response = asg_client.describe_auto_scaling_groups(
+        AutoScalingGroupNames=[event["AutoScalingGroupName"]]
+    )
+    assert len(as_groups_response["AutoScalingGroups"]) == 1
+    asg = as_groups_response["AutoScalingGroups"][0]
+    asg_instance_ids = [instance["InstanceId"] for instance in asg["Instances"]]
+    instance_descriptions = get_cached_instances()
+    # The instances launched less than 10 minutes ago
+    immune_ids = [
+        instance["InstanceId"]
+        for instance in instance_descriptions.values()
+        if start - instance["LaunchTime"].timestamp() < 600
+    ]
+    # if the ASG's instance ID not in instance_descriptions, it's most probably
+    # is not cached yet, so we must mark it as immuned
+    immune_ids.extend(
+        iid for iid in asg_instance_ids if iid not in instance_descriptions
+    )
+    print("Time spent on the requests to AWS: ", time.time() - start)
 
     runners = list_runners(access_token)
+    runner_ids = set(runner.name for runner in runners)
     # We used to delete potential hosts to terminate from GitHub runners pool,
     # but the documentation states:
     # --- Returning an instance first in the response data does not guarantee its termination
@@ -177,18 +118,23 @@ def main(access_token: str, event: dict) -> Dict[str, List[str]]:
         total_to_kill += num_to_kill
         if num_to_kill > len(candidates):
             raise Exception(
-                f"Required to kill {num_to_kill}, but have only {len(candidates)} candidates in AV {zone}"
+                f"Required to kill {num_to_kill}, but have only {len(candidates)}"
+                f" candidates in AV {zone}"
             )
 
         delete_for_av = []  # type: RunnerDescriptions
         for candidate in candidates:
-            if candidate not in set(runner.name for runner in runners):
+            if candidate in immune_ids:
+                print(
+                    f"Candidate {candidate} started less than 10 minutes ago, won't touch a child"
+                )
+                break
+            if candidate not in runner_ids:
                 print(
                     f"Candidate {candidate} was not in runners list, simply delete it"
                 )
                 instances_to_kill.append(candidate)
-
-        for candidate in candidates:
+                break
             if len(delete_for_av) + len(instances_to_kill) == num_to_kill:
                 break
             if candidate in instances_to_kill:
@@ -207,22 +153,18 @@ def main(access_token: str, event: dict) -> Dict[str, List[str]]:
 
         if len(delete_for_av) < num_to_kill:
             print(
-                f"Checked all candidates for av {zone}, get to delete {len(delete_for_av)}, but still cannot get required {num_to_kill}"
+                f"Checked all candidates for av {zone}, get to delete "
+                f"{len(delete_for_av)}, but still cannot get required {num_to_kill}"
             )
 
         instances_to_kill += [runner.name for runner in delete_for_av]
 
     if len(instances_to_kill) < total_to_kill:
-        print(f"Check other hosts from the same ASG {event['AutoScalingGroupName']}")
-        client = boto3.client("autoscaling")
-        as_groups = client.describe_auto_scaling_groups(
-            AutoScalingGroupNames=[event["AutoScalingGroupName"]]
-        )
-        assert len(as_groups["AutoScalingGroups"]) == 1
-        asg = as_groups["AutoScalingGroups"][0]
-        for instance in asg["Instances"]:
+        for instance in asg_instance_ids:
+            if instance in immune_ids:
+                continue
             for runner in runners:
-                if runner.name == instance["InstanceId"] and not runner.busy:
+                if runner.name == instance and not runner.busy:
                     print(f"Runner {runner.name} is not busy and can be deleted")
                     instances_to_kill.append(runner.name)
 
@@ -230,9 +172,9 @@ def main(access_token: str, event: dict) -> Dict[str, List[str]]:
                 print("Got enough instances to kill")
                 break
 
-    print("Got instances to kill: ", ", ".join(instances_to_kill))
     response = {"InstanceIDs": instances_to_kill}
-    print(response)
+    print("Got instances to kill: ", response)
+    print("Time spent on the request: ", time.time() - start)
     return response
 
 
@@ -270,6 +212,8 @@ if __name__ == "__main__":
         with open(args.private_key_path, "r") as key_file:
             private_key = key_file.read()
 
+    token = get_access_token_by_key_app(private_key, args.app_id)
+
     sample_event = {
         "AutoScalingGroupARN": "arn:aws:autoscaling:us-east-1:<account-id>:autoScalingGroup:d4738357-2d40-4038-ae7e-b00ae0227003:autoScalingGroupName/my-asg",
         "AutoScalingGroupName": "my-asg",
@@ -314,14 +258,4 @@ if __name__ == "__main__":
         "Cause": "SCALE_IN",
     }
 
-    payload = {
-        "iat": int(time.time()) - 60,
-        "exp": int(time.time()) + (10 * 60),
-        "iss": args.app_id,
-    }
-
-    encoded_jwt = jwt.encode(payload, private_key, algorithm="RS256")
-    installation_id = get_installation_id(encoded_jwt)
-    access_token = get_access_token(encoded_jwt, args.app_id)
-
-    main(access_token, sample_event)
+    main(token, sample_event)
diff --git a/tests/ci/terminate_runner_lambda/lambda_shared b/tests/ci/terminate_runner_lambda/lambda_shared
new file mode 120000
index 00000000000..ba86e090f6c
--- /dev/null
+++ b/tests/ci/terminate_runner_lambda/lambda_shared
@@ -0,0 +1 @@
+../lambda_shared_package/lambda_shared
\ No newline at end of file
diff --git a/tests/ci/terminate_runner_lambda/requirements.txt b/tests/ci/terminate_runner_lambda/requirements.txt
index 98be09ab232..4cb3fba0f7b 100644
--- a/tests/ci/terminate_runner_lambda/requirements.txt
+++ b/tests/ci/terminate_runner_lambda/requirements.txt
@@ -1,3 +1 @@
-requests<2.30
-PyJWT
-cryptography<38
+../lambda_shared_package[token]
diff --git a/tests/ci/upload_result_helper.py b/tests/ci/upload_result_helper.py
index 150af7aff4a..fbb89ef8078 100644
--- a/tests/ci/upload_result_helper.py
+++ b/tests/ci/upload_result_helper.py
@@ -1,5 +1,5 @@
 from pathlib import Path
-from typing import Dict, List
+from typing import Dict, List, Optional
 import os
 import logging
 
@@ -58,14 +58,19 @@ def upload_results(
     test_results: TestResults,
     additional_files: List[str],
     check_name: str,
+    additional_urls: Optional[List[str]] = None,
 ) -> str:
     normalized_check_name = check_name.lower()
     for r in ((" ", "_"), ("(", "_"), (")", "_"), (",", "_"), ("/", "_")):
         normalized_check_name = normalized_check_name.replace(*r)
+
+    # Preserve additional_urls to not modify the original one
+    original_additional_urls = additional_urls or []
     s3_path_prefix = f"{pr_number}/{commit_sha}/{normalized_check_name}"
     additional_urls = process_logs(
         s3_client, additional_files, s3_path_prefix, test_results
     )
+    additional_urls.extend(original_additional_urls)
 
     branch_url = f"{GITHUB_SERVER_URL}/{GITHUB_REPOSITORY}/commits/master"
     branch_name = "master"
diff --git a/tests/ci/utils.lib b/tests/ci/utils.lib
new file mode 100644
index 00000000000..b5ce4ae0d78
--- /dev/null
+++ b/tests/ci/utils.lib
@@ -0,0 +1,29 @@
+#!/bin/bash
+
+function run_with_retry()
+{
+    set +e
+
+    local total_retries="$1"
+    shift
+
+    local retry=0
+
+    until [ "$retry" -ge "$total_retries" ]
+    do
+        if "$@"; then
+            set -e
+            return
+        else
+            retry=$((retry + 1))
+            sleep 5
+        fi
+    done
+
+    echo "Command '$*' failed after $total_retries retries, exiting"
+    exit 1
+}
+
+function fn_exists() {
+    declare -F "$1" > /dev/null;
+}
\ No newline at end of file
diff --git a/tests/ci/version_helper.py b/tests/ci/version_helper.py
index 372974f4eda..15229c3d21d 100755
--- a/tests/ci/version_helper.py
+++ b/tests/ci/version_helper.py
@@ -335,6 +335,7 @@ def main():
         "--version-type",
         "-t",
         choices=VersionType.VALID,
+        default=VersionType.TESTING,
         help="optional parameter to generate DESCRIBE",
     )
     parser.add_argument(
@@ -344,10 +345,16 @@ def main():
         help="if the ENV variables should be exported",
     )
     parser.add_argument(
-        "--update",
-        "-u",
+        "--update-part",
         choices=("major", "minor", "patch"),
-        help="the version part to update, tweak is always calculated from commits",
+        help="the version part to update, tweak is always calculated from commits, "
+        "implies `--update-cmake`",
+    )
+    parser.add_argument(
+        "--update-cmake",
+        "-u",
+        action="store_true",
+        help=f"is update for {FILE_WITH_VERSION_PATH} is needed or not",
     )
     parser.add_argument(
         "--update-contributors",
@@ -364,13 +371,12 @@ def main():
 
     version = get_version_from_repo(args.version_path, Git(True))
 
-    if args.update:
-        version = version.update(args.update)
+    if args.update_part:
+        version = version.update(args.update_part)
 
-    if args.version_type:
-        version.with_description(args.version_type)
+    version.with_description(args.version_type)
 
-    if args.update:
+    if args.update_part or args.update_cmake:
         update_cmake_version(version)
 
     for k, v in version.as_dict().items():
diff --git a/tests/ci/version_test.py b/tests/ci/version_test.py
index abd0f9349f4..978edcc093e 100644
--- a/tests/ci/version_test.py
+++ b/tests/ci/version_test.py
@@ -11,11 +11,11 @@ class TestFunctions(unittest.TestCase):
         cases = (
             ("0.0.0.0", vh.get_version_from_string("0.0.0.0")),
             ("1.1.1.2", vh.get_version_from_string("1.1.1.2")),
-            ("v1.1.1.2-lts", vh.get_version_from_string("1.1.1.2")),
-            ("v1.1.1.2-prestable", vh.get_version_from_string("1.1.1.2")),
-            ("v1.1.1.2-stable", vh.get_version_from_string("1.1.1.2")),
-            ("v1.1.1.2-testing", vh.get_version_from_string("1.1.1.2")),
-            ("refs/tags/v1.1.1.2-testing", vh.get_version_from_string("1.1.1.2")),
+            ("v11.1.1.2-lts", vh.get_version_from_string("11.1.1.2")),
+            ("v01.1.1.2-prestable", vh.get_version_from_string("1.1.1.2")),
+            ("v21.1.1.2-stable", vh.get_version_from_string("21.1.1.2")),
+            ("v31.1.1.2-testing", vh.get_version_from_string("31.1.1.2")),
+            ("refs/tags/v31.1.1.2-testing", vh.get_version_from_string("31.1.1.2")),
         )
         for test_case in cases:
             version = vh.version_arg(test_case[0])
@@ -25,6 +25,7 @@ class TestFunctions(unittest.TestCase):
             "1.1.1.a",
             "1.1.1.1.1",
             "1.1.1.2-testing",
+            "v1.1.1.2-testing",
             "v1.1.1.2-testin",
             "refs/tags/v1.1.1.2-testin",
         )
diff --git a/tests/ci/worker/init_runner.sh b/tests/ci/worker/init_runner.sh
index c8b11bc6e37..171dd743f90 100644
--- a/tests/ci/worker/init_runner.sh
+++ b/tests/ci/worker/init_runner.sh
@@ -42,12 +42,129 @@ systemctl restart amazon-cloudwatch-agent.service
 
 # Refresh teams ssh keys
 TEAM_KEYS_URL=$(aws ssm get-parameter --region us-east-1 --name team-keys-url --query 'Parameter.Value' --output=text)
-curl "${TEAM_KEYS_URL}" > /home/ubuntu/.ssh/authorized_keys2
+curl -s "${TEAM_KEYS_URL}" > /home/ubuntu/.ssh/authorized_keys2
 chown ubuntu: /home/ubuntu/.ssh -R
 
 
 # Create a pre-run script that will provide diagnostics info
 mkdir -p /tmp/actions-hooks
+cat > /tmp/actions-hooks/common.sh << 'EOF'
+#!/bin/bash
+EOF
+
+terminate_delayed() {
+    # The function for post hook to gracefully finish the job and then tear down
+    # The very specific sleep time is used later to determine in the main loop if
+    # the instance is tearing down
+    # IF `sleep` IS CHANGED, CHANGE ANOTHER VALUE IN `pgrep`
+    sleep=13.14159265358979323846
+    echo "Going to terminate the runner's instance in $sleep seconds"
+    INSTANCE_ID=$(ec2metadata --instance-id)
+    # We execute it with `at` to not have it as an orphan process, but launched independently
+    # GH Runners kill all remain processes
+    echo "sleep '$sleep'; aws ec2 terminate-instances --instance-ids $INSTANCE_ID" | at now || \
+        aws ec2 terminate-instances --instance-ids "$INSTANCE_ID"  # workaround for complete out of space or non-installed `at`
+    exit 0
+}
+
+detect_delayed_termination() {
+    # The function look for very specific sleep with pi
+    if pgrep 'sleep 13.14159265358979323846'; then
+        echo 'The instance has delayed termination, sleep the same time to wait if it goes down'
+        sleep 14
+    fi
+}
+
+declare -f terminate_delayed >> /tmp/actions-hooks/common.sh
+
+terminate_and_exit() {
+    # Terminate instance and exit from the script instantly
+    echo "Going to terminate the runner's instance"
+    INSTANCE_ID=$(ec2metadata --instance-id)
+    aws ec2 terminate-instances --instance-ids "$INSTANCE_ID"
+    exit 0
+}
+
+declare -f terminate_and_exit >> /tmp/actions-hooks/common.sh
+
+check_proceed_spot_termination() {
+    # The function checks and proceeds spot instance termination if exists
+    # The event for spot instance termination
+    if TERMINATION_DATA=$(curl -s --fail http://169.254.169.254/latest/meta-data/spot/instance-action); then
+        # https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/spot-instance-termination-notices.html#instance-action-metadata
+        _action=$(jq '.action' -r <<< "$TERMINATION_DATA")
+        _time=$(jq '.time | fromdate' <<< "$TERMINATION_DATA")
+        _until_action=$((_time - $(date +%s)))
+        echo "Received the '$_action' event that will be effective in $_until_action seconds"
+        if (( _until_action <= 30 )); then
+            echo "The action $_action will be done in $_until_action, killing the runner and exit"
+            local runner_pid
+            runner_pid=$(pgrep Runner.Listener)
+            if [ -n "$runner_pid" ]; then
+                # Kill the runner to not allow it cancelling the job
+                kill -9 "$runner_pid"
+            fi
+            sudo -u ubuntu ./config.sh remove --token "$(get_runner_token)"
+            terminate_and_exit
+        fi
+    fi
+}
+
+no_terminating_metadata() {
+    # The function check that instance could continue work
+    # Returns 1 if any of termination events are received
+
+    # The event for rebalance recommendation. Not strict, so we have some room to make a decision here
+    if curl -s --fail http://169.254.169.254/latest/meta-data/events/recommendations/rebalance; then
+        echo 'Received recommendation to rebalance, checking the uptime'
+        UPTIME=$(< /proc/uptime)
+        UPTIME=${UPTIME%%.*}
+        # We don't shutdown the instances younger than 30m
+        if (( 1800 < UPTIME )); then
+            # To not shutdown everything at once, use the 66% to survive
+            if (( $((RANDOM % 3)) == 0 )); then
+                echo 'The instance is older than 30m and won the roulette'
+                return 1
+            fi
+            echo 'The instance is older than 30m, but is not chosen for rebalance'
+        else
+            echo 'The instance is younger than 30m, do not shut it down'
+        fi
+    fi
+
+    # Checks if the ASG in a lifecycle hook state
+    local ASG_STATUS
+    ASG_STATUS=$(curl -s http://169.254.169.254/latest/meta-data/autoscaling/target-lifecycle-state)
+    if [ "$ASG_STATUS" == "Terminated" ]; then
+        echo 'The instance in ASG status Terminating:Wait'
+        return 1
+    fi
+}
+
+terminate_on_event() {
+    # If there is a rebalance event, then the instance could die soon
+    # Let's don't wait for it and terminate proactively
+    if curl -s --fail http://169.254.169.254/latest/meta-data/events/recommendations/rebalance; then
+        terminate_and_exit
+    fi
+
+    # Here we check if the autoscaling group marked the instance for termination, and it's wait for the job to finish
+    ASG_STATUS=$(curl -s http://169.254.169.254/latest/meta-data/autoscaling/target-lifecycle-state)
+    if [ "$ASG_STATUS" == "Terminated" ]; then
+        INSTANCE_ID=$(ec2metadata --instance-id)
+        ASG_NAME=$(aws ec2 describe-tags --filters "Name=resource-id,Values=$INSTANCE_ID" --query "Tags[?Key=='aws:autoscaling:groupName'].Value" --output text)
+        LIFECYCLE_HOOKS=$(aws autoscaling describe-lifecycle-hooks --auto-scaling-group-name "$ASG_NAME" --query "LifecycleHooks[].LifecycleHookName" --output text)
+        for LCH in $LIFECYCLE_HOOKS; do
+            aws autoscaling complete-lifecycle-action --lifecycle-action-result CONTINUE \
+                --lifecycle-hook-name "$LCH" --auto-scaling-group-name "$ASG_NAME" \
+                --instance-id "$INSTANCE_ID"
+            true  # autoformat issue
+        done
+        echo 'The runner is marked as "Terminated" by the autoscaling group, we are terminating'
+        terminate_and_exit
+    fi
+}
+
 cat > /tmp/actions-hooks/pre-run.sh << EOF
 #!/bin/bash
 set -uo pipefail
@@ -61,21 +178,13 @@ cat > /tmp/actions-hooks/post-run.sh << 'EOF'
 #!/bin/bash
 set -xuo pipefail
 
-terminate-and-exit() {
-  echo "Going to terminate the runner"
-  INSTANCE_ID=$(ec2metadata --instance-id)
-  # We execute it with at to not have it as an orphan process
-  # GH Runners kill all remain processes
-  echo "sleep 10; aws ec2 terminate-instances --instance-ids $INSTANCE_ID" | at now || \
-    aws ec2 terminate-instances --instance-ids "$INSTANCE_ID"  # workaround for complete out of space
-  exit 0
-}
+source /tmp/actions-hooks/common.sh
 
 # Free KiB, free percents
 ROOT_STAT=($(df / | awk '/\// {print $4 " " int($4/$2 * 100)}'))
 if [[ ${ROOT_STAT[0]} -lt 3000000 ]] || [[ ${ROOT_STAT[1]} -lt 5 ]]; then
   echo "The runner has ${ROOT_STAT[0]}KiB and ${ROOT_STAT[1]}% of free space on /"
-  terminate-and-exit
+  terminate_delayed
 fi
 
 # shellcheck disable=SC2046
@@ -98,24 +207,52 @@ if [ "$(docker ps --all --quiet)" ]; then
     docker info && break || sleep 2
   done
   # Last chance, otherwise we have to terminate poor instance
-  docker info 1>/dev/null || { echo Docker unable to start; terminate-and-exit; }
+  docker info 1>/dev/null || { echo Docker unable to start; terminate_delayed ; }
 fi
 EOF
 
-while true; do
-    runner_pid=$(pgrep run.sh)
-    echo "Got runner pid $runner_pid"
+get_runner_token() {
+    /usr/local/bin/aws ssm  get-parameter --name github_runner_registration_token --with-decryption --output text --query Parameter.Value
+}
 
-    cd $RUNNER_HOME || exit 1
+is_job_assigned() {
+    local runner_pid
+    runner_pid=$(pgrep Runner.Listener)
     if [ -z "$runner_pid" ]; then
-        echo "Receiving token"
-        RUNNER_TOKEN=$(/usr/local/bin/aws ssm  get-parameter --name github_runner_registration_token --with-decryption --output text --query Parameter.Value)
+        # if runner has finished, it's fine
+        return 0
+    fi
+    local log_file
+    log_file=$(lsof -p "$runner_pid" 2>/dev/null | grep -o "$RUNNER_HOME/_diag/Runner.*log")
+    if [ -z "$log_file" ]; then
+        # assume, the process is over or just started
+        return 0
+    fi
+    # So far it's the only solid way to determine that the job is starting
+    grep -q 'Terminal] .* Running job:' "$log_file" \
+        && return 0 \
+        || return 1
+}
 
-        echo "Will try to remove runner"
-        sudo -u ubuntu ./config.sh remove --token "$RUNNER_TOKEN" ||:
+while true; do
+    runner_pid=$(pgrep Runner.Listener)
+    echo "Got runner pid '$runner_pid'"
+
+    if [ -z "$runner_pid" ]; then
+        cd $RUNNER_HOME || terminate_and_exit
+        detect_delayed_termination
+        # If runner is not active, check that it needs to terminate itself
+        echo "Checking if the instance suppose to terminate"
+        no_terminating_metadata || terminate_on_event
+        check_proceed_spot_termination
 
         echo "Going to configure runner"
-        sudo -u ubuntu ./config.sh --url $RUNNER_URL --token "$RUNNER_TOKEN" --name "$INSTANCE_ID" --runnergroup Default --labels "$LABELS" --work _work
+        sudo -u ubuntu ./config.sh --url $RUNNER_URL --token "$(get_runner_token)" --ephemeral \
+          --runnergroup Default --labels "$LABELS" --work _work --name "$INSTANCE_ID"
+
+        echo "Another one check to avoid race between runner and infrastructure"
+        no_terminating_metadata || terminate_on_event
+        check_proceed_spot_termination
 
         echo "Run"
         sudo -u ubuntu \
@@ -124,7 +261,28 @@ while true; do
           ./run.sh &
         sleep 15
     else
-        echo "Runner is working with pid $runner_pid, nothing to do"
-        sleep 10
+        echo "Runner is working with pid $runner_pid, checking the metadata in background"
+        check_proceed_spot_termination
+
+        if ! is_job_assigned; then
+            RUNNER_AGE=$(( $(date +%s) - $(stat -c +%Y /proc/"$runner_pid" 2>/dev/null || date +%s) ))
+            echo "The runner is launched $RUNNER_AGE seconds ago and still has hot received the job"
+            if (( 60 < RUNNER_AGE )); then
+                echo "Check if the instance should tear down"
+                if ! no_terminating_metadata; then
+                    # Another check if the worker still didn't start
+                    if is_job_assigned; then
+                        echo "During the metadata check the job was assigned, continue"
+                        continue
+                    fi
+                    kill -9 "$runner_pid"
+                    sudo -u ubuntu ./config.sh remove --token "$(get_runner_token)"
+                    terminate_on_event
+                fi
+            fi
+        fi
+        sleep 5
     fi
 done
+
+# vim:ts=4:sw=4
diff --git a/tests/ci/workflow_approve_rerun_lambda/__init__.py b/tests/ci/workflow_approve_rerun_lambda/__init__.py
deleted file mode 100644
index 4265cc3e6c1..00000000000
--- a/tests/ci/workflow_approve_rerun_lambda/__init__.py
+++ /dev/null
@@ -1 +0,0 @@
-#!/usr/bin/env python
diff --git a/tests/ci/workflow_approve_rerun_lambda/app.py b/tests/ci/workflow_approve_rerun_lambda/app.py
index 32cba5d466b..5e2331ece3c 100644
--- a/tests/ci/workflow_approve_rerun_lambda/app.py
+++ b/tests/ci/workflow_approve_rerun_lambda/app.py
@@ -5,9 +5,10 @@ import fnmatch
 import json
 import time
 
-import jwt
 import requests  # type: ignore
-import boto3  # type: ignore
+
+from lambda_shared.pr import TRUSTED_CONTRIBUTORS
+from lambda_shared.token import get_cached_access_token
 
 SUSPICIOUS_CHANGED_FILES_NUMBER = 200
 
@@ -67,108 +68,6 @@ NEED_RERUN_WORKFLOWS = {
     "ReleaseBranchCI",
 }
 
-# Individual trusted contirbutors who are not in any trusted organization.
-# Can be changed in runtime: we will append users that we learned to be in
-# a trusted org, to save GitHub API calls.
-TRUSTED_CONTRIBUTORS = {
-    e.lower()
-    for e in [
-        "achimbab",
-        "adevyatova ",  # DOCSUP
-        "Algunenano",  # Raúl Marín, Tinybird
-        "amosbird",
-        "AnaUvarova",  # DOCSUP
-        "anauvarova",  # technical writer, Yandex
-        "annvsh",  # technical writer, Yandex
-        "atereh",  # DOCSUP
-        "azat",
-        "bharatnc",  # Newbie, but already with many contributions.
-        "bobrik",  # Seasoned contributor, CloudFlare
-        "BohuTANG",
-        "codyrobert",  # Flickerbox engineer
-        "cwurm",  # Employee
-        "damozhaeva",  # DOCSUP
-        "den-crane",
-        "flickerbox-tom",  # Flickerbox
-        "gyuton",  # DOCSUP
-        "hagen1778",  # Roman Khavronenko, seasoned contributor
-        "hczhcz",
-        "hexiaoting",  # Seasoned contributor
-        "ildus",  # adjust, ex-pgpro
-        "javisantana",  # a Spanish ClickHouse enthusiast, ex-Carto
-        "ka1bi4",  # DOCSUP
-        "kirillikoff",  # DOCSUP
-        "kreuzerkrieg",
-        "lehasm",  # DOCSUP
-        "michon470",  # DOCSUP
-        "nikvas0",
-        "nvartolomei",
-        "olgarev",  # DOCSUP
-        "otrazhenia",  # Yandex docs contractor
-        "pdv-ru",  # DOCSUP
-        "podshumok",  # cmake expert from QRator Labs
-        "s-mx",  # Maxim Sabyanin, former employee, present contributor
-        "sevirov",  # technical writer, Yandex
-        "spongedu",  # Seasoned contributor
-        "taiyang-li",
-        "ucasFL",  # Amos Bird's friend
-        "vdimir",  # Employee
-        "vzakaznikov",
-        "YiuRULE",
-        "zlobober",  # Developer of YT
-        "ilejn",  # Arenadata, responsible for Kerberized Kafka
-        "thomoco",  # ClickHouse
-        "BoloniniD",  # Seasoned contributor, HSE
-        "tonickkozlov",  # Cloudflare
-        "tylerhannan",  # ClickHouse Employee
-        "myrrc",  # Mike Kot, DoubleCloud
-        "thevar1able",  # ClickHouse Employee
-        "aalexfvk",
-        "MikhailBurdukov",
-        "tsolodov",  # ClickHouse Employee
-        "kitaisreal",
-    ]
-}
-
-
-def get_installation_id(jwt_token):
-    headers = {
-        "Authorization": f"Bearer {jwt_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-    response = requests.get("https://api.github.com/app/installations", headers=headers)
-    response.raise_for_status()
-    data = response.json()
-    for installation in data:
-        if installation["account"]["login"] == "ClickHouse":
-            installation_id = installation["id"]
-    return installation_id
-
-
-def get_access_token(jwt_token, installation_id):
-    headers = {
-        "Authorization": f"Bearer {jwt_token}",
-        "Accept": "application/vnd.github.v3+json",
-    }
-    response = requests.post(
-        f"https://api.github.com/app/installations/{installation_id}/access_tokens",
-        headers=headers,
-    )
-    response.raise_for_status()
-    data = response.json()
-    return data["token"]
-
-
-def get_key_and_app_from_aws():
-    secret_name = "clickhouse_github_secret_key"
-    session = boto3.session.Session()
-    client = session.client(
-        service_name="secretsmanager",
-    )
-    get_secret_value_response = client.get_secret_value(SecretId=secret_name)
-    data = json.loads(get_secret_value_response["SecretString"])
-    return data["clickhouse-app-key"], int(data["clickhouse-app-id"])
-
 
 def is_trusted_contributor(pr_user_login, pr_user_orgs):
     if pr_user_login.lower() in TRUSTED_CONTRIBUTORS:
@@ -325,25 +224,12 @@ def approve_run(workflow_description: WorkflowDescription, token: str) -> None:
 
 
 def label_manual_approve(pull_request, token):
-    url = f"{pull_request['url']}/labels"
-    data = {"labels": "manual approve"}
+    url = f"{pull_request['issue_url']}/labels"
+    data = {"labels": ["manual approve"]}
 
     _exec_post_with_retry(url, token, data)
 
 
-def get_token_from_aws():
-    private_key, app_id = get_key_and_app_from_aws()
-    payload = {
-        "iat": int(time.time()) - 60,
-        "exp": int(time.time()) + (10 * 60),
-        "iss": app_id,
-    }
-
-    encoded_jwt = jwt.encode(payload, private_key, algorithm="RS256")
-    installation_id = get_installation_id(encoded_jwt)
-    return get_access_token(encoded_jwt, installation_id)
-
-
 def get_workflow_jobs(workflow_description, token):
     jobs_url = (
         workflow_description.api_url + f"/attempts/{workflow_description.attempt}/jobs"
@@ -443,7 +329,7 @@ def check_workflow_completed(
 
 
 def main(event):
-    token = get_token_from_aws()
+    token = get_cached_access_token()
     event_data = json.loads(event["body"])
     print("The body received:", event["body"])
     workflow_description = get_workflow_description_from_event(event_data)
@@ -490,11 +376,10 @@ def main(event):
     changed_files = get_changed_files_for_pull_request(pull_request, token)
     print(f"Totally have {len(changed_files)} changed files in PR:", changed_files)
     if check_suspicious_changed_files(changed_files):
-        print(
-            f"Pull Request {pull_request['number']} has suspicious changes, "
-            "label it for manuall approve"
-        )
-        label_manual_approve(pull_request, token)
+        print(f"Pull Request {pull_request['number']} has suspicious changes")
+        if "manual approve" not in labels:
+            print("Label the PR as needed for manuall approve")
+            label_manual_approve(pull_request, token)
     else:
         print(f"Pull Request {pull_request['number']} has no suspicious changes")
         approve_run(workflow_description, token)
diff --git a/tests/ci/workflow_approve_rerun_lambda/lambda_shared b/tests/ci/workflow_approve_rerun_lambda/lambda_shared
new file mode 120000
index 00000000000..ba86e090f6c
--- /dev/null
+++ b/tests/ci/workflow_approve_rerun_lambda/lambda_shared
@@ -0,0 +1 @@
+../lambda_shared_package/lambda_shared
\ No newline at end of file
diff --git a/tests/ci/workflow_approve_rerun_lambda/requirements.txt b/tests/ci/workflow_approve_rerun_lambda/requirements.txt
index 98be09ab232..4cb3fba0f7b 100644
--- a/tests/ci/workflow_approve_rerun_lambda/requirements.txt
+++ b/tests/ci/workflow_approve_rerun_lambda/requirements.txt
@@ -1,3 +1 @@
-requests<2.30
-PyJWT
-cryptography<38
+../lambda_shared_package[token]
diff --git a/tests/ci/workflow_jobs_lambda/app.py b/tests/ci/workflow_jobs_lambda/app.py
index bc8e1212be5..c624a492604 100644
--- a/tests/ci/workflow_jobs_lambda/app.py
+++ b/tests/ci/workflow_jobs_lambda/app.py
@@ -10,13 +10,11 @@ fields for private repositories
 
 from base64 import b64decode
 from dataclasses import dataclass
-from typing import Any, List
+from typing import Any, List, Optional
 import json
 import logging
-import time
 
-import boto3  # type: ignore
-import requests  # type: ignore
+from lambda_shared import ClickHouseHelper, InsertException, get_parameter_from_ssm
 
 logging.getLogger().setLevel(logging.INFO)
 
@@ -66,137 +64,7 @@ class WorkflowJob:
         return self.__dict__
 
 
-### VENDORING
-def get_parameter_from_ssm(name, decrypt=True, client=None):
-    if not client:
-        client = boto3.client("ssm", region_name="us-east-1")
-    return client.get_parameter(Name=name, WithDecryption=decrypt)["Parameter"]["Value"]
-
-
-class InsertException(Exception):
-    pass
-
-
-class ClickHouseHelper:
-    def __init__(self, url=None):
-        if url is None:
-            url = get_parameter_from_ssm("clickhouse-test-stat-url")
-
-        self.url = url
-        self.auth = {
-            "X-ClickHouse-User": get_parameter_from_ssm("clickhouse-test-stat-login"),
-            "X-ClickHouse-Key": get_parameter_from_ssm("clickhouse-test-stat-password"),
-        }
-
-    @staticmethod
-    def _insert_json_str_info_impl(url, auth, db, table, json_str):
-        params = {
-            "database": db,
-            "query": f"INSERT INTO {table} FORMAT JSONEachRow",
-            "date_time_input_format": "best_effort",
-            "send_logs_level": "warning",
-        }
-
-        for i in range(5):
-            try:
-                response = requests.post(
-                    url, params=params, data=json_str, headers=auth
-                )
-            except Exception as e:
-                error = f"Received exception while sending data to {url} on {i} attempt: {e}"
-                logging.warning(error)
-                continue
-
-            logging.info("Response content '%s'", response.content)
-
-            if response.ok:
-                break
-
-            error = (
-                "Cannot insert data into clickhouse at try "
-                + str(i)
-                + ": HTTP code "
-                + str(response.status_code)
-                + ": '"
-                + str(response.text)
-                + "'"
-            )
-
-            if response.status_code >= 500:
-                # A retriable error
-                time.sleep(1)
-                continue
-
-            logging.info(
-                "Request headers '%s', body '%s'",
-                response.request.headers,
-                response.request.body,
-            )
-
-            raise InsertException(error)
-        else:
-            raise InsertException(error)
-
-    def _insert_json_str_info(self, db, table, json_str):
-        self._insert_json_str_info_impl(self.url, self.auth, db, table, json_str)
-
-    def insert_event_into(self, db, table, event, safe=True):
-        event_str = json.dumps(event)
-        try:
-            self._insert_json_str_info(db, table, event_str)
-        except InsertException as e:
-            logging.error(
-                "Exception happened during inserting data into clickhouse: %s", e
-            )
-            if not safe:
-                raise
-
-    def insert_events_into(self, db, table, events, safe=True):
-        jsons = []
-        for event in events:
-            jsons.append(json.dumps(event))
-
-        try:
-            self._insert_json_str_info(db, table, ",".join(jsons))
-        except InsertException as e:
-            logging.error(
-                "Exception happened during inserting data into clickhouse: %s", e
-            )
-            if not safe:
-                raise
-
-    def _select_and_get_json_each_row(self, db, query):
-        params = {
-            "database": db,
-            "query": query,
-            "default_format": "JSONEachRow",
-        }
-        for i in range(5):
-            response = None
-            try:
-                response = requests.get(self.url, params=params, headers=self.auth)
-                response.raise_for_status()
-                return response.text
-            except Exception as ex:
-                logging.warning("Cannot insert with exception %s", str(ex))
-                if response:
-                    logging.warning("Reponse text %s", response.text)
-                time.sleep(0.1 * i)
-
-        raise Exception("Cannot fetch data from clickhouse")
-
-    def select_json_each_row(self, db, query):
-        text = self._select_and_get_json_each_row(db, query)
-        result = []
-        for line in text.split("\n"):
-            if line:
-                result.append(json.loads(line))
-        return result
-
-
-### VENDORING END
-
-clickhouse_client = ClickHouseHelper()
+CH_CLIENT = None  # type: Optional[ClickHouseHelper]
 
 
 def send_event_workflow_job(workflow_job: WorkflowJob) -> None:
@@ -232,23 +100,30 @@ def send_event_workflow_job(workflow_job: WorkflowJob) -> None:
     # PARTITION BY toStartOfMonth(started_at)
     # ORDER BY (id, updated_at)
     # SETTINGS index_granularity = 8192
-    global clickhouse_client
-    kwargs = {
-        "db": "default",
-        "table": "workflow_jobs",
-        "event": workflow_job.as_dict(),
-        "safe": False,
-    }
+    global CH_CLIENT
+    CH_CLIENT = CH_CLIENT or ClickHouseHelper(
+        get_parameter_from_ssm("clickhouse-test-stat-url"),
+        get_parameter_from_ssm("clickhouse-test-stat-login"),
+        get_parameter_from_ssm("clickhouse-test-stat-password"),
+    )
     try:
-        clickhouse_client.insert_event_into(**kwargs)
+        CH_CLIENT.insert_event_into(
+            "default", "workflow_jobs", workflow_job.as_dict(), False
+        )
     except InsertException as ex:
         logging.exception(
             "Got an exception on insert, tryuing to update the client "
             "credentials and repeat",
             exc_info=ex,
         )
-        clickhouse_client = ClickHouseHelper()
-        clickhouse_client.insert_event_into(**kwargs)
+        CH_CLIENT = ClickHouseHelper(
+            get_parameter_from_ssm("clickhouse-test-stat-url"),
+            get_parameter_from_ssm("clickhouse-test-stat-login"),
+            get_parameter_from_ssm("clickhouse-test-stat-password"),
+        )
+        CH_CLIENT.insert_event_into(
+            "default", "workflow_jobs", workflow_job.as_dict(), False
+        )
 
 
 def handler(event: dict, context: Any) -> dict:
@@ -257,6 +132,7 @@ def handler(event: dict, context: Any) -> dict:
     else:
         event_data = json.loads(event["body"])
 
+    logging.info("Got the next raw event from the github hook: %s", event_data)
     repo = event_data["repository"]
     try:
         wf_job = event_data["workflow_job"]
@@ -265,6 +141,9 @@ def handler(event: dict, context: Any) -> dict:
         logging.error("The event data: %s", event)
         logging.error("The context data: %s", context)
 
+    # We record only finished steps
+    steps = len([step for step in wf_job["steps"] if step["conclusion"] is not None])
+
     workflow_job = WorkflowJob(
         wf_job["id"],
         wf_job["run_id"],
@@ -281,7 +160,7 @@ def handler(event: dict, context: Any) -> dict:
         wf_job["started_at"],
         wf_job["completed_at"] or "1970-01-01T00:00:00",  # nullable date
         wf_job["name"],
-        len(wf_job["steps"]),
+        steps,
         wf_job["check_run_url"],
         wf_job["labels"],
         wf_job["runner_id"] or 0,  # nullable
diff --git a/tests/ci/workflow_jobs_lambda/lambda_shared b/tests/ci/workflow_jobs_lambda/lambda_shared
new file mode 120000
index 00000000000..ba86e090f6c
--- /dev/null
+++ b/tests/ci/workflow_jobs_lambda/lambda_shared
@@ -0,0 +1 @@
+../lambda_shared_package/lambda_shared
\ No newline at end of file
diff --git a/tests/ci/workflow_jobs_lambda/requirements.txt b/tests/ci/workflow_jobs_lambda/requirements.txt
index 3bcbe2dfd07..098e04a9798 100644
--- a/tests/ci/workflow_jobs_lambda/requirements.txt
+++ b/tests/ci/workflow_jobs_lambda/requirements.txt
@@ -1 +1 @@
-requests<2.30
+../lambda_shared_package
diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index d8fad77b95c..4860ce0fac9 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -340,9 +340,28 @@ def get_transactions_list(args):
         return f"Cannot get list of transactions: {e}"
 
 
+def kill_gdb_if_any():
+    # Check if we have running gdb.
+    code = subprocess.call("pidof gdb", shell=True)
+    if code != 0:
+        return
+
+    for i in range(5):
+        code = subprocess.call("kill -TERM $(pidof gdb)", shell=True, timeout=30)
+        if code != 0:
+            sleep(i)
+        else:
+            break
+
+
 # collect server stacktraces using gdb
 def get_stacktraces_from_gdb(server_pid):
     try:
+        # We could attach gdb to clickhouse-server before running some tests
+        # to print stacktraces of all crashes even if clickhouse cannot print it for some reason.
+        # We should kill existing gdb if any before starting new one.
+        kill_gdb_if_any()
+
         cmd = f"gdb -batch -ex 'thread apply all backtrace' -p {server_pid}"
         return subprocess.check_output(cmd, shell=True).decode("utf-8")
     except Exception as e:
@@ -570,7 +589,7 @@ class SettingsRandomizer:
         "filesystem_prefetch_step_bytes": lambda: random.choice(
             [0, "100Mi"]
         ),  # 0 means 'auto'
-        "compile_expressions": lambda: random.randint(0, 1),
+        # "compile_expressions": lambda: random.randint(0, 1), - this setting has a bug: https://github.com/ClickHouse/ClickHouse/issues/51264
         "compile_aggregate_expressions": lambda: random.randint(0, 1),
         "compile_sort_description": lambda: random.randint(0, 1),
         "merge_tree_coarse_index_granularity": lambda: random.randint(2, 32),
@@ -973,7 +992,10 @@ class TestCase:
 
                 if os.path.isfile(self.stdout_file):
                     description += ", result:\n\n"
-                    description += trim_for_log(open(self.stdout_file).read())
+                    with open(self.stdout_file, "rb") as f:
+                        description += trim_for_log(
+                            f.read().decode("utf-8", errors="ignore")
+                        )
                     description += "\n"
 
                 description += f"\nstdout:\n{stdout}\n"
diff --git a/tests/config/config.d/database_replicated.xml b/tests/config/config.d/database_replicated.xml
index 9a405f85908..2504a7ca526 100644
--- a/tests/config/config.d/database_replicated.xml
+++ b/tests/config/config.d/database_replicated.xml
@@ -40,7 +40,7 @@
             <operation_timeout_ms>10000</operation_timeout_ms>
             <session_timeout_ms>30000</session_timeout_ms>
             <heart_beat_interval_ms>1000</heart_beat_interval_ms>
-            <election_timeout_lower_bound_ms>4000</election_timeout_lower_bound_ms>
+            <election_timeout_lower_bound_ms>2000</election_timeout_lower_bound_ms>
             <election_timeout_upper_bound_ms>5000</election_timeout_upper_bound_ms>
             <raft_logs_level>information</raft_logs_level>
             <force_sync>false</force_sync>
diff --git a/tests/config/config.d/keeper_port.xml b/tests/config/config.d/keeper_port.xml
index cffd325e968..7db174c5419 100644
--- a/tests/config/config.d/keeper_port.xml
+++ b/tests/config/config.d/keeper_port.xml
@@ -28,5 +28,9 @@
                 <port>9234</port>
             </server>
         </raft_configuration>
+
+        <feature_flags>
+            <check_not_exists>1</check_not_exists>
+        </feature_flags>
     </keeper_server>
 </clickhouse>
diff --git a/tests/config/config.d/lost_forever_check.xml b/tests/config/config.d/lost_forever_check.xml
new file mode 100644
index 00000000000..a021d694dff
--- /dev/null
+++ b/tests/config/config.d/lost_forever_check.xml
@@ -0,0 +1,4 @@
+<clickhouse>
+    <replicated_merge_tree_paranoid_check_on_drop_range>1</replicated_merge_tree_paranoid_check_on_drop_range>
+    <replicated_merge_tree_paranoid_check_on_startup>1</replicated_merge_tree_paranoid_check_on_startup>
+</clickhouse>
diff --git a/tests/config/config.d/merge_tree.xml b/tests/config/config.d/merge_tree.xml
index bf2da9b09a2..2ac468673fa 100644
--- a/tests/config/config.d/merge_tree.xml
+++ b/tests/config/config.d/merge_tree.xml
@@ -2,5 +2,7 @@
     <merge_tree>
         <enable_the_endpoint_id_with_zookeeper_name_prefix>1</enable_the_endpoint_id_with_zookeeper_name_prefix>
         <number_of_free_entries_in_pool_to_execute_mutation>8</number_of_free_entries_in_pool_to_execute_mutation>
+        <max_cleanup_delay_period>60</max_cleanup_delay_period>
+        <cleanup_thread_preferred_points_per_iteration>10</cleanup_thread_preferred_points_per_iteration>
     </merge_tree>
 </clickhouse>
diff --git a/tests/config/config.d/merge_tree_old_dirs_cleanup.xml b/tests/config/config.d/merge_tree_old_dirs_cleanup.xml
index 2b8ea63b63d..e6b50724c97 100644
--- a/tests/config/config.d/merge_tree_old_dirs_cleanup.xml
+++ b/tests/config/config.d/merge_tree_old_dirs_cleanup.xml
@@ -5,4 +5,5 @@
         <!-- Default is 60 seconds, but let's make tests more aggressive -->
         <merge_tree_clear_old_temporary_directories_interval_seconds>5</merge_tree_clear_old_temporary_directories_interval_seconds>
     </merge_tree>
+    <allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 </clickhouse>
diff --git a/tests/config/config.d/storage_conf.xml b/tests/config/config.d/storage_conf.xml
index dee03307177..deee71bd812 100644
--- a/tests/config/config.d/storage_conf.xml
+++ b/tests/config/config.d/storage_conf.xml
@@ -57,7 +57,6 @@
                 <path>s3_cache/</path>
                 <max_size>128Mi</max_size>
                 <cache_on_write_operations>1</cache_on_write_operations>
-                <do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
             </s3_cache>
             <s3_cache_2>
@@ -65,7 +64,6 @@
                 <disk>s3_disk_2</disk>
                 <path>s3_cache_2/</path>
                 <max_size>128Mi</max_size>
-                <do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>
                 <max_file_segment_size>100Mi</max_file_segment_size>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
             </s3_cache_2>
@@ -77,7 +75,6 @@
                 <data_cache_max_size>22548578304</data_cache_max_size>
                 <cache_on_write_operations>1</cache_on_write_operations>
                 <enable_cache_hits_threshold>1</enable_cache_hits_threshold>
-                <do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
             </s3_cache_3>
             <s3_cache_4>
@@ -87,7 +84,6 @@
                 <max_size>128Mi</max_size>
                 <cache_on_write_operations>1</cache_on_write_operations>
                 <enable_filesystem_query_cache_limit>1</enable_filesystem_query_cache_limit>
-                <do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
             </s3_cache_4>
             <s3_cache_5>
@@ -95,7 +91,6 @@
                 <disk>s3_disk_5</disk>
                 <path>s3_cache_5/</path>
                 <max_size>128Mi</max_size>
-                <do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
             </s3_cache_5>
             <s3_cache_6>
@@ -103,7 +98,6 @@
                 <disk>s3_disk_6</disk>
                 <path>s3_cache_6/</path>
                 <max_size>128Mi</max_size>
-                <do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>
                 <enable_bypass_cache_with_threashold>1</enable_bypass_cache_with_threashold>
                 <bypass_cache_threashold>100</bypass_cache_threashold>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
@@ -113,7 +107,6 @@
                 <disk>s3_disk_6</disk>
                 <path>s3_cache_small/</path>
                 <max_size>1000</max_size>
-                <do_not_evict_index_and_mark_files>1</do_not_evict_index_and_mark_files>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
             </s3_cache_small>
             <s3_cache_small_segment_size>
@@ -122,7 +115,6 @@
                 <path>s3_cache_small_segment_size/</path>
                 <max_size>128Mi</max_size>
                 <max_file_segment_size>10Ki</max_file_segment_size>
-                <do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>
                 <cache_on_write_operations>1</cache_on_write_operations>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
             </s3_cache_small_segment_size>
@@ -146,7 +138,6 @@
                 <path>local_cache/</path>
                 <max_size>22548578304</max_size>
                 <cache_on_write_operations>1</cache_on_write_operations>
-                <do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
             </local_cache>
             <local_cache_2>
@@ -154,7 +145,6 @@
                 <disk>local_disk</disk>
                 <path>local_cache_2/</path>
                 <max_size>22548578304</max_size>
-                <do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
             </local_cache_2>
             <local_cache_3>
@@ -164,7 +154,6 @@
                 <max_size>22548578304</max_size>
                 <cache_on_write_operations>1</cache_on_write_operations>
                 <enable_cache_hits_threshold>1</enable_cache_hits_threshold>
-                <do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
             </local_cache_3>
             <!-- multi layer cache -->
@@ -173,7 +162,6 @@
                 <disk>s3_cache_5</disk>
                 <path>s3_cache_multi/</path>
                 <max_size>22548578304</max_size>
-                <do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
             </s3_cache_multi>
             <s3_cache_multi_2>
@@ -181,7 +169,6 @@
                 <disk>s3_cache_multi</disk>
                 <path>s3_cache_multi_2/</path>
                 <max_size>22548578304</max_size>
-                <do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
             </s3_cache_multi_2>
         </disks>
diff --git a/tests/config/install.sh b/tests/config/install.sh
index efa5a9c086e..50f2627d37c 100755
--- a/tests/config/install.sh
+++ b/tests/config/install.sh
@@ -33,6 +33,7 @@ ln -sf $SRC_PATH/config.d/test_cluster_with_incorrect_pw.xml $DEST_SERVER_PATH/c
 ln -sf $SRC_PATH/config.d/keeper_port.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/logging_no_rotate.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/merge_tree.xml $DEST_SERVER_PATH/config.d/
+ln -sf $SRC_PATH/config.d/lost_forever_check.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/metadata_cache.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/tcp_with_proxy.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/prometheus.xml $DEST_SERVER_PATH/config.d/
@@ -78,6 +79,7 @@ ln -sf $SRC_PATH/users.d/enable_blobs_check.xml $DEST_SERVER_PATH/users.d/
 ln -sf $SRC_PATH/users.d/marks.xml $DEST_SERVER_PATH/users.d/
 ln -sf $SRC_PATH/users.d/insert_keeper_retries.xml $DEST_SERVER_PATH/users.d/
 ln -sf $SRC_PATH/users.d/prefetch_settings.xml $DEST_SERVER_PATH/users.d/
+ln -sf $SRC_PATH/users.d/nonconst_timezone.xml $DEST_SERVER_PATH/users.d/
 
 if [[ -n "$USE_NEW_ANALYZER" ]] && [[ "$USE_NEW_ANALYZER" -eq 1 ]]; then
     ln -sf $SRC_PATH/users.d/analyzer.xml $DEST_SERVER_PATH/users.d/
diff --git a/tests/config/users.d/nonconst_timezone.xml b/tests/config/users.d/nonconst_timezone.xml
new file mode 100644
index 00000000000..c7e9de5ab69
--- /dev/null
+++ b/tests/config/users.d/nonconst_timezone.xml
@@ -0,0 +1,7 @@
+<clickhouse>
+    <profiles>
+        <default>
+            <allow_nonconst_timezone_arguments>1</allow_nonconst_timezone_arguments>
+        </default>
+    </profiles>
+</clickhouse>
diff --git a/tests/instructions/easy_tasks_sorted_ru.md b/tests/instructions/easy_tasks_sorted_ru.md
index a98a5766ffe..09ea48d0bd9 100644
--- a/tests/instructions/easy_tasks_sorted_ru.md
+++ b/tests/instructions/easy_tasks_sorted_ru.md
@@ -6,7 +6,7 @@
 
 Делаем `chmod 000 /etc/clickhouse-client/config.xml` и смотрим, что получится.
 
-## Уменьшать max_memory_usage, если на сервере мало оперативки.
+## + Уменьшать max_memory_usage, если на сервере мало оперативки.
 
 Смотрим, сколько на сервере оперативки. Если `max_memory_usage`, `max_memory_usage_for_all_queries` ограничены, но больше 90% (настройка) от имеющейся оперативки, то уменьшать их и выводить предупреждение в лог..
 
@@ -42,10 +42,12 @@ void memoryBitAnd(const char * a, const char * b, char * result, size_t size);
 
 В ClickHouse есть возможность указать collation для сортировки строк. Это не работает для `Nullable(String)`.
 
-## Запретить чтение значений типа AggregateFunction по-умолчанию и добавить настройку.
+## + Запретить чтение значений типа AggregateFunction по-умолчанию и добавить настройку.
 
 Состояния агрегатных функций могут быть записаны в дамп и считаны из него. Но десериализация состояний агрегатных функций небезопасна. Аккуратно выбранные пользовательские данные могут привести к segfault или порче памяти. Поэтому нужно просто сделать настройку, которая запрещает читать AggregateFunction из пользовательских данных.
 
+Upd: сделали по-другому: теперь всё безопасно.
+
 ## + В статистику jemalloc добавить информацию по arenas.
 
 В `system.asynchronous_metrics` - суммарный размер арен.
@@ -56,9 +58,9 @@ void memoryBitAnd(const char * a, const char * b, char * result, size_t size);
 
 Как cache, но без кэша — всегда прямой запрос в источник.
 
-## Функции randomFixedString, randomBinaryString, fuzzBits, fuzzBytes.
+## + Функции randomFixedString, randomBinaryString, fuzzBits, fuzzBytes.
 
-## Агрегатные функции для статистических тестов (e.g. тест нормальности распределения) и статистик.
+## + Агрегатные функции для статистических тестов (e.g. тест нормальности распределения) и статистик.
 
 ## + Функции создания и обновления состояния агрегатной функции по одному кортежу аргументов.
 
@@ -119,11 +121,11 @@ position с конца строки.
 
 Добавляем счётчики всех ошибок (ErrorCodes) по аналогии с ProfileEvents. Кроме количества запоминаем также время последней ошибки, стек трейс, сообщение. Добавляем системную таблицу system.errors. Отправка в Graphite.
 
-## Добавить Lizard, LZSSE и density в качестве вариантов алгоритмов сжатия.
+## + Добавить Lizard, LZSSE и density в качестве вариантов алгоритмов сжатия.
 
 Экспериментальные алгоритмы сжатия. Сейчас ClickHouse поддерживает только lz4 и zstd.
 
-## Запрос CREATE OR REPLACE TABLE
+## + Запрос CREATE OR REPLACE TABLE
 
 Атомарно удаляет таблицу перед созданием новой, если такая была.
 
@@ -149,12 +151,16 @@ https://clickhouse.com/docs/en/query_language/create/#create-table
 
 Запретить модификацию данных в партиции. На партицию ставится флаг, что она заблокирована. В неё нельзя делать INSERT и ALTER. С файлов снимается доступ на запись.
 
+Upd: не нужно.
+
 ## Настройка join_use_nulls: поддержка для LEFT ARRAY JOIN.
 
-## Внешние словари из Aerospike/Couchbase/Cassandra (на выбор).
+## + Внешние словари из Aerospike/Couchbase/Cassandra (на выбор).
 
 Подключить одну из key-value БД как источник.
 
+Upd: сделали Redis, Cassandra, MongoDB.
+
 ## + Движок таблиц Mongo, табличная функция mongo.
 
 Возможность легко импортировать данные из MongoDB.
@@ -181,7 +187,7 @@ https://clickhouse.com/docs/en/operations/table_engines/external_data/
 
 Не работает, если открыть clickhouse-client в интерактивном режиме и делать несколько запросов.
 
-## Настройка для возможности получить частичный результат при cancel-е.
+## + Настройка для возможности получить частичный результат при cancel-е.
 
 Хотим по Ctrl+C получить те данные, которые успели обработаться.
 
diff --git a/tests/integration/helpers/client.py b/tests/integration/helpers/client.py
index c2676ac08a6..fdeedb9a80d 100644
--- a/tests/integration/helpers/client.py
+++ b/tests/integration/helpers/client.py
@@ -121,6 +121,7 @@ class Client:
         user=None,
         password=None,
         database=None,
+        query_id=None,
     ):
         return self.get_query_request(
             sql,
@@ -130,6 +131,7 @@ class Client:
             user=user,
             password=password,
             database=database,
+            query_id=query_id,
         ).get_error()
 
     @stacktraces_on_timeout_decorator
diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index f57ebf40e54..21398790be3 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -624,10 +624,12 @@ class ClickHouseCluster:
             # if you change packages, don't forget to update them in docker/test/integration/runner/dockerd-entrypoint.sh
             (
                 pyspark.sql.SparkSession.builder.appName("spark_test")
-                .config(
-                    "spark.jars.packages",
-                    "org.apache.hudi:hudi-spark3.3-bundle_2.12:0.13.0,io.delta:delta-core_2.12:2.2.0,org.apache.iceberg:iceberg-spark-runtime-3.3_2.12:1.1.0",
-                )
+                # The jars are now linked to "$SPARK_HOME/jars" and we don't
+                # need packages to be downloaded once and once again
+                # .config(
+                #     "spark.jars.packages",
+                #     "org.apache.hudi:hudi-spark3.3-bundle_2.12:0.13.0,io.delta:delta-core_2.12:2.2.0,org.apache.iceberg:iceberg-spark-runtime-3.3_2.12:1.1.0",
+                # )
                 .master("local")
                 .getOrCreate()
                 .stop()
@@ -3054,7 +3056,6 @@ CLICKHOUSE_STAY_ALIVE_COMMAND = "bash -c \"trap 'pkill tail' INT TERM; {} --daem
     CLICKHOUSE_START_COMMAND
 )
 
-# /run/xtables.lock passed inside for correct iptables --wait
 DOCKER_COMPOSE_TEMPLATE = """
 version: '2.3'
 services:
@@ -3066,7 +3067,6 @@ services:
             - {db_dir}:/var/lib/clickhouse/
             - {logs_dir}:/var/log/clickhouse-server/
             - /etc/passwd:/etc/passwd:ro
-            - /run/xtables.lock:/run/xtables.lock:ro
             {binary_volume}
             {odbc_bridge_volume}
             {library_bridge_volume}
@@ -3376,6 +3376,7 @@ class ClickHouseInstance:
         user=None,
         password=None,
         database=None,
+        query_id=None,
     ):
         logging.debug(f"Executing query {sql} on {self.name}")
         return self.client.query_and_get_error(
@@ -3386,6 +3387,7 @@ class ClickHouseInstance:
             user=user,
             password=password,
             database=database,
+            query_id=query_id,
         )
 
     def query_and_get_error_with_retry(
diff --git a/tests/integration/helpers/network.py b/tests/integration/helpers/network.py
index 471aa2bdc2e..2df560708e0 100644
--- a/tests/integration/helpers/network.py
+++ b/tests/integration/helpers/network.py
@@ -231,6 +231,9 @@ class _NetworkManager:
 
     def _ensure_container(self):
         if self._container is None or self._container_expire_time <= time.time():
+            image_name = "clickhouse/integration-helper:" + os.getenv(
+                "DOCKER_HELPER_TAG", "latest"
+            )
             for i in range(5):
                 if self._container is not None:
                     try:
@@ -247,7 +250,7 @@ class _NetworkManager:
                         time.sleep(i)
 
             image = subprocess.check_output(
-                "docker images -q clickhouse/integration-helper 2>/dev/null", shell=True
+                f"docker images -q {image_name} 2>/dev/null", shell=True
             )
             if not image.strip():
                 print("No network image helper, will try download")
@@ -256,22 +259,18 @@ class _NetworkManager:
                 for i in range(5):
                     try:
                         subprocess.check_call(  # STYLE_CHECK_ALLOW_SUBPROCESS_CHECK_CALL
-                            "docker pull clickhouse/integration-helper", shell=True
+                            f"docker pull {image_name}", shell=True
                         )
                         break
                     except:
                         time.sleep(i)
                 else:
-                    raise Exception("Cannot pull clickhouse/integration-helper image")
+                    raise Exception(f"Cannot pull {image_name} image")
 
             self._container = self._docker_client.containers.run(
-                "clickhouse/integration-helper",
+                image_name,
                 auto_remove=True,
                 command=("sleep %s" % self.container_exit_timeout),
-                # /run/xtables.lock passed inside for correct iptables --wait
-                volumes={
-                    "/run/xtables.lock": {"bind": "/run/xtables.lock", "mode": "ro"}
-                },
                 detach=True,
                 network_mode="host",
             )
diff --git a/tests/integration/helpers/s3_mocks/broken_s3.py b/tests/integration/helpers/s3_mocks/broken_s3.py
index 026a3c6f515..8ff4f9e9203 100644
--- a/tests/integration/helpers/s3_mocks/broken_s3.py
+++ b/tests/integration/helpers/s3_mocks/broken_s3.py
@@ -6,10 +6,10 @@ import time
 import urllib.parse
 import http.server
 import socketserver
+import string
 
 
-UPSTREAM_HOST = "minio1"
-UPSTREAM_PORT = 9001
+INF_COUNT = 100000000
 
 
 class MockControl:
@@ -28,31 +28,88 @@ class MockControl:
             ],
             nothrow=True,
         )
-        assert response == "OK"
+        assert response == "OK", response
+
+    def setup_error_at_object_upload(self, count=None, after=None):
+        url = f"http://localhost:{self._port}/mock_settings/error_at_object_upload?nothing=1"
+
+        if count is not None:
+            url += f"&count={count}"
+
+        if after is not None:
+            url += f"&after={after}"
 
-    def setup_fail_upload(self, part_length):
         response = self._cluster.exec_in_container(
             self._cluster.get_container_id(self._container),
             [
                 "curl",
                 "-s",
-                f"http://localhost:{self._port}/mock_settings/error_at_put?when_length_bigger={part_length}",
+                url,
             ],
             nothrow=True,
         )
-        assert response == "OK"
+        assert response == "OK", response
+
+    def setup_error_at_part_upload(self, count=None, after=None):
+        url = f"http://localhost:{self._port}/mock_settings/error_at_part_upload?nothing=1"
+
+        if count is not None:
+            url += f"&count={count}"
+
+        if after is not None:
+            url += f"&after={after}"
 
-    def setup_fake_upload(self, part_length):
         response = self._cluster.exec_in_container(
             self._cluster.get_container_id(self._container),
             [
                 "curl",
                 "-s",
-                f"http://localhost:{self._port}/mock_settings/fake_put?when_length_bigger={part_length}",
+                url,
             ],
             nothrow=True,
         )
-        assert response == "OK"
+        assert response == "OK", response
+
+    def setup_error_at_create_multi_part_upload(self, count=None):
+        url = f"http://localhost:{self._port}/mock_settings/error_at_create_multi_part_upload"
+
+        if count is not None:
+            url += f"?count={count}"
+
+        response = self._cluster.exec_in_container(
+            self._cluster.get_container_id(self._container),
+            [
+                "curl",
+                "-s",
+                url,
+            ],
+            nothrow=True,
+        )
+        assert response == "OK", response
+
+    def setup_fake_puts(self, part_length):
+        response = self._cluster.exec_in_container(
+            self._cluster.get_container_id(self._container),
+            [
+                "curl",
+                "-s",
+                f"http://localhost:{self._port}/mock_settings/fake_puts?when_length_bigger={part_length}",
+            ],
+            nothrow=True,
+        )
+        assert response == "OK", response
+
+    def setup_fake_multpartuploads(self):
+        response = self._cluster.exec_in_container(
+            self._cluster.get_container_id(self._container),
+            [
+                "curl",
+                "-s",
+                f"http://localhost:{self._port}/mock_settings/setup_fake_multpartuploads?",
+            ],
+            nothrow=True,
+        )
+        assert response == "OK", response
 
     def setup_slow_answers(
         self, minimal_length=0, timeout=None, probability=None, count=None
@@ -77,7 +134,7 @@ class MockControl:
             ["curl", "-s", url],
             nothrow=True,
         )
-        assert response == "OK"
+        assert response == "OK", response
 
 
 class _ServerRuntime:
@@ -88,7 +145,7 @@ class _ServerRuntime:
             self.probability = probability_ if probability_ is not None else 1
             self.timeout = timeout_ if timeout_ is not None else 0.1
             self.minimal_length = minimal_length_ if minimal_length_ is not None else 0
-            self.count = count_ if count_ is not None else 2**32
+            self.count = count_ if count_ is not None else INF_COUNT
 
         def __str__(self):
             return (
@@ -109,12 +166,32 @@ class _ServerRuntime:
                         return _runtime.slow_put.timeout
             return None
 
+    class CountAfter:
+        def __init__(self, count_=None, after_=None):
+            self.count = count_ if count_ is not None else INF_COUNT
+            self.after = after_ if after_ is not None else 0
+
+        def __str__(self):
+            return f"count:{self.count} after:{self.after}"
+
+        def has_effect(self):
+            if self.after:
+                self.after -= 1
+            if self.after == 0:
+                if self.count:
+                    self.count -= 1
+                    return True
+            return False
+
     def __init__(self):
         self.lock = threading.Lock()
-        self.error_at_put_when_length_bigger = None
+        self.error_at_part_upload = None
+        self.error_at_object_upload = None
         self.fake_put_when_length_bigger = None
         self.fake_uploads = dict()
         self.slow_put = None
+        self.fake_multipart_upload = None
+        self.error_at_create_multi_part_upload = None
 
     def register_fake_upload(self, upload_id, key):
         with self.lock:
@@ -127,10 +204,14 @@ class _ServerRuntime:
         return False
 
     def reset(self):
-        self.error_at_put_when_length_bigger = None
-        self.fake_put_when_length_bigger = None
-        self.fake_uploads = dict()
-        self.slow_put = None
+        with self.lock:
+            self.error_at_part_upload = None
+            self.error_at_object_upload = None
+            self.fake_put_when_length_bigger = None
+            self.fake_uploads = dict()
+            self.slow_put = None
+            self.fake_multipart_upload = None
+            self.error_at_create_multi_part_upload = None
 
 
 _runtime = _ServerRuntime()
@@ -141,6 +222,13 @@ def _and_then(value, func):
     return None if value is None else func(value)
 
 
+def get_random_string(length):
+    # choose from all lowercase letter
+    letters = string.ascii_lowercase
+    result_str = "".join(random.choice(letters) for i in range(length))
+    return result_str
+
+
 class RequestHandler(http.server.BaseHTTPRequestHandler):
     def _ok(self):
         self.send_response(200)
@@ -166,19 +254,30 @@ class RequestHandler(http.server.BaseHTTPRequestHandler):
         self._read_out()
 
         self.send_response(307)
-        url = f"http://{UPSTREAM_HOST}:{UPSTREAM_PORT}{self.path}"
+        url = (
+            f"http://{self.server.upstream_host}:{self.server.upstream_port}{self.path}"
+        )
         self.send_header("Location", url)
         self.end_headers()
         self.wfile.write(b"Redirected")
 
     def _error(self, data):
         self._read_out()
-
         self.send_response(500)
         self.send_header("Content-Type", "text/xml")
         self.end_headers()
         self.wfile.write(bytes(data, "UTF-8"))
 
+    def _error_expected_500(self):
+        self._error(
+            '<?xml version="1.0" encoding="UTF-8"?>'
+            "<Error>"
+            "<Code>ExpectedError</Code>"
+            "<Message>mock s3 injected error</Message>"
+            "<RequestId>txfbd566d03042474888193-00608d7537</RequestId>"
+            "</Error>"
+        )
+
     def _fake_put_ok(self):
         self._read_out()
 
@@ -188,6 +287,28 @@ class RequestHandler(http.server.BaseHTTPRequestHandler):
         self.send_header("Content-Length", 0)
         self.end_headers()
 
+    def _fake_uploads(self, path, upload_id):
+        self._read_out()
+
+        parts = [x for x in path.split("/") if x]
+        bucket = parts[0]
+        key = "/".join(parts[1:])
+        data = (
+            '<?xml version="1.0" encoding="UTF-8"?>\n'
+            "<InitiateMultipartUploadResult>\n"
+            f"<Bucket>{bucket}</Bucket>"
+            f"<Key>{key}</Key>"
+            f"<UploadId>{upload_id}</UploadId>"
+            "</InitiateMultipartUploadResult>"
+        )
+
+        self.send_response(200)
+        self.send_header("Content-Type", "text/xml")
+        self.send_header("Content-Length", len(data))
+        self.end_headers()
+
+        self.wfile.write(bytes(data, "UTF-8"))
+
     def _fake_post_ok(self, path):
         self._read_out()
 
@@ -219,18 +340,29 @@ class RequestHandler(http.server.BaseHTTPRequestHandler):
         if len(path) < 2:
             return self._error("_mock_settings: wrong command")
 
-        if path[1] == "error_at_put":
+        if path[1] == "error_at_part_upload":
             params = urllib.parse.parse_qs(parts.query, keep_blank_values=False)
-            _runtime.error_at_put_when_length_bigger = int(
-                params.get("when_length_bigger", [1024 * 1024])[0]
+            _runtime.error_at_part_upload = _ServerRuntime.CountAfter(
+                count_=_and_then(params.get("count", [None])[0], int),
+                after_=_and_then(params.get("after", [None])[0], int),
             )
             return self._ok()
-        if path[1] == "fake_put":
+
+        if path[1] == "error_at_object_upload":
+            params = urllib.parse.parse_qs(parts.query, keep_blank_values=False)
+            _runtime.error_at_object_upload = _ServerRuntime.CountAfter(
+                count_=_and_then(params.get("count", [None])[0], int),
+                after_=_and_then(params.get("after", [None])[0], int),
+            )
+            return self._ok()
+
+        if path[1] == "fake_puts":
             params = urllib.parse.parse_qs(parts.query, keep_blank_values=False)
             _runtime.fake_put_when_length_bigger = int(
                 params.get("when_length_bigger", [1024 * 1024])[0]
             )
             return self._ok()
+
         if path[1] == "slow_put":
             params = urllib.parse.parse_qs(parts.query, keep_blank_values=False)
             _runtime.slow_put = _ServerRuntime.SlowPut(
@@ -241,6 +373,18 @@ class RequestHandler(http.server.BaseHTTPRequestHandler):
             )
             self.log_message("set slow put %s", _runtime.slow_put)
             return self._ok()
+
+        if path[1] == "setup_fake_multpartuploads":
+            _runtime.fake_multipart_upload = True
+            return self._ok()
+
+        if path[1] == "error_at_create_multi_part_upload":
+            params = urllib.parse.parse_qs(parts.query, keep_blank_values=False)
+            _runtime.error_at_create_multi_part_upload = int(
+                params.get("count", [INF_COUNT])[0]
+            )
+            return self._ok()
+
         if path[1] == "reset":
             _runtime.reset()
             return self._ok()
@@ -265,33 +409,42 @@ class RequestHandler(http.server.BaseHTTPRequestHandler):
                 self.log_message("slow put %s", timeout)
                 time.sleep(timeout)
 
-        if _runtime.error_at_put_when_length_bigger is not None:
-            if content_length > _runtime.error_at_put_when_length_bigger:
-                return self._error(
-                    '<?xml version="1.0" encoding="UTF-8"?>'
-                    "<Error>"
-                    "<Code>ExpectedError</Code>"
-                    "<Message>mock s3 injected error</Message>"
-                    "<RequestId>txfbd566d03042474888193-00608d7537</RequestId>"
-                    "</Error>"
-                )
-
         parts = urllib.parse.urlsplit(self.path)
         params = urllib.parse.parse_qs(parts.query, keep_blank_values=False)
         upload_id = params.get("uploadId", [None])[0]
-        if _runtime.fake_put_when_length_bigger is not None:
-            if content_length > _runtime.fake_put_when_length_bigger:
-                if upload_id is not None:
-                    _runtime.register_fake_upload(upload_id, parts.path)
-                return self._fake_put_ok()
+
+        if upload_id is not None:
+            if _runtime.error_at_part_upload is not None:
+                if _runtime.error_at_part_upload.has_effect():
+                    return self._error_expected_500()
+            if _runtime.fake_multipart_upload:
+                if _runtime.is_fake_upload(upload_id, parts.path):
+                    return self._fake_put_ok()
+        else:
+            if _runtime.error_at_object_upload is not None:
+                if _runtime.error_at_object_upload.has_effect():
+                    return self._error_expected_500()
+            if _runtime.fake_put_when_length_bigger is not None:
+                if content_length > _runtime.fake_put_when_length_bigger:
+                    return self._fake_put_ok()
 
         return self._redirect()
 
     def do_POST(self):
         parts = urllib.parse.urlsplit(self.path)
-        params = urllib.parse.parse_qs(parts.query, keep_blank_values=False)
-        upload_id = params.get("uploadId", [None])[0]
+        params = urllib.parse.parse_qs(parts.query, keep_blank_values=True)
+        uploads = params.get("uploads", [None])[0]
+        if uploads is not None:
+            if _runtime.error_at_create_multi_part_upload:
+                _runtime.error_at_create_multi_part_upload -= 1
+                return self._error_expected_500()
 
+            if _runtime.fake_multipart_upload:
+                upload_id = get_random_string(5)
+                _runtime.register_fake_upload(upload_id, parts.path)
+                return self._fake_uploads(parts.path, upload_id)
+
+        upload_id = params.get("uploadId", [None])[0]
         if _runtime.is_fake_upload(upload_id, parts.path):
             return self._fake_post_ok(parts.path)
 
@@ -307,7 +460,15 @@ class RequestHandler(http.server.BaseHTTPRequestHandler):
 class _ThreadedHTTPServer(socketserver.ThreadingMixIn, http.server.HTTPServer):
     """Handle requests in a separate thread."""
 
+    def set_upstream(self, upstream_host, upstream_port):
+        self.upstream_host = upstream_host
+        self.upstream_port = upstream_port
+
 
 if __name__ == "__main__":
     httpd = _ThreadedHTTPServer(("0.0.0.0", int(sys.argv[1])), RequestHandler)
+    if len(sys.argv) == 4:
+        httpd.set_upstream(sys.argv[2], sys.argv[3])
+    else:
+        httpd.set_upstream("minio1", 9001)
     httpd.serve_forever()
diff --git a/tests/integration/pytest.ini b/tests/integration/pytest.ini
index 772c96f7361..e40959bd37b 100644
--- a/tests/integration/pytest.ini
+++ b/tests/integration/pytest.ini
@@ -19,3 +19,6 @@ markers =
     long_run: marks tests which run for a long time
 addopts =
     -m 'not long_run'
+; 'The asyncore module is deprecated' comes from casandra driver
+filterwarnings =
+    ignore:The asyncore module is deprecated:DeprecationWarning
diff --git a/tests/integration/runner b/tests/integration/runner
index f658bac412b..df52f587eee 100755
--- a/tests/integration/runner
+++ b/tests/integration/runner
@@ -336,6 +336,8 @@ if __name__ == "__main__":
                 env_tags += "-e {}={} ".format("DOCKER_MYSQL_PHP_CLIENT_TAG", tag)
             elif image == "clickhouse/postgresql-java-client":
                 env_tags += "-e {}={} ".format("DOCKER_POSTGRESQL_JAVA_CLIENT_TAG", tag)
+            elif image == "clickhouse/integration-helper":
+                env_tags += "-e {}={} ".format("DOCKER_HELPER_TAG", tag)
             elif image == "clickhouse/integration-test":
                 env_tags += "-e {}={} ".format("DOCKER_BASE_TAG", tag)
             elif image == "clickhouse/kerberized-hadoop":
@@ -393,39 +395,27 @@ if __name__ == "__main__":
     if args.keyword_expression:
         args.pytest_args += ["-k", args.keyword_expression]
 
-    cmd_base = "docker run {net} {tty} --rm --name {name} --privileged \
-        --volume={odbc_bridge_bin}:/clickhouse-odbc-bridge --volume={bin}:/clickhouse \
-        --volume={library_bridge_bin}:/clickhouse-library-bridge \
-        --volume={base_cfg}:/clickhouse-config --volume={cases_dir}:/ClickHouse/tests/integration \
-        --volume={src_dir}/Server/grpc_protos:/ClickHouse/src/Server/grpc_protos \
-        --volume=/run:/run/host:ro \
-        {dockerd_internal_volume} -e DOCKER_CLIENT_TIMEOUT=300 -e COMPOSE_HTTP_TIMEOUT=600 \
-        -e XTABLES_LOCKFILE=/run/host/xtables.lock \
-        -e PYTHONUNBUFFERED=1 \
-        {env_tags} {env_cleanup} -e PYTEST_OPTS='{parallel} {opts} {tests_list} {rand} -vvv' {img}".format(
-        net=net,
-        tty=tty,
-        bin=args.binary,
-        odbc_bridge_bin=args.odbc_bridge_binary,
-        library_bridge_bin=args.library_bridge_binary,
-        base_cfg=args.base_configs_dir,
-        cases_dir=args.cases_dir,
-        src_dir=args.src_dir,
-        env_tags=env_tags,
-        env_cleanup=env_cleanup,
-        parallel=parallel_args,
-        rand=rand_args,
-        opts=" ".join(args.pytest_args).replace("'", "\\'"),
-        tests_list=" ".join(args.tests_list),
-        dockerd_internal_volume=dockerd_internal_volume,
-        img=DIND_INTEGRATION_TESTS_IMAGE_NAME + ":" + args.docker_image_version,
-        name=CONTAINER_NAME,
+    pytest_opts = " ".join(args.pytest_args).replace("'", "\\'")
+    tests_list = " ".join(args.tests_list)
+    cmd_base = (
+        f"docker run {net} {tty} --rm --name {CONTAINER_NAME} "
+        "--privileged --dns-search='.' "  # since recent dns search leaks from host
+        f"--volume={args.odbc_bridge_binary}:/clickhouse-odbc-bridge "
+        f"--volume={args.binary}:/clickhouse "
+        f"--volume={args.library_bridge_binary}:/clickhouse-library-bridge "
+        f"--volume={args.base_configs_dir}:/clickhouse-config "
+        f"--volume={args.cases_dir}:/ClickHouse/tests/integration "
+        f"--volume={args.src_dir}/Server/grpc_protos:/ClickHouse/src/Server/grpc_protos "
+        f"--volume=/run:/run/host:ro {dockerd_internal_volume} {env_tags} {env_cleanup} "
+        "-e DOCKER_CLIENT_TIMEOUT=300 -e COMPOSE_HTTP_TIMEOUT=600 -e PYTHONUNBUFFERED=1 "
+        f"-e PYTEST_OPTS='{parallel_args} {pytest_opts} {tests_list} {rand_args} -vvv'"
+        f" {DIND_INTEGRATION_TESTS_IMAGE_NAME}:{args.docker_image_version}"
     )
 
     cmd = cmd_base + " " + args.command
     cmd_pre_pull = (
-        cmd_base
-        + " find /compose -name docker_compose_*.yml -exec docker-compose -f '{}' pull \;"
+        f"{cmd_base} find /compose -name docker_compose_*.yml "
+        r"-exec docker-compose -f '{}' pull \;"
     )
 
     containers = subprocess.check_output(
diff --git a/tests/ci/runner_token_rotation_lambda/__init__.py b/tests/integration/test_alter_moving_garbage/__init__.py
similarity index 100%
rename from tests/ci/runner_token_rotation_lambda/__init__.py
rename to tests/integration/test_alter_moving_garbage/__init__.py
diff --git a/tests/integration/test_alter_moving_garbage/configs/config.d/remote_servers.xml b/tests/integration/test_alter_moving_garbage/configs/config.d/remote_servers.xml
new file mode 100644
index 00000000000..45713eaed59
--- /dev/null
+++ b/tests/integration/test_alter_moving_garbage/configs/config.d/remote_servers.xml
@@ -0,0 +1,16 @@
+<clickhouse>
+    <remote_servers>
+        <test_cluster>
+            <shard>
+                <replica>
+                    <host>node1</host>
+                    <port>9000</port>
+                </replica>
+                <replica>
+                    <host>node2</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </test_cluster>
+    </remote_servers>
+</clickhouse>
diff --git a/tests/integration/test_alter_moving_garbage/configs/config.d/storage_conf.xml b/tests/integration/test_alter_moving_garbage/configs/config.d/storage_conf.xml
new file mode 100644
index 00000000000..1450a459257
--- /dev/null
+++ b/tests/integration/test_alter_moving_garbage/configs/config.d/storage_conf.xml
@@ -0,0 +1,26 @@
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <s3>
+                <type>s3</type>
+                <endpoint>http://minio1:9001/root/data/</endpoint>
+                <access_key_id>minio</access_key_id>
+                <secret_access_key>minio123</secret_access_key>
+            </s3>
+        </disks>
+        <policies>
+            <two_disks>
+                <volumes>
+                    <default>
+                        <disk>default</disk>
+                    </default>
+                    <external>
+                        <disk>s3</disk>
+                    </external>
+                </volumes>
+            </two_disks>
+        </policies>
+    </storage_configuration>
+
+    <allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
+</clickhouse>
diff --git a/tests/integration/test_alter_moving_garbage/configs/config.xml b/tests/integration/test_alter_moving_garbage/configs/config.xml
new file mode 100644
index 00000000000..f4be5ab6b7c
--- /dev/null
+++ b/tests/integration/test_alter_moving_garbage/configs/config.xml
@@ -0,0 +1,7 @@
+<clickhouse>
+    <tcp_port>9000</tcp_port>
+    <listen_host>127.0.0.1</listen_host>
+    <max_concurrent_queries>500</max_concurrent_queries>
+    <path>./clickhouse/</path>
+    <users_config>users.xml</users_config>
+</clickhouse>
diff --git a/tests/integration/test_alter_moving_garbage/test.py b/tests/integration/test_alter_moving_garbage/test.py
new file mode 100644
index 00000000000..330df3ac490
--- /dev/null
+++ b/tests/integration/test_alter_moving_garbage/test.py
@@ -0,0 +1,155 @@
+import logging
+import time
+
+import pytest
+import threading
+import random
+
+from helpers.client import QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
+
+# two replicas in remote_servers.xml
+REPLICA_COUNT = 2
+
+
+@pytest.fixture(scope="module")
+def cluster():
+    try:
+        cluster = ClickHouseCluster(__file__)
+        for i in range(1, REPLICA_COUNT + 1):
+            cluster.add_instance(
+                f"node{i}",
+                main_configs=[
+                    "configs/config.d/storage_conf.xml",
+                    "configs/config.d/remote_servers.xml",
+                ],
+                with_minio=True,
+                with_zookeeper=True,
+            )
+
+        logging.info("Starting cluster...")
+        cluster.start()
+        logging.info("Cluster started")
+
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+def create_table(node, table_name, replicated, additional_settings):
+    settings = {
+        "storage_policy": "two_disks",
+        "old_parts_lifetime": 1,
+        "index_granularity": 512,
+        "temporary_directories_lifetime": 0,
+        "merge_tree_clear_old_temporary_directories_interval_seconds": 1,
+    }
+    settings.update(additional_settings)
+
+    table_engine = (
+        f"ReplicatedMergeTree('/clickhouse/tables/0/{table_name}', '{node.name}')"
+        if replicated
+        else "MergeTree()"
+    )
+
+    create_table_statement = f"""
+        CREATE TABLE {table_name} (
+            dt Date,
+            id Int64,
+            data String,
+            INDEX min_max (id) TYPE minmax GRANULARITY 3
+        ) ENGINE = {table_engine}
+        PARTITION BY dt
+        ORDER BY (dt, id)
+        SETTINGS {",".join((k+"="+repr(v) for k, v in settings.items()))}"""
+
+    if replicated:
+        node.query_with_retry(create_table_statement)
+    else:
+        node.query(create_table_statement)
+
+
+@pytest.mark.parametrize(
+    "allow_remote_fs_zero_copy_replication,replicated_engine",
+    [(False, False), (False, True), (True, True)],
+)
+def test_create_table(
+    cluster, allow_remote_fs_zero_copy_replication, replicated_engine
+):
+    if replicated_engine:
+        nodes = list(cluster.instances.values())
+    else:
+        nodes = [cluster.instances["node1"]]
+
+    additional_settings = {}
+
+    # Different names for logs readability
+    table_name = "test_table"
+    if allow_remote_fs_zero_copy_replication:
+        table_name = "test_table_zero_copy"
+        additional_settings["allow_remote_fs_zero_copy_replication"] = 1
+    if replicated_engine:
+        table_name = table_name + "_replicated"
+
+    for node in nodes:
+        create_table(node, table_name, replicated_engine, additional_settings)
+
+    for i in range(1, 11):
+        partition = f"2021-01-{i:02d}"
+        random.choice(nodes).query(
+            f"INSERT INTO {table_name} SELECT toDate('{partition}'), number as id, toString(sipHash64(number, {i})) FROM numbers(10_000)"
+        )
+
+    # Run ALTER in parallel with moving parts
+
+    stop_alter = False
+
+    def alter():
+        random.choice(nodes).query(f"ALTER TABLE {table_name} ADD COLUMN col0 String")
+        for d in range(1, 100):
+            if stop_alter:
+                break
+
+            # Some lightweight mutation should change moving part before it is swapped, then we will have to cleanup it.
+            # Messages `Failed to swap {}. Active part doesn't exist` should appear in logs.
+            #
+            # I managed to reproduce issue with DELETE (`ALTER TABLE {table_name} ADD/DROP COLUMN` also works on real s3 instead of minio)
+            # Note: do not delete rows with id % 100 = 0, because they are used in `check_count` to use them in check that data is not corrupted
+            random.choice(nodes).query(f"DELETE FROM {table_name} WHERE id % 100 = {d}")
+
+            time.sleep(0.1)
+
+    alter_thread = threading.Thread(target=alter)
+    alter_thread.start()
+
+    for i in range(1, 11):
+        partition = f"2021-01-{i:02d}"
+        try:
+            random.choice(nodes).query(
+                f"ALTER TABLE {table_name} MOVE PARTITION '{partition}' TO DISK 's3'",
+            )
+        except QueryRuntimeException as e:
+            if "PART_IS_TEMPORARILY_LOCKED" in str(e):
+                continue
+            raise e
+
+        # Function to clear old temporary directories wakes up every 1 second, sleep to make sure it is called
+        time.sleep(0.5)
+
+    stop_alter = True
+    alter_thread.join()
+
+    # Check that no data was lost
+
+    data_digest = None
+    if replicated_engine:
+        # We don't know what data was replicated, so we need to check all replicas and take unique values
+        data_digest = random.choice(nodes).query_with_retry(
+            f"SELECT countDistinct(dt, data) FROM clusterAllReplicas(test_cluster, default.{table_name}) WHERE id % 100 == 0"
+        )
+    else:
+        data_digest = random.choice(nodes).query(
+            f"SELECT countDistinct(dt, data) FROM {table_name} WHERE id % 100 == 0"
+        )
+
+    assert data_digest == "1000\n"
diff --git a/tests/integration/test_backup_restore_on_cluster/test.py b/tests/integration/test_backup_restore_on_cluster/test.py
index 5542eac856d..6af3a7dbab8 100644
--- a/tests/integration/test_backup_restore_on_cluster/test.py
+++ b/tests/integration/test_backup_restore_on_cluster/test.py
@@ -2,6 +2,7 @@ from time import sleep
 import pytest
 import re
 import os.path
+import random, string
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV, assert_eq_with_retry
 
@@ -726,6 +727,58 @@ def test_projection():
     )
 
 
+def test_file_deduplication():
+    # Random column name helps finding it in logs.
+    column_name = "".join(random.choice(string.ascii_letters) for x in range(10))
+
+    # Make four replicas in total: 2 on each host.
+    node1.query(
+        f"""
+        CREATE TABLE tbl ON CLUSTER 'cluster' (
+        {column_name} Int32
+        ) ENGINE=ReplicatedMergeTree('/clickhouse/tables/tbl/', '{{replica}}')
+        ORDER BY tuple() SETTINGS min_bytes_for_wide_part=0
+        """
+    )
+
+    node1.query(
+        f"""
+        CREATE TABLE tbl2 ON CLUSTER 'cluster' (
+        {column_name} Int32
+        ) ENGINE=ReplicatedMergeTree('/clickhouse/tables/tbl/', '{{replica}}-2')
+        ORDER BY tuple() SETTINGS min_bytes_for_wide_part=0
+        """
+    )
+
+    # Unique data.
+    node1.query(
+        f"INSERT INTO tbl VALUES (3556), (1177), (4004), (4264), (3729), (1438), (2158), (2684), (415), (1917)"
+    )
+    node1.query("SYSTEM SYNC REPLICA ON CLUSTER 'cluster' tbl")
+    node1.query("SYSTEM SYNC REPLICA ON CLUSTER 'cluster' tbl2")
+
+    backup_name = new_backup_name()
+    node1.query(f"BACKUP TABLE tbl, TABLE tbl2 ON CLUSTER 'cluster' TO {backup_name}")
+
+    node1.query("SYSTEM FLUSH LOGS ON CLUSTER 'cluster'")
+
+    # The bin file should be written to the backup once, and skipped three times (because there are four replicas in total).
+    bin_file_writing_log_line = (
+        f"Writing backup for file .*{column_name}.bin .* (disk default)"
+    )
+    bin_file_skip_log_line = f"Writing backup for file .*{column_name}.bin .* skipped"
+
+    num_bin_file_writings = int(node1.count_in_log(bin_file_writing_log_line)) + int(
+        node2.count_in_log(bin_file_writing_log_line)
+    )
+    num_bin_file_skips = int(node1.count_in_log(bin_file_skip_log_line)) + int(
+        node2.count_in_log(bin_file_skip_log_line)
+    )
+
+    assert num_bin_file_writings == 1
+    assert num_bin_file_skips == 3
+
+
 def test_replicated_table_with_not_synced_def():
     node1.query(
         "CREATE TABLE tbl ("
diff --git a/tests/integration/test_broken_detached_part_clean_up/test.py b/tests/integration/test_broken_detached_part_clean_up/test.py
index 5b18fa34494..9a70ebe0d48 100644
--- a/tests/integration/test_broken_detached_part_clean_up/test.py
+++ b/tests/integration/test_broken_detached_part_clean_up/test.py
@@ -141,7 +141,8 @@ def test_remove_broken_detached_part_replicated_merge_tree(started_cluster):
             merge_tree_enable_clear_old_broken_detached=1,
             merge_tree_clear_old_broken_detached_parts_ttl_timeout_seconds=5,
             cleanup_delay_period=1,
-            cleanup_delay_period_random_add=0;
+            cleanup_delay_period_random_add=0,
+            cleanup_thread_preferred_points_per_iteration=0;
         """
     )
 
diff --git a/tests/integration/test_broken_part_during_merge/test.py b/tests/integration/test_broken_part_during_merge/test.py
index f4110844466..26962236869 100644
--- a/tests/integration/test_broken_part_during_merge/test.py
+++ b/tests/integration/test_broken_part_during_merge/test.py
@@ -25,7 +25,7 @@ def test_merge_and_part_corruption(started_cluster):
         """
         CREATE TABLE replicated_mt(date Date, id UInt32, value Int32)
         ENGINE = ReplicatedMergeTree('/clickhouse/tables/replicated_mt', '{replica}') ORDER BY id 
-        SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1;
+        SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, cleanup_thread_preferred_points_per_iteration=0;
             """.format(
             replica=node1.name
         )
diff --git a/tests/integration/test_cgroup_limit/test.py b/tests/integration/test_cgroup_limit/test.py
index f6392eca4d7..e77b0f70960 100644
--- a/tests/integration/test_cgroup_limit/test.py
+++ b/tests/integration/test_cgroup_limit/test.py
@@ -1,5 +1,6 @@
 #!/usr/bin/env python3
 
+import logging
 import os
 import math
 import subprocess
@@ -16,18 +17,19 @@ def run_command_in_container(cmd, *args):
             f"{alternative_binary}:/usr/bin/clickhouse",
         )
 
-    return subprocess.check_output(
-        [
-            "docker",
-            "run",
-            "--rm",
-            *args,
-            "ubuntu:20.04",
-            "sh",
-            "-c",
-            cmd,
-        ]
-    )
+    command = [
+        "docker",
+        "run",
+        "--rm",
+        *args,
+        "ubuntu:22.04",
+        "sh",
+        "-c",
+        cmd,
+    ]
+
+    logging.debug("Command: %s", " ".join(command))
+    return subprocess.check_output(command)
 
 
 def run_with_cpu_limit(cmd, num_cpus, *args):
diff --git a/tests/integration/test_checking_s3_blobs_paranoid/test.py b/tests/integration/test_checking_s3_blobs_paranoid/test.py
index 042d57a0c43..a80ad93d53d 100644
--- a/tests/integration/test_checking_s3_blobs_paranoid/test.py
+++ b/tests/integration/test_checking_s3_blobs_paranoid/test.py
@@ -54,7 +54,7 @@ def test_upload_after_check_works(cluster, broken_s3):
         """
     )
 
-    broken_s3.setup_fake_upload(1)
+    broken_s3.setup_fake_puts(1)
 
     error = node.query_and_get_error(
         "INSERT INTO s3_upload_after_check_works VALUES (1, 'Hello')"
@@ -63,3 +63,105 @@ def test_upload_after_check_works(cluster, broken_s3):
     assert "Code: 499" in error, error
     assert "Immediately after upload" in error, error
     assert "suddenly disappeared" in error, error
+
+
+def get_counters(node, query_id, log_type="ExceptionWhileProcessing"):
+    node.query("SYSTEM FLUSH LOGS")
+    return [
+        int(x)
+        for x in node.query(
+            f"""
+                SELECT
+                    ProfileEvents['S3CreateMultipartUpload'],
+                    ProfileEvents['S3UploadPart'],
+                    ProfileEvents['S3WriteRequestsErrors']
+                FROM system.query_log
+                WHERE query_id='{query_id}'
+                    AND type='{log_type}'
+                """
+        ).split()
+        if x
+    ]
+
+
+#  Add "lz4" compression method in the list after https://github.com/ClickHouse/ClickHouse/issues/50975 is fixed
+@pytest.mark.parametrize(
+    "compression", ["none", "gzip", "br", "xz", "zstd", "bz2", "deflate"]
+)
+def test_upload_s3_fail_create_multi_part_upload(cluster, broken_s3, compression):
+    node = cluster.instances["node"]
+
+    broken_s3.setup_error_at_create_multi_part_upload()
+
+    insert_query_id = f"INSERT_INTO_TABLE_FUNCTION_FAIL_CREATE_MPU_{compression}"
+    error = node.query_and_get_error(
+        f"""
+        INSERT INTO
+            TABLE FUNCTION s3(
+                'http://resolver:8083/root/data/test_upload_s3_fail_create_multi_part_upload',
+                'minio', 'minio123',
+                'CSV', auto, '{compression}'
+            )
+        SELECT
+            *
+        FROM system.numbers
+        LIMIT 100000000
+        SETTINGS
+            s3_max_single_part_upload_size=100,
+            s3_min_upload_part_size=100
+        """,
+        query_id=insert_query_id,
+    )
+
+    assert "Code: 499" in error, error
+    assert "mock s3 injected error" in error, error
+
+    count_create_multi_part_uploads, count_upload_parts, count_s3_errors = get_counters(
+        node, insert_query_id
+    )
+    assert count_create_multi_part_uploads == 1
+    assert count_upload_parts == 0
+    assert count_s3_errors == 1
+
+
+#  Add "lz4" compression method in the list after https://github.com/ClickHouse/ClickHouse/issues/50975 is fixed
+@pytest.mark.parametrize(
+    "compression", ["none", "gzip", "br", "xz", "zstd", "bz2", "deflate"]
+)
+def test_upload_s3_fail_upload_part_when_multi_part_upload(
+    cluster, broken_s3, compression
+):
+    node = cluster.instances["node"]
+
+    broken_s3.setup_fake_multpartuploads()
+    broken_s3.setup_error_at_part_upload(count=1, after=2)
+
+    insert_query_id = f"INSERT_INTO_TABLE_FUNCTION_FAIL_UPLOAD_PART_{compression}"
+    error = node.query_and_get_error(
+        f"""
+        INSERT INTO
+            TABLE FUNCTION s3(
+                'http://resolver:8083/root/data/test_upload_s3_fail_upload_part_when_multi_part_upload',
+                'minio', 'minio123',
+                'CSV', auto, '{compression}'
+            )
+        SELECT
+            *
+        FROM system.numbers
+        LIMIT 100000000
+        SETTINGS
+            s3_max_single_part_upload_size=100,
+            s3_min_upload_part_size=100
+        """,
+        query_id=insert_query_id,
+    )
+
+    assert "Code: 499" in error, error
+    assert "mock s3 injected error" in error, error
+
+    count_create_multi_part_uploads, count_upload_parts, count_s3_errors = get_counters(
+        node, insert_query_id
+    )
+    assert count_create_multi_part_uploads == 1
+    assert count_upload_parts >= 2
+    assert count_s3_errors >= 2
diff --git a/tests/integration/test_consistant_parts_after_move_partition/configs/remote_servers.xml b/tests/integration/test_consistant_parts_after_move_partition/configs/remote_servers.xml
index 3d4ccd584b1..f22b7dc4032 100644
--- a/tests/integration/test_consistant_parts_after_move_partition/configs/remote_servers.xml
+++ b/tests/integration/test_consistant_parts_after_move_partition/configs/remote_servers.xml
@@ -16,4 +16,5 @@
             </shard>
         </test_cluster>
     </remote_servers>
+    <allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 </clickhouse>
diff --git a/tests/integration/test_consistant_parts_after_move_partition/test.py b/tests/integration/test_consistant_parts_after_move_partition/test.py
index 63a51472773..284a8580f17 100644
--- a/tests/integration/test_consistant_parts_after_move_partition/test.py
+++ b/tests/integration/test_consistant_parts_after_move_partition/test.py
@@ -14,11 +14,13 @@ def initialize_database(nodes, shard):
             CREATE TABLE `{database}`.src (p UInt64, d UInt64)
             ENGINE = ReplicatedMergeTree('/clickhouse/{database}/tables/test_consistent_shard1{shard}/replicated', '{replica}')
             ORDER BY d PARTITION BY p
-            SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+            SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5,
+            cleanup_delay_period=0, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;
             CREATE TABLE `{database}`.dest (p UInt64, d UInt64)
             ENGINE = ReplicatedMergeTree('/clickhouse/{database}/tables/test_consistent_shard2{shard}/replicated', '{replica}')
             ORDER BY d PARTITION BY p
-            SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+            SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5,
+            cleanup_delay_period=0, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0, temporary_directories_lifetime=1;
         """.format(
                 shard=shard, replica=node.name, database=CLICKHOUSE_DATABASE
             )
diff --git a/tests/integration/test_consistent_parts_after_clone_replica/test.py b/tests/integration/test_consistent_parts_after_clone_replica/test.py
index 0c907340090..2771a874d68 100644
--- a/tests/integration/test_consistent_parts_after_clone_replica/test.py
+++ b/tests/integration/test_consistent_parts_after_clone_replica/test.py
@@ -13,7 +13,8 @@ def fill_nodes(nodes, shard):
             CREATE TABLE test_table(date Date, id UInt32)
             ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}')
             ORDER BY id PARTITION BY toYYYYMM(date) 
-            SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+            SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0,
+            cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;
             """.format(
                 shard=shard, replica=node.name
             )
diff --git a/tests/integration/test_disk_over_web_server/test.py b/tests/integration/test_disk_over_web_server/test.py
index 719de5e8bef..d62adfb3343 100644
--- a/tests/integration/test_disk_over_web_server/test.py
+++ b/tests/integration/test_disk_over_web_server/test.py
@@ -45,6 +45,8 @@ def cluster():
                 f"CREATE TABLE data{i} (id Int32) ENGINE = MergeTree() ORDER BY id SETTINGS storage_policy = 'def', min_bytes_for_wide_part=1;"
             )
 
+            node.query("SYSTEM STOP MERGES")
+
             for _ in range(10):
                 node.query(
                     f"INSERT INTO data{i} SELECT number FROM numbers(500000 * {i+1})"
diff --git a/tests/integration/test_drop_replica/test.py b/tests/integration/test_drop_replica/test.py
index e87edb0a578..0941e664982 100644
--- a/tests/integration/test_drop_replica/test.py
+++ b/tests/integration/test_drop_replica/test.py
@@ -11,7 +11,8 @@ def fill_nodes(nodes, shard):
                 CREATE DATABASE test;
     
                 CREATE TABLE test.test_table(date Date, id UInt32)
-                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) 
+                SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;
             """.format(
                 shard=shard, replica=node.name
             )
@@ -22,7 +23,8 @@ def fill_nodes(nodes, shard):
                 CREATE DATABASE test1;
     
                 CREATE TABLE test1.test_table(date Date, id UInt32)
-                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test1/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test1/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) 
+                SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;
             """.format(
                 shard=shard, replica=node.name
             )
@@ -33,7 +35,8 @@ def fill_nodes(nodes, shard):
                 CREATE DATABASE test2;
     
                 CREATE TABLE test2.test_table(date Date, id UInt32)
-                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test2/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test2/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) 
+                SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;
             """.format(
                 shard=shard, replica=node.name
             )
@@ -44,7 +47,8 @@ def fill_nodes(nodes, shard):
                 CREATE DATABASE test3;
     
                 CREATE TABLE test3.test_table(date Date, id UInt32)
-                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test3/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test3/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) 
+                SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;
             """.format(
                 shard=shard, replica=node.name
             )
@@ -55,7 +59,8 @@ def fill_nodes(nodes, shard):
                 CREATE DATABASE test4;
     
                 CREATE TABLE test4.test_table(date Date, id UInt32)
-                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test4/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test4/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) 
+                SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;
             """.format(
                 shard=shard, replica=node.name
             )
diff --git a/tests/integration/test_encrypted_disk/configs/storage.xml b/tests/integration/test_encrypted_disk/configs/storage.xml
index 1e48c80d50f..2b84e0d6daa 100644
--- a/tests/integration/test_encrypted_disk/configs/storage.xml
+++ b/tests/integration/test_encrypted_disk/configs/storage.xml
@@ -105,4 +105,5 @@
             </s3_encrypted_cache_policy>
          </policies>
     </storage_configuration>
+    <allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 </clickhouse>
diff --git a/tests/integration/test_encrypted_disk/test.py b/tests/integration/test_encrypted_disk/test.py
index 9f5415f4bea..fbf2b59785b 100644
--- a/tests/integration/test_encrypted_disk/test.py
+++ b/tests/integration/test_encrypted_disk/test.py
@@ -96,7 +96,7 @@ def test_part_move(policy, destination_disks):
             data String
         ) ENGINE=MergeTree()
         ORDER BY id
-        SETTINGS storage_policy='{}'
+        SETTINGS storage_policy='{}', temporary_directories_lifetime=1
         """.format(
             policy
         )
diff --git a/tests/integration/test_executable_dictionary/dictionaries/executable_missing_strict_check_dictionary.xml b/tests/integration/test_executable_dictionary/dictionaries/executable_missing_strict_check_dictionary.xml
new file mode 100644
index 00000000000..8562851e69c
--- /dev/null
+++ b/tests/integration/test_executable_dictionary/dictionaries/executable_missing_strict_check_dictionary.xml
@@ -0,0 +1,29 @@
+<dictionaries>
+  <dictionary>
+    <name>executable_input_missing_executable</name>
+    <source>
+      <executable>
+        <!-- OOPS! executable not found -->
+        <command>executable_not_found</command>
+        <format>CSV</format>
+      </executable>
+    </source>
+    <lifetime>
+      <min>86400</min>
+      <max>90000</max>
+    </lifetime>
+    <layout>
+      <flat />
+    </layout>
+    <structure>
+        <id>
+            <name>input</name>
+        </id>
+        <attribute>
+            <name>result</name>
+            <type>String</type>
+            <null_value></null_value>
+        </attribute>
+    </structure>
+  </dictionary>
+</dictionaries>
diff --git a/tests/integration/test_executable_dictionary/test.py b/tests/integration/test_executable_dictionary/test.py
index 43e6ec0a800..22f3442bb95 100644
--- a/tests/integration/test_executable_dictionary/test.py
+++ b/tests/integration/test_executable_dictionary/test.py
@@ -217,33 +217,21 @@ def test_executable_implicit_input_argument_python(started_cluster):
 
 def test_executable_input_signalled_python(started_cluster):
     skip_test_msan(node)
-    assert (
-        node.query(
-            "SELECT dictGet('executable_input_signalled_python', 'result', toUInt64(1))"
-        )
-        == "Default result\n"
+    assert node.query_and_get_error(
+        "SELECT dictGet('executable_input_signalled_python', 'result', toUInt64(1))"
     )
-    assert (
-        node.query(
-            "SELECT dictGet('executable_input_signalled_pool_python', 'result', toUInt64(1))"
-        )
-        == "Default result\n"
+    assert node.query_and_get_error(
+        "SELECT dictGet('executable_input_signalled_pool_python', 'result', toUInt64(1))"
     )
 
 
 def test_executable_implicit_input_signalled_python(started_cluster):
     skip_test_msan(node)
-    assert (
-        node.query(
-            "SELECT dictGet('executable_implicit_input_signalled_python', 'result', toUInt64(1))"
-        )
-        == "Default result\n"
+    assert node.query_and_get_error(
+        "SELECT dictGet('executable_implicit_input_signalled_python', 'result', toUInt64(1))"
     )
-    assert (
-        node.query(
-            "SELECT dictGet('executable_implicit_input_signalled_pool_python', 'result', toUInt64(1))"
-        )
-        == "Default result\n"
+    assert node.query_and_get_error(
+        "SELECT dictGet('executable_implicit_input_signalled_pool_python', 'result', toUInt64(1))"
     )
 
 
@@ -482,3 +470,23 @@ def test_executable_source_updated_python(started_cluster):
         )
         == "Value 1 1\n"
     )
+
+
+def test_executable_source_exit_code_check(started_cluster):
+    skip_test_msan(node)
+    assert "DB::Exception" in node.query_and_get_error(
+        "SELECT * FROM dictionary(executable_input_missing_executable) ORDER BY input"
+    )
+    assert "DB::Exception" in node.query_and_get_error(
+        "SELECT dictGet('executable_input_missing_executable', 'result', toUInt64(1))"
+    )
+
+    assert (
+        node.query(
+            "SELECT status FROM system.dictionaries WHERE name='executable_input_missing_executable'"
+        )
+        == "FAILED\n"
+    )
+    assert "DB::Exception" in node.query(
+        "SELECT last_exception FROM system.dictionaries WHERE name='executable_input_missing_executable'"
+    )
diff --git a/tests/integration/test_hedged_requests/configs/logger.xml b/tests/integration/test_hedged_requests/configs/logger.xml
new file mode 100644
index 00000000000..b341b14d43c
--- /dev/null
+++ b/tests/integration/test_hedged_requests/configs/logger.xml
@@ -0,0 +1,5 @@
+<clickhouse>
+    <logger>
+        <count>20</count>
+    </logger>
+</clickhouse>
diff --git a/tests/integration/test_hedged_requests/test.py b/tests/integration/test_hedged_requests/test.py
index 2ca37fbb7ee..18ea3e50619 100644
--- a/tests/integration/test_hedged_requests/test.py
+++ b/tests/integration/test_hedged_requests/test.py
@@ -23,7 +23,7 @@ def started_cluster():
     NODES["node"] = cluster.add_instance(
         "node",
         stay_alive=True,
-        main_configs=["configs/remote_servers.xml"],
+        main_configs=["configs/remote_servers.xml", "configs/logger.xml"],
         user_configs=["configs/users.xml"],
     )
 
@@ -203,6 +203,9 @@ def update_configs(
 
 
 def test_stuck_replica(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs()
 
     cluster.pause_container("node_1")
@@ -233,6 +236,9 @@ def test_stuck_replica(started_cluster):
 
 
 def test_long_query(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs()
 
     # Restart to reset pool states.
@@ -249,12 +255,18 @@ def test_long_query(started_cluster):
 
 
 def test_send_table_status_sleep(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(node_1_sleep_in_send_tables_status=sleep_time)
     check_query(expected_replica="node_2")
     check_changing_replica_events(1)
 
 
 def test_send_table_status_sleep2(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(
         node_1_sleep_in_send_tables_status=sleep_time,
         node_2_sleep_in_send_tables_status=sleep_time,
@@ -264,12 +276,18 @@ def test_send_table_status_sleep2(started_cluster):
 
 
 def test_send_data(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(node_1_sleep_in_send_data=sleep_time)
     check_query(expected_replica="node_2")
     check_changing_replica_events(1)
 
 
 def test_send_data2(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(
         node_1_sleep_in_send_data=sleep_time, node_2_sleep_in_send_data=sleep_time
     )
@@ -278,6 +296,9 @@ def test_send_data2(started_cluster):
 
 
 def test_combination1(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(
         node_1_sleep_in_send_tables_status=sleep_time,
         node_2_sleep_in_send_data=sleep_time,
@@ -287,6 +308,9 @@ def test_combination1(started_cluster):
 
 
 def test_combination2(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(
         node_1_sleep_in_send_data=sleep_time,
         node_2_sleep_in_send_tables_status=sleep_time,
@@ -296,6 +320,9 @@ def test_combination2(started_cluster):
 
 
 def test_combination3(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(
         node_1_sleep_in_send_data=sleep_time,
         node_2_sleep_in_send_tables_status=1000,
@@ -306,6 +333,9 @@ def test_combination3(started_cluster):
 
 
 def test_combination4(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(
         node_1_sleep_in_send_tables_status=1000,
         node_1_sleep_in_send_data=sleep_time,
@@ -317,6 +347,9 @@ def test_combination4(started_cluster):
 
 
 def test_receive_timeout1(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     # Check the situation when first two replicas get receive timeout
     # in establishing connection, but the third replica is ok.
     update_configs(
@@ -329,6 +362,9 @@ def test_receive_timeout1(started_cluster):
 
 
 def test_receive_timeout2(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     # Check the situation when first replica get receive timeout
     # in packet receiving but there are replicas in process of
     # connection establishing.
@@ -342,6 +378,9 @@ def test_receive_timeout2(started_cluster):
 
 
 def test_initial_receive_timeout(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     # Check the situation when replicas don't respond after
     # receiving query (so, no packets were send to initiator)
     update_configs(
@@ -360,6 +399,9 @@ def test_initial_receive_timeout(started_cluster):
 
 
 def test_async_connect(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs()
 
     NODES["node"].restart_clickhouse()
@@ -377,6 +419,9 @@ def test_async_connect(started_cluster):
     check_changing_replica_events(2)
     check_if_query_sending_was_not_suspended()
 
+    # Restart server to reset connection pool state
+    NODES["node"].restart_clickhouse()
+
     NODES["node"].query(
         "SELECT hostName(), id FROM distributed_connect ORDER BY id LIMIT 1 SETTINGS prefer_localhost_replica = 0, connect_timeout_with_failover_ms=5000, async_query_sending_for_remote=1, max_threads=1"
     )
@@ -387,6 +432,9 @@ def test_async_connect(started_cluster):
 
 
 def test_async_query_sending(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(
         node_1_sleep_after_receiving_query=5000,
         node_2_sleep_after_receiving_query=5000,
diff --git a/tests/integration/test_hedged_requests_parallel/test.py b/tests/integration/test_hedged_requests_parallel/test.py
index 492b869614f..728697c690d 100644
--- a/tests/integration/test_hedged_requests_parallel/test.py
+++ b/tests/integration/test_hedged_requests_parallel/test.py
@@ -172,6 +172,9 @@ def update_configs(
 
 
 def test_send_table_status_sleep(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(
         node_1_sleep_in_send_tables_status=sleep_time,
         node_2_sleep_in_send_tables_status=sleep_time,
@@ -181,6 +184,9 @@ def test_send_table_status_sleep(started_cluster):
 
 
 def test_send_data(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(
         node_1_sleep_in_send_data=sleep_time, node_2_sleep_in_send_data=sleep_time
     )
@@ -189,6 +195,9 @@ def test_send_data(started_cluster):
 
 
 def test_combination1(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(
         node_1_sleep_in_send_tables_status=1000,
         node_2_sleep_in_send_tables_status=1000,
@@ -199,6 +208,9 @@ def test_combination1(started_cluster):
 
 
 def test_combination2(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(
         node_1_sleep_in_send_data=sleep_time,
         node_2_sleep_in_send_tables_status=1000,
@@ -210,6 +222,9 @@ def test_combination2(started_cluster):
 
 
 def test_query_with_no_data_to_sample(started_cluster):
+    if NODES["node"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     update_configs(
         node_1_sleep_in_send_data=sleep_time, node_2_sleep_in_send_data=sleep_time
     )
diff --git a/tests/integration/test_host_regexp_hosts_file_resolution/test.py b/tests/integration/test_host_regexp_hosts_file_resolution/test.py
index 3fd9e65cf2a..2c07c4d880f 100644
--- a/tests/integration/test_host_regexp_hosts_file_resolution/test.py
+++ b/tests/integration/test_host_regexp_hosts_file_resolution/test.py
@@ -43,4 +43,4 @@ def test_host_regexp_multiple_ptr_hosts_file_v4(started_cluster):
 
     endpoint = build_endpoint_v4(server_ip)
 
-    assert "1\n" == client.exec_in_container((["bash", "-c", f"curl {endpoint}"]))
+    assert "1\n" == client.exec_in_container(["bash", "-c", f"curl {endpoint}"])
diff --git a/tests/integration/test_host_regexp_multiple_ptr_records/coredns_config/Corefile b/tests/integration/test_host_regexp_multiple_ptr_records/coredns_config/Corefile
index 0dd198441dc..3edf37dafa5 100644
--- a/tests/integration/test_host_regexp_multiple_ptr_records/coredns_config/Corefile
+++ b/tests/integration/test_host_regexp_multiple_ptr_records/coredns_config/Corefile
@@ -1,6 +1,6 @@
 . {
     hosts /example.com {
-        reload "200ms"
+        reload "20ms"
         fallthrough
     }
     forward . 127.0.0.11
diff --git a/tests/integration/test_host_regexp_multiple_ptr_records/test.py b/tests/integration/test_host_regexp_multiple_ptr_records/test.py
index fa2917411e4..82ae0b6c527 100644
--- a/tests/integration/test_host_regexp_multiple_ptr_records/test.py
+++ b/tests/integration/test_host_regexp_multiple_ptr_records/test.py
@@ -1,5 +1,7 @@
 import pytest
+import socket
 from helpers.cluster import ClickHouseCluster, get_docker_compose_path, run_and_check
+from time import sleep
 import os
 
 DOCKER_COMPOSE_PATH = get_docker_compose_path()
@@ -32,11 +34,27 @@ def started_cluster():
         cluster.shutdown()
 
 
+def check_ptr_record(ip, hostname):
+    try:
+        host, aliaslist, ipaddrlist = socket.gethostbyaddr(ip)
+        if hostname.lower() == host.lower():
+            return True
+    except socket.herror:
+        pass
+    return False
+
+
 def setup_dns_server(ip):
     domains_string = "test3.example.com test2.example.com test1.example.com"
     example_file_path = f'{ch_server.env_variables["COREDNS_CONFIG_DIR"]}/example.com'
     run_and_check(f"echo '{ip} {domains_string}' > {example_file_path}", shell=True)
 
+    # DNS server takes time to reload the configuration.
+    for try_num in range(10):
+        if all(check_ptr_record(ip, host) for host in domains_string.split()):
+            break
+        sleep(1)
+
 
 def setup_ch_server(dns_server_ip):
     ch_server.exec_in_container(
@@ -66,7 +84,7 @@ def test_host_regexp_multiple_ptr_v4_fails_with_wrong_resolution(started_cluster
 
     endpoint = build_endpoint_v4(server_ip)
 
-    assert "1\n" != client.exec_in_container((["bash", "-c", f"curl {endpoint}"]))
+    assert "1\n" != client.exec_in_container(["bash", "-c", f"curl {endpoint}"])
 
 
 def test_host_regexp_multiple_ptr_v4(started_cluster):
@@ -79,7 +97,7 @@ def test_host_regexp_multiple_ptr_v4(started_cluster):
 
     endpoint = build_endpoint_v4(server_ip)
 
-    assert "1\n" == client.exec_in_container((["bash", "-c", f"curl {endpoint}"]))
+    assert "1\n" == client.exec_in_container(["bash", "-c", f"curl {endpoint}"])
 
 
 def test_host_regexp_multiple_ptr_v6(started_cluster):
@@ -88,4 +106,4 @@ def test_host_regexp_multiple_ptr_v6(started_cluster):
 
     endpoint = build_endpoint_v6(ch_server.ipv6_address)
 
-    assert "1\n" == client.exec_in_container((["bash", "-c", f"curl -6 {endpoint}"]))
+    assert "1\n" == client.exec_in_container(["bash", "-c", f"curl -6 {endpoint}"])
diff --git a/tests/integration/test_host_regexp_multiple_ptr_records_concurrent/coredns_config/Corefile b/tests/integration/test_host_regexp_multiple_ptr_records_concurrent/coredns_config/Corefile
index 0dd198441dc..3edf37dafa5 100644
--- a/tests/integration/test_host_regexp_multiple_ptr_records_concurrent/coredns_config/Corefile
+++ b/tests/integration/test_host_regexp_multiple_ptr_records_concurrent/coredns_config/Corefile
@@ -1,6 +1,6 @@
 . {
     hosts /example.com {
-        reload "200ms"
+        reload "20ms"
         fallthrough
     }
     forward . 127.0.0.11
diff --git a/tests/integration/test_host_regexp_multiple_ptr_records_concurrent/test.py b/tests/integration/test_host_regexp_multiple_ptr_records_concurrent/test.py
index 62f47579612..d73e8813e79 100644
--- a/tests/integration/test_host_regexp_multiple_ptr_records_concurrent/test.py
+++ b/tests/integration/test_host_regexp_multiple_ptr_records_concurrent/test.py
@@ -1,4 +1,5 @@
 import pytest
+import socket
 from helpers.cluster import ClickHouseCluster, get_docker_compose_path, run_and_check
 from time import sleep
 import os
@@ -31,11 +32,27 @@ def started_cluster():
         cluster.shutdown()
 
 
+def check_ptr_record(ip, hostname):
+    try:
+        host, aliaslist, ipaddrlist = socket.gethostbyaddr(ip)
+        if hostname.lower() == host.lower():
+            return True
+    except socket.herror:
+        pass
+    return False
+
+
 def setup_dns_server(ip):
     domains_string = "test3.example.com test2.example.com test1.example.com"
     example_file_path = f'{ch_server.env_variables["COREDNS_CONFIG_DIR"]}/example.com'
     run_and_check(f"echo '{ip} {domains_string}' > {example_file_path}", shell=True)
 
+    # DNS server takes time to reload the configuration.
+    for try_num in range(10):
+        if all(check_ptr_record(ip, host) for host in domains_string.split()):
+            break
+        sleep(1)
+
 
 def setup_ch_server(dns_server_ip):
     ch_server.exec_in_container(
diff --git a/tests/integration/test_https_replication/configs/listen_host.xml b/tests/integration/test_https_replication/configs/listen_host.xml
new file mode 100644
index 00000000000..f94e5c88568
--- /dev/null
+++ b/tests/integration/test_https_replication/configs/listen_host.xml
@@ -0,0 +1,3 @@
+<clickhouse>
+    <listen_host>::</listen_host>
+</clickhouse>
diff --git a/tests/integration/test_https_replication/test_change_ip.py b/tests/integration/test_https_replication/test_change_ip.py
new file mode 100644
index 00000000000..14fe5351c8d
--- /dev/null
+++ b/tests/integration/test_https_replication/test_change_ip.py
@@ -0,0 +1,96 @@
+import pytest
+from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import assert_eq_with_retry
+
+"""
+Both ssl_conf.xml and no_ssl_conf.xml have the same port
+"""
+
+
+def _fill_nodes(nodes, shard):
+    for node in nodes:
+        node.query(
+            """
+                CREATE DATABASE test;
+    
+                CREATE TABLE test_table(date Date, id UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}') PARTITION BY toYYYYMM(date) ORDER BY id;
+            """.format(
+                shard=shard, replica=node.name
+            )
+        )
+
+
+cluster = ClickHouseCluster(__file__)
+node1 = cluster.add_instance(
+    "node1",
+    main_configs=[
+        "configs/remote_servers.xml",
+        "configs/listen_host.xml",
+        "configs/ssl_conf.xml",
+        "configs/server.crt",
+        "configs/server.key",
+        "configs/dhparam.pem",
+    ],
+    with_zookeeper=True,
+    ipv6_address="2001:3984:3989::1:1111",
+)
+node2 = cluster.add_instance(
+    "node2",
+    main_configs=[
+        "configs/remote_servers.xml",
+        "configs/listen_host.xml",
+        "configs/ssl_conf.xml",
+        "configs/server.crt",
+        "configs/server.key",
+        "configs/dhparam.pem",
+    ],
+    with_zookeeper=True,
+    ipv6_address="2001:3984:3989::1:1112",
+)
+
+
+@pytest.fixture(scope="module")
+def both_https_cluster():
+    try:
+        cluster.start()
+
+        _fill_nodes([node1, node2], 1)
+
+        yield cluster
+
+    finally:
+        cluster.shutdown()
+
+
+def test_replication_when_node_ip_changed(both_https_cluster):
+    """
+    Test for a bug when replication over HTTPS stops working when the IP of the source replica was changed.
+
+    node1 is a source node
+    node2 fethes data from node1
+    """
+    node1.query("truncate table test_table")
+    node2.query("truncate table test_table")
+
+    # First we check, that normal replication works
+    node1.query(
+        "INSERT INTO test_table VALUES ('2022-10-01', 1), ('2022-10-02', 2), ('2022-10-03', 3)"
+    )
+    assert node1.query("SELECT count(*) from test_table") == "3\n"
+    assert_eq_with_retry(node2, "SELECT count(*) from test_table", "3")
+
+    # We change source node ip
+    cluster.restart_instance_with_ip_change(node1, "2001:3984:3989::1:7777")
+
+    # Put some data to source node1
+    node1.query(
+        "INSERT INTO test_table VALUES ('2018-10-01', 4), ('2018-10-02', 4), ('2018-10-03', 6)"
+    )
+    # Check that data is placed on node1
+    assert node1.query("SELECT count(*) from test_table") == "6\n"
+
+    # drop DNS cache
+    node2.query("SYSTEM DROP DNS CACHE")
+    # Data is fetched
+    assert_eq_with_retry(node2, "SELECT count(*) from test_table", "6")
diff --git a/tests/integration/test_jbod_balancer/test.py b/tests/integration/test_jbod_balancer/test.py
index df34a075d5a..4797eec5381 100644
--- a/tests/integration/test_jbod_balancer/test.py
+++ b/tests/integration/test_jbod_balancer/test.py
@@ -134,6 +134,7 @@ def test_replicated_balanced_merge_fetch(start_cluster):
                     old_parts_lifetime = 1,
                     cleanup_delay_period = 1,
                     cleanup_delay_period_random_add = 2,
+                    cleanup_thread_preferred_points_per_iteration=0,
                     min_bytes_to_rebalance_partition_over_jbod = 1024,
                     max_bytes_to_merge_at_max_space_in_pool = 4096
             """.format(
diff --git a/tests/integration/test_jbod_ha/test.py b/tests/integration/test_jbod_ha/test.py
index 5cbb5989ff3..033d751912a 100644
--- a/tests/integration/test_jbod_ha/test.py
+++ b/tests/integration/test_jbod_ha/test.py
@@ -58,6 +58,7 @@ def test_jbod_ha(start_cluster):
                     old_parts_lifetime = 1,
                     cleanup_delay_period = 1,
                     cleanup_delay_period_random_add = 2,
+                    cleanup_thread_preferred_points_per_iteration=0,
                     max_bytes_to_merge_at_max_space_in_pool = 4096
             """.format(
                     i
diff --git a/tests/integration/test_jemalloc_percpu_arena/test.py b/tests/integration/test_jemalloc_percpu_arena/test.py
index 0dccde3776e..8de3dcd7ea2 100755
--- a/tests/integration/test_jemalloc_percpu_arena/test.py
+++ b/tests/integration/test_jemalloc_percpu_arena/test.py
@@ -26,7 +26,7 @@ def run_command_in_container(cmd, *args):
             "run",
             "--rm",
             *args,
-            "ubuntu:20.04",
+            "ubuntu:22.04",
             "sh",
             "-c",
             cmd,
diff --git a/tests/ci/team_keys_lambda/__init__.py b/tests/integration/test_keeper_disks/__init__.py
similarity index 100%
rename from tests/ci/team_keys_lambda/__init__.py
rename to tests/integration/test_keeper_disks/__init__.py
diff --git a/tests/integration/test_keeper_disks/configs/enable_keeper.xml b/tests/integration/test_keeper_disks/configs/enable_keeper.xml
new file mode 100644
index 00000000000..5814979229c
--- /dev/null
+++ b/tests/integration/test_keeper_disks/configs/enable_keeper.xml
@@ -0,0 +1,53 @@
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <log_local>
+                <type>local</type>
+                <path>/var/lib/clickhouse/coordination/logs/</path>
+            </log_local>
+            <log_s3_plain>
+                <type>s3_plain</type>
+                <endpoint>http://minio1:9001/root/logs/</endpoint>
+                <access_key_id>minio</access_key_id>
+                <secret_access_key>minio123</secret_access_key>
+            </log_s3_plain>
+            <snapshot_local>
+                <type>local</type>
+                <path>/var/lib/clickhouse/coordination/snapshots/</path>
+            </snapshot_local>
+            <snapshot_s3_plain>
+                <type>s3_plain</type>
+                <endpoint>http://minio1:9001/root/snapshots/</endpoint>
+                <access_key_id>minio</access_key_id>
+                <secret_access_key>minio123</secret_access_key>
+            </snapshot_s3_plain>
+        </disks>
+    </storage_configuration>
+
+    <keeper_server>
+        <use_cluster>false</use_cluster>
+        <tcp_port>9181</tcp_port>
+        <server_id>1</server_id>
+        <create_snapshot_on_exit>false</create_snapshot_on_exit>
+
+        <coordination_settings>
+            <operation_timeout_ms>5000</operation_timeout_ms>
+            <session_timeout_ms>10000</session_timeout_ms>
+            <raft_logs_level>trace</raft_logs_level>
+            <snapshot_distance>10</snapshot_distance>
+            <stale_log_gap>10</stale_log_gap>
+            <reserved_log_items>1</reserved_log_items>
+            <rotate_log_storage_interval>3</rotate_log_storage_interval>
+        </coordination_settings>
+
+        <!-- DISK DEFINITION PLACEHOLDER -->
+
+        <raft_configuration>
+            <server>
+                <id>1</id>
+                <hostname>node</hostname>
+                <port>9234</port>
+            </server>
+        </raft_configuration>
+    </keeper_server>
+</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_keeper_disks/test.py b/tests/integration/test_keeper_disks/test.py
new file mode 100644
index 00000000000..11bb215be54
--- /dev/null
+++ b/tests/integration/test_keeper_disks/test.py
@@ -0,0 +1,258 @@
+#!/usr/bin/env python3
+import pytest
+from helpers.cluster import ClickHouseCluster
+import helpers.keeper_utils as keeper_utils
+from minio.deleteobjects import DeleteObject
+
+import os
+
+CURRENT_TEST_DIR = os.path.dirname(os.path.abspath(__file__))
+cluster = ClickHouseCluster(__file__)
+node = cluster.add_instance(
+    "node", main_configs=["configs/enable_keeper.xml"], stay_alive=True, with_minio=True
+)
+
+from kazoo.client import KazooClient, KazooState
+
+
+@pytest.fixture(scope="module")
+def started_cluster():
+    try:
+        cluster.start()
+        yield cluster
+
+    finally:
+        cluster.shutdown()
+
+
+def get_fake_zk(nodename, timeout=30.0):
+    _fake_zk_instance = KazooClient(
+        hosts=cluster.get_instance_ip(nodename) + ":9181", timeout=timeout
+    )
+    _fake_zk_instance.start()
+    return _fake_zk_instance
+
+
+def stop_zk(zk):
+    try:
+        if zk:
+            zk.stop()
+            zk.close()
+    except:
+        pass
+
+
+def stop_clickhouse(cluster, cleanup_disks):
+    node.stop_clickhouse()
+
+    if not cleanup_disks:
+        return
+
+    node.exec_in_container(["rm", "-rf", "/var/lib/clickhouse/coordination/logs"])
+    node.exec_in_container(["rm", "-rf", "/var/lib/clickhouse/coordination/snapshots"])
+
+    s3_objects = list_s3_objects(cluster, prefix="")
+    if len(s3_objects) == 0:
+        return
+
+    assert (
+        len(
+            list(
+                cluster.minio_client.remove_objects(
+                    cluster.minio_bucket,
+                    [DeleteObject(obj) for obj in s3_objects],
+                )
+            )
+        )
+        == 0
+    )
+
+
+def setup_storage(cluster, storage_config, cleanup_disks):
+    stop_clickhouse(cluster, cleanup_disks)
+    node.copy_file_to_container(
+        os.path.join(CURRENT_TEST_DIR, "configs/enable_keeper.xml"),
+        "/etc/clickhouse-server/config.d/enable_keeper.xml",
+    )
+    node.replace_in_config(
+        "/etc/clickhouse-server/config.d/enable_keeper.xml",
+        "<!-- DISK DEFINITION PLACEHOLDER -->",
+        storage_config,
+    )
+    node.start_clickhouse()
+    keeper_utils.wait_until_connected(cluster, node)
+
+
+def setup_local_storage(cluster):
+    setup_storage(
+        cluster,
+        "<log_storage_disk>log_local<\\/log_storage_disk>"
+        "<snapshot_storage_disk>snapshot_local<\\/snapshot_storage_disk>",
+        cleanup_disks=True,
+    )
+
+
+def list_s3_objects(cluster, prefix=""):
+    minio = cluster.minio_client
+    prefix_len = len(prefix)
+    return [
+        obj.object_name[prefix_len:]
+        for obj in minio.list_objects(
+            cluster.minio_bucket, prefix=prefix, recursive=True
+        )
+    ]
+
+
+def get_local_files(path):
+    files = node.exec_in_container(["ls", path]).strip().split("\n")
+    files.sort()
+    return files
+
+
+def get_local_logs():
+    return get_local_files("/var/lib/clickhouse/coordination/logs")
+
+
+def get_local_snapshots():
+    return get_local_files("/var/lib/clickhouse/coordination/snapshots")
+
+
+def test_logs_with_disks(started_cluster):
+    setup_local_storage(started_cluster)
+
+    node_zk = get_fake_zk("node")
+    try:
+        node_zk.create("/test")
+        for _ in range(30):
+            node_zk.create("/test/somenode", b"somedata", sequence=True)
+
+        stop_zk(node_zk)
+
+        previous_log_files = get_local_logs()
+
+        setup_storage(
+            started_cluster,
+            "<log_storage_disk>log_s3_plain<\\/log_storage_disk>"
+            "<latest_log_storage_disk>log_local<\\/latest_log_storage_disk>"
+            "<snapshot_storage_disk>snapshot_local<\\/snapshot_storage_disk>",
+            cleanup_disks=False,
+        )
+
+        # all but the latest log should be on S3
+        s3_log_files = list_s3_objects(started_cluster, "logs/")
+        assert set(s3_log_files) == set(previous_log_files[:-1])
+        local_log_files = get_local_logs()
+        assert len(local_log_files) == 1
+        assert local_log_files[0] == previous_log_files[-1]
+
+        previous_log_files = s3_log_files + local_log_files
+
+        node_zk = get_fake_zk("node")
+
+        for _ in range(30):
+            node_zk.create("/test/somenode", b"somedata", sequence=True)
+
+        stop_zk(node_zk)
+
+        log_files = list_s3_objects(started_cluster, "logs/")
+        local_log_files = get_local_logs()
+        assert len(local_log_files) == 1
+
+        log_files.extend(local_log_files)
+        assert set(log_files) != previous_log_files
+
+        previous_log_files = log_files
+
+        setup_storage(
+            started_cluster,
+            "<old_log_storage_disk>log_s3_plain<\\/old_log_storage_disk>"
+            "<log_storage_disk>log_local<\\/log_storage_disk>"
+            "<snapshot_storage_disk>snapshot_local<\\/snapshot_storage_disk>",
+            cleanup_disks=False,
+        )
+
+        local_log_files = get_local_logs()
+        assert set(local_log_files) == set(previous_log_files)
+
+        node_zk = get_fake_zk("node")
+
+        for child in node_zk.get_children("/test"):
+            assert node_zk.get(f"/test/{child}")[0] == b"somedata"
+
+    finally:
+        stop_zk(node_zk)
+
+
+def test_snapshots_with_disks(started_cluster):
+    setup_local_storage(started_cluster)
+
+    node_zk = get_fake_zk("node")
+    try:
+        node_zk.create("/test2")
+        for _ in range(30):
+            node_zk.create("/test2/somenode", b"somedata", sequence=True)
+
+        stop_zk(node_zk)
+
+        snapshot_idx = keeper_utils.send_4lw_cmd(cluster, node, "csnp")
+        node.wait_for_log_line(
+            f"Created persistent snapshot {snapshot_idx}", look_behind_lines=1000
+        )
+
+        previous_snapshot_files = get_local_snapshots()
+
+        setup_storage(
+            started_cluster,
+            "<snapshot_storage_disk>snapshot_s3_plain<\\/snapshot_storage_disk>"
+            "<latest_snapshot_storage_disk>snapshot_local<\\/latest_snapshot_storage_disk>"
+            "<log_storage_disk>log_local<\\/log_storage_disk>",
+            cleanup_disks=False,
+        )
+
+        ## all but the latest log should be on S3
+        s3_snapshot_files = list_s3_objects(started_cluster, "snapshots/")
+        assert set(s3_snapshot_files) == set(previous_snapshot_files[:-1])
+        local_snapshot_files = get_local_snapshots()
+        assert len(local_snapshot_files) == 1
+        assert local_snapshot_files[0] == previous_snapshot_files[-1]
+
+        previous_snapshot_files = s3_snapshot_files + local_snapshot_files
+
+        node_zk = get_fake_zk("node")
+
+        for _ in range(30):
+            node_zk.create("/test2/somenode", b"somedata", sequence=True)
+
+        stop_zk(node_zk)
+
+        snapshot_idx = keeper_utils.send_4lw_cmd(cluster, node, "csnp")
+        node.wait_for_log_line(
+            f"Created persistent snapshot {snapshot_idx}", look_behind_lines=1000
+        )
+
+        snapshot_files = list_s3_objects(started_cluster, "snapshots/")
+        local_snapshot_files = get_local_snapshots()
+        assert len(local_snapshot_files) == 1
+
+        snapshot_files.extend(local_snapshot_files)
+
+        previous_snapshot_files = snapshot_files
+
+        setup_storage(
+            started_cluster,
+            "<old_snapshot_storage_disk>snapshot_s3_plain<\\/old_snapshot_storage_disk>"
+            "<snapshot_storage_disk>snapshot_local<\\/snapshot_storage_disk>"
+            "<log_storage_disk>log_local<\\/log_storage_disk>",
+            cleanup_disks=False,
+        )
+
+        local_snapshot_files = get_local_snapshots()
+        assert set(local_snapshot_files) == set(previous_snapshot_files)
+
+        node_zk = get_fake_zk("node")
+
+        for child in node_zk.get_children("/test2"):
+            assert node_zk.get(f"/test2/{child}")[0] == b"somedata"
+
+    finally:
+        stop_zk(node_zk)
diff --git a/tests/ci/terminate_runner_lambda/__init__.py b/tests/integration/test_keeper_feature_flags_config/__init__.py
similarity index 100%
rename from tests/ci/terminate_runner_lambda/__init__.py
rename to tests/integration/test_keeper_feature_flags_config/__init__.py
diff --git a/tests/integration/test_keeper_feature_flags_config/configs/enable_keeper.xml b/tests/integration/test_keeper_feature_flags_config/configs/enable_keeper.xml
new file mode 100644
index 00000000000..53a169c4c3c
--- /dev/null
+++ b/tests/integration/test_keeper_feature_flags_config/configs/enable_keeper.xml
@@ -0,0 +1,31 @@
+<clickhouse>
+    <keeper_server>
+        <tcp_port>9181</tcp_port>
+        <server_id>1</server_id>
+        <log_storage_path>/var/lib/clickhouse/coordination/log</log_storage_path>
+        <snapshot_storage_path>/var/lib/clickhouse/coordination/snapshots</snapshot_storage_path>
+
+        <coordination_settings>
+            <snapshot_distance>10</snapshot_distance>
+            <reserved_log_items>5</reserved_log_items>
+            <operation_timeout_ms>5000</operation_timeout_ms>
+            <session_timeout_ms>10000</session_timeout_ms>
+            <raft_logs_level>trace</raft_logs_level>
+
+            <!-- For instant start in single node configuration -->
+            <heart_beat_interval_ms>0</heart_beat_interval_ms>
+            <election_timeout_lower_bound_ms>0</election_timeout_lower_bound_ms>
+            <election_timeout_upper_bound_ms>0</election_timeout_upper_bound_ms>
+        </coordination_settings>
+
+        <!-- FEATURE FLAGS -->
+
+        <raft_configuration>
+            <server>
+                <id>1</id>
+                <hostname>localhost</hostname>
+                <port>9234</port>
+            </server>
+        </raft_configuration>
+    </keeper_server>
+</clickhouse>
diff --git a/tests/integration/test_keeper_feature_flags_config/test.py b/tests/integration/test_keeper_feature_flags_config/test.py
new file mode 100644
index 00000000000..93ac6cbd3bd
--- /dev/null
+++ b/tests/integration/test_keeper_feature_flags_config/test.py
@@ -0,0 +1,96 @@
+#!/usr/bin/env python3
+
+import pytest
+import os
+from helpers.cluster import ClickHouseCluster
+import helpers.keeper_utils as keeper_utils
+from kazoo.client import KazooClient, KazooState
+
+CURRENT_TEST_DIR = os.path.dirname(os.path.abspath(__file__))
+cluster = ClickHouseCluster(__file__)
+
+# clickhouse itself will use external zookeeper
+node = cluster.add_instance(
+    "node",
+    main_configs=["configs/enable_keeper.xml"],
+    stay_alive=True,
+)
+
+
+@pytest.fixture(scope="module")
+def started_cluster():
+    try:
+        cluster.start()
+
+        yield cluster
+
+    finally:
+        cluster.shutdown()
+
+
+def get_connection_zk(nodename, timeout=30.0):
+    _fake_zk_instance = KazooClient(
+        hosts=cluster.get_instance_ip(nodename) + ":9181", timeout=timeout
+    )
+    _fake_zk_instance.start()
+    return _fake_zk_instance
+
+
+def restart_clickhouse(feature_flags=[], expect_fail=True):
+    node.stop_clickhouse()
+    node.copy_file_to_container(
+        os.path.join(CURRENT_TEST_DIR, "configs/enable_keeper.xml"),
+        "/etc/clickhouse-server/config.d/enable_keeper.xml",
+    )
+
+    if len(feature_flags) > 0:
+        feature_flags_config = "<feature_flags>"
+
+        for feature, is_enabled in feature_flags:
+            feature_flags_config += f"<{feature}>{is_enabled}<\\/{feature}>"
+
+        feature_flags_config += "<\\/feature_flags>"
+
+        node.replace_in_config(
+            "/etc/clickhouse-server/config.d/enable_keeper.xml",
+            "<!-- FEATURE FLAGS -->",
+            feature_flags_config,
+        )
+
+    node.start_clickhouse(retry_start=not expect_fail)
+    keeper_utils.wait_until_connected(cluster, node)
+
+
+def test_keeper_feature_flags(started_cluster):
+    restart_clickhouse()
+
+    def assert_feature_flags(feature_flags):
+        res = keeper_utils.send_4lw_cmd(started_cluster, node, "ftfl")
+
+        for feature, is_enabled in feature_flags:
+            node.wait_for_log_line(
+                f"ZooKeeperClient: Keeper feature flag {feature.upper()}: {'enabled' if is_enabled else 'disabled'}",
+                look_behind_lines=1000,
+            )
+
+            node.wait_for_log_line(
+                f"KeeperContext: Keeper feature flag {feature.upper()}: {'enabled' if is_enabled else 'disabled'}",
+                look_behind_lines=1000,
+            )
+
+            assert f"{feature}\t{1 if is_enabled else 0}" in res
+
+    assert_feature_flags(
+        [("filtered_list", 1), ("multi_read", 1), ("check_not_exists", 0)]
+    )
+
+    feature_flags = [("multi_read", 0), ("check_not_exists", 1)]
+    restart_clickhouse(feature_flags)
+    assert_feature_flags(feature_flags + [("filtered_list", 1)])
+
+    feature_flags = [("multi_read", 0), ("check_not_exists", 0), ("filtered_list", 0)]
+    restart_clickhouse(feature_flags)
+    assert_feature_flags(feature_flags)
+
+    with pytest.raises(Exception):
+        restart_clickhouse([("invalid_feature", 1)], expect_fail=True)
diff --git a/tests/integration/test_keeper_four_word_command/test.py b/tests/integration/test_keeper_four_word_command/test.py
index 2098daea5fe..b546d879c75 100644
--- a/tests/integration/test_keeper_four_word_command/test.py
+++ b/tests/integration/test_keeper_four_word_command/test.py
@@ -183,8 +183,8 @@ def test_cmd_mntr(started_cluster):
         # contains:
         #   10 nodes created by test
         #   3 nodes created by clickhouse "/clickhouse/task_queue/ddl"
-        #   1 root node, 2 keeper system nodes
-        assert int(result["zk_znode_count"]) == 13
+        #   1 root node, 3 keeper system nodes
+        assert int(result["zk_znode_count"]) == 14
         assert int(result["zk_watch_count"]) == 2
         assert int(result["zk_ephemerals_count"]) == 2
         assert int(result["zk_approximate_data_size"]) > 0
@@ -252,10 +252,12 @@ def test_cmd_conf(started_cluster):
 
         assert result["four_letter_word_allow_list"] == "*"
         assert result["log_storage_path"] == "/var/lib/clickhouse/coordination/log"
+        assert result["log_storage_disk"] == "LocalLogDisk"
         assert (
             result["snapshot_storage_path"]
             == "/var/lib/clickhouse/coordination/snapshots"
         )
+        assert result["snapshot_storage_disk"] == "LocalSnapshotDisk"
 
         assert result["session_timeout_ms"] == "30000"
         assert result["min_session_timeout_ms"] == "10000"
@@ -329,7 +331,7 @@ def test_cmd_srvr(started_cluster):
         assert int(result["Connections"]) == 1
         assert int(result["Zxid"]) > 10
         assert result["Mode"] == "leader"
-        assert result["Node count"] == "13"
+        assert result["Node count"] == "14"
 
     finally:
         destroy_zk_client(zk)
@@ -369,7 +371,7 @@ def test_cmd_stat(started_cluster):
         assert int(result["Connections"]) == 1
         assert int(result["Zxid"]) >= 10
         assert result["Mode"] == "leader"
-        assert result["Node count"] == "13"
+        assert result["Node count"] == "14"
 
         # filter connection statistics
         cons = [n for n in data.split("\n") if "=" in n]
diff --git a/tests/integration/test_keeper_multinode_blocade_leader/configs/enable_keeper1.xml b/tests/integration/test_keeper_multinode_blocade_leader/configs/enable_keeper1.xml
deleted file mode 100644
index 17455ed12f5..00000000000
--- a/tests/integration/test_keeper_multinode_blocade_leader/configs/enable_keeper1.xml
+++ /dev/null
@@ -1,41 +0,0 @@
-<clickhouse>
-    <keeper_server>
-        <tcp_port>9181</tcp_port>
-        <server_id>1</server_id>
-        <log_storage_path>/var/lib/clickhouse/coordination/log</log_storage_path>
-        <snapshot_storage_path>/var/lib/clickhouse/coordination/snapshots</snapshot_storage_path>
-
-        <coordination_settings>
-            <operation_timeout_ms>5000</operation_timeout_ms>
-            <session_timeout_ms>10000</session_timeout_ms>
-            <snapshot_distance>75</snapshot_distance>
-            <raft_logs_level>trace</raft_logs_level>
-        </coordination_settings>
-
-        <raft_configuration>
-            <server>
-                <id>1</id>
-                <hostname>node1</hostname>
-                <port>9234</port>
-                <can_become_leader>true</can_become_leader>
-                <priority>3</priority>
-            </server>
-            <server>
-                <id>2</id>
-                <hostname>node2</hostname>
-                <port>9234</port>
-                <can_become_leader>true</can_become_leader>
-                <start_as_follower>true</start_as_follower>
-                <priority>2</priority>
-            </server>
-            <server>
-                <id>3</id>
-                <hostname>node3</hostname>
-                <port>9234</port>
-                <can_become_leader>true</can_become_leader>
-                <start_as_follower>true</start_as_follower>
-                <priority>1</priority>
-            </server>
-        </raft_configuration>
-    </keeper_server>
-</clickhouse>
diff --git a/tests/integration/test_keeper_multinode_blocade_leader/configs/enable_keeper2.xml b/tests/integration/test_keeper_multinode_blocade_leader/configs/enable_keeper2.xml
deleted file mode 100644
index 03a23984cc2..00000000000
--- a/tests/integration/test_keeper_multinode_blocade_leader/configs/enable_keeper2.xml
+++ /dev/null
@@ -1,41 +0,0 @@
-<clickhouse>
-    <keeper_server>
-        <tcp_port>9181</tcp_port>
-        <server_id>2</server_id>
-        <log_storage_path>/var/lib/clickhouse/coordination/log</log_storage_path>
-        <snapshot_storage_path>/var/lib/clickhouse/coordination/snapshots</snapshot_storage_path>
-
-        <coordination_settings>
-            <operation_timeout_ms>5000</operation_timeout_ms>
-            <session_timeout_ms>10000</session_timeout_ms>
-            <snapshot_distance>75</snapshot_distance>
-            <raft_logs_level>trace</raft_logs_level>
-        </coordination_settings>
-
-        <raft_configuration>
-            <server>
-                <id>1</id>
-                <hostname>node1</hostname>
-                <port>9234</port>
-                <can_become_leader>true</can_become_leader>
-                <priority>3</priority>
-            </server>
-            <server>
-                <id>2</id>
-                <hostname>node2</hostname>
-                <port>9234</port>
-                <can_become_leader>true</can_become_leader>
-                <start_as_follower>true</start_as_follower>
-                <priority>2</priority>
-            </server>
-            <server>
-                <id>3</id>
-                <hostname>node3</hostname>
-                <port>9234</port>
-                <can_become_leader>true</can_become_leader>
-                <start_as_follower>true</start_as_follower>
-                <priority>1</priority>
-            </server>
-        </raft_configuration>
-    </keeper_server>
-</clickhouse>
diff --git a/tests/integration/test_keeper_multinode_blocade_leader/configs/enable_keeper3.xml b/tests/integration/test_keeper_multinode_blocade_leader/configs/enable_keeper3.xml
deleted file mode 100644
index a3196ac3061..00000000000
--- a/tests/integration/test_keeper_multinode_blocade_leader/configs/enable_keeper3.xml
+++ /dev/null
@@ -1,41 +0,0 @@
-<clickhouse>
-    <keeper_server>
-        <tcp_port>9181</tcp_port>
-        <server_id>3</server_id>
-        <log_storage_path>/var/lib/clickhouse/coordination/log</log_storage_path>
-        <snapshot_storage_path>/var/lib/clickhouse/coordination/snapshots</snapshot_storage_path>
-
-        <coordination_settings>
-            <operation_timeout_ms>5000</operation_timeout_ms>
-            <session_timeout_ms>10000</session_timeout_ms>
-            <snapshot_distance>75</snapshot_distance>
-            <raft_logs_level>trace</raft_logs_level>
-        </coordination_settings>
-
-        <raft_configuration>
-            <server>
-                <id>1</id>
-                <hostname>node1</hostname>
-                <port>9234</port>
-                <can_become_leader>true</can_become_leader>
-                <priority>3</priority>
-            </server>
-            <server>
-                <id>2</id>
-                <hostname>node2</hostname>
-                <port>9234</port>
-                <can_become_leader>true</can_become_leader>
-                <start_as_follower>true</start_as_follower>
-                <priority>2</priority>
-            </server>
-            <server>
-                <id>3</id>
-                <hostname>node3</hostname>
-                <port>9234</port>
-                <can_become_leader>true</can_become_leader>
-                <start_as_follower>true</start_as_follower>
-                <priority>1</priority>
-            </server>
-        </raft_configuration>
-    </keeper_server>
-</clickhouse>
diff --git a/tests/integration/test_keeper_multinode_blocade_leader/configs/use_keeper.xml b/tests/integration/test_keeper_multinode_blocade_leader/configs/use_keeper.xml
deleted file mode 100644
index 384e984f210..00000000000
--- a/tests/integration/test_keeper_multinode_blocade_leader/configs/use_keeper.xml
+++ /dev/null
@@ -1,16 +0,0 @@
-<clickhouse>
-    <zookeeper>
-        <node index="1">
-            <host>node1</host>
-            <port>9181</port>
-        </node>
-        <node index="2">
-            <host>node2</host>
-            <port>9181</port>
-        </node>
-        <node index="3">
-            <host>node3</host>
-            <port>9181</port>
-        </node>
-    </zookeeper>
-</clickhouse>
diff --git a/tests/integration/test_keeper_multinode_blocade_leader/test.py b/tests/integration/test_keeper_multinode_blocade_leader/test.py
deleted file mode 100644
index 3af0751b0fd..00000000000
--- a/tests/integration/test_keeper_multinode_blocade_leader/test.py
+++ /dev/null
@@ -1,473 +0,0 @@
-import pytest
-from helpers.cluster import ClickHouseCluster
-import helpers.keeper_utils as keeper_utils
-import random
-import string
-import os
-import time
-from multiprocessing.dummy import Pool
-from helpers.network import PartitionManager
-from helpers.test_tools import assert_eq_with_retry
-
-cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance(
-    "node1",
-    main_configs=["configs/enable_keeper1.xml", "configs/use_keeper.xml"],
-    stay_alive=True,
-)
-node2 = cluster.add_instance(
-    "node2",
-    main_configs=["configs/enable_keeper2.xml", "configs/use_keeper.xml"],
-    stay_alive=True,
-)
-node3 = cluster.add_instance(
-    "node3",
-    main_configs=["configs/enable_keeper3.xml", "configs/use_keeper.xml"],
-    stay_alive=True,
-)
-
-from kazoo.client import KazooClient, KazooState
-
-"""
-In this test, we blockade RAFT leader and check that the whole system is
-able to recover. It's not a good test because we use ClickHouse's replicated
-tables to check connectivity, but they may require special operations (or a long
-wait) after session expiration. We don't use kazoo, because this client pretends
-to be very smart: SUSPEND sessions, try to recover them, and so on. The test
-will be even less predictable than with ClickHouse tables.
-
-TODO find (or write) not so smart python client.
-TODO remove this when jepsen tests will be written.
-"""
-
-
-@pytest.fixture(scope="module")
-def started_cluster():
-    try:
-        cluster.start()
-
-        yield cluster
-
-    finally:
-        cluster.shutdown()
-
-
-def smaller_exception(ex):
-    return "\n".join(str(ex).split("\n")[0:2])
-
-
-def get_fake_zk(nodename, timeout=30.0):
-    _fake_zk_instance = KazooClient(
-        hosts=cluster.get_instance_ip(nodename) + ":9181", timeout=timeout
-    )
-    _fake_zk_instance.start()
-    return _fake_zk_instance
-
-
-def wait_nodes():
-    keeper_utils.wait_nodes(cluster, [node1, node2, node3])
-
-
-# in extremely rare case it can take more than 5 minutes in debug build with sanitizer
-@pytest.mark.timeout(600)
-def test_blocade_leader(started_cluster):
-    for i in range(100):
-        wait_nodes()
-        try:
-            for i, node in enumerate([node1, node2, node3]):
-                node.query(
-                    "CREATE DATABASE IF NOT EXISTS ordinary ENGINE=Ordinary",
-                    settings={"allow_deprecated_database_ordinary": 1},
-                )
-                node.query(
-                    "CREATE TABLE IF NOT EXISTS ordinary.t1 (value UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/t1', '{}') ORDER BY tuple()".format(
-                        i + 1
-                    )
-                )
-            break
-        except Exception as ex:
-            print("Got exception from node", smaller_exception(ex))
-            time.sleep(0.1)
-
-    node2.query(
-        "INSERT INTO ordinary.t1 SELECT number FROM numbers(10) SETTINGS insert_keeper_max_retries = 0"
-    )
-
-    node1.query("SYSTEM SYNC REPLICA ordinary.t1", timeout=10)
-    node3.query("SYSTEM SYNC REPLICA ordinary.t1", timeout=10)
-
-    assert_eq_with_retry(node1, "SELECT COUNT() FROM ordinary.t1", "10")
-    assert_eq_with_retry(node2, "SELECT COUNT() FROM ordinary.t1", "10")
-    assert_eq_with_retry(node3, "SELECT COUNT() FROM ordinary.t1", "10")
-
-    with PartitionManager() as pm:
-        pm.partition_instances(node2, node1)
-        pm.partition_instances(node3, node1)
-
-        for i in range(100):
-            try:
-                restart_replica_for_sure(
-                    node2, "ordinary.t1", "/clickhouse/t1/replicas/2"
-                )
-                node2.query(
-                    "INSERT INTO ordinary.t1 SELECT rand() FROM numbers(100) SETTINGS insert_keeper_max_retries = 0"
-                )
-                break
-            except Exception as ex:
-                try:
-                    node2.query("ATTACH TABLE ordinary.t1")
-                except Exception as attach_ex:
-                    print("Got exception node2", smaller_exception(attach_ex))
-                print("Got exception node2", smaller_exception(ex))
-                time.sleep(0.5)
-        else:
-            for num, node in enumerate([node1, node2, node3]):
-                dump_zk(
-                    node, "/clickhouse/t1", "/clickhouse/t1/replicas/{}".format(num + 1)
-                )
-            assert False, "Cannot insert anything node2"
-
-        for i in range(100):
-            try:
-                restart_replica_for_sure(
-                    node3, "ordinary.t1", "/clickhouse/t1/replicas/3"
-                )
-                node3.query(
-                    "INSERT INTO ordinary.t1 SELECT rand() FROM numbers(100) SETTINGS insert_keeper_max_retries = 0"
-                )
-                break
-            except Exception as ex:
-                try:
-                    node3.query("ATTACH TABLE ordinary.t1")
-                except Exception as attach_ex:
-                    print("Got exception node3", smaller_exception(attach_ex))
-                print("Got exception node3", smaller_exception(ex))
-                time.sleep(0.5)
-        else:
-            for num, node in enumerate([node1, node2, node3]):
-                dump_zk(
-                    node, "/clickhouse/t1", "/clickhouse/t1/replicas/{}".format(num + 1)
-                )
-            assert False, "Cannot insert anything node3"
-
-    for n, node in enumerate([node1, node2, node3]):
-        for i in range(100):
-            try:
-                restart_replica_for_sure(
-                    node, "ordinary.t1", "/clickhouse/t1/replicas/{}".format(n + 1)
-                )
-                break
-            except Exception as ex:
-                try:
-                    node.query("ATTACH TABLE ordinary.t1")
-                except Exception as attach_ex:
-                    print(
-                        "Got exception node{}".format(n + 1),
-                        smaller_exception(attach_ex),
-                    )
-
-                print("Got exception node{}".format(n + 1), smaller_exception(ex))
-                time.sleep(0.5)
-        else:
-            assert False, "Cannot reconnect for node{}".format(n + 1)
-
-    for i in range(100):
-        try:
-            node1.query(
-                "INSERT INTO ordinary.t1 SELECT rand() FROM numbers(100) SETTINGS insert_keeper_max_retries = 0"
-            )
-            break
-        except Exception as ex:
-            print("Got exception node1", smaller_exception(ex))
-            time.sleep(0.5)
-    else:
-        for num, node in enumerate([node1, node2, node3]):
-            dump_zk(
-                node, "/clickhouse/t1", "/clickhouse/t1/replicas/{}".format(num + 1)
-            )
-        assert False, "Cannot insert anything node1"
-
-    for n, node in enumerate([node1, node2, node3]):
-        for i in range(100):
-            try:
-                restart_replica_for_sure(
-                    node, "ordinary.t1", "/clickhouse/t1/replicas/{}".format(n + 1)
-                )
-                node.query("SYSTEM SYNC REPLICA ordinary.t1", timeout=10)
-                break
-            except Exception as ex:
-                try:
-                    node.query("ATTACH TABLE ordinary.t1")
-                except Exception as attach_ex:
-                    print(
-                        "Got exception node{}".format(n + 1),
-                        smaller_exception(attach_ex),
-                    )
-
-                print("Got exception node{}".format(n + 1), smaller_exception(ex))
-                time.sleep(0.5)
-        else:
-            for num, node in enumerate([node1, node2, node3]):
-                dump_zk(
-                    node, "/clickhouse/t1", "/clickhouse/t1/replicas/{}".format(num + 1)
-                )
-            assert False, "Cannot sync replica node{}".format(n + 1)
-
-    if node1.query("SELECT COUNT() FROM ordinary.t1") != "310\n":
-        for num, node in enumerate([node1, node2, node3]):
-            dump_zk(
-                node, "/clickhouse/t1", "/clickhouse/t1/replicas/{}".format(num + 1)
-            )
-
-    assert_eq_with_retry(node1, "SELECT COUNT() FROM ordinary.t1", "310")
-    assert_eq_with_retry(node2, "SELECT COUNT() FROM ordinary.t1", "310")
-    assert_eq_with_retry(node3, "SELECT COUNT() FROM ordinary.t1", "310")
-
-
-def dump_zk(node, zk_path, replica_path):
-    print(node.query("SELECT * FROM system.replication_queue FORMAT Vertical"))
-    print("Replicas")
-    print(node.query("SELECT * FROM system.replicas FORMAT Vertical"))
-    print("Replica 2 info")
-    print(
-        node.query(
-            "SELECT * FROM system.zookeeper WHERE path = '{}' FORMAT Vertical".format(
-                zk_path
-            )
-        )
-    )
-    print("Queue")
-    print(
-        node.query(
-            "SELECT * FROM system.zookeeper WHERE path = '{}/queue' FORMAT Vertical".format(
-                replica_path
-            )
-        )
-    )
-    print("Log")
-    print(
-        node.query(
-            "SELECT * FROM system.zookeeper WHERE path = '{}/log' FORMAT Vertical".format(
-                zk_path
-            )
-        )
-    )
-    print("Parts")
-    print(
-        node.query(
-            "SELECT name FROM system.zookeeper WHERE path = '{}/parts' FORMAT Vertical".format(
-                replica_path
-            )
-        )
-    )
-
-
-def restart_replica_for_sure(node, table_name, zk_replica_path):
-    fake_zk = None
-    try:
-        node.query("DETACH TABLE {}".format(table_name))
-        fake_zk = get_fake_zk(node.name)
-        if fake_zk.exists(zk_replica_path + "/is_active") is not None:
-            fake_zk.delete(zk_replica_path + "/is_active")
-
-        node.query("ATTACH TABLE {}".format(table_name))
-    except Exception as ex:
-        print("Exception", ex)
-        raise ex
-    finally:
-        if fake_zk:
-            fake_zk.stop()
-            fake_zk.close()
-
-
-# in extremely rare case it can take more than 5 minutes in debug build with sanitizer
-@pytest.mark.timeout(600)
-def test_blocade_leader_twice(started_cluster):
-    for i in range(100):
-        wait_nodes()
-        try:
-            for i, node in enumerate([node1, node2, node3]):
-                node.query(
-                    "CREATE DATABASE IF NOT EXISTS ordinary ENGINE=Ordinary",
-                    settings={"allow_deprecated_database_ordinary": 1},
-                )
-                node.query(
-                    "CREATE TABLE IF NOT EXISTS ordinary.t2 (value UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/t2', '{}') ORDER BY tuple()".format(
-                        i + 1
-                    )
-                )
-            break
-        except Exception as ex:
-            print("Got exception from node", smaller_exception(ex))
-            time.sleep(0.1)
-
-    node2.query(
-        "INSERT INTO ordinary.t2 SELECT number FROM numbers(10) SETTINGS insert_keeper_max_retries = 0"
-    )
-
-    node1.query("SYSTEM SYNC REPLICA ordinary.t2", timeout=10)
-    node3.query("SYSTEM SYNC REPLICA ordinary.t2", timeout=10)
-
-    assert_eq_with_retry(node1, "SELECT COUNT() FROM ordinary.t2", "10")
-    assert_eq_with_retry(node2, "SELECT COUNT() FROM ordinary.t2", "10")
-    assert_eq_with_retry(node3, "SELECT COUNT() FROM ordinary.t2", "10")
-
-    with PartitionManager() as pm:
-        pm.partition_instances(node2, node1)
-        pm.partition_instances(node3, node1)
-
-        for i in range(100):
-            try:
-                restart_replica_for_sure(
-                    node2, "ordinary.t2", "/clickhouse/t2/replicas/2"
-                )
-                node2.query(
-                    "INSERT INTO ordinary.t2 SELECT rand() FROM numbers(100) SETTINGS insert_keeper_max_retries = 0"
-                )
-                break
-            except Exception as ex:
-                try:
-                    node2.query("ATTACH TABLE ordinary.t2")
-                except Exception as attach_ex:
-                    print("Got exception node2", smaller_exception(attach_ex))
-                print("Got exception node2", smaller_exception(ex))
-                time.sleep(0.5)
-        else:
-            for num, node in enumerate([node1, node2, node3]):
-                dump_zk(
-                    node, "/clickhouse/t2", "/clickhouse/t2/replicas/{}".format(num + 1)
-                )
-            assert False, "Cannot reconnect for node2"
-
-        for i in range(100):
-            try:
-                restart_replica_for_sure(
-                    node3, "ordinary.t2", "/clickhouse/t2/replicas/3"
-                )
-                node3.query("SYSTEM SYNC REPLICA ordinary.t2", timeout=10)
-                node3.query(
-                    "INSERT INTO ordinary.t2 SELECT rand() FROM numbers(100) SETTINGS insert_keeper_max_retries = 0"
-                )
-                break
-            except Exception as ex:
-                try:
-                    node3.query("ATTACH TABLE ordinary.t2")
-                except Exception as attach_ex:
-                    print("Got exception node3", smaller_exception(attach_ex))
-                print("Got exception node3", smaller_exception(ex))
-                time.sleep(0.5)
-        else:
-            for num, node in enumerate([node1, node2, node3]):
-                dump_zk(
-                    node, "/clickhouse/t2", "/clickhouse/t2/replicas/{}".format(num + 1)
-                )
-            assert False, "Cannot reconnect for node3"
-
-        node2.query("SYSTEM SYNC REPLICA ordinary.t2", timeout=10)
-
-        assert_eq_with_retry(node2, "SELECT COUNT() FROM ordinary.t2", "210")
-        assert_eq_with_retry(node3, "SELECT COUNT() FROM ordinary.t2", "210")
-
-        # Total network partition
-        pm.partition_instances(node3, node2)
-
-        for i in range(10):
-            try:
-                node3.query(
-                    "INSERT INTO ordinary.t2 SELECT rand() FROM numbers(100) SETTINGS insert_keeper_max_retries = 0"
-                )
-                assert False, "Node3 became leader?"
-            except Exception as ex:
-                time.sleep(0.5)
-
-        for i in range(10):
-            try:
-                node2.query(
-                    "INSERT INTO ordinary.t2 SELECT rand() FROM numbers(100) SETTINGS insert_keeper_max_retries = 0"
-                )
-                assert False, "Node2 became leader?"
-            except Exception as ex:
-                time.sleep(0.5)
-
-    for n, node in enumerate([node1, node2, node3]):
-        for i in range(100):
-            try:
-                restart_replica_for_sure(
-                    node, "ordinary.t2", "/clickhouse/t2/replicas/{}".format(n + 1)
-                )
-                break
-            except Exception as ex:
-                try:
-                    node.query("ATTACH TABLE ordinary.t2")
-                except Exception as attach_ex:
-                    print(
-                        "Got exception node{}".format(n + 1),
-                        smaller_exception(attach_ex),
-                    )
-
-                print("Got exception node{}".format(n + 1), smaller_exception(ex))
-                time.sleep(0.5)
-        else:
-            for num, node in enumerate([node1, node2, node3]):
-                dump_zk(
-                    node, "/clickhouse/t2", "/clickhouse/t2/replicas/{}".format(num + 1)
-                )
-            assert False, "Cannot reconnect for node{}".format(n + 1)
-
-    for n, node in enumerate([node1, node2, node3]):
-        for i in range(100):
-            try:
-                node.query(
-                    "INSERT INTO ordinary.t2 SELECT rand() FROM numbers(100) SETTINGS insert_keeper_max_retries = 0"
-                )
-                break
-            except Exception as ex:
-                print("Got exception node{}".format(n + 1), smaller_exception(ex))
-                time.sleep(0.5)
-        else:
-            for num, node in enumerate([node1, node2, node3]):
-                dump_zk(
-                    node, "/clickhouse/t2", "/clickhouse/t2/replicas/{}".format(num + 1)
-                )
-            assert False, "Cannot reconnect for node{}".format(n + 1)
-
-        for i in range(100):
-            all_done = True
-            for n, node in enumerate([node1, node2, node3]):
-                try:
-                    restart_replica_for_sure(
-                        node, "ordinary.t2", "/clickhouse/t2/replicas/{}".format(n + 1)
-                    )
-                    node.query("SYSTEM SYNC REPLICA ordinary.t2", timeout=10)
-                    break
-                except Exception as ex:
-                    all_done = False
-                    try:
-                        node.query("ATTACH TABLE ordinary.t2")
-                    except Exception as attach_ex:
-                        print(
-                            "Got exception node{}".format(n + 1),
-                            smaller_exception(attach_ex),
-                        )
-
-                    print("Got exception node{}".format(n + 1), smaller_exception(ex))
-                    time.sleep(0.5)
-
-            if all_done:
-                break
-        else:
-            for num, node in enumerate([node1, node2, node3]):
-                dump_zk(
-                    node, "/clickhouse/t2", "/clickhouse/t2/replicas/{}".format(num + 1)
-                )
-            assert False, "Cannot reconnect in i {} retries".format(i)
-
-    assert_eq_with_retry(node1, "SELECT COUNT() FROM ordinary.t2", "510")
-    if node2.query("SELECT COUNT() FROM ordinary.t2") != "510\n":
-        for num, node in enumerate([node1, node2, node3]):
-            dump_zk(
-                node, "/clickhouse/t2", "/clickhouse/t2/replicas/{}".format(num + 1)
-            )
-
-    assert_eq_with_retry(node2, "SELECT COUNT() FROM ordinary.t2", "510")
-    assert_eq_with_retry(node3, "SELECT COUNT() FROM ordinary.t2", "510")
diff --git a/tests/integration/test_keeper_restore_from_snapshot/configs/disk_s3_storage.xml b/tests/integration/test_keeper_restore_from_snapshot/configs/disk_s3_storage.xml
new file mode 100644
index 00000000000..2ec4bcd77fb
--- /dev/null
+++ b/tests/integration/test_keeper_restore_from_snapshot/configs/disk_s3_storage.xml
@@ -0,0 +1,26 @@
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <snapshot_s3_plain1>
+                <type>s3_plain</type>
+                <endpoint>http://minio1:9001/root/data/snapshots1/</endpoint>
+                <access_key_id>minio</access_key_id>
+                <secret_access_key>minio123</secret_access_key>
+            </snapshot_s3_plain1>
+            <snapshot_s3_plain2>
+                <type>s3_plain</type>
+                <endpoint>http://minio1:9001/root/data/snapshots2/</endpoint>
+                <access_key_id>minio</access_key_id>
+                <secret_access_key>minio123</secret_access_key>
+            </snapshot_s3_plain2>
+            <snapshot_s3_plain3>
+                <type>s3_plain</type>
+                <endpoint>http://minio1:9001/root/data/snapshots3/</endpoint>
+                <access_key_id>minio</access_key_id>
+                <secret_access_key>minio123</secret_access_key>
+            </snapshot_s3_plain3>
+        </disks>
+    </storage_configuration>
+
+</clickhouse>
+
diff --git a/tests/integration/test_keeper_restore_from_snapshot/configs/enable_keeper1.xml b/tests/integration/test_keeper_restore_from_snapshot/configs/enable_keeper1.xml
index 4ea543e6f31..510913b5dc4 100644
--- a/tests/integration/test_keeper_restore_from_snapshot/configs/enable_keeper1.xml
+++ b/tests/integration/test_keeper_restore_from_snapshot/configs/enable_keeper1.xml
@@ -2,8 +2,6 @@
     <keeper_server>
         <tcp_port>9181</tcp_port>
         <server_id>1</server_id>
-        <log_storage_path>/var/lib/clickhouse/coordination/log</log_storage_path>
-        <snapshot_storage_path>/var/lib/clickhouse/coordination/snapshots</snapshot_storage_path>
 
         <coordination_settings>
             <operation_timeout_ms>5000</operation_timeout_ms>
diff --git a/tests/integration/test_keeper_restore_from_snapshot/configs/enable_keeper2.xml b/tests/integration/test_keeper_restore_from_snapshot/configs/enable_keeper2.xml
index 4bf3083c1fa..0d50573df01 100644
--- a/tests/integration/test_keeper_restore_from_snapshot/configs/enable_keeper2.xml
+++ b/tests/integration/test_keeper_restore_from_snapshot/configs/enable_keeper2.xml
@@ -2,8 +2,6 @@
     <keeper_server>
         <tcp_port>9181</tcp_port>
         <server_id>2</server_id>
-        <log_storage_path>/var/lib/clickhouse/coordination/log</log_storage_path>
-        <snapshot_storage_path>/var/lib/clickhouse/coordination/snapshots</snapshot_storage_path>
 
         <coordination_settings>
             <operation_timeout_ms>5000</operation_timeout_ms>
diff --git a/tests/integration/test_keeper_restore_from_snapshot/configs/enable_keeper3.xml b/tests/integration/test_keeper_restore_from_snapshot/configs/enable_keeper3.xml
index b9e2a2d0422..8fa322cb9e7 100644
--- a/tests/integration/test_keeper_restore_from_snapshot/configs/enable_keeper3.xml
+++ b/tests/integration/test_keeper_restore_from_snapshot/configs/enable_keeper3.xml
@@ -2,8 +2,6 @@
     <keeper_server>
         <tcp_port>9181</tcp_port>
         <server_id>3</server_id>
-        <log_storage_path>/var/lib/clickhouse/coordination/log</log_storage_path>
-        <snapshot_storage_path>/var/lib/clickhouse/coordination/snapshots</snapshot_storage_path>
 
         <coordination_settings>
             <operation_timeout_ms>5000</operation_timeout_ms>
diff --git a/tests/integration/test_keeper_restore_from_snapshot/configs/keeper1_snapshot_disk.xml b/tests/integration/test_keeper_restore_from_snapshot/configs/keeper1_snapshot_disk.xml
new file mode 100644
index 00000000000..01759e2771a
--- /dev/null
+++ b/tests/integration/test_keeper_restore_from_snapshot/configs/keeper1_snapshot_disk.xml
@@ -0,0 +1,5 @@
+<clickhouse>
+    <keeper_server>
+        <snapshot_storage_disk>snapshot_s3_plain1</snapshot_storage_disk>
+    </keeper_server>
+</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_keeper_restore_from_snapshot/configs/keeper2_snapshot_disk.xml b/tests/integration/test_keeper_restore_from_snapshot/configs/keeper2_snapshot_disk.xml
new file mode 100644
index 00000000000..6c33c5fb300
--- /dev/null
+++ b/tests/integration/test_keeper_restore_from_snapshot/configs/keeper2_snapshot_disk.xml
@@ -0,0 +1,5 @@
+<clickhouse>
+    <keeper_server>
+        <snapshot_storage_disk>snapshot_s3_plain2</snapshot_storage_disk>
+    </keeper_server>
+</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_keeper_restore_from_snapshot/configs/keeper3_snapshot_disk.xml b/tests/integration/test_keeper_restore_from_snapshot/configs/keeper3_snapshot_disk.xml
new file mode 100644
index 00000000000..5016ccd581b
--- /dev/null
+++ b/tests/integration/test_keeper_restore_from_snapshot/configs/keeper3_snapshot_disk.xml
@@ -0,0 +1,5 @@
+<clickhouse>
+    <keeper_server>
+        <snapshot_storage_disk>snapshot_s3_plain3</snapshot_storage_disk>
+    </keeper_server>
+</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_keeper_restore_from_snapshot/configs/local_storage_path.xml b/tests/integration/test_keeper_restore_from_snapshot/configs/local_storage_path.xml
new file mode 100644
index 00000000000..63cb958c88e
--- /dev/null
+++ b/tests/integration/test_keeper_restore_from_snapshot/configs/local_storage_path.xml
@@ -0,0 +1,6 @@
+<clickhouse>
+    <keeper_server>
+        <log_storage_path>/var/lib/clickhouse/coordination/log</log_storage_path>
+        <snapshot_storage_path>/var/lib/clickhouse/coordination/snapshots</snapshot_storage_path>
+    </keeper_server>
+</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_keeper_restore_from_snapshot/test.py b/tests/integration/test_keeper_restore_from_snapshot/test.py
index bc33689dd20..e4d5793bb17 100644
--- a/tests/integration/test_keeper_restore_from_snapshot/test.py
+++ b/tests/integration/test_keeper_restore_from_snapshot/test.py
@@ -9,13 +9,19 @@ import time
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance(
-    "node1", main_configs=["configs/enable_keeper1.xml"], stay_alive=True
+    "node1",
+    main_configs=["configs/enable_keeper1.xml", "configs/local_storage_path.xml"],
+    stay_alive=True,
 )
 node2 = cluster.add_instance(
-    "node2", main_configs=["configs/enable_keeper2.xml"], stay_alive=True
+    "node2",
+    main_configs=["configs/enable_keeper2.xml", "configs/local_storage_path.xml"],
+    stay_alive=True,
 )
 node3 = cluster.add_instance(
-    "node3", main_configs=["configs/enable_keeper3.xml"], stay_alive=True
+    "node3",
+    main_configs=["configs/enable_keeper3.xml", "configs/local_storage_path.xml"],
+    stay_alive=True,
 )
 
 from kazoo.client import KazooClient, KazooState
diff --git a/tests/integration/test_keeper_restore_from_snapshot/test_disk_s3.py b/tests/integration/test_keeper_restore_from_snapshot/test_disk_s3.py
new file mode 100644
index 00000000000..1226df75203
--- /dev/null
+++ b/tests/integration/test_keeper_restore_from_snapshot/test_disk_s3.py
@@ -0,0 +1,152 @@
+#!/usr/bin/env python3
+import pytest
+from helpers.cluster import ClickHouseCluster
+import helpers.keeper_utils as keeper_utils
+import random
+import string
+import os
+import time
+
+cluster = ClickHouseCluster(__file__)
+node1 = cluster.add_instance(
+    "node1",
+    main_configs=[
+        "configs/enable_keeper1.xml",
+        "configs/disk_s3_storage.xml",
+        "configs/keeper1_snapshot_disk.xml",
+    ],
+    stay_alive=True,
+    with_minio=True,
+)
+node2 = cluster.add_instance(
+    "node2",
+    main_configs=[
+        "configs/enable_keeper2.xml",
+        "configs/disk_s3_storage.xml",
+        "configs/keeper2_snapshot_disk.xml",
+    ],
+    stay_alive=True,
+    with_minio=True,
+)
+node3 = cluster.add_instance(
+    "node3",
+    main_configs=[
+        "configs/enable_keeper3.xml",
+        "configs/disk_s3_storage.xml",
+        "configs/keeper3_snapshot_disk.xml",
+    ],
+    stay_alive=True,
+    with_minio=True,
+)
+
+from kazoo.client import KazooClient, KazooState
+
+
+@pytest.fixture(scope="module")
+def started_cluster():
+    try:
+        cluster.start()
+
+        yield cluster
+
+    finally:
+        cluster.shutdown()
+
+
+def get_fake_zk(nodename, timeout=30.0):
+    _fake_zk_instance = KazooClient(
+        hosts=cluster.get_instance_ip(nodename) + ":9181", timeout=timeout
+    )
+    _fake_zk_instance.start()
+    return _fake_zk_instance
+
+
+def stop_zk(zk):
+    try:
+        if zk:
+            zk.stop()
+            zk.close()
+    except:
+        pass
+
+
+def test_recover_from_snapshot_with_disk_s3(started_cluster):
+    try:
+        node1_zk = node2_zk = node3_zk = None
+        node1_zk = get_fake_zk("node1")
+        node2_zk = get_fake_zk("node2")
+        node3_zk = get_fake_zk("node3")
+
+        node1_zk.create("/test_snapshot_multinode_recover", "somedata".encode())
+
+        node2_zk.sync("/test_snapshot_multinode_recover")
+        node3_zk.sync("/test_snapshot_multinode_recover")
+
+        assert node1_zk.get("/test_snapshot_multinode_recover")[0] == b"somedata"
+        assert node2_zk.get("/test_snapshot_multinode_recover")[0] == b"somedata"
+        assert node3_zk.get("/test_snapshot_multinode_recover")[0] == b"somedata"
+
+        node3.stop_clickhouse(kill=True)
+
+        # at least we will have 2 snapshots
+        for i in range(435):
+            node1_zk.create(
+                "/test_snapshot_multinode_recover" + str(i),
+                ("somedata" + str(i)).encode(),
+            )
+
+        for i in range(435):
+            if i % 10 == 0:
+                node1_zk.delete("/test_snapshot_multinode_recover" + str(i))
+
+    finally:
+        for zk in [node1_zk, node2_zk, node3_zk]:
+            stop_zk(zk)
+
+    # stale node should recover from leader's snapshot
+    # with some sanitizers can start longer than 5 seconds
+    node3.start_clickhouse(20)
+    keeper_utils.wait_until_connected(cluster, node3)
+    print("Restarted")
+
+    try:
+        node1_zk = node2_zk = node3_zk = None
+        node1_zk = get_fake_zk("node1")
+        node2_zk = get_fake_zk("node2")
+        node3_zk = get_fake_zk("node3")
+
+        node1_zk.sync("/test_snapshot_multinode_recover")
+        node2_zk.sync("/test_snapshot_multinode_recover")
+        node3_zk.sync("/test_snapshot_multinode_recover")
+
+        assert node1_zk.get("/test_snapshot_multinode_recover")[0] == b"somedata"
+        assert node2_zk.get("/test_snapshot_multinode_recover")[0] == b"somedata"
+        assert node3_zk.get("/test_snapshot_multinode_recover")[0] == b"somedata"
+
+        for i in range(435):
+            if i % 10 != 0:
+                assert (
+                    node1_zk.get("/test_snapshot_multinode_recover" + str(i))[0]
+                    == ("somedata" + str(i)).encode()
+                )
+                assert (
+                    node2_zk.get("/test_snapshot_multinode_recover" + str(i))[0]
+                    == ("somedata" + str(i)).encode()
+                )
+                assert (
+                    node3_zk.get("/test_snapshot_multinode_recover" + str(i))[0]
+                    == ("somedata" + str(i)).encode()
+                )
+            else:
+                assert (
+                    node1_zk.exists("/test_snapshot_multinode_recover" + str(i)) is None
+                )
+                assert (
+                    node2_zk.exists("/test_snapshot_multinode_recover" + str(i)) is None
+                )
+                assert (
+                    node3_zk.exists("/test_snapshot_multinode_recover" + str(i)) is None
+                )
+    finally:
+        for zk in [node1_zk, node2_zk, node3_zk]:
+            stop_zk(zk)
diff --git a/tests/integration/test_kerberos_auth/test.py b/tests/integration/test_kerberos_auth/test.py
index 3a183ad86a0..a41255cff3e 100644
--- a/tests/integration/test_kerberos_auth/test.py
+++ b/tests/integration/test_kerberos_auth/test.py
@@ -47,7 +47,7 @@ def make_auth(instance):
     instance_ip = cluster.get_instance_ip(instance.name)
 
     client.exec_in_container(
-        (["bash", "-c", f"echo '{instance_ip} {instance.hostname}' >> /etc/hosts"])
+        ["bash", "-c", f"echo '{instance_ip} {instance.hostname}' >> /etc/hosts"]
     )
 
     client.exec_in_container(
diff --git a/tests/integration/test_lost_part/test.py b/tests/integration/test_lost_part/test.py
index dd4c2105d55..0bc24268040 100644
--- a/tests/integration/test_lost_part/test.py
+++ b/tests/integration/test_lost_part/test.py
@@ -42,7 +42,8 @@ def test_lost_part_same_replica(start_cluster):
     for node in [node1, node2]:
         node.query(
             f"CREATE TABLE mt0 (id UInt64, date Date) ENGINE ReplicatedMergeTree('/clickhouse/tables/t', '{node.name}') ORDER BY tuple() PARTITION BY date "
-            "SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1"
+            "SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, cleanup_thread_preferred_points_per_iteration=0,"
+            "merge_selecting_sleep_ms=100, max_merge_selecting_sleep_ms=1000"
         )
 
     node1.query("SYSTEM STOP MERGES mt0")
@@ -109,7 +110,8 @@ def test_lost_part_other_replica(start_cluster):
     for node in [node1, node2]:
         node.query(
             f"CREATE TABLE mt1 (id UInt64) ENGINE ReplicatedMergeTree('/clickhouse/tables/t1', '{node.name}') ORDER BY tuple() "
-            "SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1"
+            "SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, cleanup_thread_preferred_points_per_iteration=0,"
+            "merge_selecting_sleep_ms=100, max_merge_selecting_sleep_ms=1000"
         )
 
     node1.query("SYSTEM STOP MERGES mt1")
@@ -178,7 +180,8 @@ def test_lost_part_mutation(start_cluster):
     for node in [node1, node2]:
         node.query(
             f"CREATE TABLE mt2 (id UInt64) ENGINE ReplicatedMergeTree('/clickhouse/tables/t2', '{node.name}') ORDER BY tuple() "
-            "SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1"
+            "SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, cleanup_thread_preferred_points_per_iteration=0,"
+            "merge_selecting_sleep_ms=100, max_merge_selecting_sleep_ms=1000"
         )
 
     node1.query("SYSTEM STOP MERGES mt2")
@@ -241,7 +244,8 @@ def test_lost_last_part(start_cluster):
     for node in [node1, node2]:
         node.query(
             f"CREATE TABLE mt3 (id UInt64, p String) ENGINE ReplicatedMergeTree('/clickhouse/tables/t3', '{node.name}') "
-            "ORDER BY tuple() PARTITION BY p SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1"
+            "ORDER BY tuple() PARTITION BY p SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, cleanup_thread_preferred_points_per_iteration=0,"
+            "merge_selecting_sleep_ms=100, max_merge_selecting_sleep_ms=1000"
         )
 
     node1.query("SYSTEM STOP MERGES mt3")
diff --git a/tests/integration/test_lost_part_during_startup/configs/compat.xml b/tests/integration/test_lost_part_during_startup/configs/compat.xml
new file mode 100644
index 00000000000..c919eaf6146
--- /dev/null
+++ b/tests/integration/test_lost_part_during_startup/configs/compat.xml
@@ -0,0 +1,4 @@
+<clickhouse>
+    <replicated_merge_tree_paranoid_check_on_drop_range>0</replicated_merge_tree_paranoid_check_on_drop_range>
+    <replicated_merge_tree_paranoid_check_on_startup>0</replicated_merge_tree_paranoid_check_on_startup>
+</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_lost_part_during_startup/test.py b/tests/integration/test_lost_part_during_startup/test.py
index de21d64c8aa..a013ec5d48d 100644
--- a/tests/integration/test_lost_part_during_startup/test.py
+++ b/tests/integration/test_lost_part_during_startup/test.py
@@ -6,7 +6,14 @@ from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance("node1", with_zookeeper=True, stay_alive=True)
-node2 = cluster.add_instance("node2", with_zookeeper=True, stay_alive=True)
+node2 = cluster.add_instance(
+    "node2",
+    with_zookeeper=True,
+    stay_alive=True,
+    main_configs=[
+        "configs/compat.xml",
+    ],
+)
 
 
 @pytest.fixture(scope="module")
diff --git a/tests/integration/test_materialized_mysql_database/configs/users.xml b/tests/integration/test_materialized_mysql_database/configs/users.xml
index 3669fbb46ba..7a7529c94bb 100644
--- a/tests/integration/test_materialized_mysql_database/configs/users.xml
+++ b/tests/integration/test_materialized_mysql_database/configs/users.xml
@@ -14,6 +14,7 @@
                 <ip>::/0</ip>
             </networks>
             <profile>default</profile>
+            <named_collection_control>1</named_collection_control>
         </default>
     </users>
 </clickhouse>
diff --git a/tests/integration/test_materialized_mysql_database/materialize_with_ddl.py b/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py
similarity index 92%
rename from tests/integration/test_materialized_mysql_database/materialize_with_ddl.py
rename to tests/integration/test_materialized_mysql_database/materialized_with_ddl.py
index 97e2de49ceb..8cf9e67bf63 100644
--- a/tests/integration/test_materialized_mysql_database/materialize_with_ddl.py
+++ b/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py
@@ -379,11 +379,51 @@ def drop_table_with_materialized_mysql_database(
         "",
     )
 
+    mysql_node.query(
+        "CREATE TABLE test_database_drop.test_table_3 (id INT NOT NULL PRIMARY KEY) ENGINE = InnoDB"
+    )
+    mysql_node.query("INSERT INTO test_database_drop.test_table_3 VALUES(1), (2)")
+    check_query(
+        clickhouse_node,
+        "SHOW TABLES FROM test_database_drop FORMAT TSV",
+        "test_table_2\ntest_table_3\n",
+    )
+    check_query(
+        clickhouse_node,
+        "SELECT * FROM test_database_drop.test_table_3 ORDER BY id FORMAT TSV",
+        "1\n2\n",
+    )
+    mysql_node.query("TRUNCATE test_database_drop.test_table_3")
+    check_query(
+        clickhouse_node,
+        "SELECT * FROM test_database_drop.test_table_3 ORDER BY id FORMAT TSV",
+        "",
+    )
+
+    mysql_node.query(
+        "CREATE TABLE test_database_drop.test_table_4 (id INT NOT NULL PRIMARY KEY) ENGINE = InnoDB"
+    )
+    mysql_node.query("INSERT INTO test_database_drop.test_table_4 VALUES(1), (2)")
+    check_query(
+        clickhouse_node,
+        "SELECT * FROM test_database_drop.test_table_4 ORDER BY id FORMAT TSV",
+        "1\n2\n",
+    )
+    with mysql_node.alloc_connection() as mysql:
+        mysql.query("USE test_database_drop")
+        mysql.query("TRUNCATE test_table_4")
+
+    check_query(
+        clickhouse_node,
+        "SELECT * FROM test_database_drop.test_table_4 ORDER BY id FORMAT TSV",
+        "",
+    )
+
     clickhouse_node.query("DROP DATABASE test_database_drop")
     mysql_node.query("DROP DATABASE test_database_drop")
 
 
-def create_table_like_with_materialize_mysql_database(
+def create_table_like_with_materialized_mysql_database(
     clickhouse_node, mysql_node, service_name
 ):
     mysql_node.query("DROP DATABASE IF EXISTS create_like")
@@ -1010,6 +1050,8 @@ def select_without_columns(clickhouse_node, mysql_node, service_name):
 
 
 def insert_with_modify_binlog_checksum(clickhouse_node, mysql_node, service_name):
+    clickhouse_node.query("DROP DATABASE IF EXISTS test_checksum")
+    mysql_node.query("DROP DATABASE IF EXISTS test_checksum")
     mysql_node.query("CREATE DATABASE test_checksum")
     mysql_node.query("CREATE TABLE test_checksum.t (a INT PRIMARY KEY, b varchar(200))")
     clickhouse_node.query(
@@ -1041,6 +1083,21 @@ def insert_with_modify_binlog_checksum(clickhouse_node, mysql_node, service_name
         "1\t1111\n2\t2222\n3\t3333\n",
     )
 
+    clickhouse_node.query("DROP DATABASE test_checksum")
+    mysql_node.query("SET GLOBAL binlog_checksum=NONE")
+    clickhouse_node.query(
+        "CREATE DATABASE test_checksum ENGINE = MaterializeMySQL('{}:3306', 'test_checksum', 'root', 'clickhouse')".format(
+            service_name
+        )
+    )
+    check_query(clickhouse_node, "SHOW TABLES FROM test_checksum FORMAT TSV", "t\n")
+    mysql_node.query("INSERT INTO test_checksum.t VALUES(4, '4444')")
+    check_query(
+        clickhouse_node,
+        "SELECT * FROM test_checksum.t ORDER BY a FORMAT TSV",
+        "1\t1111\n2\t2222\n3\t3333\n4\t4444\n",
+    )
+
     clickhouse_node.query("DROP DATABASE test_checksum")
     mysql_node.query("DROP DATABASE test_checksum")
 
@@ -1436,6 +1493,9 @@ def utf8mb4_test(clickhouse_node, mysql_node, service_name):
         "1\t\U0001F984\n2\t\u2601\n",
     )
 
+    clickhouse_node.query("DROP DATABASE utf8mb4_test")
+    mysql_node.query("DROP DATABASE utf8mb4_test")
+
 
 def system_parts_test(clickhouse_node, mysql_node, service_name):
     mysql_node.query("DROP DATABASE IF EXISTS system_parts_test")
@@ -1464,6 +1524,9 @@ def system_parts_test(clickhouse_node, mysql_node, service_name):
     clickhouse_node.query("OPTIMIZE TABLE system_parts_test.test")
     check_active_parts(1)
 
+    clickhouse_node.query("DROP DATABASE system_parts_test")
+    mysql_node.query("DROP DATABASE system_parts_test")
+
 
 def multi_table_update_test(clickhouse_node, mysql_node, service_name):
     mysql_node.query("DROP DATABASE IF EXISTS multi_table_update")
@@ -1489,6 +1552,8 @@ def multi_table_update_test(clickhouse_node, mysql_node, service_name):
 
     check_query(clickhouse_node, "SELECT * FROM multi_table_update.a", "1\tbaz\n")
     check_query(clickhouse_node, "SELECT * FROM multi_table_update.b", "1\tquux\n")
+    clickhouse_node.query("DROP DATABASE multi_table_update")
+    mysql_node.query("DROP DATABASE multi_table_update")
 
 
 def system_tables_test(clickhouse_node, mysql_node, service_name):
@@ -1509,50 +1574,53 @@ def system_tables_test(clickhouse_node, mysql_node, service_name):
         "intDiv(id, 4294967)\tid\tid\n",
     )
 
+    clickhouse_node.query("DROP DATABASE system_tables_test")
+    mysql_node.query("DROP DATABASE system_tables_test")
 
-def materialize_with_column_comments_test(clickhouse_node, mysql_node, service_name):
-    mysql_node.query("DROP DATABASE IF EXISTS materialize_with_column_comments_test")
+
+def materialized_with_column_comments_test(clickhouse_node, mysql_node, service_name):
+    mysql_node.query("DROP DATABASE IF EXISTS materialized_with_column_comments_test")
     clickhouse_node.query(
-        "DROP DATABASE IF EXISTS materialize_with_column_comments_test"
+        "DROP DATABASE IF EXISTS materialized_with_column_comments_test"
     )
-    mysql_node.query("CREATE DATABASE materialize_with_column_comments_test")
+    mysql_node.query("CREATE DATABASE materialized_with_column_comments_test")
     mysql_node.query(
-        "CREATE TABLE materialize_with_column_comments_test.test (id int NOT NULL PRIMARY KEY, value VARCHAR(255) COMMENT 'test comment') ENGINE=InnoDB"
+        "CREATE TABLE materialized_with_column_comments_test.test (id int NOT NULL PRIMARY KEY, value VARCHAR(255) COMMENT 'test comment') ENGINE=InnoDB"
     )
     clickhouse_node.query(
-        "CREATE DATABASE materialize_with_column_comments_test ENGINE = MaterializedMySQL('{}:3306', 'materialize_with_column_comments_test', 'root', 'clickhouse')".format(
+        "CREATE DATABASE materialized_with_column_comments_test ENGINE = MaterializedMySQL('{}:3306', 'materialized_with_column_comments_test', 'root', 'clickhouse')".format(
             service_name
         )
     )
     check_query(
         clickhouse_node,
-        "DESCRIBE TABLE materialize_with_column_comments_test.test",
+        "DESCRIBE TABLE materialized_with_column_comments_test.test",
         "id\tInt32\t\t\t\t\t\nvalue\tNullable(String)\t\t\ttest comment\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n",
     )
     mysql_node.query(
-        "ALTER TABLE materialize_with_column_comments_test.test MODIFY value VARCHAR(255) COMMENT 'comment test'"
+        "ALTER TABLE materialized_with_column_comments_test.test MODIFY value VARCHAR(255) COMMENT 'comment test'"
     )
     check_query(
         clickhouse_node,
-        "DESCRIBE TABLE materialize_with_column_comments_test.test",
+        "DESCRIBE TABLE materialized_with_column_comments_test.test",
         "id\tInt32\t\t\t\t\t\nvalue\tNullable(String)\t\t\tcomment test\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n",
     )
     mysql_node.query(
-        "ALTER TABLE materialize_with_column_comments_test.test ADD value2 int COMMENT 'test comment 2'"
+        "ALTER TABLE materialized_with_column_comments_test.test ADD value2 int COMMENT 'test comment 2'"
     )
     check_query(
         clickhouse_node,
-        "DESCRIBE TABLE materialize_with_column_comments_test.test",
+        "DESCRIBE TABLE materialized_with_column_comments_test.test",
         "id\tInt32\t\t\t\t\t\nvalue\tNullable(String)\t\t\tcomment test\t\t\nvalue2\tNullable(Int32)\t\t\ttest comment 2\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n",
     )
-    clickhouse_node.query("DROP DATABASE materialize_with_column_comments_test")
-    mysql_node.query("DROP DATABASE materialize_with_column_comments_test")
+    clickhouse_node.query("DROP DATABASE materialized_with_column_comments_test")
+    mysql_node.query("DROP DATABASE materialized_with_column_comments_test")
 
 
-def materialize_with_enum8_test(clickhouse_node, mysql_node, service_name):
-    mysql_node.query("DROP DATABASE IF EXISTS materialize_with_enum8_test")
-    clickhouse_node.query("DROP DATABASE IF EXISTS materialize_with_enum8_test")
-    mysql_node.query("CREATE DATABASE materialize_with_enum8_test")
+def materialized_with_enum8_test(clickhouse_node, mysql_node, service_name):
+    mysql_node.query("DROP DATABASE IF EXISTS materialized_with_enum8_test")
+    clickhouse_node.query("DROP DATABASE IF EXISTS materialized_with_enum8_test")
+    mysql_node.query("CREATE DATABASE materialized_with_enum8_test")
     enum8_values_count = 127
     enum8_values = ""
     enum8_values_with_backslash = ""
@@ -1564,46 +1632,46 @@ def materialize_with_enum8_test(clickhouse_node, mysql_node, service_name):
         "\\'" + str(enum8_values_count) + "\\' = " + str(enum8_values_count)
     )
     mysql_node.query(
-        "CREATE TABLE materialize_with_enum8_test.test (id int NOT NULL PRIMARY KEY, value ENUM("
+        "CREATE TABLE materialized_with_enum8_test.test (id int NOT NULL PRIMARY KEY, value ENUM("
         + enum8_values
         + ")) ENGINE=InnoDB"
     )
     mysql_node.query(
-        "INSERT INTO materialize_with_enum8_test.test (id, value) VALUES (1, '1'),(2, '2')"
+        "INSERT INTO materialized_with_enum8_test.test (id, value) VALUES (1, '1'),(2, '2')"
     )
     clickhouse_node.query(
-        "CREATE DATABASE materialize_with_enum8_test ENGINE = MaterializedMySQL('{}:3306', 'materialize_with_enum8_test', 'root', 'clickhouse')".format(
+        "CREATE DATABASE materialized_with_enum8_test ENGINE = MaterializedMySQL('{}:3306', 'materialized_with_enum8_test', 'root', 'clickhouse')".format(
             service_name
         )
     )
     check_query(
         clickhouse_node,
-        "SELECT value FROM materialize_with_enum8_test.test ORDER BY id",
+        "SELECT value FROM materialized_with_enum8_test.test ORDER BY id",
         "1\n2\n",
     )
     mysql_node.query(
-        "INSERT INTO materialize_with_enum8_test.test (id, value) VALUES (3, '127')"
+        "INSERT INTO materialized_with_enum8_test.test (id, value) VALUES (3, '127')"
     )
     check_query(
         clickhouse_node,
-        "SELECT value FROM materialize_with_enum8_test.test ORDER BY id",
+        "SELECT value FROM materialized_with_enum8_test.test ORDER BY id",
         "1\n2\n127\n",
     )
     check_query(
         clickhouse_node,
-        "DESCRIBE TABLE materialize_with_enum8_test.test",
+        "DESCRIBE TABLE materialized_with_enum8_test.test",
         "id\tInt32\t\t\t\t\t\nvalue\tNullable(Enum8("
         + enum8_values_with_backslash
         + "))\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n",
     )
-    clickhouse_node.query("DROP DATABASE materialize_with_enum8_test")
-    mysql_node.query("DROP DATABASE materialize_with_enum8_test")
+    clickhouse_node.query("DROP DATABASE materialized_with_enum8_test")
+    mysql_node.query("DROP DATABASE materialized_with_enum8_test")
 
 
-def materialize_with_enum16_test(clickhouse_node, mysql_node, service_name):
-    mysql_node.query("DROP DATABASE IF EXISTS materialize_with_enum16_test")
-    clickhouse_node.query("DROP DATABASE IF EXISTS materialize_with_enum16_test")
-    mysql_node.query("CREATE DATABASE materialize_with_enum16_test")
+def materialized_with_enum16_test(clickhouse_node, mysql_node, service_name):
+    mysql_node.query("DROP DATABASE IF EXISTS materialized_with_enum16_test")
+    clickhouse_node.query("DROP DATABASE IF EXISTS materialized_with_enum16_test")
+    mysql_node.query("CREATE DATABASE materialized_with_enum16_test")
     enum16_values_count = 600
     enum16_values = ""
     enum16_values_with_backslash = ""
@@ -1615,40 +1683,40 @@ def materialize_with_enum16_test(clickhouse_node, mysql_node, service_name):
         "\\'" + str(enum16_values_count) + "\\' = " + str(enum16_values_count)
     )
     mysql_node.query(
-        "CREATE TABLE materialize_with_enum16_test.test (id int NOT NULL PRIMARY KEY, value ENUM("
+        "CREATE TABLE materialized_with_enum16_test.test (id int NOT NULL PRIMARY KEY, value ENUM("
         + enum16_values
         + ")) ENGINE=InnoDB"
     )
     mysql_node.query(
-        "INSERT INTO materialize_with_enum16_test.test (id, value) VALUES (1, '1'),(2, '2')"
+        "INSERT INTO materialized_with_enum16_test.test (id, value) VALUES (1, '1'),(2, '2')"
     )
     clickhouse_node.query(
-        "CREATE DATABASE materialize_with_enum16_test ENGINE = MaterializedMySQL('{}:3306', 'materialize_with_enum16_test', 'root', 'clickhouse')".format(
+        "CREATE DATABASE materialized_with_enum16_test ENGINE = MaterializedMySQL('{}:3306', 'materialized_with_enum16_test', 'root', 'clickhouse')".format(
             service_name
         )
     )
     check_query(
         clickhouse_node,
-        "SELECT value FROM materialize_with_enum16_test.test ORDER BY id",
+        "SELECT value FROM materialized_with_enum16_test.test ORDER BY id",
         "1\n2\n",
     )
     mysql_node.query(
-        "INSERT INTO materialize_with_enum16_test.test (id, value) VALUES (3, '500')"
+        "INSERT INTO materialized_with_enum16_test.test (id, value) VALUES (3, '500')"
     )
     check_query(
         clickhouse_node,
-        "SELECT value FROM materialize_with_enum16_test.test ORDER BY id",
+        "SELECT value FROM materialized_with_enum16_test.test ORDER BY id",
         "1\n2\n500\n",
     )
     check_query(
         clickhouse_node,
-        "DESCRIBE TABLE materialize_with_enum16_test.test",
+        "DESCRIBE TABLE materialized_with_enum16_test.test",
         "id\tInt32\t\t\t\t\t\nvalue\tNullable(Enum16("
         + enum16_values_with_backslash
         + "))\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n",
     )
-    clickhouse_node.query("DROP DATABASE materialize_with_enum16_test")
-    mysql_node.query("DROP DATABASE materialize_with_enum16_test")
+    clickhouse_node.query("DROP DATABASE materialized_with_enum16_test")
+    mysql_node.query("DROP DATABASE materialized_with_enum16_test")
 
 
 def alter_enum8_to_enum16_test(clickhouse_node, mysql_node, service_name):
@@ -1974,6 +2042,18 @@ def table_overrides(clickhouse_node, mysql_node, service_name):
             f"{explain_with_table_func} {testcase[0]}"
         )
 
+    clickhouse_node.query("DROP DATABASE IF EXISTS table_overrides")
+    # Check empty table overrides
+    clickhouse_node.query(
+        f"""
+        CREATE DATABASE table_overrides ENGINE=MaterializeMySQL('{service_name}:3306', 'table_overrides', 'root', 'clickhouse')
+        TABLE OVERRIDE t1 ()
+    """
+    )
+    check_query(clickhouse_node, "SELECT count() FROM table_overrides.t1", "1001\n")
+    show_db = clickhouse_node.query("SHOW CREATE DATABASE table_overrides")
+    assert "TABLE OVERRIDE `t1`\\n(\\n\\n)" in show_db, show_db
+
     clickhouse_node.query("DROP DATABASE IF EXISTS table_overrides")
     mysql_node.query("DROP DATABASE IF EXISTS table_overrides")
 
@@ -2225,3 +2305,34 @@ def dropddl(clickhouse_node, mysql_node, mysql_host):
     )
     mysql_node.query(f"DROP DATABASE {db}")
     clickhouse_node.query(f"DROP DATABASE {db}")
+
+
+def named_collections(clickhouse_node, mysql_node, service_name):
+    db = "named_collections"
+    mysql_node.query(f"DROP DATABASE IF EXISTS {db}")
+    clickhouse_node.query(f"DROP DATABASE IF EXISTS {db}")
+    mysql_node.query(f"CREATE DATABASE {db}")
+    mysql_node.query(
+        f"CREATE TABLE {db}.t1 (id INT PRIMARY KEY, name VARCHAR(64), val INT)"
+    )
+    mysql_node.query(
+        f"INSERT INTO {db}.t1 (id, name, val) VALUES (1, 'a', 1), (2, 'b', 2)"
+    )
+
+    clickhouse_node.query(
+        f"""CREATE NAMED COLLECTION {db} AS
+            user = 'root',
+            password = 'clickhouse',
+            host = '{service_name}',
+            port = 3306,
+            database = '{db}'
+            """
+    )
+    clickhouse_node.query(f"CREATE DATABASE {db} ENGINE = MaterializedMySQL({db})")
+    check_query(
+        clickhouse_node,
+        f"/* expect: (1, 'a', 1), (2, 'b', 2) */ SELECT * FROM {db}.t1",
+        "1\ta\t1\n2\tb\t2\n",
+    )
+    clickhouse_node.query(f"DROP DATABASE IF EXISTS {db}")
+    mysql_node.query(f"DROP DATABASE IF EXISTS {db}")
diff --git a/tests/integration/test_materialized_mysql_database/test.py b/tests/integration/test_materialized_mysql_database/test.py
index a22d73061ae..21316d1a474 100644
--- a/tests/integration/test_materialized_mysql_database/test.py
+++ b/tests/integration/test_materialized_mysql_database/test.py
@@ -14,7 +14,7 @@ from helpers.cluster import (
 import docker
 import logging
 
-from . import materialize_with_ddl
+from . import materialized_with_ddl
 
 DOCKER_COMPOSE_PATH = get_docker_compose_path()
 
@@ -152,16 +152,16 @@ def clickhouse_node():
 def test_materialized_database_dml_with_mysql_5_7(
     started_cluster, started_mysql_5_7, clickhouse_node: ClickHouseInstance
 ):
-    materialize_with_ddl.dml_with_materialized_mysql_database(
+    materialized_with_ddl.dml_with_materialized_mysql_database(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.materialized_mysql_database_with_views(
+    materialized_with_ddl.materialized_mysql_database_with_views(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.materialized_mysql_database_with_datetime_and_decimal(
+    materialized_with_ddl.materialized_mysql_database_with_datetime_and_decimal(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.move_to_prewhere_and_column_filtering(
+    materialized_with_ddl.move_to_prewhere_and_column_filtering(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -169,16 +169,16 @@ def test_materialized_database_dml_with_mysql_5_7(
 def test_materialized_database_dml_with_mysql_8_0(
     started_cluster, started_mysql_8_0, clickhouse_node
 ):
-    materialize_with_ddl.dml_with_materialized_mysql_database(
+    materialized_with_ddl.dml_with_materialized_mysql_database(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.materialized_mysql_database_with_views(
+    materialized_with_ddl.materialized_mysql_database_with_views(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.materialized_mysql_database_with_datetime_and_decimal(
+    materialized_with_ddl.materialized_mysql_database_with_datetime_and_decimal(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.move_to_prewhere_and_column_filtering(
+    materialized_with_ddl.move_to_prewhere_and_column_filtering(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -186,30 +186,30 @@ def test_materialized_database_dml_with_mysql_8_0(
 def test_materialized_database_ddl_with_mysql_5_7(
     started_cluster, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.drop_table_with_materialized_mysql_database(
+    materialized_with_ddl.drop_table_with_materialized_mysql_database(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.create_table_with_materialized_mysql_database(
+    materialized_with_ddl.create_table_with_materialized_mysql_database(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.rename_table_with_materialized_mysql_database(
+    materialized_with_ddl.rename_table_with_materialized_mysql_database(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.alter_add_column_with_materialized_mysql_database(
+    materialized_with_ddl.alter_add_column_with_materialized_mysql_database(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.alter_drop_column_with_materialized_mysql_database(
+    materialized_with_ddl.alter_drop_column_with_materialized_mysql_database(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
     # mysql 5.7 cannot support alter rename column
-    # materialize_with_ddl.alter_rename_column_with_materialized_mysql_database(clickhouse_node, started_mysql_5_7, "mysql57")
-    materialize_with_ddl.alter_rename_table_with_materialized_mysql_database(
+    # materialized_with_ddl.alter_rename_column_with_materialized_mysql_database(clickhouse_node, started_mysql_5_7, "mysql57")
+    materialized_with_ddl.alter_rename_table_with_materialized_mysql_database(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.alter_modify_column_with_materialized_mysql_database(
+    materialized_with_ddl.alter_modify_column_with_materialized_mysql_database(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.create_table_like_with_materialize_mysql_database(
+    materialized_with_ddl.create_table_like_with_materialized_mysql_database(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -217,31 +217,31 @@ def test_materialized_database_ddl_with_mysql_5_7(
 def test_materialized_database_ddl_with_mysql_8_0(
     started_cluster, started_mysql_8_0, clickhouse_node
 ):
-    materialize_with_ddl.drop_table_with_materialized_mysql_database(
+    materialized_with_ddl.drop_table_with_materialized_mysql_database(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.create_table_with_materialized_mysql_database(
+    materialized_with_ddl.create_table_with_materialized_mysql_database(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.rename_table_with_materialized_mysql_database(
+    materialized_with_ddl.rename_table_with_materialized_mysql_database(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.alter_add_column_with_materialized_mysql_database(
+    materialized_with_ddl.alter_add_column_with_materialized_mysql_database(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.alter_drop_column_with_materialized_mysql_database(
+    materialized_with_ddl.alter_drop_column_with_materialized_mysql_database(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.alter_rename_table_with_materialized_mysql_database(
+    materialized_with_ddl.alter_rename_table_with_materialized_mysql_database(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.alter_rename_column_with_materialized_mysql_database(
+    materialized_with_ddl.alter_rename_column_with_materialized_mysql_database(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.alter_modify_column_with_materialized_mysql_database(
+    materialized_with_ddl.alter_modify_column_with_materialized_mysql_database(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.create_table_like_with_materialize_mysql_database(
+    materialized_with_ddl.create_table_like_with_materialized_mysql_database(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -249,7 +249,7 @@ def test_materialized_database_ddl_with_mysql_8_0(
 def test_materialized_database_ddl_with_empty_transaction_5_7(
     started_cluster, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.query_event_with_empty_transaction(
+    materialized_with_ddl.query_event_with_empty_transaction(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -257,7 +257,7 @@ def test_materialized_database_ddl_with_empty_transaction_5_7(
 def test_materialized_database_ddl_with_empty_transaction_8_0(
     started_cluster, started_mysql_8_0, clickhouse_node
 ):
-    materialize_with_ddl.query_event_with_empty_transaction(
+    materialized_with_ddl.query_event_with_empty_transaction(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -265,7 +265,7 @@ def test_materialized_database_ddl_with_empty_transaction_8_0(
 def test_select_without_columns_5_7(
     started_cluster, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.select_without_columns(
+    materialized_with_ddl.select_without_columns(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -273,7 +273,7 @@ def test_select_without_columns_5_7(
 def test_select_without_columns_8_0(
     started_cluster, started_mysql_8_0, clickhouse_node
 ):
-    materialize_with_ddl.select_without_columns(
+    materialized_with_ddl.select_without_columns(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -281,7 +281,7 @@ def test_select_without_columns_8_0(
 def test_insert_with_modify_binlog_checksum_5_7(
     started_cluster, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.insert_with_modify_binlog_checksum(
+    materialized_with_ddl.insert_with_modify_binlog_checksum(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -289,7 +289,7 @@ def test_insert_with_modify_binlog_checksum_5_7(
 def test_insert_with_modify_binlog_checksum_8_0(
     started_cluster, started_mysql_8_0, clickhouse_node
 ):
-    materialize_with_ddl.insert_with_modify_binlog_checksum(
+    materialized_with_ddl.insert_with_modify_binlog_checksum(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -297,7 +297,7 @@ def test_insert_with_modify_binlog_checksum_8_0(
 def test_materialized_database_err_sync_user_privs_5_7(
     started_cluster, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.err_sync_user_privs_with_materialized_mysql_database(
+    materialized_with_ddl.err_sync_user_privs_with_materialized_mysql_database(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -305,19 +305,19 @@ def test_materialized_database_err_sync_user_privs_5_7(
 def test_materialized_database_err_sync_user_privs_8_0(
     started_cluster, started_mysql_8_0, clickhouse_node
 ):
-    materialize_with_ddl.err_sync_user_privs_with_materialized_mysql_database(
+    materialized_with_ddl.err_sync_user_privs_with_materialized_mysql_database(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
 
 def test_network_partition_5_7(started_cluster, started_mysql_5_7, clickhouse_node):
-    materialize_with_ddl.network_partition_test(
+    materialized_with_ddl.network_partition_test(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
 
 def test_network_partition_8_0(started_cluster, started_mysql_8_0, clickhouse_node):
-    materialize_with_ddl.network_partition_test(
+    materialized_with_ddl.network_partition_test(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -325,7 +325,7 @@ def test_network_partition_8_0(started_cluster, started_mysql_8_0, clickhouse_no
 def test_mysql_kill_sync_thread_restore_5_7(
     started_cluster, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.mysql_kill_sync_thread_restore_test(
+    materialized_with_ddl.mysql_kill_sync_thread_restore_test(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -333,7 +333,7 @@ def test_mysql_kill_sync_thread_restore_5_7(
 def test_mysql_kill_sync_thread_restore_8_0(
     started_cluster, started_mysql_8_0, clickhouse_node
 ):
-    materialize_with_ddl.mysql_kill_sync_thread_restore_test(
+    materialized_with_ddl.mysql_kill_sync_thread_restore_test(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -341,7 +341,7 @@ def test_mysql_kill_sync_thread_restore_8_0(
 def test_mysql_killed_while_insert_5_7(
     started_cluster, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.mysql_killed_while_insert(
+    materialized_with_ddl.mysql_killed_while_insert(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -349,7 +349,7 @@ def test_mysql_killed_while_insert_5_7(
 def test_mysql_killed_while_insert_8_0(
     started_cluster, started_mysql_8_0, clickhouse_node
 ):
-    materialize_with_ddl.mysql_killed_while_insert(
+    materialized_with_ddl.mysql_killed_while_insert(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -357,7 +357,7 @@ def test_mysql_killed_while_insert_8_0(
 def test_clickhouse_killed_while_insert_5_7(
     started_cluster, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.clickhouse_killed_while_insert(
+    materialized_with_ddl.clickhouse_killed_while_insert(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -365,7 +365,7 @@ def test_clickhouse_killed_while_insert_5_7(
 def test_clickhouse_killed_while_insert_8_0(
     started_cluster, started_mysql_8_0, clickhouse_node
 ):
-    materialize_with_ddl.clickhouse_killed_while_insert(
+    materialized_with_ddl.clickhouse_killed_while_insert(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -373,12 +373,12 @@ def test_clickhouse_killed_while_insert_8_0(
 def test_utf8mb4(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.utf8mb4_test(clickhouse_node, started_mysql_5_7, "mysql57")
-    materialize_with_ddl.utf8mb4_test(clickhouse_node, started_mysql_8_0, "mysql80")
+    materialized_with_ddl.utf8mb4_test(clickhouse_node, started_mysql_5_7, "mysql57")
+    materialized_with_ddl.utf8mb4_test(clickhouse_node, started_mysql_8_0, "mysql80")
 
 
 def test_system_parts_table(started_cluster, started_mysql_8_0, clickhouse_node):
-    materialize_with_ddl.system_parts_test(
+    materialized_with_ddl.system_parts_test(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -386,10 +386,10 @@ def test_system_parts_table(started_cluster, started_mysql_8_0, clickhouse_node)
 def test_multi_table_update(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.multi_table_update_test(
+    materialized_with_ddl.multi_table_update_test(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.multi_table_update_test(
+    materialized_with_ddl.multi_table_update_test(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -397,10 +397,10 @@ def test_multi_table_update(
 def test_system_tables_table(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.system_tables_test(
+    materialized_with_ddl.system_tables_test(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.system_tables_test(
+    materialized_with_ddl.system_tables_test(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -408,10 +408,10 @@ def test_system_tables_table(
 def test_materialized_with_column_comments(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.materialize_with_column_comments_test(
+    materialized_with_ddl.materialized_with_column_comments_test(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.materialize_with_column_comments_test(
+    materialized_with_ddl.materialized_with_column_comments_test(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -419,22 +419,22 @@ def test_materialized_with_column_comments(
 def test_materialized_with_enum(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.materialize_with_enum8_test(
+    materialized_with_ddl.materialized_with_enum8_test(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.materialize_with_enum16_test(
+    materialized_with_ddl.materialized_with_enum16_test(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.alter_enum8_to_enum16_test(
+    materialized_with_ddl.alter_enum8_to_enum16_test(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.materialize_with_enum8_test(
+    materialized_with_ddl.materialized_with_enum8_test(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.materialize_with_enum16_test(
+    materialized_with_ddl.materialized_with_enum16_test(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.alter_enum8_to_enum16_test(
+    materialized_with_ddl.alter_enum8_to_enum16_test(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -445,10 +445,10 @@ def test_materialized_with_enum(
 def test_mysql_settings(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.mysql_settings_test(
+    materialized_with_ddl.mysql_settings_test(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
-    materialize_with_ddl.mysql_settings_test(
+    materialized_with_ddl.mysql_settings_test(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
 
@@ -456,10 +456,10 @@ def test_mysql_settings(
 def test_large_transaction(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.materialized_mysql_large_transaction(
+    materialized_with_ddl.materialized_mysql_large_transaction(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.materialized_mysql_large_transaction(
+    materialized_with_ddl.materialized_mysql_large_transaction(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -467,24 +467,24 @@ def test_large_transaction(
 def test_table_table(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.table_table(clickhouse_node, started_mysql_8_0, "mysql80")
-    materialize_with_ddl.table_table(clickhouse_node, started_mysql_5_7, "mysql57")
+    materialized_with_ddl.table_table(clickhouse_node, started_mysql_8_0, "mysql80")
+    materialized_with_ddl.table_table(clickhouse_node, started_mysql_5_7, "mysql57")
 
 
 def test_table_overrides(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.table_overrides(clickhouse_node, started_mysql_5_7, "mysql57")
-    materialize_with_ddl.table_overrides(clickhouse_node, started_mysql_8_0, "mysql80")
+    materialized_with_ddl.table_overrides(clickhouse_node, started_mysql_5_7, "mysql57")
+    materialized_with_ddl.table_overrides(clickhouse_node, started_mysql_8_0, "mysql80")
 
 
 def test_materialized_database_support_all_kinds_of_mysql_datatype(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.materialized_database_support_all_kinds_of_mysql_datatype(
+    materialized_with_ddl.materialized_database_support_all_kinds_of_mysql_datatype(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.materialized_database_support_all_kinds_of_mysql_datatype(
+    materialized_with_ddl.materialized_database_support_all_kinds_of_mysql_datatype(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -492,10 +492,10 @@ def test_materialized_database_support_all_kinds_of_mysql_datatype(
 def test_materialized_database_settings_materialized_mysql_tables_list(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.materialized_database_settings_materialized_mysql_tables_list(
+    materialized_with_ddl.materialized_database_settings_materialized_mysql_tables_list(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.materialized_database_settings_materialized_mysql_tables_list(
+    materialized_with_ddl.materialized_database_settings_materialized_mysql_tables_list(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -503,10 +503,10 @@ def test_materialized_database_settings_materialized_mysql_tables_list(
 def test_materialized_database_mysql_date_type_to_date32(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.materialized_database_mysql_date_type_to_date32(
+    materialized_with_ddl.materialized_database_mysql_date_type_to_date32(
         clickhouse_node, started_mysql_8_0, "mysql80"
     )
-    materialize_with_ddl.materialized_database_mysql_date_type_to_date32(
+    materialized_with_ddl.materialized_database_mysql_date_type_to_date32(
         clickhouse_node, started_mysql_5_7, "mysql57"
     )
 
@@ -514,12 +514,18 @@ def test_materialized_database_mysql_date_type_to_date32(
 def test_savepoint_query(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.savepoint(clickhouse_node, started_mysql_8_0, "mysql80")
-    materialize_with_ddl.savepoint(clickhouse_node, started_mysql_5_7, "mysql57")
+    materialized_with_ddl.savepoint(clickhouse_node, started_mysql_8_0, "mysql80")
+    materialized_with_ddl.savepoint(clickhouse_node, started_mysql_5_7, "mysql57")
 
 
 def test_materialized_database_mysql_drop_ddl(
     started_cluster, started_mysql_8_0, started_mysql_5_7, clickhouse_node
 ):
-    materialize_with_ddl.dropddl(clickhouse_node, started_mysql_8_0, "mysql80")
-    materialize_with_ddl.dropddl(clickhouse_node, started_mysql_5_7, "mysql57")
+    materialized_with_ddl.dropddl(clickhouse_node, started_mysql_8_0, "mysql80")
+    materialized_with_ddl.dropddl(clickhouse_node, started_mysql_5_7, "mysql57")
+
+
+def test_named_collections(started_cluster, started_mysql_8_0, clickhouse_node):
+    materialized_with_ddl.named_collections(
+        clickhouse_node, started_mysql_8_0, "mysql80"
+    )
diff --git a/tests/integration/test_merge_tree_azure_blob_storage/configs/config.xml b/tests/integration/test_merge_tree_azure_blob_storage/configs/config.xml
index feb537ebbce..a6e0d26f695 100644
--- a/tests/integration/test_merge_tree_azure_blob_storage/configs/config.xml
+++ b/tests/integration/test_merge_tree_azure_blob_storage/configs/config.xml
@@ -15,4 +15,5 @@
     <max_concurrent_queries>500</max_concurrent_queries>
     <path>./clickhouse/</path>
     <users_config>users.xml</users_config>
+    <allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 </clickhouse>
diff --git a/tests/integration/test_merge_tree_azure_blob_storage/test.py b/tests/integration/test_merge_tree_azure_blob_storage/test.py
index 8bf4df17c39..761b5257a34 100644
--- a/tests/integration/test_merge_tree_azure_blob_storage/test.py
+++ b/tests/integration/test_merge_tree_azure_blob_storage/test.py
@@ -66,6 +66,7 @@ def create_table(node, table_name, **additional_settings):
         "storage_policy": "blob_storage_policy",
         "old_parts_lifetime": 1,
         "index_granularity": 512,
+        "temporary_directories_lifetime": 1,
     }
     settings.update(additional_settings)
 
diff --git a/tests/integration/test_keeper_multinode_blocade_leader/__init__.py b/tests/integration/test_merge_tree_check_part_with_cache/__init__.py
similarity index 100%
rename from tests/integration/test_keeper_multinode_blocade_leader/__init__.py
rename to tests/integration/test_merge_tree_check_part_with_cache/__init__.py
diff --git a/tests/integration/test_merge_tree_check_part_with_cache/configs/storage_conf.xml b/tests/integration/test_merge_tree_check_part_with_cache/configs/storage_conf.xml
new file mode 100644
index 00000000000..c5e5565e1a9
--- /dev/null
+++ b/tests/integration/test_merge_tree_check_part_with_cache/configs/storage_conf.xml
@@ -0,0 +1,29 @@
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <s3>
+                <type>s3</type>
+                <endpoint>http://minio1:9001/root/data/</endpoint>
+                <access_key_id>minio</access_key_id>
+                <secret_access_key>minio123</secret_access_key>
+                <s3_max_single_part_upload_size>33554432</s3_max_single_part_upload_size>
+            </s3>
+            <s3_cache>
+                <type>cache</type>
+                <disk>s3</disk>
+                <path>/s3_cache/</path>
+                <max_size>1000000000</max_size>
+                <cache_on_write_operations>1</cache_on_write_operations>
+            </s3_cache>
+        </disks>
+        <policies>
+            <s3_cache>
+                <volumes>
+                    <main>
+                        <disk>s3_cache</disk>
+                    </main>
+                </volumes>
+            </s3_cache>
+        </policies>
+    </storage_configuration>
+</clickhouse>
diff --git a/tests/integration/test_merge_tree_check_part_with_cache/test.py b/tests/integration/test_merge_tree_check_part_with_cache/test.py
new file mode 100644
index 00000000000..1f50a5ab9de
--- /dev/null
+++ b/tests/integration/test_merge_tree_check_part_with_cache/test.py
@@ -0,0 +1,106 @@
+import pytest
+import os
+import json
+from helpers.cluster import ClickHouseCluster
+
+cluster = ClickHouseCluster(__file__)
+
+node = cluster.add_instance(
+    "node",
+    main_configs=["configs/storage_conf.xml"],
+    with_minio=True,
+)
+
+
+@pytest.fixture(scope="module")
+def start_cluster():
+    try:
+        cluster.start()
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+def test_check_part_with_cache(start_cluster):
+    if node.is_built_with_sanitizer() or node.is_debug_build():
+        pytest.skip(
+            "Skip with debug build and sanitizers. \
+            This test manually corrupts cache which triggers LOGICAL_ERROR \
+            and leads to crash with those builds"
+        )
+
+    node.query(
+        """
+        CREATE TABLE s3_test (
+            id Int64,
+            data String
+        ) ENGINE=MergeTree()
+        ORDER BY id
+        SETTINGS storage_policy='s3_cache'
+        """
+    )
+
+    node.query("SYSTEM STOP MERGES s3_test")
+
+    node.query(
+        "INSERT INTO s3_test VALUES (0, 'data')",
+        settings={"enable_filesystem_cache_on_write_operations": 1},
+    )
+
+    node.query(
+        "INSERT INTO s3_test VALUES (1, 'data')",
+        settings={"enable_filesystem_cache_on_write_operations": 1},
+    )
+
+    def get_cache_path_of_data_file(part_name):
+        disk_path = node.query(
+            "SELECT path FROM system.disks WHERE name = 's3_cache'"
+        ).strip("\n")
+
+        part_path = node.query(
+            f"SELECT path FROM system.parts WHERE table = 's3_test' AND name = '{part_name}'"
+        ).strip("\n")
+
+        local_data_file_path = os.path.relpath(part_path, disk_path) + "/data.bin"
+
+        return node.query(
+            f"SELECT cache_paths[1] FROM system.remote_data_paths WHERE disk_name = 's3_cache' AND local_path = '{local_data_file_path}'"
+        ).strip("\n")
+
+    cache_path = get_cache_path_of_data_file("all_1_1_0")
+    assert len(cache_path) > 0
+
+    node.exec_in_container(
+        ["bash", "-c", f"truncate -s -1 {cache_path}"], privileged=True
+    )
+
+    assert (
+        node.query(
+            "SELECT count() FROM s3_test WHERE NOT ignore(*)",
+            settings={"enable_filesystem_cache": 0},
+        )
+        == "2\n"
+    )
+
+    with pytest.raises(Exception):
+        node.query(
+            "SELECT count() FROM s3_test WHERE NOT ignore(*)",
+            settings={"enable_filesystem_cache": 1},
+        )
+
+    assert node.query("CHECK TABLE s3_test") == "1\n"
+
+    # Check that cache is removed only for one part after CHECK TABLE
+    cache_path = get_cache_path_of_data_file("all_1_1_0")
+    assert len(cache_path) == 0
+
+    cache_path = get_cache_path_of_data_file("all_2_2_0")
+    assert len(cache_path) > 0
+
+    assert (
+        node.query(
+            "SELECT count() FROM s3_test WHERE NOT ignore(*)",
+            settings={"enable_filesystem_cache": 1},
+        )
+        == "2\n"
+    )
diff --git a/tests/integration/test_merge_tree_empty_parts/test.py b/tests/integration/test_merge_tree_empty_parts/test.py
index 0f611408a67..c6a96f3ed1b 100644
--- a/tests/integration/test_merge_tree_empty_parts/test.py
+++ b/tests/integration/test_merge_tree_empty_parts/test.py
@@ -27,7 +27,7 @@ def test_empty_parts_alter_delete(started_cluster):
         "CREATE TABLE empty_parts_delete (d Date, key UInt64, value String) "
         "ENGINE = ReplicatedMergeTree('/clickhouse/tables/empty_parts_delete', 'r1') "
         "PARTITION BY toYYYYMM(d) ORDER BY key "
-        "SETTINGS old_parts_lifetime = 1"
+        "SETTINGS old_parts_lifetime = 1, cleanup_delay_period=0, cleanup_thread_preferred_points_per_iteration=0"
     )
 
     node1.query("INSERT INTO empty_parts_delete VALUES (toDate('2020-10-10'), 1, 'a')")
@@ -48,7 +48,7 @@ def test_empty_parts_summing(started_cluster):
         "CREATE TABLE empty_parts_summing (d Date, key UInt64, value Int64) "
         "ENGINE = ReplicatedSummingMergeTree('/clickhouse/tables/empty_parts_summing', 'r1') "
         "PARTITION BY toYYYYMM(d) ORDER BY key "
-        "SETTINGS old_parts_lifetime = 1"
+        "SETTINGS old_parts_lifetime = 1, cleanup_delay_period=0, cleanup_thread_preferred_points_per_iteration=0"
     )
 
     node1.query("INSERT INTO empty_parts_summing VALUES (toDate('2020-10-10'), 1, 1)")
diff --git a/tests/integration/test_merge_tree_hdfs/configs/config.d/storage_conf.xml b/tests/integration/test_merge_tree_hdfs/configs/config.d/storage_conf.xml
index 890c396ed95..858d77e9ea0 100644
--- a/tests/integration/test_merge_tree_hdfs/configs/config.d/storage_conf.xml
+++ b/tests/integration/test_merge_tree_hdfs/configs/config.d/storage_conf.xml
@@ -29,4 +29,5 @@
     <merge_tree>
         <min_bytes_for_wide_part>0</min_bytes_for_wide_part>
     </merge_tree>
+    <allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 </clickhouse>
diff --git a/tests/integration/test_merge_tree_hdfs/test.py b/tests/integration/test_merge_tree_hdfs/test.py
index c79986c34f0..95b63a5c8a3 100644
--- a/tests/integration/test_merge_tree_hdfs/test.py
+++ b/tests/integration/test_merge_tree_hdfs/test.py
@@ -29,7 +29,8 @@ def create_table(cluster, table_name, additional_settings=None):
         SETTINGS
             storage_policy='hdfs',
             old_parts_lifetime=0,
-            index_granularity=512
+            index_granularity=512,
+            temporary_directories_lifetime=1
         """.format(
         table_name
     )
@@ -234,12 +235,7 @@ def test_attach_detach_partition(cluster):
     assert node.query("SELECT count(*) FROM hdfs_test FORMAT Values") == "(8192)"
 
     hdfs_objects = fs.listdir("/clickhouse")
-    assert (
-        len(hdfs_objects)
-        == FILES_OVERHEAD
-        + FILES_OVERHEAD_PER_PART_WIDE * 2
-        - FILES_OVERHEAD_METADATA_VERSION
-    )
+    assert len(hdfs_objects) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE * 2
 
     node.query("ALTER TABLE hdfs_test DROP PARTITION '2020-01-03'")
     assert node.query("SELECT count(*) FROM hdfs_test FORMAT Values") == "(4096)"
diff --git a/tests/integration/test_merge_tree_load_parts/configs/compat.xml b/tests/integration/test_merge_tree_load_parts/configs/compat.xml
new file mode 100644
index 00000000000..c919eaf6146
--- /dev/null
+++ b/tests/integration/test_merge_tree_load_parts/configs/compat.xml
@@ -0,0 +1,4 @@
+<clickhouse>
+    <replicated_merge_tree_paranoid_check_on_drop_range>0</replicated_merge_tree_paranoid_check_on_drop_range>
+    <replicated_merge_tree_paranoid_check_on_startup>0</replicated_merge_tree_paranoid_check_on_startup>
+</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_merge_tree_load_parts/test.py b/tests/integration/test_merge_tree_load_parts/test.py
index 118c31ea864..968225887ad 100644
--- a/tests/integration/test_merge_tree_load_parts/test.py
+++ b/tests/integration/test_merge_tree_load_parts/test.py
@@ -9,7 +9,7 @@ cluster = helpers.cluster.ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance(
     "node1",
-    main_configs=["configs/fast_background_pool.xml"],
+    main_configs=["configs/fast_background_pool.xml", "configs/compat.xml"],
     with_zookeeper=True,
     stay_alive=True,
 )
diff --git a/tests/integration/test_merge_tree_s3/configs/config.xml b/tests/integration/test_merge_tree_s3/configs/config.xml
index 314f23f5788..a25da96215e 100644
--- a/tests/integration/test_merge_tree_s3/configs/config.xml
+++ b/tests/integration/test_merge_tree_s3/configs/config.xml
@@ -8,4 +8,5 @@
     </s3>
 
     <enable_system_unfreeze>true</enable_system_unfreeze>
+    <allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 </clickhouse>
diff --git a/tests/integration/test_merge_tree_s3/test.py b/tests/integration/test_merge_tree_s3/test.py
index 7730bfcf7b2..f754bc905bf 100644
--- a/tests/integration/test_merge_tree_s3/test.py
+++ b/tests/integration/test_merge_tree_s3/test.py
@@ -75,6 +75,7 @@ def create_table(node, table_name, **additional_settings):
         "storage_policy": "s3",
         "old_parts_lifetime": 0,
         "index_granularity": 512,
+        "temporary_directories_lifetime": 1,
     }
     settings.update(additional_settings)
 
@@ -335,9 +336,7 @@ def test_attach_detach_partition(cluster, node_name):
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(8192)"
     assert (
         len(list_objects(cluster, "data/"))
-        == FILES_OVERHEAD
-        + FILES_OVERHEAD_PER_PART_WIDE * 2
-        - FILES_OVERHEAD_METADATA_VERSION
+        == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE * 2
     )
 
     node.query("ALTER TABLE s3_test DROP PARTITION '2020-01-03'")
@@ -739,109 +738,6 @@ def test_cache_with_full_disk_space(cluster, node_name):
     check_no_objects_after_drop(cluster, node_name=node_name)
 
 
-@pytest.mark.parametrize("node_name", ["node"])
-def test_store_cleanup_disk_s3(cluster, node_name):
-    node = cluster.instances[node_name]
-    node.query("DROP TABLE IF EXISTS s3_test SYNC")
-    node.query(
-        "CREATE TABLE s3_test UUID '00000000-1000-4000-8000-000000000001' (n UInt64) Engine=MergeTree() ORDER BY n SETTINGS storage_policy='s3';"
-    )
-    node.query("INSERT INTO s3_test SELECT 1")
-
-    node.stop_clickhouse(kill=True)
-    path_to_data = "/var/lib/clickhouse/"
-    node.exec_in_container(["rm", f"{path_to_data}/metadata/default/s3_test.sql"])
-    node.start_clickhouse()
-
-    node.wait_for_log_line(
-        "Removing unused directory", timeout=90, look_behind_lines=1000
-    )
-    node.wait_for_log_line("directories from store")
-    node.query(
-        "CREATE TABLE s3_test UUID '00000000-1000-4000-8000-000000000001' (n UInt64) Engine=MergeTree() ORDER BY n SETTINGS storage_policy='s3';"
-    )
-    node.query("INSERT INTO s3_test SELECT 1")
-    check_no_objects_after_drop(cluster)
-
-
-@pytest.mark.parametrize("node_name", ["node"])
-def test_cache_setting_compatibility(cluster, node_name):
-    node = cluster.instances[node_name]
-
-    node.query("DROP TABLE IF EXISTS s3_test SYNC")
-
-    node.query(
-        "CREATE TABLE s3_test (key UInt32, value String) Engine=MergeTree() ORDER BY key SETTINGS storage_policy='s3_cache_r', compress_marks=false, compress_primary_key=false;"
-    )
-    node.query(
-        "INSERT INTO s3_test SELECT * FROM generateRandom('key UInt32, value String') LIMIT 500"
-    )
-
-    result = node.query("SYSTEM DROP FILESYSTEM CACHE")
-
-    result = node.query(
-        "SELECT count() FROM system.filesystem_cache WHERE cache_path LIKE '%persistent'"
-    )
-    assert int(result) == 0
-
-    node.query("SELECT * FROM s3_test")
-
-    result = node.query(
-        "SELECT count() FROM system.filesystem_cache WHERE cache_path LIKE '%persistent'"
-    )
-    assert int(result) > 0
-
-    config_path = os.path.join(
-        SCRIPT_DIR,
-        f"./{cluster.instances_dir_name}/node/configs/config.d/storage_conf.xml",
-    )
-
-    replace_config(
-        config_path,
-        "<do_not_evict_index_and_mark_files>1</do_not_evict_index_and_mark_files>",
-        "<do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>",
-    )
-
-    result = node.query("DESCRIBE FILESYSTEM CACHE 's3_cache_r'")
-    assert result.strip().endswith("1")
-
-    node.restart_clickhouse()
-
-    result = node.query("DESCRIBE FILESYSTEM CACHE 's3_cache_r'")
-    assert result.strip().endswith("0")
-
-    result = node.query(
-        "SELECT count() FROM system.filesystem_cache WHERE cache_path LIKE '%persistent'"
-    )
-    assert int(result) > 0
-
-    node.query("SELECT * FROM s3_test FORMAT Null")
-
-    assert not node.contains_in_log("No such file or directory: Cache info:")
-
-    replace_config(
-        config_path,
-        "<do_not_evict_index_and_mark_files>0</do_not_evict_index_and_mark_files>",
-        "<do_not_evict_index_and_mark_files>1</do_not_evict_index_and_mark_files>",
-    )
-
-    result = node.query(
-        "SELECT count() FROM system.filesystem_cache WHERE cache_path LIKE '%persistent'"
-    )
-    assert int(result) > 0
-
-    node.restart_clickhouse()
-
-    result = node.query("DESCRIBE FILESYSTEM CACHE 's3_cache_r'")
-    assert result.strip().endswith("1")
-
-    node.query("SELECT * FROM s3_test FORMAT Null")
-
-    assert not node.contains_in_log("No such file or directory: Cache info:")
-
-    check_no_objects_after_drop(cluster)
-
-
 @pytest.mark.parametrize("node_name", ["node"])
 def test_merge_canceled_by_drop(cluster, node_name):
     node = cluster.instances[node_name]
@@ -887,7 +783,9 @@ def test_merge_canceled_by_s3_errors(cluster, broken_s3, node_name, storage_poli
     min_key = node.query("SELECT min(key) FROM test_merge_canceled_by_s3_errors")
     assert int(min_key) == 0, min_key
 
-    broken_s3.setup_fail_upload(50000)
+    broken_s3.setup_error_at_object_upload()
+    broken_s3.setup_fake_multpartuploads()
+    broken_s3.setup_error_at_part_upload()
 
     node.query("SYSTEM START MERGES test_merge_canceled_by_s3_errors")
 
@@ -930,7 +828,7 @@ def test_merge_canceled_by_s3_errors_when_move(cluster, broken_s3, node_name):
         settings={"materialize_ttl_after_modify": 0},
     )
 
-    broken_s3.setup_fail_upload(10000)
+    broken_s3.setup_error_at_object_upload(count=1, after=1)
 
     node.query("SYSTEM START MERGES merge_canceled_by_s3_errors_when_move")
 
@@ -966,7 +864,7 @@ def test_s3_engine_heavy_write_check_mem(
         " ENGINE S3('http://resolver:8083/root/data/test-upload.csv', 'minio', 'minio123', 'CSV')",
     )
 
-    broken_s3.setup_fake_upload(1000)
+    broken_s3.setup_fake_multpartuploads()
     broken_s3.setup_slow_answers(10 * 1024 * 1024, timeout=15, count=10)
 
     query_id = f"INSERT_INTO_S3_ENGINE_QUERY_ID_{in_flight}"
@@ -1012,7 +910,7 @@ def test_s3_disk_heavy_write_check_mem(cluster, broken_s3, node_name):
     )
     node.query("SYSTEM STOP MERGES s3_test")
 
-    broken_s3.setup_fake_upload(1000)
+    broken_s3.setup_fake_multpartuploads()
     broken_s3.setup_slow_answers(10 * 1024 * 1024, timeout=10, count=50)
 
     query_id = f"INSERT_INTO_S3_DISK_QUERY_ID"
@@ -1038,3 +936,215 @@ def test_s3_disk_heavy_write_check_mem(cluster, broken_s3, node_name):
     assert int(result) > 0.8 * memory
 
     check_no_objects_after_drop(cluster, node_name=node_name)
+
+
+def get_memory_usage(node, query_id):
+    node.query("SYSTEM FLUSH LOGS")
+    memory_usage = node.query(
+        "SELECT memory_usage"
+        " FROM system.query_log"
+        f" WHERE query_id='{query_id}'"
+        "   AND type='QueryFinish'"
+    )
+    return int(memory_usage)
+
+
+def get_memory_usages(node, query_ids):
+    node.query("SYSTEM FLUSH LOGS")
+    result = []
+    for query_id in query_ids:
+        memory_usage = node.query(
+            "SELECT memory_usage"
+            " FROM system.query_log"
+            f" WHERE query_id='{query_id}'"
+            "   AND type='QueryFinish'"
+        )
+        result.append(int(memory_usage))
+    return result
+
+
+@pytest.mark.parametrize("node_name", ["node"])
+def test_heavy_insert_select_check_memory(cluster, broken_s3, node_name):
+    node = cluster.instances[node_name]
+
+    node.query(
+        """
+        CREATE TABLE central_query_log
+        (
+            control_plane_id UUID,
+            pod_id LowCardinality(String),
+            scrape_ts_microseconds DateTime64(6) CODEC(Delta(8), LZ4),
+            event_date Date,
+            event_time DateTime,
+            payload Array(String),
+            payload_01 String,
+            payload_02 String,
+            payload_03 String,
+            payload_04 String,
+            payload_05 String,
+            payload_06 String,
+            payload_07 String,
+            payload_08 String,
+            payload_09 String,
+            payload_10 String,
+            payload_11 String,
+            payload_12 String,
+            payload_13 String,
+            payload_14 String,
+            payload_15 String,
+            payload_16 String,
+            payload_17 String,
+            payload_18 String,
+            payload_19 String
+        )
+        ENGINE=MergeTree()
+        PARTITION BY toYYYYMM(event_date)
+        ORDER BY (control_plane_id, event_date, pod_id)
+        SETTINGS
+            storage_policy='s3'
+        """
+    )
+
+    node.query("SYSTEM STOP MERGES central_query_log")
+
+    write_count = 2
+    write_query_ids = []
+    for x in range(write_count):
+        query_id = f"INSERT_INTO_TABLE_RANDOM_DATA_QUERY_ID_{x}"
+        write_query_ids.append(query_id)
+        node.query(
+            """
+            INSERT INTO central_query_log
+            SELECT
+                control_plane_id,
+                pod_id,
+                toStartOfHour(event_time) + toIntervalSecond(randUniform(0,60)) as scrape_ts_microseconds,
+                toDate(event_time) as event_date,
+                event_time,
+                payload,
+                payload[1] as payload_01,
+                payload[2] as payload_02,
+                payload[3] as payload_03,
+                payload[4] as payload_04,
+                payload[5] as payload_05,
+                payload[6] as payload_06,
+                payload[7] as payload_07,
+                payload[8] as payload_08,
+                payload[9] as payload_09,
+                payload[10] as payload_10,
+                payload[11] as payload_11,
+                payload[12] as payload_12,
+                payload[13] as payload_13,
+                payload[14] as payload_14,
+                payload[15] as payload_15,
+                payload[16] as payload_16,
+                payload[17] as payload_17,
+                payload[18] as payload_18,
+                payload[19] as payload_19
+            FROM
+            (
+                SELECT
+                    control_plane_id,
+                    substring(payload[1], 1, 5) as pod_id,
+                    toDateTime('2022-12-12 00:00:00')
+                        + toIntervalDay(floor(randUniform(0,3)))
+                        + toIntervalHour(floor(randUniform(0,24)))
+                        + toIntervalSecond(floor(randUniform(0,60)))
+                        as event_time,
+                    payload
+                FROM
+                    generateRandom(
+                        'control_plane_id UUID, payload Array(String)',
+                        NULL,
+                        100,
+                        100
+                    )
+                LIMIT 10000
+            )
+            SETTINGS
+                max_insert_block_size=256000000,
+                min_insert_block_size_rows=1000000,
+                min_insert_block_size_bytes=256000000
+            """,
+            query_id=query_id,
+        )
+
+    memory = 845346116
+    for memory_usage, query_id in zip(
+        get_memory_usages(node, write_query_ids), write_query_ids
+    ):
+        assert int(memory_usage) < 1.2 * memory, f"{memory_usage} : {query_id}"
+        assert int(memory_usage) > 0.8 * memory, f"{memory_usage} : {query_id}"
+
+    broken_s3.setup_slow_answers(minimal_length=1000, timeout=5, count=20)
+    broken_s3.setup_fake_multpartuploads()
+
+    insert_query_id = f"INSERT_INTO_S3_FUNCTION_QUERY_ID"
+    node.query(
+        """
+        INSERT INTO
+            TABLE FUNCTION s3(
+                'http://resolver:8083/root/data/test-upload_{_partition_id}.csv.gz',
+                'minio', 'minio123',
+                'CSV', auto, 'gzip'
+            )
+        PARTITION BY formatDateTime(subtractHours(toDateTime('2022-12-13 00:00:00'), 1),'%Y-%m-%d_%H:00')
+        WITH toDateTime('2022-12-13 00:00:00') as time_point
+        SELECT
+            *
+        FROM central_query_log
+        WHERE
+            event_date >= subtractDays(toDate(time_point), 1)
+            AND scrape_ts_microseconds >= subtractHours(toStartOfHour(time_point), 12)
+            AND scrape_ts_microseconds < toStartOfDay(time_point)
+        SETTINGS
+            s3_max_inflight_parts_for_one_file=1
+        """,
+        query_id=insert_query_id,
+    )
+
+    query_id = f"SELECT_QUERY_ID"
+    total = node.query(
+        """
+        SELECT
+            count()
+        FROM central_query_log
+        """,
+        query_id=query_id,
+    )
+    assert int(total) == 10000 * write_count
+
+    query_id = f"SELECT_WHERE_QUERY_ID"
+    selected = node.query(
+        """
+        WITH toDateTime('2022-12-13 00:00:00') as time_point
+        SELECT
+            count()
+        FROM central_query_log
+        WHERE
+            event_date >= subtractDays(toDate(time_point), 1)
+            AND scrape_ts_microseconds >= subtractHours(toStartOfHour(time_point), 12)
+            AND scrape_ts_microseconds < toStartOfDay(time_point)
+        """,
+        query_id=query_id,
+    )
+    assert int(selected) < 4500, selected
+    assert int(selected) > 2500, selected
+
+    node.query("SYSTEM FLUSH LOGS")
+    profile_events = node.query(
+        f"""
+        SELECT ProfileEvents
+            FROM system.query_log
+            WHERE query_id='{insert_query_id}'
+            AND type='QueryFinish'
+        """
+    )
+
+    memory_usage = get_memory_usage(node, insert_query_id)
+    memory = 123507857
+    assert int(memory_usage) < 1.2 * memory, f"{memory_usage} {profile_events}"
+    assert int(memory_usage) > 0.8 * memory, f"{memory_usage} {profile_events}"
+
+    node.query(f"DROP TABLE IF EXISTS central_query_log SYNC")
+    remove_all_s3_objects(cluster)
diff --git a/tests/integration/test_move_partition_to_disk_on_cluster/configs/config.d/storage_configuration.xml b/tests/integration/test_move_partition_to_disk_on_cluster/configs/config.d/storage_configuration.xml
index 3289186c175..cd2f0867c61 100644
--- a/tests/integration/test_move_partition_to_disk_on_cluster/configs/config.d/storage_configuration.xml
+++ b/tests/integration/test_move_partition_to_disk_on_cluster/configs/config.d/storage_configuration.xml
@@ -24,5 +24,6 @@
     </policies>
 
 </storage_configuration>
+<allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 
 </clickhouse>
diff --git a/tests/integration/test_move_partition_to_disk_on_cluster/test.py b/tests/integration/test_move_partition_to_disk_on_cluster/test.py
index 90753fc8ce3..c639e080cdf 100644
--- a/tests/integration/test_move_partition_to_disk_on_cluster/test.py
+++ b/tests/integration/test_move_partition_to_disk_on_cluster/test.py
@@ -46,7 +46,7 @@ def test_move_partition_to_disk_on_cluster(start_cluster):
             "(x UInt64) "
             "ENGINE=ReplicatedMergeTree('/clickhouse/tables/test_local_table', '{replica}') "
             "ORDER BY tuple()"
-            "SETTINGS storage_policy = 'jbod_with_external';",
+            "SETTINGS storage_policy = 'jbod_with_external', temporary_directories_lifetime=1;",
         )
 
     node1.query("INSERT INTO test_local_table VALUES (0)")
diff --git a/tests/integration/test_multiple_disks/configs/config.d/storage_configuration.xml b/tests/integration/test_multiple_disks/configs/config.d/storage_configuration.xml
index ef40bfb0a0e..033699f4634 100644
--- a/tests/integration/test_multiple_disks/configs/config.d/storage_configuration.xml
+++ b/tests/integration/test_multiple_disks/configs/config.d/storage_configuration.xml
@@ -122,5 +122,10 @@
     </policies>
 
 </storage_configuration>
+<allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
+
+<merge_tree>
+    <temporary_directories_lifetime>1</temporary_directories_lifetime>
+</merge_tree>
 
 </clickhouse>
diff --git a/tests/integration/test_multiple_disks/test.py b/tests/integration/test_multiple_disks/test.py
index 0e51df017b2..b5606ee8bc2 100644
--- a/tests/integration/test_multiple_disks/test.py
+++ b/tests/integration/test_multiple_disks/test.py
@@ -846,7 +846,7 @@ def test_start_stop_moves(start_cluster, name, engine):
         node1.query("SYSTEM START MOVES {}".format(name))
 
         # wait sometime until background backoff finishes
-        retry = 30
+        retry = 60
         i = 0
         while not sum(1 for x in used_disks if x == "jbod1") <= 2 and i < retry:
             time.sleep(1)
@@ -1528,7 +1528,8 @@ def test_simple_replication_and_moves(start_cluster):
                     s1 String
                 ) ENGINE = ReplicatedMergeTree('/clickhouse/replicated_table_for_moves', '{}')
                 ORDER BY tuple()
-                SETTINGS storage_policy='moving_jbod_with_external', old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=2
+                SETTINGS storage_policy='moving_jbod_with_external', old_parts_lifetime=1,
+                cleanup_delay_period=1, cleanup_delay_period_random_add=2, cleanup_thread_preferred_points_per_iteration=0
             """.format(
                     i + 1
                 )
@@ -1609,7 +1610,8 @@ def test_download_appropriate_disk(start_cluster):
                     s1 String
                 ) ENGINE = ReplicatedMergeTree('/clickhouse/replicated_table_for_download', '{}')
                 ORDER BY tuple()
-                SETTINGS storage_policy='moving_jbod_with_external', old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=2
+                SETTINGS storage_policy='moving_jbod_with_external', old_parts_lifetime=1,
+                cleanup_delay_period=1, cleanup_delay_period_random_add=2, cleanup_thread_preferred_points_per_iteration=0
             """.format(
                     i + 1
                 )
diff --git a/tests/integration/test_non_default_compression/configs/deflateqpl_compression_by_default.xml b/tests/integration/test_non_default_compression/configs/deflateqpl_compression_by_default.xml
new file mode 100644
index 00000000000..2ad6a0f1eff
--- /dev/null
+++ b/tests/integration/test_non_default_compression/configs/deflateqpl_compression_by_default.xml
@@ -0,0 +1,11 @@
+<clickhouse>
+    <compression>
+        <case>
+            <!-- Conditions. All must be satisfied simultaneously. Some conditions may not be specified. -->
+            <min_part_size>0</min_part_size>         <!-- The minimum size of a part in bytes. -->
+            <min_part_size_ratio>0</min_part_size_ratio>    <!-- The minimum size of the part relative to all the data in the table. -->
+            <!-- Which compression method to choose. -->
+            <method>deflate_qpl</method>
+        </case>
+    </compression>
+</clickhouse>
diff --git a/tests/integration/test_non_default_compression/configs/enable_deflateqpl_codec.xml b/tests/integration/test_non_default_compression/configs/enable_deflateqpl_codec.xml
new file mode 100644
index 00000000000..24e101e0e3f
--- /dev/null
+++ b/tests/integration/test_non_default_compression/configs/enable_deflateqpl_codec.xml
@@ -0,0 +1,7 @@
+<clickhouse>
+    <profiles>
+        <default>
+            <enable_deflate_qpl_codec>1</enable_deflate_qpl_codec>
+        </default>
+    </profiles>
+</clickhouse>
diff --git a/tests/integration/test_non_default_compression/test.py b/tests/integration/test_non_default_compression/test.py
index e0a67a5db95..18e2eb43813 100644
--- a/tests/integration/test_non_default_compression/test.py
+++ b/tests/integration/test_non_default_compression/test.py
@@ -38,6 +38,14 @@ node5 = cluster.add_instance(
 )
 node6 = cluster.add_instance(
     "node6",
+    main_configs=["configs/deflateqpl_compression_by_default.xml"],
+    user_configs=[
+        "configs/allow_suspicious_codecs.xml",
+        "configs/enable_deflateqpl_codec.xml",
+    ],
+)
+node7 = cluster.add_instance(
+    "node7",
     main_configs=["configs/allow_experimental_codecs.xml"],
     user_configs=["configs/allow_suspicious_codecs.xml"],
 )
@@ -244,3 +252,58 @@ def test_uncompressed_cache_plus_zstd_codec(start_cluster):
         )
         == "10000\n"
     )
+
+
+def test_preconfigured_deflateqpl_codec(start_cluster):
+    node6.query(
+        """
+    CREATE TABLE compression_codec_multiple_with_key (
+        somedate Date CODEC(ZSTD, ZSTD, ZSTD(12), LZ4HC(12), DEFLATE_QPL),
+        id UInt64 CODEC(LZ4, ZSTD, NONE, LZ4HC, DEFLATE_QPL),
+        data String CODEC(ZSTD(2), LZ4HC, NONE, LZ4, LZ4, DEFLATE_QPL),
+        somecolumn Float64
+    ) ENGINE = MergeTree() PARTITION BY somedate ORDER BY id SETTINGS index_granularity = 2;
+    """
+    )
+    node6.query(
+        "INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), 100000, 'hello', 88.88), (toDate('2018-10-12'), 100002, 'world', 99.99), (toDate('2018-10-12'), 1111, '!', 777.777)"
+    )
+    assert (
+        node6.query(
+            "SELECT COUNT(*) FROM compression_codec_multiple_with_key WHERE id % 2 == 0"
+        )
+        == "2\n"
+    )
+    assert (
+        node6.query(
+            "SELECT DISTINCT somecolumn FROM compression_codec_multiple_with_key ORDER BY id"
+        )
+        == "777.777\n88.88\n99.99\n"
+    )
+    assert (
+        node6.query(
+            "SELECT data FROM compression_codec_multiple_with_key WHERE id >= 1112 AND somedate = toDate('2018-10-12') AND somecolumn <= 100"
+        )
+        == "hello\nworld\n"
+    )
+
+    node6.query(
+        "INSERT INTO compression_codec_multiple_with_key SELECT toDate('2018-10-12'), number, toString(number), 1.0 FROM system.numbers LIMIT 10000"
+    )
+
+    assert (
+        node6.query(
+            "SELECT COUNT(id) FROM compression_codec_multiple_with_key WHERE id % 10 == 0"
+        )
+        == "1001\n"
+    )
+    assert (
+        node6.query("SELECT SUM(somecolumn) FROM compression_codec_multiple_with_key")
+        == str(777.777 + 88.88 + 99.99 + 1.0 * 10000) + "\n"
+    )
+    assert (
+        node6.query(
+            "SELECT count(*) FROM compression_codec_multiple_with_key GROUP BY somedate"
+        )
+        == "10003\n"
+    )
diff --git a/tests/integration/test_old_parts_finally_removed/test.py b/tests/integration/test_old_parts_finally_removed/test.py
index 5347d433419..cbd701588d5 100644
--- a/tests/integration/test_old_parts_finally_removed/test.py
+++ b/tests/integration/test_old_parts_finally_removed/test.py
@@ -27,7 +27,8 @@ def started_cluster():
 
 def test_part_finally_removed(started_cluster):
     node1.query(
-        "CREATE TABLE drop_outdated_part (Key UInt64) ENGINE = ReplicatedMergeTree('/table/d', '1') ORDER BY tuple() SETTINGS old_parts_lifetime=10, cleanup_delay_period=10, cleanup_delay_period_random_add=1"
+        "CREATE TABLE drop_outdated_part (Key UInt64) ENGINE = ReplicatedMergeTree('/table/d', '1') ORDER BY tuple() "
+        "SETTINGS old_parts_lifetime=10, cleanup_delay_period=10, cleanup_delay_period_random_add=1, cleanup_thread_preferred_points_per_iteration=0"
     )
     node1.query("INSERT INTO drop_outdated_part VALUES (1)")
 
@@ -44,7 +45,7 @@ def test_part_finally_removed(started_cluster):
     )
 
     node1.query(
-        "ALTER TABLE drop_outdated_part MODIFY SETTING old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=1"
+        "ALTER TABLE drop_outdated_part MODIFY SETTING old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=1, cleanup_thread_preferred_points_per_iteration=0"
     )
 
     for i in range(60):
diff --git a/tests/integration/test_parts_delete_zookeeper/test.py b/tests/integration/test_parts_delete_zookeeper/test.py
index a78aefa4595..9fd07e7b65d 100644
--- a/tests/integration/test_parts_delete_zookeeper/test.py
+++ b/tests/integration/test_parts_delete_zookeeper/test.py
@@ -21,7 +21,7 @@ def start_cluster():
             CREATE DATABASE test;
             CREATE TABLE test_table(date Date, id UInt32)
             ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/replicated', 'node1')
-            ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS old_parts_lifetime=4, cleanup_delay_period=1;
+            ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS old_parts_lifetime=4, cleanup_delay_period=1, cleanup_thread_preferred_points_per_iteration=0;
             """
         )
 
diff --git a/tests/integration/test_postgresql_protocol/test.py b/tests/integration/test_postgresql_protocol/test.py
index e1d8cbf9bcc..de01bba6862 100644
--- a/tests/integration/test_postgresql_protocol/test.py
+++ b/tests/integration/test_postgresql_protocol/test.py
@@ -111,7 +111,7 @@ def test_psql_client(started_cluster):
 def test_python_client(started_cluster):
     node = cluster.instances["node"]
 
-    with pytest.raises(py_psql.InternalError) as exc_info:
+    with pytest.raises(py_psql.OperationalError) as exc_info:
         ch = py_psql.connect(
             host=node.ip_address,
             port=server_port,
@@ -122,9 +122,7 @@ def test_python_client(started_cluster):
         cur = ch.cursor()
         cur.execute("select name from tables;")
 
-    assert exc_info.value.args == (
-        "Query execution failed.\nDB::Exception: Table default.tables doesn't exist\nSSL connection has been closed unexpectedly\n",
-    )
+    assert exc_info.value.args == ("SSL connection has been closed unexpectedly\n",)
 
     ch = py_psql.connect(
         host=node.ip_address,
diff --git a/tests/integration/test_profile_events_s3/test.py b/tests/integration/test_profile_events_s3/test.py
index 10c9385f865..a8e037d667f 100644
--- a/tests/integration/test_profile_events_s3/test.py
+++ b/tests/integration/test_profile_events_s3/test.py
@@ -139,7 +139,7 @@ def test_profile_events(cluster):
     )
     stat1 = get_query_stat(instance, query1)
     for metric in stat1:
-        assert stat1[metric] == metrics1[metric] - metrics0[metric]
+        assert stat1[metric] == metrics1.get(metric, 0) - metrics0.get(metric, 0)
     assert (
         metrics1["WriteBufferFromS3Bytes"] - metrics0["WriteBufferFromS3Bytes"] == size1
     )
@@ -163,7 +163,7 @@ def test_profile_events(cluster):
     stat2 = get_query_stat(instance, query2)
 
     for metric in stat2:
-        assert stat2[metric] == metrics2[metric] - metrics1[metric]
+        assert stat2[metric] == metrics2.get(metric, 0) - metrics1.get(metric, 0)
 
     assert (
         metrics2["WriteBufferFromS3Bytes"] - metrics1["WriteBufferFromS3Bytes"]
@@ -189,4 +189,4 @@ def test_profile_events(cluster):
     # With async reads profile events are not updated fully because reads are done in a separate thread.
     # for metric in stat3:
     #    print(metric)
-    #    assert stat3[metric] == metrics3[metric] - metrics2[metric]
+    #    assert stat3[metric] == metrics3.get(metric, 0) - metrics2.get(metric, 0)
diff --git a/tests/integration/test_recovery_replica/test.py b/tests/integration/test_recovery_replica/test.py
index 0a63da4db22..582e018f5d2 100644
--- a/tests/integration/test_recovery_replica/test.py
+++ b/tests/integration/test_recovery_replica/test.py
@@ -4,7 +4,7 @@ import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import assert_eq_with_retry
 
-SETTINGS = "SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0"
+SETTINGS = "SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0"
 
 
 def fill_nodes(nodes):
diff --git a/tests/integration/test_rename_column/configs/config.d/storage_configuration.xml b/tests/integration/test_rename_column/configs/config.d/storage_configuration.xml
index da297e40037..65cac905e9a 100644
--- a/tests/integration/test_rename_column/configs/config.d/storage_configuration.xml
+++ b/tests/integration/test_rename_column/configs/config.d/storage_configuration.xml
@@ -24,9 +24,11 @@
         </default_with_external>
     </policies>
 </storage_configuration>
-    
+
 <merge_tree>
     <min_bytes_for_wide_part>0</min_bytes_for_wide_part>
+    <temporary_directories_lifetime>1</temporary_directories_lifetime>
 </merge_tree>
+<allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 
 </clickhouse>
diff --git a/tests/integration/test_replicated_database/test.py b/tests/integration/test_replicated_database/test.py
index 2ab2fe499ff..b3ba8d4737f 100644
--- a/tests/integration/test_replicated_database/test.py
+++ b/tests/integration/test_replicated_database/test.py
@@ -34,6 +34,7 @@ competing_node = cluster.add_instance(
     main_configs=["configs/config.xml"],
     user_configs=["configs/settings.xml"],
     with_zookeeper=True,
+    stay_alive=True,
     macros={"shard": 1, "replica": 3},
 )
 snapshotting_node = cluster.add_instance(
@@ -1272,3 +1273,61 @@ def test_recover_digest_mismatch(started_cluster):
     dummy_node.query("DROP DATABASE IF EXISTS recover_digest_mismatch")
 
     print("Everything Okay")
+
+
+def test_replicated_table_structure_alter(started_cluster):
+    main_node.query("DROP DATABASE IF EXISTS table_structure")
+    dummy_node.query("DROP DATABASE IF EXISTS table_structure")
+
+    main_node.query(
+        "CREATE DATABASE table_structure ENGINE = Replicated('/clickhouse/databases/table_structure', 'shard1', 'replica1');"
+    )
+    dummy_node.query(
+        "CREATE DATABASE table_structure ENGINE = Replicated('/clickhouse/databases/table_structure', 'shard1', 'replica2');"
+    )
+    competing_node.query(
+        "CREATE DATABASE table_structure ENGINE = Replicated('/clickhouse/databases/table_structure', 'shard1', 'replica3');"
+    )
+
+    competing_node.query("CREATE TABLE table_structure.mem (n int) ENGINE=Memory")
+    dummy_node.query("DETACH DATABASE table_structure")
+
+    settings = {"distributed_ddl_task_timeout": 0}
+    main_node.query(
+        "CREATE TABLE table_structure.rmt (n int, v UInt64) ENGINE=ReplicatedReplacingMergeTree(v) ORDER BY n",
+        settings=settings,
+    )
+
+    competing_node.query("SYSTEM SYNC DATABASE REPLICA table_structure")
+    competing_node.query("DETACH DATABASE table_structure")
+
+    main_node.query(
+        "ALTER TABLE table_structure.rmt ADD COLUMN m int", settings=settings
+    )
+    main_node.query(
+        "ALTER TABLE table_structure.rmt COMMENT COLUMN v 'version'", settings=settings
+    )
+    main_node.query("INSERT INTO table_structure.rmt VALUES (1, 2, 3)")
+
+    command = "rm -f /var/lib/clickhouse/metadata/table_structure/mem.sql"
+    competing_node.exec_in_container(["bash", "-c", command])
+    competing_node.restart_clickhouse(kill=True)
+
+    dummy_node.query("ATTACH DATABASE table_structure")
+    dummy_node.query("SYSTEM SYNC DATABASE REPLICA table_structure")
+    dummy_node.query("SYSTEM SYNC REPLICA table_structure.rmt")
+    assert "1\t2\t3\n" == dummy_node.query("SELECT * FROM table_structure.rmt")
+
+    competing_node.query("SYSTEM SYNC DATABASE REPLICA table_structure")
+    competing_node.query("SYSTEM SYNC REPLICA table_structure.rmt")
+    # time.sleep(600)
+    assert "mem" in competing_node.query("SHOW TABLES FROM table_structure")
+    assert "1\t2\t3\n" == competing_node.query("SELECT * FROM table_structure.rmt")
+
+    main_node.query("ALTER TABLE table_structure.rmt ADD COLUMN k int")
+    main_node.query("INSERT INTO table_structure.rmt VALUES (1, 2, 3, 4)")
+    dummy_node.query("SYSTEM SYNC DATABASE REPLICA table_structure")
+    dummy_node.query("SYSTEM SYNC REPLICA table_structure.rmt")
+    assert "1\t2\t3\t0\n1\t2\t3\t4\n" == dummy_node.query(
+        "SELECT * FROM table_structure.rmt ORDER BY k"
+    )
diff --git a/tests/integration/test_replicated_merge_tree_hdfs_zero_copy/configs/config.d/storage_conf.xml b/tests/integration/test_replicated_merge_tree_hdfs_zero_copy/configs/config.d/storage_conf.xml
index cb444c728c9..bb4aba94e0b 100644
--- a/tests/integration/test_replicated_merge_tree_hdfs_zero_copy/configs/config.d/storage_conf.xml
+++ b/tests/integration/test_replicated_merge_tree_hdfs_zero_copy/configs/config.d/storage_conf.xml
@@ -89,4 +89,5 @@
         <cluster>test_cluster</cluster>
         <shard>1</shard>
     </macros>
+    <allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 </clickhouse>
diff --git a/tests/integration/test_replicated_merge_tree_hdfs_zero_copy/test.py b/tests/integration/test_replicated_merge_tree_hdfs_zero_copy/test.py
index bd1c890950a..eb3d62eb718 100644
--- a/tests/integration/test_replicated_merge_tree_hdfs_zero_copy/test.py
+++ b/tests/integration/test_replicated_merge_tree_hdfs_zero_copy/test.py
@@ -128,7 +128,7 @@ def test_hdfs_zero_copy_replication_single_move(cluster, storage_policy, init_ob
             CREATE TABLE single_node_move_test (dt DateTime, id Int64)
             ENGINE=ReplicatedMergeTree('/clickhouse/tables/{cluster}/{shard}/single_node_move_test', '{replica}')
             ORDER BY (dt, id)
-            SETTINGS storage_policy='$policy'
+            SETTINGS storage_policy='$policy',temporary_directories_lifetime=1
             """
             ).substitute(policy=storage_policy)
         )
diff --git a/tests/integration/test_replicated_merge_tree_s3_zero_copy/configs/config.d/storage_conf.xml b/tests/integration/test_replicated_merge_tree_s3_zero_copy/configs/config.d/storage_conf.xml
index 15239041478..96d59d5633e 100644
--- a/tests/integration/test_replicated_merge_tree_s3_zero_copy/configs/config.d/storage_conf.xml
+++ b/tests/integration/test_replicated_merge_tree_s3_zero_copy/configs/config.d/storage_conf.xml
@@ -12,6 +12,7 @@
                 <disk>s3</disk>
                 <max_size>100000000</max_size>
                 <path>./cache_s3/</path>
+                <cache_on_write_operations>1</cache_on_write_operations>
             </cache_s3>
         </disks>
         <policies>
diff --git a/tests/integration/test_replicated_merge_tree_s3_zero_copy/configs/config.d/users.xml b/tests/integration/test_replicated_merge_tree_s3_zero_copy/configs/config.d/users.xml
new file mode 100644
index 00000000000..5de169edc1e
--- /dev/null
+++ b/tests/integration/test_replicated_merge_tree_s3_zero_copy/configs/config.d/users.xml
@@ -0,0 +1,7 @@
+<clickhouse>
+    <profiles>
+        <default>
+            <enable_filesystem_cache_on_write_operations>1</enable_filesystem_cache_on_write_operations>
+        </default>
+    </profiles>
+</clickhouse>
diff --git a/tests/integration/test_replicated_merge_tree_s3_zero_copy/test.py b/tests/integration/test_replicated_merge_tree_s3_zero_copy/test.py
index eca18820016..72a01d278d8 100644
--- a/tests/integration/test_replicated_merge_tree_s3_zero_copy/test.py
+++ b/tests/integration/test_replicated_merge_tree_s3_zero_copy/test.py
@@ -19,6 +19,7 @@ def cluster():
         cluster.add_instance(
             "node1",
             main_configs=["configs/config.d/storage_conf.xml"],
+            user_configs=["configs/config.d/users.xml"],
             macros={"replica": "1"},
             with_minio=True,
             with_zookeeper=True,
@@ -26,12 +27,14 @@ def cluster():
         cluster.add_instance(
             "node2",
             main_configs=["configs/config.d/storage_conf.xml"],
+            user_configs=["configs/config.d/users.xml"],
             macros={"replica": "2"},
             with_zookeeper=True,
         )
         cluster.add_instance(
             "node3",
             main_configs=["configs/config.d/storage_conf.xml"],
+            user_configs=["configs/config.d/users.xml"],
             macros={"replica": "3"},
             with_zookeeper=True,
         )
@@ -74,7 +77,7 @@ def generate_values(date_str, count, sign=1):
 
 def create_table(cluster, additional_settings=None):
     create_table_statement = """
-        CREATE TABLE s3_test ON CLUSTER cluster(
+        CREATE TABLE s3_test ON CLUSTER cluster (
             dt Date,
             id Int64,
             data String,
@@ -95,7 +98,8 @@ def create_table(cluster, additional_settings=None):
 def drop_table(cluster):
     yield
     for node in list(cluster.instances.values()):
-        node.query("DROP TABLE IF EXISTS s3_test")
+        node.query("DROP TABLE IF EXISTS s3_test SYNC")
+        node.query("DROP TABLE IF EXISTS test_drop_table SYNC")
 
     minio = cluster.minio_client
     # Remove extra objects to prevent tests cascade failing
diff --git a/tests/integration/test_s3_zero_copy_replication/configs/config.d/s3.xml b/tests/integration/test_s3_zero_copy_replication/configs/config.d/s3.xml
index f7d9efc2cae..63162c3c19b 100644
--- a/tests/integration/test_s3_zero_copy_replication/configs/config.d/s3.xml
+++ b/tests/integration/test_s3_zero_copy_replication/configs/config.d/s3.xml
@@ -93,4 +93,5 @@
         <cluster>test_cluster</cluster>
     </macros>
 
+    <allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 </clickhouse>
diff --git a/tests/integration/test_s3_zero_copy_replication/test.py b/tests/integration/test_s3_zero_copy_replication/test.py
index 100f062de2f..bc13c127610 100644
--- a/tests/integration/test_s3_zero_copy_replication/test.py
+++ b/tests/integration/test_s3_zero_copy_replication/test.py
@@ -163,7 +163,7 @@ def test_s3_zero_copy_on_hybrid_storage(started_cluster):
         CREATE TABLE hybrid_test ON CLUSTER test_cluster (id UInt32, value String)
         ENGINE=ReplicatedMergeTree('/clickhouse/tables/hybrid_test', '{}')
         ORDER BY id
-        SETTINGS storage_policy='hybrid'
+        SETTINGS storage_policy='hybrid',temporary_directories_lifetime=1
         """.format(
             "{replica}"
         )
diff --git a/tests/integration/test_secure_socket/test.py b/tests/integration/test_secure_socket/test.py
index 2dffbed03d6..123715e5f05 100644
--- a/tests/integration/test_secure_socket/test.py
+++ b/tests/integration/test_secure_socket/test.py
@@ -58,6 +58,9 @@ def test(started_cluster):
         config.format(sleep_in_send_data_ms=1000000),
     )
 
+    if NODES["node1"].is_built_with_thread_sanitizer():
+        pytest.skip("Hedged requests don't work under Thread Sanitizer")
+
     attempts = 0
     while attempts < 1000:
         setting = NODES["node2"].http_query(
diff --git a/tests/integration/test_ssl_cert_authentication/configs/ssl_config.xml b/tests/integration/test_ssl_cert_authentication/configs/ssl_config.xml
index ed3b2b595db..24c9eb8891f 100644
--- a/tests/integration/test_ssl_cert_authentication/configs/ssl_config.xml
+++ b/tests/integration/test_ssl_cert_authentication/configs/ssl_config.xml
@@ -25,12 +25,9 @@
             <cacheSessions>true</cacheSessions>
             <disableProtocols>sslv2,sslv3</disableProtocols>
             <preferServerCiphers>true</preferServerCiphers>
-            <!-- Use for self-signed: <verificationMode>none</verificationMode> -->
             <invalidCertificateHandler>
-                <!-- Use for self-signed: <name>AcceptCertificateHandler</name> -->
                 <name>RejectCertificateHandler</name>
             </invalidCertificateHandler>
         </client>
     </openSSL>
 </clickhouse>
-  
\ No newline at end of file
diff --git a/tests/integration/test_ssl_cert_authentication/test.py b/tests/integration/test_ssl_cert_authentication/test.py
index b05a6acc16b..ff2de7491e1 100644
--- a/tests/integration/test_ssl_cert_authentication/test.py
+++ b/tests/integration/test_ssl_cert_authentication/test.py
@@ -2,10 +2,11 @@ import pytest
 from helpers.client import Client
 from helpers.cluster import ClickHouseCluster
 from helpers.ssl_context import WrapSSLContextWithSNI
+import urllib.request, urllib.parse
 import ssl
 import os.path
 from os import remove
-import urllib3
+import logging
 
 
 # The test cluster is configured with certificate for that host name, see 'server-ext.cnf'.
@@ -14,6 +15,7 @@ SSL_HOST = "integration-tests.clickhouse.com"
 HTTPS_PORT = 8443
 # It's important for the node to work at this IP because 'server-cert.pem' requires that (see server-ext.cnf).
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
+MAX_RETRY = 5
 
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance(
@@ -164,17 +166,19 @@ def get_ssl_context(cert_name):
 def execute_query_https(
     query, user, enable_ssl_auth=True, cert_name=None, password=None
 ):
-    url = f"https://{instance.ip_address}:{HTTPS_PORT}/?query={query}"
-    headers = {"X-ClickHouse-User": user}
+    url = (
+        f"https://{instance.ip_address}:{HTTPS_PORT}/?query={urllib.parse.quote(query)}"
+    )
+    request = urllib.request.Request(url)
+    request.add_header("X-ClickHouse-User", user)
     if enable_ssl_auth:
-        headers["X-ClickHouse-SSL-Certificate-Auth"] = "on"
+        request.add_header("X-ClickHouse-SSL-Certificate-Auth", "on")
     if password:
-        headers["X-ClickHouse-Key"] = password
-    http_client = urllib3.PoolManager(ssl_context=get_ssl_context(cert_name))
-    response = http_client.request("GET", url, headers=headers)
-    if response.status != 200:
-        raise Exception(response.status)
-    return response.data.decode("utf-8")
+        request.add_header("X-ClickHouse-Key", password)
+    response = urllib.request.urlopen(
+        request, context=get_ssl_context(cert_name)
+    ).read()
+    return response.decode("utf-8")
 
 
 def test_https():
@@ -198,10 +202,18 @@ def test_https_wrong_cert():
         execute_query_https("SELECT currentUser()", user="john", cert_name="client2")
     assert "403" in str(err.value)
 
+    count = 0
     # Wrong certificate: self-signed certificate.
-    with pytest.raises(Exception) as err:
-        execute_query_https("SELECT currentUser()", user="john", cert_name="wrong")
-    assert "unknown ca" in str(err.value)
+    while count <= MAX_RETRY:
+        with pytest.raises(Exception) as err:
+            execute_query_https("SELECT currentUser()", user="john", cert_name="wrong")
+        err_str = str(err.value)
+        if count < MAX_RETRY and "Broken pipe" in err_str:
+            count = count + 1
+            logging.warning(f"Failed attempt with wrong cert, err: {err_str}")
+            continue
+        assert "unknown ca" in err_str
+        break
 
     # No certificate.
     with pytest.raises(Exception) as err:
@@ -291,24 +303,45 @@ def test_https_non_ssl_auth():
         == "jane\n"
     )
 
+    count = 0
     # However if we send a certificate it must not be wrong.
-    with pytest.raises(Exception) as err:
-        execute_query_https(
-            "SELECT currentUser()",
-            user="peter",
-            enable_ssl_auth=False,
-            cert_name="wrong",
-        )
-    assert "unknown ca" in str(err.value)
-    with pytest.raises(Exception) as err:
-        execute_query_https(
-            "SELECT currentUser()",
-            user="jane",
-            enable_ssl_auth=False,
-            password="qwe123",
-            cert_name="wrong",
-        )
-    assert "unknown ca" in str(err.value)
+    while count <= MAX_RETRY:
+        with pytest.raises(Exception) as err:
+            execute_query_https(
+                "SELECT currentUser()",
+                user="peter",
+                enable_ssl_auth=False,
+                cert_name="wrong",
+            )
+        err_str = str(err.value)
+        if count < MAX_RETRY and "Broken pipe" in err_str:
+            count = count + 1
+            logging.warning(
+                f"Failed attempt with wrong cert, user: peter, err: {err_str}"
+            )
+            continue
+        assert "unknown ca" in err_str
+        break
+
+    count = 0
+    while count <= MAX_RETRY:
+        with pytest.raises(Exception) as err:
+            execute_query_https(
+                "SELECT currentUser()",
+                user="jane",
+                enable_ssl_auth=False,
+                password="qwe123",
+                cert_name="wrong",
+            )
+        err_str = str(err.value)
+        if count < MAX_RETRY and "Broken pipe" in err_str:
+            count = count + 1
+            logging.warning(
+                f"Failed attempt with wrong cert, user: jane, err: {err_str}"
+            )
+            continue
+        assert "unknown ca" in err_str
+        break
 
 
 def test_create_user():
diff --git a/tests/integration/test_storage_azure_blob_storage/__init__.py b/tests/integration/test_storage_azure_blob_storage/__init__.py
new file mode 100644
index 00000000000..e5a0d9b4834
--- /dev/null
+++ b/tests/integration/test_storage_azure_blob_storage/__init__.py
@@ -0,0 +1 @@
+#!/usr/bin/env python3
diff --git a/tests/integration/test_storage_azure_blob_storage/configs/disable_profilers.xml b/tests/integration/test_storage_azure_blob_storage/configs/disable_profilers.xml
new file mode 100644
index 00000000000..a39badbf8ec
--- /dev/null
+++ b/tests/integration/test_storage_azure_blob_storage/configs/disable_profilers.xml
@@ -0,0 +1,9 @@
+<!-- Sometime azurite is super slow, profiler make it even worse -->
+<clickhouse>
+    <profiles>
+        <default>
+            <query_profiler_real_time_period_ns>0</query_profiler_real_time_period_ns>
+            <query_profiler_cpu_time_period_ns>0</query_profiler_cpu_time_period_ns>
+        </default>
+    </profiles>
+</clickhouse>
diff --git a/tests/integration/test_storage_azure_blob_storage/configs/named_collections.xml b/tests/integration/test_storage_azure_blob_storage/configs/named_collections.xml
new file mode 100644
index 00000000000..e0c18d11940
--- /dev/null
+++ b/tests/integration/test_storage_azure_blob_storage/configs/named_collections.xml
@@ -0,0 +1,16 @@
+<clickhouse>
+    <named_collections>
+        <azure_conf1>
+            <connection_string>DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;BlobEndpoint=http://azurite1:10000/devstoreaccount1;</connection_string>
+            <container>cont</container>
+            <blob_path>test_simple_write_named.csv</blob_path>
+            <structure>key UInt64, data String</structure>
+            <format>CSV</format>
+        </azure_conf1>
+        <azure_conf2>
+            <storage_account_url>http://azurite1:10000/devstoreaccount1</storage_account_url>
+            <account_name>devstoreaccount1</account_name>
+            <account_key>Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==</account_key>
+        </azure_conf2>
+    </named_collections>
+</clickhouse>
diff --git a/tests/integration/test_storage_azure_blob_storage/test.py b/tests/integration/test_storage_azure_blob_storage/test.py
new file mode 100644
index 00000000000..6089466ff5d
--- /dev/null
+++ b/tests/integration/test_storage_azure_blob_storage/test.py
@@ -0,0 +1,613 @@
+#!/usr/bin/env python3
+
+import gzip
+import json
+import logging
+import os
+import io
+import random
+import threading
+import time
+
+from azure.storage.blob import BlobServiceClient
+import helpers.client
+import pytest
+from helpers.cluster import ClickHouseCluster, ClickHouseInstance
+from helpers.network import PartitionManager
+from helpers.mock_servers import start_mock_servers
+from helpers.test_tools import exec_query_with_retry
+
+
+@pytest.fixture(scope="module")
+def cluster():
+    try:
+        cluster = ClickHouseCluster(__file__)
+        cluster.add_instance(
+            "node",
+            main_configs=["configs/named_collections.xml"],
+            user_configs=["configs/disable_profilers.xml"],
+            with_azurite=True,
+        )
+        cluster.start()
+
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+def azure_query(node, query, try_num=10, settings={}):
+    for i in range(try_num):
+        try:
+            return node.query(query, settings=settings)
+        except Exception as ex:
+            retriable_errors = [
+                "DB::Exception: Azure::Core::Http::TransportException: Connection was closed by the server while trying to read a response",
+                "DB::Exception: Azure::Core::Http::TransportException: Connection closed before getting full response or response is less than expected",
+            ]
+            retry = False
+            for error in retriable_errors:
+                if error in str(ex):
+                    retry = True
+                    print(f"Try num: {i}. Having retriable error: {ex}")
+                    time.sleep(i)
+                    break
+            if not retry or i == try_num - 1:
+                raise Exception(ex)
+            continue
+
+
+def get_azure_file_content(filename):
+    container_name = "cont"
+    connection_string = "DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;BlobEndpoint=http://127.0.0.1:10000/devstoreaccount1;"
+    blob_service_client = BlobServiceClient.from_connection_string(connection_string)
+    container_client = blob_service_client.get_container_client(container_name)
+    blob_client = container_client.get_blob_client(filename)
+    download_stream = blob_client.download_blob()
+    return download_stream.readall().decode("utf-8")
+
+
+def put_azure_file_content(filename, data):
+    container_name = "cont"
+    connection_string = "DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;BlobEndpoint=http://127.0.0.1:10000/devstoreaccount1;"
+    blob_service_client = BlobServiceClient.from_connection_string(connection_string)
+    try:
+        container_client = blob_service_client.create_container(container_name)
+    except:
+        container_client = blob_service_client.get_container_client(container_name)
+
+    blob_client = container_client.get_blob_client(filename)
+    buf = io.BytesIO(data)
+    blob_client.upload_blob(buf)
+
+
+def test_create_table_connection_string(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        "CREATE TABLE test_create_table_conn_string (key UInt64, data String) Engine = AzureBlobStorage('DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;BlobEndpoint=http://azurite1:10000/devstoreaccount1/;', 'cont', 'test_create_connection_string', 'CSV')",
+    )
+
+
+def test_create_table_account_string(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        "CREATE TABLE test_create_table_account_url (key UInt64, data String) Engine = AzureBlobStorage('http://azurite1:10000/devstoreaccount1',  'cont', 'test_create_connection_string', 'devstoreaccount1', 'Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==', 'CSV')",
+    )
+
+
+def test_simple_write_account_string(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        "CREATE TABLE test_simple_write (key UInt64, data String) Engine = AzureBlobStorage('http://azurite1:10000/devstoreaccount1', 'cont', 'test_simple_write.csv', 'devstoreaccount1', 'Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==', 'CSV')",
+    )
+    azure_query(node, "INSERT INTO test_simple_write VALUES (1, 'a')")
+    print(get_azure_file_content("test_simple_write.csv"))
+    assert get_azure_file_content("test_simple_write.csv") == '1,"a"\n'
+
+
+def test_simple_write_connection_string(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        "CREATE TABLE test_simple_write_connection_string (key UInt64, data String) Engine = AzureBlobStorage('DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;BlobEndpoint=http://azurite1:10000/devstoreaccount1;', 'cont', 'test_simple_write_c.csv', 'CSV')",
+    )
+    azure_query(node, "INSERT INTO test_simple_write_connection_string VALUES (1, 'a')")
+    print(get_azure_file_content("test_simple_write_c.csv"))
+    assert get_azure_file_content("test_simple_write_c.csv") == '1,"a"\n'
+
+
+def test_simple_write_named_collection_1(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        "CREATE TABLE test_simple_write_named_collection_1 (key UInt64, data String) Engine = AzureBlobStorage(azure_conf1)",
+    )
+    azure_query(
+        node, "INSERT INTO test_simple_write_named_collection_1 VALUES (1, 'a')"
+    )
+    print(get_azure_file_content("test_simple_write_named.csv"))
+    assert get_azure_file_content("test_simple_write_named.csv") == '1,"a"\n'
+    azure_query(node, "TRUNCATE TABLE test_simple_write_named_collection_1")
+
+
+def test_simple_write_named_collection_2(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        "CREATE TABLE test_simple_write_named_collection_2 (key UInt64, data String) Engine = AzureBlobStorage(azure_conf2, container='cont', blob_path='test_simple_write_named_2.csv', format='CSV')",
+    )
+    azure_query(
+        node, "INSERT INTO test_simple_write_named_collection_2 VALUES (1, 'a')"
+    )
+    print(get_azure_file_content("test_simple_write_named_2.csv"))
+    assert get_azure_file_content("test_simple_write_named_2.csv") == '1,"a"\n'
+
+
+def test_partition_by(cluster):
+    node = cluster.instances["node"]
+    table_format = "column1 UInt32, column2 UInt32, column3 UInt32"
+    partition_by = "column3"
+    values = "(1, 2, 3), (3, 2, 1), (78, 43, 45)"
+    filename = "test_{_partition_id}.csv"
+
+    azure_query(
+        node,
+        f"CREATE TABLE test_partitioned_write ({table_format}) Engine = AzureBlobStorage('http://azurite1:10000/devstoreaccount1', 'cont', '{filename}', 'devstoreaccount1', 'Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==', 'CSV') PARTITION BY {partition_by}",
+    )
+    azure_query(node, f"INSERT INTO test_partitioned_write VALUES {values}")
+
+    assert "1,2,3\n" == get_azure_file_content("test_3.csv")
+    assert "3,2,1\n" == get_azure_file_content("test_1.csv")
+    assert "78,43,45\n" == get_azure_file_content("test_45.csv")
+
+
+def test_partition_by_string_column(cluster):
+    node = cluster.instances["node"]
+    table_format = "col_num UInt32, col_str String"
+    partition_by = "col_str"
+    values = "(1, 'foo/bar'), (3, 'йцук'), (78, '你好')"
+    filename = "test_{_partition_id}.csv"
+    azure_query(
+        node,
+        f"CREATE TABLE test_partitioned_string_write ({table_format}) Engine = AzureBlobStorage('http://azurite1:10000/devstoreaccount1', 'cont', '{filename}', 'devstoreaccount1', 'Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==', 'CSV') PARTITION BY {partition_by}",
+    )
+    azure_query(node, f"INSERT INTO test_partitioned_string_write VALUES {values}")
+
+    assert '1,"foo/bar"\n' == get_azure_file_content("test_foo/bar.csv")
+    assert '3,"йцук"\n' == get_azure_file_content("test_йцук.csv")
+    assert '78,"你好"\n' == get_azure_file_content("test_你好.csv")
+
+
+def test_partition_by_const_column(cluster):
+    node = cluster.instances["node"]
+    table_format = "column1 UInt32, column2 UInt32, column3 UInt32"
+    values = "(1, 2, 3), (3, 2, 1), (78, 43, 45)"
+    partition_by = "'88'"
+    values_csv = "1,2,3\n3,2,1\n78,43,45\n"
+    filename = "test_{_partition_id}.csv"
+    azure_query(
+        node,
+        f"CREATE TABLE test_partitioned_const_write ({table_format}) Engine = AzureBlobStorage('http://azurite1:10000/devstoreaccount1', 'cont', '{filename}', 'devstoreaccount1', 'Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==', 'CSV') PARTITION BY {partition_by}",
+    )
+    azure_query(node, f"INSERT INTO test_partitioned_const_write VALUES {values}")
+    assert values_csv == get_azure_file_content("test_88.csv")
+
+
+def test_truncate(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        "CREATE TABLE test_truncate (key UInt64, data String) Engine = AzureBlobStorage(azure_conf2, container='cont', blob_path='test_truncate.csv', format='CSV')",
+    )
+    azure_query(node, "INSERT INTO test_truncate VALUES (1, 'a')")
+    assert get_azure_file_content("test_truncate.csv") == '1,"a"\n'
+    azure_query(node, "TRUNCATE TABLE test_truncate")
+    with pytest.raises(Exception):
+        print(get_azure_file_content("test_truncate.csv"))
+
+
+def test_simple_read_write(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        "CREATE TABLE test_simple_read_write (key UInt64, data String) Engine = AzureBlobStorage(azure_conf2, container='cont', blob_path='test_simple_read_write.csv', format='CSV')",
+    )
+
+    azure_query(node, "INSERT INTO test_simple_read_write VALUES (1, 'a')")
+    assert get_azure_file_content("test_simple_read_write.csv") == '1,"a"\n'
+    print(azure_query(node, "SELECT * FROM test_simple_read_write"))
+    assert azure_query(node, "SELECT * FROM test_simple_read_write") == "1\ta\n"
+
+
+def test_create_new_files_on_insert(cluster):
+    node = cluster.instances["node"]
+
+    azure_query(
+        node,
+        f"create table test_multiple_inserts(a Int32, b String) ENGINE = AzureBlobStorage(azure_conf2, container='cont', blob_path='test_parquet', format='Parquet')",
+    )
+    azure_query(node, "truncate table test_multiple_inserts")
+    azure_query(
+        node,
+        f"insert into test_multiple_inserts select number, randomString(100) from numbers(10) settings azure_truncate_on_insert=1",
+    )
+    azure_query(
+        node,
+        f"insert into test_multiple_inserts select number, randomString(100) from numbers(20) settings azure_create_new_file_on_insert=1",
+    )
+    azure_query(
+        node,
+        f"insert into test_multiple_inserts select number, randomString(100) from numbers(30) settings azure_create_new_file_on_insert=1",
+    )
+
+    result = azure_query(node, f"select count() from test_multiple_inserts")
+    assert int(result) == 60
+
+    azure_query(node, f"drop table test_multiple_inserts")
+
+
+def test_overwrite(cluster):
+    node = cluster.instances["node"]
+
+    azure_query(
+        node,
+        f"create table test_overwrite(a Int32, b String) ENGINE = AzureBlobStorage(azure_conf2, container='cont', blob_path='test_parquet_overwrite', format='Parquet')",
+    )
+    azure_query(node, "truncate table test_overwrite")
+
+    azure_query(
+        node,
+        f"insert into test_overwrite select number, randomString(100) from numbers(50) settings azure_truncate_on_insert=1",
+    )
+    node.query_and_get_error(
+        f"insert into test_overwrite select number, randomString(100) from numbers(100)"
+    )
+    azure_query(
+        node,
+        f"insert into test_overwrite select number, randomString(100) from numbers(200) settings azure_truncate_on_insert=1",
+    )
+
+    result = azure_query(node, f"select count() from test_overwrite")
+    assert int(result) == 200
+
+
+def test_insert_with_path_with_globs(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        f"create table test_insert_globs(a Int32, b String) ENGINE = AzureBlobStorage(azure_conf2, container='cont', blob_path='test_insert_with_globs*', format='Parquet')",
+    )
+    node.query_and_get_error(
+        f"insert into table function test_insert_globs SELECT number, randomString(100) FROM numbers(500)"
+    )
+
+
+def test_put_get_with_globs(cluster):
+    # type: (ClickHouseCluster) -> None
+    unique_prefix = random.randint(1, 10000)
+    node = cluster.instances["node"]  # type: ClickHouseInstance
+    table_format = "column1 UInt32, column2 UInt32, column3 UInt32"
+    max_path = ""
+    for i in range(10):
+        for j in range(10):
+            path = "{}/{}_{}/{}.csv".format(
+                unique_prefix, i, random.choice(["a", "b", "c", "d"]), j
+            )
+            max_path = max(path, max_path)
+            values = f"({i},{j},{i + j})"
+
+            azure_query(
+                node,
+                f"CREATE TABLE test_put_{i}_{j} ({table_format}) Engine = AzureBlobStorage(azure_conf2, container='cont', blob_path='{path}', format='CSV')",
+            )
+
+            query = f"insert into test_put_{i}_{j} VALUES {values}"
+            azure_query(node, query)
+
+    azure_query(
+        node,
+        f"CREATE TABLE test_glob_select ({table_format}) Engine = AzureBlobStorage(azure_conf2, container='cont', blob_path='{unique_prefix}/*_{{a,b,c,d}}/?.csv', format='CSV')",
+    )
+    query = "select sum(column1), sum(column2), sum(column3), min(_file), max(_path) from test_glob_select"
+    assert azure_query(node, query).splitlines() == [
+        "450\t450\t900\t0.csv\t{bucket}/{max_path}".format(
+            bucket="cont", max_path=max_path
+        )
+    ]
+
+
+def test_azure_glob_scheherazade(cluster):
+    node = cluster.instances["node"]  # type: ClickHouseInstance
+    table_format = "column1 UInt32, column2 UInt32, column3 UInt32"
+    values = "(1, 1, 1)"
+    nights_per_job = 1001 // 30
+    jobs = []
+    for night in range(0, 1001, nights_per_job):
+
+        def add_tales(start, end):
+            for i in range(start, end):
+                path = "night_{}/tale.csv".format(i)
+                unique_num = random.randint(1, 10000)
+                azure_query(
+                    node,
+                    f"CREATE TABLE test_scheherazade_{i}_{unique_num} ({table_format}) Engine = AzureBlobStorage(azure_conf2, container='cont', blob_path='{path}', format='CSV')",
+                )
+                query = (
+                    f"insert into test_scheherazade_{i}_{unique_num} VALUES {values}"
+                )
+                azure_query(node, query)
+
+        jobs.append(
+            threading.Thread(
+                target=add_tales, args=(night, min(night + nights_per_job, 1001))
+            )
+        )
+        jobs[-1].start()
+
+    for job in jobs:
+        job.join()
+
+    azure_query(
+        node,
+        f"CREATE TABLE test_glob_select_scheherazade ({table_format}) Engine = AzureBlobStorage(azure_conf2, container='cont', blob_path='night_*/tale.csv', format='CSV')",
+    )
+    query = "select count(), sum(column1), sum(column2), sum(column3) from test_glob_select_scheherazade"
+    assert azure_query(node, query).splitlines() == ["1001\t1001\t1001\t1001"]
+
+
+@pytest.mark.parametrize(
+    "extension,method",
+    [pytest.param("bin", "gzip", id="bin"), pytest.param("gz", "auto", id="gz")],
+)
+def test_storage_azure_get_gzip(cluster, extension, method):
+    node = cluster.instances["node"]
+    filename = f"test_get_gzip.{extension}"
+    name = f"test_get_gzip_{extension}"
+    data = [
+        "Sophia Intrieri,55",
+        "Jack Taylor,71",
+        "Christopher Silva,66",
+        "Clifton Purser,35",
+        "Richard Aceuedo,43",
+        "Lisa Hensley,31",
+        "Alice Wehrley,1",
+        "Mary Farmer,47",
+        "Samara Ramirez,19",
+        "Shirley Lloyd,51",
+        "Santos Cowger,0",
+        "Richard Mundt,88",
+        "Jerry Gonzalez,15",
+        "Angela James,10",
+        "Norman Ortega,33",
+        "",
+    ]
+    azure_query(node, f"DROP TABLE IF EXISTS {name}")
+
+    buf = io.BytesIO()
+    compressed = gzip.GzipFile(fileobj=buf, mode="wb")
+    compressed.write(("\n".join(data)).encode())
+    compressed.close()
+    put_azure_file_content(filename, buf.getvalue())
+
+    azure_query(
+        node,
+        f"""CREATE TABLE {name} (name String, id UInt32) ENGINE = AzureBlobStorage(
+                                azure_conf2, container='cont', blob_path ='{filename}',
+                                format='CSV',
+                                compression='{method}')""",
+    )
+
+    assert azure_query(node, f"SELECT sum(id) FROM {name}").splitlines() == ["565"]
+    azure_query(node, f"DROP TABLE {name}")
+
+
+def test_schema_inference_no_globs(cluster):
+    node = cluster.instances["node"]  # type: ClickHouseInstance
+    table_format = "column1 UInt32, column2 String, column3 UInt32"
+    azure_query(
+        node,
+        f"CREATE TABLE test_schema_inference_src ({table_format}) Engine = AzureBlobStorage(azure_conf2, container='cont', blob_path='test_schema_inference_no_globs.csv', format='CSVWithNames')",
+    )
+
+    query = f"insert into test_schema_inference_src SELECT number, toString(number), number * number FROM numbers(1000)"
+    azure_query(node, query)
+
+    azure_query(
+        node,
+        f"CREATE TABLE test_select_inference Engine = AzureBlobStorage(azure_conf2, container='cont', blob_path='test_schema_inference_no_globs.csv')",
+    )
+
+    print(node.query("SHOW CREATE TABLE test_select_inference"))
+
+    query = "select sum(column1), sum(length(column2)), sum(column3), min(_file), max(_path) from test_select_inference"
+    assert azure_query(node, query).splitlines() == [
+        "499500\t2890\t332833500\ttest_schema_inference_no_globs.csv\tcont/test_schema_inference_no_globs.csv"
+    ]
+
+
+def test_schema_inference_from_globs(cluster):
+    node = cluster.instances["node"]
+    unique_prefix = random.randint(1, 10000)
+    node = cluster.instances["node"]  # type: ClickHouseInstance
+    table_format = "column1 UInt32, column2 UInt32, column3 UInt32"
+    max_path = ""
+    for i in range(10):
+        for j in range(10):
+            path = "{}/{}_{}/{}.csv".format(
+                unique_prefix, i, random.choice(["a", "b", "c", "d"]), j
+            )
+            max_path = max(path, max_path)
+            values = f"({i},{j},{i + j})"
+
+            azure_query(
+                node,
+                f"CREATE TABLE test_schema_{i}_{j} ({table_format}) Engine = AzureBlobStorage(azure_conf2, container='cont', blob_path='{path}', format='CSVWithNames')",
+            )
+
+            query = f"insert into test_schema_{i}_{j} VALUES {values}"
+            azure_query(node, query)
+
+    azure_query(
+        node,
+        f"CREATE TABLE test_glob_select_inference Engine = AzureBlobStorage(azure_conf2, container='cont', blob_path='{unique_prefix}/*_{{a,b,c,d}}/?.csv')",
+    )
+
+    print(node.query("SHOW CREATE TABLE test_glob_select_inference"))
+
+    query = "select sum(column1), sum(column2), sum(column3), min(_file), max(_path) from test_glob_select_inference"
+    assert azure_query(node, query).splitlines() == [
+        "450\t450\t900\t0.csv\t{bucket}/{max_path}".format(
+            bucket="cont", max_path=max_path
+        )
+    ]
+
+
+def test_simple_write_account_string_table_function(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        "INSERT INTO TABLE FUNCTION azureBlobStorage('http://azurite1:10000/devstoreaccount1', 'cont', 'test_simple_write_tf.csv', 'devstoreaccount1', 'Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==', 'CSV', 'auto', 'key UInt64, data String') VALUES (1, 'a')",
+    )
+    print(get_azure_file_content("test_simple_write_tf.csv"))
+    assert get_azure_file_content("test_simple_write_tf.csv") == '1,"a"\n'
+
+
+def test_simple_write_connection_string_table_function(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        "INSERT INTO TABLE FUNCTION azureBlobStorage('DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;BlobEndpoint=http://azurite1:10000/devstoreaccount1;', 'cont', 'test_simple_write_connection_tf.csv', 'CSV', 'auto', 'key UInt64, data String') VALUES (1, 'a')",
+    )
+    print(get_azure_file_content("test_simple_write_connection_tf.csv"))
+    assert get_azure_file_content("test_simple_write_connection_tf.csv") == '1,"a"\n'
+
+
+def test_simple_write_named_collection_1_table_function(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        "INSERT INTO TABLE FUNCTION azureBlobStorage(azure_conf1) VALUES (1, 'a')",
+    )
+    print(get_azure_file_content("test_simple_write_named.csv"))
+    assert get_azure_file_content("test_simple_write_named.csv") == '1,"a"\n'
+
+    azure_query(
+        node,
+        "CREATE TABLE drop_table (key UInt64, data String) Engine = AzureBlobStorage(azure_conf1)",
+    )
+
+    azure_query(
+        node,
+        "TRUNCATE TABLE drop_table",
+    )
+
+
+def test_simple_write_named_collection_2_table_function(cluster):
+    node = cluster.instances["node"]
+
+    azure_query(
+        node,
+        "INSERT INTO TABLE FUNCTION azureBlobStorage(azure_conf2, container='cont', blob_path='test_simple_write_named_2_tf.csv', format='CSV', structure='key UInt64, data String') VALUES (1, 'a')",
+    )
+    print(get_azure_file_content("test_simple_write_named_2_tf.csv"))
+    assert get_azure_file_content("test_simple_write_named_2_tf.csv") == '1,"a"\n'
+
+
+def test_put_get_with_globs_tf(cluster):
+    # type: (ClickHouseCluster) -> None
+    unique_prefix = random.randint(1, 10000)
+    node = cluster.instances["node"]  # type: ClickHouseInstance
+    table_format = "column1 UInt32, column2 UInt32, column3 UInt32"
+    max_path = ""
+    for i in range(10):
+        for j in range(10):
+            path = "{}/{}_{}/{}.csv".format(
+                unique_prefix, i, random.choice(["a", "b", "c", "d"]), j
+            )
+            max_path = max(path, max_path)
+            values = f"({i},{j},{i + j})"
+
+            azure_query(
+                node,
+                f"INSERT INTO TABLE FUNCTION azureBlobStorage(azure_conf2, container='cont', blob_path='{path}', format='CSV', compression='auto', structure='{table_format}') VALUES {values}",
+            )
+    query = f"select sum(column1), sum(column2), sum(column3), min(_file), max(_path) from azureBlobStorage(azure_conf2, container='cont', blob_path='{unique_prefix}/*_{{a,b,c,d}}/?.csv', format='CSV', structure='{table_format}')"
+    assert azure_query(node, query).splitlines() == [
+        "450\t450\t900\t0.csv\t{bucket}/{max_path}".format(
+            bucket="cont", max_path=max_path
+        )
+    ]
+
+
+def test_schema_inference_no_globs_tf(cluster):
+    node = cluster.instances["node"]  # type: ClickHouseInstance
+    table_format = "column1 UInt32, column2 String, column3 UInt32"
+
+    query = f"insert into table function azureBlobStorage(azure_conf2, container='cont', blob_path='test_schema_inference_no_globs_tf.csv', format='CSVWithNames', structure='{table_format}') SELECT number, toString(number), number * number FROM numbers(1000)"
+    azure_query(node, query)
+
+    query = "select sum(column1), sum(length(column2)), sum(column3), min(_file), max(_path) from azureBlobStorage(azure_conf2, container='cont', blob_path='test_schema_inference_no_globs_tf.csv')"
+    assert azure_query(node, query).splitlines() == [
+        "499500\t2890\t332833500\ttest_schema_inference_no_globs_tf.csv\tcont/test_schema_inference_no_globs_tf.csv"
+    ]
+
+
+def test_schema_inference_from_globs_tf(cluster):
+    node = cluster.instances["node"]
+    unique_prefix = random.randint(1, 10000)
+    node = cluster.instances["node"]  # type: ClickHouseInstance
+    table_format = "column1 UInt32, column2 UInt32, column3 UInt32"
+    max_path = ""
+
+    for i in range(10):
+        for j in range(10):
+            path = "{}/{}_{}/{}.csv".format(
+                unique_prefix, i, random.choice(["a", "b", "c", "d"]), j
+            )
+            max_path = max(path, max_path)
+            values = f"({i},{j},{i + j})"
+
+            query = f"insert into table function azureBlobStorage(azure_conf2, container='cont', blob_path='{path}', format='CSVWithNames', structure='{table_format}') VALUES {values}"
+            azure_query(node, query)
+
+    query = f"select sum(column1), sum(column2), sum(column3), min(_file), max(_path) from azureBlobStorage(azure_conf2, container='cont', blob_path='{unique_prefix}/*_{{a,b,c,d}}/?.csv')"
+    assert azure_query(node, query).splitlines() == [
+        "450\t450\t900\t0.csv\t{bucket}/{max_path}".format(
+            bucket="cont", max_path=max_path
+        )
+    ]
+
+
+def test_partition_by_tf(cluster):
+    node = cluster.instances["node"]
+    table_format = "column1 UInt32, column2 UInt32, column3 UInt32"
+    partition_by = "column3"
+    values = "(1, 2, 3), (3, 2, 1), (78, 43, 45)"
+    filename = "test_partition_tf_{_partition_id}.csv"
+
+    azure_query(
+        node,
+        f"INSERT INTO TABLE FUNCTION azureBlobStorage('http://azurite1:10000/devstoreaccount1', 'cont', '{filename}', 'devstoreaccount1', 'Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==', 'CSV', 'auto', '{table_format}') PARTITION BY {partition_by} VALUES {values}",
+    )
+
+    assert "1,2,3\n" == get_azure_file_content("test_partition_tf_3.csv")
+    assert "3,2,1\n" == get_azure_file_content("test_partition_tf_1.csv")
+    assert "78,43,45\n" == get_azure_file_content("test_partition_tf_45.csv")
+
+
+def test_filter_using_file(cluster):
+    node = cluster.instances["node"]
+    table_format = "column1 UInt32, column2 UInt32, column3 UInt32"
+    partition_by = "column3"
+    values = "(1, 2, 3), (3, 2, 1), (78, 43, 45)"
+    filename = "test_partition_tf_{_partition_id}.csv"
+
+    azure_query(
+        node,
+        f"INSERT INTO TABLE FUNCTION azureBlobStorage('http://azurite1:10000/devstoreaccount1', 'cont', '{filename}', 'devstoreaccount1', 'Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==', 'CSV', 'auto', '{table_format}') PARTITION BY {partition_by} VALUES {values}",
+    )
+
+    query = f"select count(*) from azureBlobStorage('http://azurite1:10000/devstoreaccount1',  'cont', 'test_partition_tf_*.csv', 'devstoreaccount1', 'Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==', 'CSV', 'auto', '{table_format}') WHERE _file='test_partition_tf_3.csv'"
+    assert azure_query(node, query) == "1\n"
diff --git a/tests/integration/test_storage_hdfs/test.py b/tests/integration/test_storage_hdfs/test.py
index edf5344e887..5ac1d3bea6f 100644
--- a/tests/integration/test_storage_hdfs/test.py
+++ b/tests/integration/test_storage_hdfs/test.py
@@ -816,6 +816,56 @@ def test_hdfsCluster_unset_skip_unavailable_shards(started_cluster):
     )
 
 
+def test_skip_empty_files(started_cluster):
+    node = started_cluster.instances["node1"]
+
+    node.query(
+        f"insert into function hdfs('hdfs://hdfs1:9000/skip_empty_files1.parquet', TSVRaw) select * from numbers(0) settings hdfs_truncate_on_insert=1"
+    )
+
+    node.query(
+        f"insert into function hdfs('hdfs://hdfs1:9000/skip_empty_files2.parquet') select * from numbers(1) settings hdfs_truncate_on_insert=1"
+    )
+
+    node.query_and_get_error(
+        f"select * from hdfs('hdfs://hdfs1:9000/skip_empty_files1.parquet') settings hdfs_skip_empty_files=0"
+    )
+
+    node.query_and_get_error(
+        f"select * from hdfs('hdfs://hdfs1:9000/skip_empty_files1.parquet', auto, 'number UINt64') settings hdfs_skip_empty_files=0"
+    )
+
+    node.query_and_get_error(
+        f"select * from hdfs('hdfs://hdfs1:9000/skip_empty_files1.parquet') settings hdfs_skip_empty_files=1"
+    )
+
+    res = node.query(
+        f"select * from hdfs('hdfs://hdfs1:9000/skip_empty_files1.parquet', auto, 'number UInt64') settings hdfs_skip_empty_files=1"
+    )
+
+    assert len(res) == 0
+
+    node.query_and_get_error(
+        f"select * from hdfs('hdfs://hdfs1:9000/skip_empty_files*.parquet') settings hdfs_skip_empty_files=0"
+    )
+
+    node.query_and_get_error(
+        f"select * from hdfs('hdfs://hdfs1:9000/skip_empty_files*.parquet', auto, 'number UInt64') settings hdfs_skip_empty_files=0"
+    )
+
+    res = node.query(
+        f"select * from hdfs('hdfs://hdfs1:9000/skip_empty_files*.parquet') settings hdfs_skip_empty_files=1"
+    )
+
+    assert int(res) == 0
+
+    res = node.query(
+        f"select * from hdfs('hdfs://hdfs1:9000/skip_empty_files*.parquet', auto, 'number UInt64') settings hdfs_skip_empty_files=1"
+    )
+
+    assert int(res) == 0
+
+
 if __name__ == "__main__":
     cluster.start()
     input("Cluster created, press any key to destroy...")
diff --git a/tests/integration/test_storage_hudi/test.py b/tests/integration/test_storage_hudi/test.py
index de9cde43609..2b77f4d6d61 100644
--- a/tests/integration/test_storage_hudi/test.py
+++ b/tests/integration/test_storage_hudi/test.py
@@ -79,7 +79,7 @@ def run_query(instance, query, stdin=None, settings=None):
 
 
 def write_hudi_from_df(spark, table_name, df, result_path, mode="overwrite"):
-    if mode is "overwrite":
+    if mode == "overwrite":
         hudi_write_mode = "insert_overwrite"
     else:
         hudi_write_mode = "upsert"
diff --git a/tests/integration/test_storage_mongodb/test.py b/tests/integration/test_storage_mongodb/test.py
index 6ba5520704d..6ce71fb91fa 100644
--- a/tests/integration/test_storage_mongodb/test.py
+++ b/tests/integration/test_storage_mongodb/test.py
@@ -71,6 +71,40 @@ def test_simple_select(started_cluster):
     simple_mongo_table.drop()
 
 
+@pytest.mark.parametrize("started_cluster", [False], indirect=["started_cluster"])
+def test_simple_select_from_view(started_cluster):
+    mongo_connection = get_mongo_connection(started_cluster)
+    db = mongo_connection["test"]
+    db.add_user("root", "clickhouse")
+    simple_mongo_table = db["simple_table"]
+    data = []
+    for i in range(0, 100):
+        data.append({"key": i, "data": hex(i * i)})
+    simple_mongo_table.insert_many(data)
+    simple_mongo_table_view = db.create_collection(
+        "simple_table_view", viewOn="simple_table"
+    )
+
+    node = started_cluster.instances["node"]
+    node.query(
+        "CREATE TABLE simple_mongo_table(key UInt64, data String) ENGINE = MongoDB('mongo1:27017', 'test', 'simple_table_view', 'root', 'clickhouse')"
+    )
+
+    assert node.query("SELECT COUNT() FROM simple_mongo_table") == "100\n"
+    assert (
+        node.query("SELECT sum(key) FROM simple_mongo_table")
+        == str(sum(range(0, 100))) + "\n"
+    )
+
+    assert (
+        node.query("SELECT data from simple_mongo_table where key = 42")
+        == hex(42 * 42) + "\n"
+    )
+    node.query("DROP TABLE simple_mongo_table")
+    simple_mongo_table_view.drop()
+    simple_mongo_table.drop()
+
+
 @pytest.mark.parametrize("started_cluster", [False], indirect=["started_cluster"])
 def test_arrays(started_cluster):
     mongo_connection = get_mongo_connection(started_cluster)
@@ -411,13 +445,16 @@ def test_simple_insert_select(started_cluster):
     node.query(
         "CREATE TABLE simple_mongo_table(key UInt64, data String) ENGINE = MongoDB('mongo1:27017', 'test', 'simple_table', 'root', 'clickhouse')"
     )
-    node.query("INSERT INTO simple_mongo_table SELECT 1, 'kek'")
+    node.query(
+        "INSERT INTO simple_mongo_table SELECT number, 'kek' || toString(number) FROM numbers(10)"
+    )
 
     assert (
-        node.query("SELECT data from simple_mongo_table where key = 1").strip() == "kek"
+        node.query("SELECT data from simple_mongo_table where key = 7").strip()
+        == "kek7"
     )
     node.query("INSERT INTO simple_mongo_table(key) SELECT 12")
-    assert int(node.query("SELECT count() from simple_mongo_table")) == 2
+    assert int(node.query("SELECT count() from simple_mongo_table")) == 11
     assert (
         node.query("SELECT data from simple_mongo_table where key = 12").strip() == ""
     )
diff --git a/tests/integration/test_storage_nats/test.py b/tests/integration/test_storage_nats/test.py
index 1d7e046864b..4d7e4cf813d 100644
--- a/tests/integration/test_storage_nats/test.py
+++ b/tests/integration/test_storage_nats/test.py
@@ -931,7 +931,8 @@ def test_nats_overloaded_insert(nats_cluster):
         CREATE TABLE test.view_overload (key UInt64, value UInt64)
             ENGINE = MergeTree
             ORDER BY key
-            SETTINGS old_parts_lifetime=5, cleanup_delay_period=2, cleanup_delay_period_random_add=3;
+            SETTINGS old_parts_lifetime=5, cleanup_delay_period=2, cleanup_delay_period_random_add=3,
+            cleanup_thread_preferred_points_per_iteration=0;
         CREATE MATERIALIZED VIEW test.consumer_overload TO test.view_overload AS
             SELECT * FROM test.nats_consume;
     """
diff --git a/tests/integration/test_storage_postgresql/test.py b/tests/integration/test_storage_postgresql/test.py
index d60a90ed7ce..9f7c012e66f 100644
--- a/tests/integration/test_storage_postgresql/test.py
+++ b/tests/integration/test_storage_postgresql/test.py
@@ -323,7 +323,7 @@ def test_concurrent_queries(started_cluster):
         )
     )
     print(count)
-    assert count <= 18
+    assert count <= 18  # 16 for test.test_table + 1 for conn + 1 for test.stat
 
     busy_pool = Pool(30)
     p = busy_pool.map_async(node_insert, range(30))
@@ -335,7 +335,7 @@ def test_concurrent_queries(started_cluster):
         )
     )
     print(count)
-    assert count <= 18
+    assert count <= 19  # 16 for test.test_table + 1 for conn + at most 2 for test.stat
 
     busy_pool = Pool(30)
     p = busy_pool.map_async(node_insert_select, range(30))
@@ -347,7 +347,7 @@ def test_concurrent_queries(started_cluster):
         )
     )
     print(count)
-    assert count <= 18
+    assert count <= 20  # 16 for test.test_table + 1 for conn + at most 3 for test.stat
 
     node1.query("DROP TABLE test.test_table;")
     node1.query("DROP TABLE test.stat;")
diff --git a/tests/integration/test_storage_rabbitmq/test.py b/tests/integration/test_storage_rabbitmq/test.py
index 4e1e28373e3..751279f5e5a 100644
--- a/tests/integration/test_storage_rabbitmq/test.py
+++ b/tests/integration/test_storage_rabbitmq/test.py
@@ -642,7 +642,8 @@ def test_rabbitmq_sharding_between_queues_publish(rabbitmq_cluster):
         CREATE TABLE test.view (key UInt64, value UInt64, channel_id String)
             ENGINE = MergeTree
             ORDER BY key
-            SETTINGS old_parts_lifetime=5, cleanup_delay_period=2, cleanup_delay_period_random_add=3;
+            SETTINGS old_parts_lifetime=5, cleanup_delay_period=2, cleanup_delay_period_random_add=3,
+            cleanup_thread_preferred_points_per_iteration=0;
         CREATE MATERIALIZED VIEW test.consumer TO test.view AS
             SELECT *, _channel_id AS channel_id FROM test.rabbitmq;
     """
@@ -857,7 +858,7 @@ def test_rabbitmq_insert(rabbitmq_cluster):
         if len(insert_messages) == 50:
             channel.stop_consuming()
 
-    consumer.basic_consume(onReceived, queue_name)
+    consumer.basic_consume(queue_name, onReceived)
     consumer.start_consuming()
     consumer_connection.close()
 
@@ -920,7 +921,7 @@ def test_rabbitmq_insert_headers_exchange(rabbitmq_cluster):
         if len(insert_messages) == 50:
             channel.stop_consuming()
 
-    consumer.basic_consume(onReceived, queue_name)
+    consumer.basic_consume(queue_name, onReceived)
     consumer.start_consuming()
     consumer_connection.close()
 
@@ -1019,7 +1020,6 @@ def test_rabbitmq_many_inserts(rabbitmq_cluster):
     ), "ClickHouse lost some messages: {}".format(result)
 
 
-@pytest.mark.skip(reason="Flaky")
 def test_rabbitmq_overloaded_insert(rabbitmq_cluster):
     instance.query(
         """
@@ -1116,7 +1116,8 @@ def test_rabbitmq_direct_exchange(rabbitmq_cluster):
         CREATE TABLE test.destination(key UInt64, value UInt64)
         ENGINE = MergeTree()
         ORDER BY key
-        SETTINGS old_parts_lifetime=5, cleanup_delay_period=2, cleanup_delay_period_random_add=3;
+        SETTINGS old_parts_lifetime=5, cleanup_delay_period=2, cleanup_delay_period_random_add=3,
+        cleanup_thread_preferred_points_per_iteration=0;
     """
     )
 
@@ -2048,7 +2049,6 @@ def test_rabbitmq_restore_failed_connection_without_losses_1(rabbitmq_cluster):
     )
 
 
-@pytest.mark.skip(reason="Timeout: FIXME")
 def test_rabbitmq_restore_failed_connection_without_losses_2(rabbitmq_cluster):
     logging.getLogger("pika").propagate = False
     instance.query(
@@ -2951,7 +2951,6 @@ def test_rabbitmq_address(rabbitmq_cluster):
     instance2.query("drop table rabbit_out sync")
 
 
-@pytest.mark.skip(reason="FIXME: flaky (something with channel.start_consuming()")
 def test_format_with_prefix_and_suffix(rabbitmq_cluster):
     instance.query(
         """
@@ -2989,7 +2988,7 @@ def test_format_with_prefix_and_suffix(rabbitmq_cluster):
         if len(insert_messages) == 2:
             channel.stop_consuming()
 
-    consumer.basic_consume(onReceived, queue_name)
+    consumer.basic_consume(queue_name, onReceived)
 
     consumer.start_consuming()
     consumer_connection.close()
@@ -3000,7 +2999,6 @@ def test_format_with_prefix_and_suffix(rabbitmq_cluster):
     )
 
 
-@pytest.mark.skip(reason="FIXME: flaky (something with channel.start_consuming()")
 def test_max_rows_per_message(rabbitmq_cluster):
     num_rows = 5
 
@@ -3048,7 +3046,7 @@ def test_max_rows_per_message(rabbitmq_cluster):
         if len(insert_messages) == 2:
             channel.stop_consuming()
 
-    consumer.basic_consume(onReceived, queue_name)
+    consumer.basic_consume(queue_name, onReceived)
     consumer.start_consuming()
     consumer_connection.close()
 
@@ -3073,7 +3071,6 @@ def test_max_rows_per_message(rabbitmq_cluster):
     assert result == "0\t0\n10\t100\n20\t200\n30\t300\n40\t400\n"
 
 
-@pytest.mark.skip(reason="FIXME: flaky (something with channel.start_consuming()")
 def test_row_based_formats(rabbitmq_cluster):
     num_rows = 10
 
@@ -3146,7 +3143,7 @@ def test_row_based_formats(rabbitmq_cluster):
             if insert_messages == 2:
                 channel.stop_consuming()
 
-        consumer.basic_consume(onReceived, queue_name)
+        consumer.basic_consume(queue_name, onReceived)
         consumer.start_consuming()
         consumer_connection.close()
 
@@ -3170,7 +3167,6 @@ def test_row_based_formats(rabbitmq_cluster):
         assert result == expected
 
 
-@pytest.mark.skip(reason="FIXME: flaky (something with channel.start_consuming()")
 def test_block_based_formats_1(rabbitmq_cluster):
     instance.query(
         """
@@ -3209,7 +3205,7 @@ def test_block_based_formats_1(rabbitmq_cluster):
         if len(insert_messages) == 3:
             channel.stop_consuming()
 
-    consumer.basic_consume(onReceived, queue_name)
+    consumer.basic_consume(queue_name, onReceived)
     consumer.start_consuming()
     consumer_connection.close()
 
@@ -3232,7 +3228,6 @@ def test_block_based_formats_1(rabbitmq_cluster):
     ]
 
 
-@pytest.mark.skip(reason="FIXME: flaky (something with channel.start_consuming()")
 def test_block_based_formats_2(rabbitmq_cluster):
     num_rows = 100
 
@@ -3294,7 +3289,7 @@ def test_block_based_formats_2(rabbitmq_cluster):
             if insert_messages == 9:
                 channel.stop_consuming()
 
-        consumer.basic_consume(onReceived, queue_name)
+        consumer.basic_consume(queue_name, onReceived)
         consumer.start_consuming()
         consumer_connection.close()
 
diff --git a/tests/queries/0_stateless/02701_fail_on_invalid_having.reference b/tests/integration/test_storage_redis/__init__.py
similarity index 100%
rename from tests/queries/0_stateless/02701_fail_on_invalid_having.reference
rename to tests/integration/test_storage_redis/__init__.py
diff --git a/tests/integration/test_storage_redis/test.py b/tests/integration/test_storage_redis/test.py
new file mode 100644
index 00000000000..2fd97b9bebd
--- /dev/null
+++ b/tests/integration/test_storage_redis/test.py
@@ -0,0 +1,388 @@
+## sudo -H pip install redis
+import redis
+import pytest
+import struct
+import sys
+
+from helpers.client import QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import TSV
+
+cluster = ClickHouseCluster(__file__)
+
+node = cluster.add_instance("node", with_redis=True)
+
+
+@pytest.fixture(scope="module")
+def started_cluster():
+    try:
+        cluster.start()
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+def get_redis_connection(db_id=0):
+    client = redis.Redis(
+        host="localhost", port=cluster.redis_port, password="clickhouse", db=db_id
+    )
+    return client
+
+
+def get_address_for_ch():
+    return cluster.redis_host + ":6379"
+
+
+def drop_table(table):
+    node.query(f"DROP TABLE IF EXISTS {table} SYNC")
+
+
+# see SerializationString.serializeBinary
+def serialize_binary_for_string(x):
+    var_uint_max = (1 << 63) - 1
+    buf = bytearray()
+    # write length
+    length = len(x)
+    # length = (length << 1) ^ (length >> 63)
+    if length > var_uint_max:
+        raise ValueError("Value too large for varint encoding")
+    for i in range(9):
+        byte = length & 0x7F
+        if length > 0x7F:
+            byte |= 0x80
+        buf += bytes([byte])
+        length >>= 7
+        if not length:
+            break
+    # write data
+    buf += x.encode("utf-8")
+    return bytes(buf)
+
+
+# see SerializationNumber.serializeBinary
+def serialize_binary_for_uint32(x):
+    buf = bytearray()
+    packed_num = struct.pack("I", x)
+    buf += packed_num
+    if sys.byteorder != "little":
+        buf.reverse()
+    return bytes(buf)
+
+
+def test_simple_select(started_cluster):
+    client = get_redis_connection()
+    address = get_address_for_ch()
+
+    # clean all
+    client.flushall()
+    drop_table("test_simple_select")
+
+    data = {}
+    for i in range(100):
+        packed = serialize_binary_for_string(str(i))
+        data[packed] = packed
+
+    client.mset(data)
+    client.close()
+
+    # create table
+    node.query(
+        f"""
+        CREATE TABLE test_simple_select(
+            k String, 
+            v String
+        ) Engine=Redis('{address}', 0, 'clickhouse') PRIMARY KEY (k)
+        """
+    )
+
+    response = TSV.toMat(
+        node.query("SELECT k, v FROM test_simple_select WHERE k='0' FORMAT TSV")
+    )
+    assert len(response) == 1
+    assert response[0] == ["0", "0"]
+
+    response = TSV.toMat(
+        node.query("SELECT * FROM test_simple_select ORDER BY k FORMAT TSV")
+    )
+    assert len(response) == 100
+    assert response[0] == ["0", "0"]
+
+
+def test_select_int(started_cluster):
+    client = get_redis_connection()
+    address = get_address_for_ch()
+
+    # clean all
+    client.flushall()
+    drop_table("test_select_int")
+
+    data = {}
+    for i in range(100):
+        packed = serialize_binary_for_uint32(i)
+        data[packed] = packed
+
+    client.mset(data)
+    client.close()
+
+    # create table
+    node.query(
+        f"""
+        CREATE TABLE test_select_int(
+            k UInt32, 
+            v UInt32
+        ) Engine=Redis('{address}', 0, 'clickhouse') PRIMARY KEY (k)
+        """
+    )
+
+    response = TSV.toMat(
+        node.query("SELECT k, v FROM test_select_int WHERE k=0 FORMAT TSV")
+    )
+    assert len(response) == 1
+    assert response[0] == ["0", "0"]
+
+    response = TSV.toMat(
+        node.query("SELECT * FROM test_select_int ORDER BY k FORMAT TSV")
+    )
+    assert len(response) == 100
+    assert response[0] == ["0", "0"]
+
+
+def test_create_table(started_cluster):
+    address = get_address_for_ch()
+
+    # simple creation
+    drop_table("test_create_table")
+    node.query(
+        f"""
+        CREATE TABLE test_create_table(
+            k String,
+            v UInt32
+        ) Engine=Redis('{address}') PRIMARY KEY (k)
+        """
+    )
+
+    # simple creation with full engine args
+    drop_table("test_create_table")
+    node.query(
+        f"""
+        CREATE TABLE test_create_table(
+            k String,
+            v UInt32
+        ) Engine=Redis('{address}', 0, 'clickhouse', 10) PRIMARY KEY (k)
+        """
+    )
+
+    drop_table("test_create_table")
+    node.query(
+        f"""
+        CREATE TABLE test_create_table(
+            k String,
+            f String,
+            v UInt32
+        ) Engine=Redis('{address}', 0, 'clickhouse', 10) PRIMARY KEY (k)
+        """
+    )
+
+    drop_table("test_create_table")
+    with pytest.raises(QueryRuntimeException):
+        node.query(
+            f"""
+            CREATE TABLE test_create_table(
+                k String,
+                f String,
+                v UInt32
+            ) Engine=Redis('{address}', 0, 'clickhouse', 10) PRIMARY KEY ()
+            """
+        )
+
+    drop_table("test_create_table")
+    with pytest.raises(QueryRuntimeException):
+        node.query(
+            f"""
+            CREATE TABLE test_create_table(
+                k String,
+                f String,
+                v UInt32
+            ) Engine=Redis('{address}', 0, 'clickhouse', 10)
+            """
+        )
+
+
+def test_simple_insert(started_cluster):
+    client = get_redis_connection()
+    address = get_address_for_ch()
+
+    # clean all
+    client.flushall()
+    drop_table("test_simple_insert")
+
+    node.query(
+        f"""
+        CREATE TABLE test_simple_insert(
+            k UInt32, 
+            m DateTime,
+            n String
+        ) Engine=Redis('{address}', 0, 'clickhouse') PRIMARY KEY (k)
+        """
+    )
+
+    node.query(
+        """
+        INSERT INTO test_simple_insert Values 
+        (1, '2023-06-01 00:00:00', 'lili'), (2, '2023-06-02 00:00:00', 'lucy')
+        """
+    )
+
+    response = node.query("SELECT COUNT(*) FROM test_simple_insert FORMAT Values")
+    assert response == "(2)"
+
+    response = TSV.toMat(
+        node.query("SELECT k, m, n FROM test_simple_insert WHERE k=1 FORMAT TSV")
+    )
+    assert len(response) == 1
+    assert response[0] == ["1", "2023-06-01 00:00:00", "lili"]
+
+    response = TSV.toMat(
+        node.query(
+            "SELECT k, m, n FROM test_simple_insert WHERE m='2023-06-01 00:00:00' FORMAT TSV"
+        )
+    )
+    assert len(response) == 1
+    assert response[0] == ["1", "2023-06-01 00:00:00", "lili"]
+
+    response = TSV.toMat(
+        node.query("SELECT k, m, n FROM test_simple_insert WHERE n='lili' FORMAT TSV")
+    )
+    assert len(response) == 1
+    assert response[0] == ["1", "2023-06-01 00:00:00", "lili"]
+
+
+def test_update(started_cluster):
+    client = get_redis_connection()
+    address = get_address_for_ch()
+    # clean all
+    client.flushall()
+    drop_table("test_update")
+
+    node.query(
+        f"""
+        CREATE TABLE test_update(
+            k UInt32, 
+            m DateTime,
+            n String
+        ) Engine=Redis('{address}', 0, 'clickhouse') PRIMARY KEY (k)
+        """
+    )
+
+    node.query(
+        """
+        INSERT INTO test_update Values 
+        (1, '2023-06-01 00:00:00', 'lili'), (2, '2023-06-02 00:00:00', 'lucy')
+        """
+    )
+
+    response = node.query(
+        """
+        ALTER TABLE test_update UPDATE m='2023-06-03 00:00:00' WHERE k=1
+        """
+    )
+
+    print("update response: ", response)
+
+    response = TSV.toMat(
+        node.query("SELECT k, m, n FROM test_update WHERE k=1 FORMAT TSV")
+    )
+    assert len(response) == 1
+    assert response[0] == ["1", "2023-06-03 00:00:00", "lili"]
+
+    # can not update key
+    with pytest.raises(QueryRuntimeException):
+        node.query(
+            """
+            ALTER TABLE test_update UPDATE k=2 WHERE k=1
+            """
+        )
+
+
+def test_delete(started_cluster):
+    client = get_redis_connection()
+    address = get_address_for_ch()
+
+    # clean all
+    client.flushall()
+    drop_table("test_delete")
+
+    node.query(
+        f"""
+        CREATE TABLE test_delete(
+            k UInt32, 
+            m DateTime,
+            n String
+        ) Engine=Redis('{address}', 0, 'clickhouse') PRIMARY KEY (k)
+        """
+    )
+
+    node.query(
+        """
+        INSERT INTO test_delete Values 
+        (1, '2023-06-01 00:00:00', 'lili'), (2, '2023-06-02 00:00:00', 'lucy')
+        """
+    )
+
+    response = node.query(
+        """
+        ALTER TABLE test_delete DELETE WHERE k=1
+        """
+    )
+
+    print("delete response: ", response)
+
+    response = TSV.toMat(node.query("SELECT k, m, n FROM test_delete FORMAT TSV"))
+    assert len(response) == 1
+    assert response[0] == ["2", "2023-06-02 00:00:00", "lucy"]
+
+    response = node.query(
+        """
+        ALTER TABLE test_delete DELETE WHERE m='2023-06-02 00:00:00'
+        """
+    )
+
+    response = TSV.toMat(node.query("SELECT k, m, n FROM test_delete FORMAT TSV"))
+    assert len(response) == 0
+
+
+def test_truncate(started_cluster):
+    client = get_redis_connection()
+    address = get_address_for_ch()
+    # clean all
+    client.flushall()
+    drop_table("test_truncate")
+
+    node.query(
+        f"""
+        CREATE TABLE test_truncate(
+            k UInt32, 
+            m DateTime,
+            n String
+        ) Engine=Redis('{address}', 0, 'clickhouse') PRIMARY KEY (k)
+        """
+    )
+
+    node.query(
+        """
+        INSERT INTO test_truncate Values 
+        (1, '2023-06-01 00:00:00', 'lili'), (2, '2023-06-02 00:00:00', 'lucy')
+        """
+    )
+
+    response = node.query(
+        """
+        TRUNCATE TABLE test_truncate
+        """
+    )
+
+    print("truncate table response: ", response)
+
+    response = TSV.toMat(node.query("SELECT COUNT(*) FROM test_truncate FORMAT TSV"))
+    assert len(response) == 1
+    assert response[0] == ["0"]
diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index f983bd618e3..6c251d2f84e 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -1011,7 +1011,7 @@ def test_seekable_formats(started_cluster):
     )
 
     result = instance.query(
-        f"SELECT count() FROM {table_function} SETTINGS max_memory_usage='60M'"
+        f"SELECT count() FROM {table_function} SETTINGS max_memory_usage='60M', max_download_threads=1"
     )
     assert int(result) == 1500000
 
@@ -1713,3 +1713,70 @@ def test_s3_list_objects_failure(started_cluster):
 
         assert ei.value.returncode == 243
         assert "Could not list objects" in ei.value.stderr
+
+
+def test_skip_empty_files(started_cluster):
+    bucket = started_cluster.minio_bucket
+    instance = started_cluster.instances["dummy"]
+
+    instance.query(
+        f"insert into function s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/skip_empty_files1.parquet', TSVRaw) select * from numbers(0) settings s3_truncate_on_insert=1"
+    )
+
+    instance.query(
+        f"insert into function s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/skip_empty_files2.parquet') select * from numbers(1) settings s3_truncate_on_insert=1"
+    )
+
+    def test(engine, setting):
+        instance.query_and_get_error(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/skip_empty_files1.parquet') settings {setting}=0"
+        )
+
+        instance.query_and_get_error(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/skip_empty_files1.parquet', auto, 'number UINt64') settings {setting}=0"
+        )
+
+        instance.query_and_get_error(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/skip_empty_files1.parquet') settings {setting}=1"
+        )
+
+        res = instance.query(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/skip_empty_files1.parquet', auto, 'number UInt64') settings {setting}=1"
+        )
+
+        assert len(res) == 0
+
+        instance.query_and_get_error(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/skip_empty_files{{1,2}}.parquet') settings {setting}=0"
+        )
+
+        instance.query_and_get_error(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/skip_empty_files{{1,2}}.parquet', auto, 'number UInt64') settings {setting}=0"
+        )
+
+        res = instance.query(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/skip_empty_files{{1,2}}.parquet') settings {setting}=1"
+        )
+
+        assert int(res) == 0
+
+        res = instance.query(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/skip_empty_files{{1,2}}.parquet', auto, 'number UInt64') settings {setting}=1"
+        )
+
+        assert int(res) == 0
+
+    test("s3", "s3_skip_empty_files")
+    test("url", "engine_url_skip_empty_files")
+
+    res = instance.query(
+        f"select * from url('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/skip_empty_files{{1|2}}.parquet') settings engine_url_skip_empty_files=1"
+    )
+
+    assert int(res) == 0
+
+    res = instance.query(
+        f"select * from url('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/skip_empty_files{{11|1|22}}.parquet', auto, 'number UInt64') settings engine_url_skip_empty_files=1"
+    )
+
+    assert len(res.strip()) == 0
diff --git a/tests/integration/test_system_metrics/test.py b/tests/integration/test_system_metrics/test.py
index 9ebe198a109..338622b824e 100644
--- a/tests/integration/test_system_metrics/test.py
+++ b/tests/integration/test_system_metrics/test.py
@@ -13,7 +13,9 @@ def fill_nodes(nodes, shard):
                 CREATE DATABASE test;
 
                 CREATE TABLE test.test_table(date Date, id UInt32)
-                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) 
+                SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5,
+                cleanup_delay_period=0, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;
             """.format(
                 shard=shard, replica=node.name
             )
diff --git a/tests/integration/test_table_function_redis/__init__.py b/tests/integration/test_table_function_redis/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_table_function_redis/test.py b/tests/integration/test_table_function_redis/test.py
new file mode 100644
index 00000000000..f4bcebe2f90
--- /dev/null
+++ b/tests/integration/test_table_function_redis/test.py
@@ -0,0 +1,230 @@
+import datetime
+
+import redis
+import pytest
+import sys
+import struct
+
+from helpers.client import QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import TSV
+
+cluster = ClickHouseCluster(__file__)
+
+node = cluster.add_instance("node", with_redis=True)
+
+
+@pytest.fixture(scope="module")
+def started_cluster():
+    try:
+        cluster.start()
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+def get_redis_connection(db_id=0):
+    client = redis.Redis(
+        host="localhost", port=cluster.redis_port, password="clickhouse", db=db_id
+    )
+    return client
+
+
+def get_address_for_ch():
+    return cluster.redis_host + ":6379"
+
+
+# see SerializationString.serializeBinary
+def serialize_binary_for_string(x):
+    var_uint_max = (1 << 63) - 1
+    buf = bytearray()
+    # write length
+    length = len(x)
+    # length = (length << 1) ^ (length >> 63)
+    if length > var_uint_max:
+        raise ValueError("Value too large for varint encoding")
+    for i in range(9):
+        byte = length & 0x7F
+        if length > 0x7F:
+            byte |= 0x80
+        buf += bytes([byte])
+        length >>= 7
+        if not length:
+            break
+    # write data
+    buf += x.encode("utf-8")
+    return bytes(buf)
+
+
+# see SerializationNumber.serializeBinary
+def serialize_binary_for_uint32(x):
+    buf = bytearray()
+    packed_num = struct.pack("I", x)
+    buf += packed_num
+    if sys.byteorder != "little":
+        buf.reverse()
+    return bytes(buf)
+
+
+def test_simple_select(started_cluster):
+    client = get_redis_connection()
+    address = get_address_for_ch()
+
+    # clean all
+    client.flushall()
+
+    data = {}
+    for i in range(100):
+        packed = serialize_binary_for_string(str(i))
+        data[packed] = packed
+
+    client.mset(data)
+    client.close()
+
+    response = TSV.toMat(
+        node.query(
+            f"""
+            SELECT 
+                key, value 
+            FROM 
+                redis('{address}', 'key', 'key String, value String', 0, 'clickhouse', 10) 
+            WHERE 
+                key='0' 
+            FORMAT TSV
+            """
+        )
+    )
+
+    assert len(response) == 1
+    assert response[0] == ["0", "0"]
+
+    response = TSV.toMat(
+        node.query(
+            f"""
+            SELECT 
+                * 
+            FROM 
+                redis('{address}', 'key', 'key String, value String', 0, 'clickhouse', 10) 
+            ORDER BY 
+                key 
+            FORMAT TSV
+            """
+        )
+    )
+
+    assert len(response) == 100
+    assert response[0] == ["0", "0"]
+
+
+def test_create_table(started_cluster):
+    client = get_redis_connection()
+    address = get_address_for_ch()
+
+    # clean all
+    client.flushall()
+    client.close()
+
+    node.query(
+        f"""
+        SELECT 
+            *
+        FROM 
+            redis('{address}', 'k', 'k String, v UInt32', 0, 'clickhouse', 10) 
+        """
+    )
+
+    # illegal data type
+    with pytest.raises(QueryRuntimeException):
+        node.query(
+            f"""
+            SELECT 
+                *
+            FROM 
+                redis('{address}', 'k', 'k not_exist_type, v String', 0, 'clickhouse', 10) 
+            """
+        )
+
+    # illegal key
+    with pytest.raises(QueryRuntimeException):
+        node.query(
+            f"""
+            SELECT 
+                *
+            FROM 
+                redis('{address}', 'not_exist_key', 'k not_exist_type, v String', 0, 'clickhouse', 10) 
+            """
+        )
+
+
+def test_data_type(started_cluster):
+    client = get_redis_connection()
+    address = get_address_for_ch()
+
+    # string
+    client.flushall()
+    value = serialize_binary_for_string("0")
+    client.set(value, value)
+
+    response = TSV.toMat(
+        node.query(
+            f"""
+            SELECT
+                *
+            FROM
+                redis('{address}', 'k', 'k String, v String', 0, 'clickhouse', 10)
+            WHERE
+                k='0'
+            FORMAT TSV
+            """
+        )
+    )
+
+    assert len(response) == 1
+    assert response[0] == ["0", "0"]
+
+    # number
+    client.flushall()
+    value = serialize_binary_for_uint32(0)
+    client.set(value, value)
+
+    response = TSV.toMat(
+        node.query(
+            f"""
+            SELECT
+                *
+            FROM
+                redis('{address}', 'k', 'k UInt32, v UInt32', 0, 'clickhouse', 10)
+            WHERE
+                k=0
+            FORMAT TSV
+            """
+        )
+    )
+
+    assert len(response) == 1
+    assert response[0] == ["0", "0"]
+
+    # datetime
+    client.flushall()
+    # clickhouse store datatime as uint32 in internal
+    dt = datetime.datetime(2023, 6, 1, 0, 0, 0)
+    seconds_since_epoch = dt.timestamp()
+    value = serialize_binary_for_uint32(int(seconds_since_epoch))
+    client.set(value, value)
+
+    response = TSV.toMat(
+        node.query(
+            f"""
+            SELECT
+                *
+            FROM
+                redis('{address}', 'k', 'k DateTime, v DateTime', 0, 'clickhouse', 10)
+            WHERE
+                k='2023-06-01 00:00:00'
+            FORMAT TSV
+            """
+        )
+    )
+
+    assert len(response) == 1
+    assert response[0] == ["2023-06-01 00:00:00", "2023-06-01 00:00:00"]
diff --git a/tests/integration/test_tlsv1_3/test.py b/tests/integration/test_tlsv1_3/test.py
index e25216c67df..f5c2be51ed7 100644
--- a/tests/integration/test_tlsv1_3/test.py
+++ b/tests/integration/test_tlsv1_3/test.py
@@ -4,6 +4,7 @@ from helpers.ssl_context import WrapSSLContextWithSNI
 import urllib.request, urllib.parse
 import ssl
 import os.path
+import logging
 
 
 # The test cluster is configured with certificate for that host name, see 'server-ext.cnf'.
@@ -11,6 +12,7 @@ import os.path
 SSL_HOST = "integration-tests.clickhouse.com"
 HTTPS_PORT = 8443
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
+MAX_RETRY = 5
 
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance(
@@ -88,10 +90,18 @@ def test_https_wrong_cert():
         execute_query_https("SELECT currentUser()", user="john", cert_name="client2")
     assert "HTTP Error 403" in str(err.value)
 
+    count = 0
     # Wrong certificate: self-signed certificate.
-    with pytest.raises(Exception) as err:
-        execute_query_https("SELECT currentUser()", user="john", cert_name="wrong")
-    assert "unknown ca" in str(err.value)
+    while count <= MAX_RETRY:
+        with pytest.raises(Exception) as err:
+            execute_query_https("SELECT currentUser()", user="john", cert_name="wrong")
+        err_str = str(err.value)
+        if count < MAX_RETRY and "Broken pipe" in err_str:
+            count = count + 1
+            logging.warning(f"Failed attempt with wrong cert, err: {err_str}")
+            continue
+        assert "unknown ca" in err_str
+        break
 
     # No certificate.
     with pytest.raises(Exception) as err:
@@ -181,24 +191,45 @@ def test_https_non_ssl_auth():
         == "jane\n"
     )
 
+    count = 0
     # However if we send a certificate it must not be wrong.
-    with pytest.raises(Exception) as err:
-        execute_query_https(
-            "SELECT currentUser()",
-            user="peter",
-            enable_ssl_auth=False,
-            cert_name="wrong",
-        )
-    assert "unknown ca" in str(err.value)
-    with pytest.raises(Exception) as err:
-        execute_query_https(
-            "SELECT currentUser()",
-            user="jane",
-            enable_ssl_auth=False,
-            password="qwe123",
-            cert_name="wrong",
-        )
-    assert "unknown ca" in str(err.value)
+    while count <= MAX_RETRY:
+        with pytest.raises(Exception) as err:
+            execute_query_https(
+                "SELECT currentUser()",
+                user="peter",
+                enable_ssl_auth=False,
+                cert_name="wrong",
+            )
+        err_str = str(err.value)
+        if count < MAX_RETRY and "Broken pipe" in err_str:
+            count = count + 1
+            logging.warning(
+                f"Failed attempt with wrong cert, user: peter, err: {err_str}"
+            )
+            continue
+        assert "unknown ca" in err_str
+        break
+
+    count = 0
+    while count <= MAX_RETRY:
+        with pytest.raises(Exception) as err:
+            execute_query_https(
+                "SELECT currentUser()",
+                user="jane",
+                enable_ssl_auth=False,
+                password="qwe123",
+                cert_name="wrong",
+            )
+        err_str = str(err.value)
+        if count < MAX_RETRY and "Broken pipe" in err_str:
+            count = count + 1
+            logging.warning(
+                f"Failed attempt with wrong cert, user: jane, err: {err_str}"
+            )
+            continue
+        assert "unknown ca" in err_str
+        break
 
 
 def test_create_user():
diff --git a/tests/integration/test_ttl_move/configs/config.d/storage_configuration.xml b/tests/integration/test_ttl_move/configs/config.d/storage_configuration.xml
index ae1dc9dd038..09e6fc99411 100644
--- a/tests/integration/test_ttl_move/configs/config.d/storage_configuration.xml
+++ b/tests/integration/test_ttl_move/configs/config.d/storage_configuration.xml
@@ -107,4 +107,5 @@
 
 </storage_configuration>
 
+<allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 </clickhouse>
diff --git a/tests/integration/test_ttl_move/test.py b/tests/integration/test_ttl_move/test.py
index 7635d784fef..a2f28e21666 100644
--- a/tests/integration/test_ttl_move/test.py
+++ b/tests/integration/test_ttl_move/test.py
@@ -1549,7 +1549,7 @@ def test_double_move_while_select(started_cluster, name, positive):
             ) ENGINE = MergeTree
             ORDER BY tuple()
             PARTITION BY n
-            SETTINGS storage_policy='small_jbod_with_external'
+            SETTINGS storage_policy='small_jbod_with_external',temporary_directories_lifetime=1
         """.format(
                 name=name
             )
diff --git a/tests/integration/test_ttl_replicated/configs/compat.xml b/tests/integration/test_ttl_replicated/configs/compat.xml
new file mode 100644
index 00000000000..c919eaf6146
--- /dev/null
+++ b/tests/integration/test_ttl_replicated/configs/compat.xml
@@ -0,0 +1,4 @@
+<clickhouse>
+    <replicated_merge_tree_paranoid_check_on_drop_range>0</replicated_merge_tree_paranoid_check_on_drop_range>
+    <replicated_merge_tree_paranoid_check_on_startup>0</replicated_merge_tree_paranoid_check_on_startup>
+</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_ttl_replicated/test.py b/tests/integration/test_ttl_replicated/test.py
index a3e7d6e4b8b..3b031569b8a 100644
--- a/tests/integration/test_ttl_replicated/test.py
+++ b/tests/integration/test_ttl_replicated/test.py
@@ -6,6 +6,7 @@ from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV, exec_query_with_retry
 from helpers.wait_for_helpers import wait_for_delete_inactive_parts
 from helpers.wait_for_helpers import wait_for_delete_empty_parts
+from helpers.test_tools import assert_eq_with_retry
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance("node1", with_zookeeper=True)
@@ -19,6 +20,9 @@ node4 = cluster.add_instance(
     tag="20.12.4.5",
     stay_alive=True,
     with_installed_binary=True,
+    main_configs=[
+        "configs/compat.xml",
+    ],
 )
 
 node5 = cluster.add_instance(
@@ -28,6 +32,9 @@ node5 = cluster.add_instance(
     tag="20.12.4.5",
     stay_alive=True,
     with_installed_binary=True,
+    main_configs=[
+        "configs/compat.xml",
+    ],
 )
 node6 = cluster.add_instance(
     "node6",
@@ -36,6 +43,9 @@ node6 = cluster.add_instance(
     tag="20.12.4.5",
     stay_alive=True,
     with_installed_binary=True,
+    main_configs=[
+        "configs/compat.xml",
+    ],
 )
 
 
@@ -66,7 +76,8 @@ def test_ttl_columns(started_cluster):
             """
                 CREATE TABLE test_ttl(date DateTime, id UInt32, a Int32 TTL date + INTERVAL 1 DAY, b Int32 TTL date + INTERVAL 1 MONTH)
                 ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl_columns', '{replica}')
-                ORDER BY id PARTITION BY toDayOfMonth(date) SETTINGS merge_with_ttl_timeout=0, min_bytes_for_wide_part=0;
+                ORDER BY id PARTITION BY toDayOfMonth(date)
+                SETTINGS merge_with_ttl_timeout=0, min_bytes_for_wide_part=0, max_merge_selecting_sleep_ms=6000;
             """.format(
                 replica=node.name
             )
@@ -99,7 +110,7 @@ def test_merge_with_ttl_timeout(started_cluster):
                 CREATE TABLE {table}(date DateTime, id UInt32, a Int32 TTL date + INTERVAL 1 DAY, b Int32 TTL date + INTERVAL 1 MONTH)
                 ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{table}', '{replica}')
                 ORDER BY id PARTITION BY toDayOfMonth(date)
-                SETTINGS min_bytes_for_wide_part=0;
+                SETTINGS min_bytes_for_wide_part=0, max_merge_selecting_sleep_ms=6000;
             """.format(
                 replica=node.name, table=table
             )
@@ -134,13 +145,11 @@ def test_merge_with_ttl_timeout(started_cluster):
             )
         )
 
-    time.sleep(15)  # TTL merges shall not happen.
-
-    assert (
-        node1.query("SELECT countIf(a = 0) FROM {table}".format(table=table)) == "3\n"
+    assert_eq_with_retry(
+        node1, "SELECT countIf(a = 0) FROM {table}".format(table=table), "3\n"
     )
-    assert (
-        node2.query("SELECT countIf(a = 0) FROM {table}".format(table=table)) == "3\n"
+    assert_eq_with_retry(
+        node2, "SELECT countIf(a = 0) FROM {table}".format(table=table), "3\n"
     )
 
 
@@ -155,7 +164,7 @@ def test_ttl_many_columns(started_cluster):
                     _offset Int32 TTL date,
                     _partition Int32 TTL date)
                 ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl_2', '{replica}')
-                ORDER BY id PARTITION BY toDayOfMonth(date) SETTINGS merge_with_ttl_timeout=0;
+                ORDER BY id PARTITION BY toDayOfMonth(date) SETTINGS merge_with_ttl_timeout=0, max_merge_selecting_sleep_ms=6000;
             """.format(
                 replica=node.name
             )
@@ -213,7 +222,7 @@ def test_ttl_table(started_cluster, delete_suffix):
                 CREATE TABLE test_ttl(date DateTime, id UInt32)
                 ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl', '{replica}')
                 ORDER BY id PARTITION BY toDayOfMonth(date)
-                TTL date + INTERVAL 1 DAY {delete_suffix} SETTINGS merge_with_ttl_timeout=0;
+                TTL date + INTERVAL 1 DAY {delete_suffix} SETTINGS merge_with_ttl_timeout=0, max_merge_selecting_sleep_ms=6000;
             """.format(
                 replica=node.name, delete_suffix=delete_suffix
             )
@@ -304,7 +313,7 @@ def test_ttl_double_delete_rule_returns_error(started_cluster):
             CREATE TABLE test_ttl(date DateTime, id UInt32)
             ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl_double_delete', '{replica}')
             ORDER BY id PARTITION BY toDayOfMonth(date)
-            TTL date + INTERVAL 1 DAY, date + INTERVAL 2 DAY SETTINGS merge_with_ttl_timeout=0
+            TTL date + INTERVAL 1 DAY, date + INTERVAL 2 DAY SETTINGS merge_with_ttl_timeout=0, max_merge_selecting_sleep_ms=6000
         """.format(
                 replica=node1.name
             )
@@ -422,7 +431,8 @@ def test_ttl_empty_parts(started_cluster):
             ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl_empty_parts', '{replica}')
             ORDER BY id
             SETTINGS max_bytes_to_merge_at_min_space_in_pool = 1, max_bytes_to_merge_at_max_space_in_pool = 1,
-                cleanup_delay_period = 1, cleanup_delay_period_random_add = 0, old_parts_lifetime = 1
+                cleanup_delay_period = 1, cleanup_delay_period_random_add = 0,
+                cleanup_thread_preferred_points_per_iteration=0, old_parts_lifetime = 1
 
         """.format(
                 replica=node.name
diff --git a/tests/integration/test_version_update_after_mutation/configs/compat.xml b/tests/integration/test_version_update_after_mutation/configs/compat.xml
new file mode 100644
index 00000000000..c919eaf6146
--- /dev/null
+++ b/tests/integration/test_version_update_after_mutation/configs/compat.xml
@@ -0,0 +1,4 @@
+<clickhouse>
+    <replicated_merge_tree_paranoid_check_on_drop_range>0</replicated_merge_tree_paranoid_check_on_drop_range>
+    <replicated_merge_tree_paranoid_check_on_startup>0</replicated_merge_tree_paranoid_check_on_startup>
+</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_version_update_after_mutation/test.py b/tests/integration/test_version_update_after_mutation/test.py
index 17b70ba7c84..c80205d48c1 100644
--- a/tests/integration/test_version_update_after_mutation/test.py
+++ b/tests/integration/test_version_update_after_mutation/test.py
@@ -13,6 +13,9 @@ node1 = cluster.add_instance(
     tag="20.4.9.110",
     with_installed_binary=True,
     stay_alive=True,
+    main_configs=[
+        "configs/compat.xml",
+    ],
 )
 node2 = cluster.add_instance(
     "node2",
@@ -21,6 +24,9 @@ node2 = cluster.add_instance(
     tag="20.4.9.110",
     with_installed_binary=True,
     stay_alive=True,
+    main_configs=[
+        "configs/compat.xml",
+    ],
 )
 node3 = cluster.add_instance(
     "node3",
@@ -29,6 +35,9 @@ node3 = cluster.add_instance(
     tag="20.4.9.110",
     with_installed_binary=True,
     stay_alive=True,
+    main_configs=[
+        "configs/compat.xml",
+    ],
 )
 
 
diff --git a/tests/integration/test_zero_copy_fetch/configs/storage_conf.xml b/tests/integration/test_zero_copy_fetch/configs/storage_conf.xml
index b3ce0735a3c..9e9dab6a972 100644
--- a/tests/integration/test_zero_copy_fetch/configs/storage_conf.xml
+++ b/tests/integration/test_zero_copy_fetch/configs/storage_conf.xml
@@ -38,4 +38,5 @@
     <merge_tree>
         <allow_remote_fs_zero_copy_replication>true</allow_remote_fs_zero_copy_replication>
     </merge_tree>
+    <allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 </clickhouse>
diff --git a/tests/integration/test_zero_copy_fetch/test.py b/tests/integration/test_zero_copy_fetch/test.py
index 9b9aa5e0da7..4f3d42096c3 100644
--- a/tests/integration/test_zero_copy_fetch/test.py
+++ b/tests/integration/test_zero_copy_fetch/test.py
@@ -45,7 +45,7 @@ CREATE TABLE test1 (EventDate Date, CounterID UInt32)
 ENGINE = ReplicatedMergeTree('/clickhouse-tables/test1', 'r1')
 PARTITION BY toMonday(EventDate)
 ORDER BY (CounterID, EventDate)
-SETTINGS index_granularity = 8192, storage_policy = 's3'"""
+SETTINGS index_granularity = 8192, storage_policy = 's3', temporary_directories_lifetime=1"""
     )
 
     node1.query(
diff --git a/tests/jepsen.clickhouse/resources/keeper_config.xml b/tests/jepsen.clickhouse/resources/keeper_config.xml
index 2ab747fbd71..1972ef6b917 100644
--- a/tests/jepsen.clickhouse/resources/keeper_config.xml
+++ b/tests/jepsen.clickhouse/resources/keeper_config.xml
@@ -8,6 +8,28 @@
         <size>never</size>
     </logger>
 
+
+    <storage_configuration>
+        <disks>
+            <log_local>
+                <type>local</type>
+                <path>/home/robot-clickhouse/db/coordination/logs/</path>
+            </log_local>
+            <latest_log_local>
+                <type>local</type>
+                <path>/home/robot-clickhouse/db/coordination/latest_log/</path>
+            </latest_log_local>
+            <snapshot_local>
+                <type>local</type>
+                <path>/home/robot-clickhouse/db/coordination/snapshots/</path>
+            </snapshot_local>
+            <latest_snapshot_local>
+                <type>local</type>
+                <path>/home/robot-clickhouse/db/coordination/latest_snapshot/</path>
+            </latest_snapshot_local>
+        </disks>
+    </storage_configuration>
+
     <keeper_server>
         <tcp_port>9181</tcp_port>
         <server_id>{id}</server_id>
diff --git a/tests/jepsen.clickhouse/src/jepsen/clickhouse/constants.clj b/tests/jepsen.clickhouse/src/jepsen/clickhouse/constants.clj
index 887fc04265c..2a9a7ef6d27 100644
--- a/tests/jepsen.clickhouse/src/jepsen/clickhouse/constants.clj
+++ b/tests/jepsen.clickhouse/src/jepsen/clickhouse/constants.clj
@@ -14,7 +14,9 @@
 
 (def coordination-data-dir (str data-dir "/coordination"))
 (def coordination-snapshots-dir (str coordination-data-dir "/snapshots"))
+(def coordination-latest-snapshot-dir (str coordination-data-dir "/latest_snapshot"))
 (def coordination-logs-dir (str coordination-data-dir "/logs"))
+(def coordination-latest_log-dir (str coordination-data-dir "/latest_log"))
 
 (def stderr-file (str logs-dir "/stderr.log"))
 
diff --git a/tests/jepsen.clickhouse/src/jepsen/clickhouse/keeper/utils.clj b/tests/jepsen.clickhouse/src/jepsen/clickhouse/keeper/utils.clj
index b882af77758..869313079d0 100644
--- a/tests/jepsen.clickhouse/src/jepsen/clickhouse/keeper/utils.clj
+++ b/tests/jepsen.clickhouse/src/jepsen/clickhouse/keeper/utils.clj
@@ -146,6 +146,8 @@
     :--
     :--logger.log (str logs-dir "/clickhouse-keeper.log")
     :--logger.errorlog (str logs-dir "/clickhouse-keeper.err.log")
-    :--keeper_server.snapshot_storage_path coordination-snapshots-dir
-    :--keeper_server.log_storage_path coordination-logs-dir
+    :--keeper_server.snapshot_storage_disk "snapshot_local"
+    :--keeper_server.latest_snapshot_storage_disk "latest_snapshot_local"
+    :--keeper_server.log_storage_disk "log_local"
+    :--keeper_server.latest_log_storage_disk "latest_log_local"
     :--path coordination-data-dir))
diff --git a/tests/performance/join_set_filter.xml b/tests/performance/join_set_filter.xml
deleted file mode 100644
index 7f7804853fc..00000000000
--- a/tests/performance/join_set_filter.xml
+++ /dev/null
@@ -1,45 +0,0 @@
-<test>
-    <substitutions>
-       <substitution>
-           <name>table_size</name>
-           <values>
-               <value>100000000</value>
-           </values>
-       </substitution>
-    </substitutions>
-
-    <settings>
-        <join_algorithm>full_sorting_merge</join_algorithm>
-    </settings>
-
-    <create_query>
-        CREATE TABLE t1 (x UInt64, y UInt64) ENGINE = MergeTree ORDER BY y
-        AS SELECT
-            sipHash64(number, 't1_x') % {table_size} AS x,
-            sipHash64(number, 't1_y') % {table_size} AS y
-        FROM numbers({table_size})
-    </create_query>
-
-    <create_query>
-        CREATE TABLE t2 (x UInt64, y UInt64) ENGINE = MergeTree ORDER BY y
-        AS SELECT
-            sipHash64(number, 't2_x') % {table_size} AS x,
-            sipHash64(number, 't2_y') % {table_size} AS y
-        FROM numbers({table_size})
-    </create_query>
-
-    <query>SELECT * FROM t1 JOIN t2 ON t1.x = t2.x WHERE less(t1.y, 10000)</query>
-    <query>SELECT * FROM t2 JOIN t1 ON t1.x = t2.x WHERE less(t1.y, 10000)</query>
-
-    <query>SELECT * FROM t1 JOIN t2 ON t1.x = t2.x WHERE greater(t1.y, {table_size} - 10000)</query>
-    <query>SELECT * FROM t2 JOIN t1 ON t1.x = t2.x WHERE greater(t1.y, {table_size} - 10000)</query>
-
-    <query>SELECT * FROM t1 JOIN t2 ON t1.x = t2.x WHERE t1.y % 100 = 0</query>
-    <query>SELECT * FROM t2 JOIN t1 ON t1.x = t2.x WHERE t1.y % 100 = 0</query>
-
-    <query>SELECT * FROM t1 JOIN t2 ON t1.x = t2.x WHERE t1.y % 1000 = 0</query>
-    <query>SELECT * FROM t2 JOIN t1 ON t1.x = t2.x WHERE t1.y % 1000 = 0</query>
-
-    <drop_query>DROP TABLE IF EXISTS t1</drop_query>
-    <drop_query>DROP TABLE IF EXISTS t2</drop_query>
-</test>
diff --git a/tests/performance/materialized_view_parallelize_output_from_storages.xml b/tests/performance/materialized_view_parallelize_output_from_storages.xml
new file mode 100644
index 00000000000..ca2cd199690
--- /dev/null
+++ b/tests/performance/materialized_view_parallelize_output_from_storages.xml
@@ -0,0 +1,12 @@
+<test>
+    <create_query>CREATE TABLE input (key Int) Engine=Null</create_query>
+    <create_query>CREATE TABLE output (key Int) Engine=Null</create_query>
+    <create_query>CREATE MATERIALIZED VIEW mv TO output AS SELECT * FROM input WHERE key > 10</create_query>
+
+    <query>INSERT INTO input SELECT * FROM numbers(10e6) SETTINGS parallelize_output_from_storages=0, min_insert_block_size_rows=10000</query>
+    <query>INSERT INTO input SELECT * FROM numbers(10e6) SETTINGS parallelize_output_from_storages=1, min_insert_block_size_rows=10000</query>
+
+    <drop_query>DROP TABLE IF EXISTS mv</drop_query>
+    <drop_query>DROP TABLE IF EXISTS input</drop_query>
+    <drop_query>DROP TABLE IF EXISTS output</drop_query>
+</test>
diff --git a/tests/performance/uniqExactIf.xml b/tests/performance/uniqExactIf.xml
index 409be257737..263fa75382c 100644
--- a/tests/performance/uniqExactIf.xml
+++ b/tests/performance/uniqExactIf.xml
@@ -1,3 +1,7 @@
 <test>
-    <query>SELECT uniqExactIf(number, 1) FROM numbers_mt(1e6)</query>
+    <query>SELECT uniqExactIf(number, 1) FROM numbers_mt(1e7)</query>
+    <query>SELECT uniqExactState(number) FROM numbers_mt(1e7) Format Null</query>
+    <query>SELECT uniqExactArray([number]) FROM numbers_mt(1e7) Format Null</query>
+    <query>with (SELECT uniqExactState(number) FROM numbers_mt(1e7)) as a select uniqExactMerge(a)</query>
+    <query>SELECT uniqExactOrNull(number) FROM numbers_mt(1e7)</query>
 </test>
diff --git a/tests/queries/0_stateless/00189_time_zones_long.reference b/tests/queries/0_stateless/00189_time_zones_long.reference
index a4287217a19..7d2ad3c8a01 100644
--- a/tests/queries/0_stateless/00189_time_zones_long.reference
+++ b/tests/queries/0_stateless/00189_time_zones_long.reference
@@ -258,18 +258,18 @@ toUnixTimestamp
 1426415400
 1426415400
 date_trunc
-2019-01-01 00:00:00
-2020-01-01 00:00:00
-2020-01-01 00:00:00
-2019-10-01 00:00:00
-2020-01-01 00:00:00
-2020-01-01 00:00:00
-2019-12-01 00:00:00
-2020-01-01 00:00:00
-2020-01-01 00:00:00
-2019-12-30 00:00:00
-2019-12-30 00:00:00
-2019-12-30 00:00:00
+2019-01-01
+2020-01-01
+2020-01-01
+2019-10-01
+2020-01-01
+2020-01-01
+2019-12-01
+2020-01-01
+2020-01-01
+2019-12-30
+2019-12-30
+2019-12-30
 2019-12-31 00:00:00
 2020-01-01 00:00:00
 2020-01-02 00:00:00
@@ -282,18 +282,18 @@ date_trunc
 2019-12-31 20:11:22
 2020-01-01 12:11:22
 2020-01-02 05:11:22
-2019-01-01 00:00:00
-2020-01-01 00:00:00
-2020-01-01 00:00:00
-2019-10-01 00:00:00
-2020-01-01 00:00:00
-2020-01-01 00:00:00
-2019-12-01 00:00:00
-2020-01-01 00:00:00
-2020-01-01 00:00:00
-2019-12-30 00:00:00
-2019-12-30 00:00:00
-2019-12-30 00:00:00
+2019-01-01
+2020-01-01
+2020-01-01
+2019-10-01
+2020-01-01
+2020-01-01
+2019-12-01
+2020-01-01
+2020-01-01
+2019-12-30
+2019-12-30
+2019-12-30
 2019-12-31 00:00:00
 2020-01-01 00:00:00
 2020-01-02 00:00:00
@@ -306,8 +306,8 @@ date_trunc
 2019-12-31 20:11:22
 2020-01-01 12:11:22
 2020-01-02 05:11:22
-2020-01-01 00:00:00
-2020-01-01 00:00:00
-2020-01-01 00:00:00
-2019-12-30 00:00:00
+2020-01-01
+2020-01-01
+2020-01-01
+2019-12-30
 2020-01-01 00:00:00
diff --git a/tests/queries/0_stateless/00416_pocopatch_progress_in_http_headers.sh b/tests/queries/0_stateless/00416_pocopatch_progress_in_http_headers.sh
index 6e9814cbca8..b2189ab0cc2 100755
--- a/tests/queries/0_stateless/00416_pocopatch_progress_in_http_headers.sh
+++ b/tests/queries/0_stateless/00416_pocopatch_progress_in_http_headers.sh
@@ -5,7 +5,6 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 ${CLICKHOUSE_CURL} -vsS "${CLICKHOUSE_URL}&max_block_size=5&send_progress_in_http_headers=1&http_headers_progress_interval_ms=0" -d 'SELECT max(number) FROM numbers(10)' 2>&1 | grep -E 'Content-Encoding|X-ClickHouse-Progress|^[0-9]'
-# This test will fail with external poco (progress not supported)
 
 ${CLICKHOUSE_CURL} -vsS "${CLICKHOUSE_URL}&max_block_size=1&send_progress_in_http_headers=1&http_headers_progress_interval_ms=0&output_format_parallel_formatting=0" -d 'SELECT number FROM numbers(10)' 2>&1 | grep -E 'Content-Encoding|X-ClickHouse-Progress|^[0-9]'
 ${CLICKHOUSE_CURL} -sS "${CLICKHOUSE_URL}&max_block_size=1&send_progress_in_http_headers=1&http_headers_progress_interval_ms=0&enable_http_compression=1" -H 'Accept-Encoding: gzip' -d 'SELECT number FROM system.numbers LIMIT 10' | gzip -d
diff --git a/tests/queries/0_stateless/00515_enhanced_time_zones.reference b/tests/queries/0_stateless/00515_enhanced_time_zones.reference
index ad0dae35c45..2555c885558 100644
--- a/tests/queries/0_stateless/00515_enhanced_time_zones.reference
+++ b/tests/queries/0_stateless/00515_enhanced_time_zones.reference
@@ -16,3 +16,22 @@
 2017-11-05 08:07:47
 2017-11-05 10:37:47
 2017-11-05 10:37:47
+-- Test const timezone arguments --
+42
+43
+42
+43
+42
+43
+42
+43
+42
+43
+42
+43
+42
+43
+42
+43
+42
+43
diff --git a/tests/queries/0_stateless/00515_enhanced_time_zones.sql b/tests/queries/0_stateless/00515_enhanced_time_zones.sql
index f719ff70d7a..5f40cfb53c1 100644
--- a/tests/queries/0_stateless/00515_enhanced_time_zones.sql
+++ b/tests/queries/0_stateless/00515_enhanced_time_zones.sql
@@ -21,16 +21,51 @@ SELECT toString(toDateTime('2017-11-05 08:07:47', 'Asia/Istanbul'));
 SELECT toString(toTimeZone(toDateTime('2017-11-05 08:07:47', 'Asia/Istanbul'), 'Asia/Kolkata'));
 SELECT toString(toDateTime('2017-11-05 08:07:47', 'Asia/Istanbul'), 'Asia/Kolkata');
 
-SELECT toTimeZone(dt, tz) FROM (
-    SELECT toDateTime('2017-11-05 08:07:47', 'Asia/Istanbul') AS dt, arrayJoin(['Asia/Kolkata', 'UTC']) AS tz
-); -- { serverError ILLEGAL_COLUMN }
-SELECT materialize('Asia/Kolkata') t, toTimeZone(toDateTime('2017-11-05 08:07:47', 'Asia/Istanbul'), t); -- { serverError ILLEGAL_COLUMN }
+SELECT '-- Test const timezone arguments --';
 
-CREATE TEMPORARY TABLE tmp AS SELECT arrayJoin(['Europe/Istanbul', 'Asia/Istanbul']);
-SELECT toTimeZone(now(), (*,).1) FROM tmp; -- { serverError ILLEGAL_COLUMN }
-SELECT now((*,).1) FROM tmp; -- { serverError ILLEGAL_COLUMN }
-SELECT now64(1, (*,).1) FROM tmp; -- { serverError ILLEGAL_COLUMN }
-SELECT toStartOfInterval(now(), INTERVAL 3 HOUR, (*,).1) FROM tmp; -- { serverError ILLEGAL_COLUMN }
-SELECT snowflakeToDateTime(toInt64(123), (*,).1) FROM tmp; -- { serverError ILLEGAL_COLUMN }
-SELECT toUnixTimestamp(now(), (*,).1) FROM tmp; -- { serverError ILLEGAL_COLUMN }
-SELECT toDateTimeOrDefault('2023-04-12 16:43:32', (*,).1, now()) FROM tmp; -- { serverError ILLEGAL_COLUMN }
+DROP TABLE IF EXISTS tab;
+
+CREATE TABLE tab (val Int64, tz String) engine=Log;
+INSERT INTO tab VALUES (42, 'Asia/Singapore') (43, 'Asia/Tokyo');
+
+SELECT val FROM tab WHERE now(tz) != toDateTime('2000-01-01 00:00:00') ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 0; -- { serverError ILLEGAL_COLUMN }
+SELECT val FROM tab WHERE now(tz) != toDateTime('2000-01-01 00:00:00') ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 1;
+
+SELECT val FROM tab WHERE now64(9, tz) != toDateTime64('2000-01-01 00:00:00', 6) ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 0; -- { serverError ILLEGAL_COLUMN }
+SELECT val FROM tab WHERE now64(9, tz) != toDateTime64('2000-01-01 00:00:00', 6) ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 1;
+
+SELECT val FROM tab WHERE nowInBlock(tz) != toDateTime('2000-01-01 00:00:00') ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 0; -- { serverError ILLEGAL_COLUMN }
+SELECT val FROM tab WHERE nowInBlock(tz) != toDateTime('2000-01-01 00:00:00') ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 1;
+
+SELECT val FROM tab WHERE toTimeZone(toDateTime(val), tz) != toDateTime('2023-06-11 14:14:14') ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 0; -- { serverError ILLEGAL_COLUMN }
+SELECT val FROM tab WHERE toTimeZone(toDateTime(val), tz) != toDateTime('2023-06-11 14:14:14') ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 1; 
+
+SELECT val FROM tab WHERE fromUnixTimestamp64Milli(val, tz) != toDateTime64('2023-06-11 14:14:14', 6) ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 0; -- { serverError ILLEGAL_COLUMN }
+SELECT val FROM tab WHERE fromUnixTimestamp64Milli(val, tz) != toDateTime64('2023-06-11 14:14:14', 6) ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 1;
+
+SELECT val FROM tab WHERE fromUnixTimestamp64Micro(val, tz) != toDateTime64('2023-06-11 14:14:14', 6) ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 0; -- { serverError ILLEGAL_COLUMN }
+SELECT val FROM tab WHERE fromUnixTimestamp64Micro(val, tz) != toDateTime64('2023-06-11 14:14:14', 6) ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 1;
+
+SELECT val FROM tab WHERE fromUnixTimestamp64Nano(val, tz) != toDateTime64('2023-06-11 14:14:14', 6) ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 0; -- { serverError ILLEGAL_COLUMN }
+SELECT val FROM tab WHERE fromUnixTimestamp64Nano(val, tz) != toDateTime64('2023-06-11 14:14:14', 6) ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 1;
+
+SELECT val FROM tab WHERE snowflakeToDateTime(val, tz) != toDateTime('2023-06-11 14:14:14') ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 0; -- { serverError ILLEGAL_COLUMN }
+SELECT val FROM tab WHERE snowflakeToDateTime(val, tz) != toDateTime('2023-06-11 14:14:14') ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 1;
+
+SELECT val FROM tab WHERE snowflakeToDateTime64(val, tz) != toDateTime64('2023-06-11 14:14:14', 6) ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 0; -- { serverError ILLEGAL_COLUMN }
+SELECT val FROM tab WHERE snowflakeToDateTime64(val, tz) != toDateTime64('2023-06-11 14:14:14', 6) ORDER BY val SETTINGS allow_nonconst_timezone_arguments = 1;
+
+-- test for a related bug:
+
+DROP TABLE tab;
+
+SET allow_nonconst_timezone_arguments = 1;
+
+CREATE TABLE tab (`country` LowCardinality(FixedString(7)) DEFAULT 'unknown', `city` LowCardinality(String) DEFAULT 'unknown', `region` LowCardinality(String) DEFAULT 'unknown', `continent` LowCardinality(FixedString(7)) DEFAULT 'unknown', `is_eu_country` Bool, `date` DateTime CODEC(DoubleDelta, LZ4), `viewer_date` DateTime ALIAS toTimezone(date, timezone), `device_browser` LowCardinality(String) DEFAULT 'unknown', `metro_code` LowCardinality(String) DEFAULT 'unknown', `domain` String DEFAULT 'unknown', `device_platform` LowCardinality(String) DEFAULT 'unknown', `device_type` LowCardinality(String) DEFAULT 'unknown', `device_vendor` LowCardinality(String) DEFAULT 'unknown', `ip` FixedString(39) DEFAULT 'unknown', `lat` Decimal(8, 6) CODEC(T64), `lng` Decimal(9, 6) CODEC(T64), `asset_id` String DEFAULT 'unknown', `is_personalized` Bool, `metric` String, `origin` String DEFAULT 'unknown', `product_id` UInt64 CODEC(T64), `referer` String DEFAULT 'unknown', `server_side` Int8 CODEC(T64), `third_party_id` String DEFAULT 'unknown', `partner_slug` LowCardinality(FixedString(10)) DEFAULT 'unknown', `user_agent` String DEFAULT 'unknown', `user_id` UUID, `zip` FixedString(10) DEFAULT 'unknown', `timezone` LowCardinality(String), `as_organization` LowCardinality(String) DEFAULT 'unknown', `content_cat` Array(String), `playback_method` LowCardinality(String) DEFAULT 'unknown', `store_id` LowCardinality(String) DEFAULT 'unknown', `store_url` String DEFAULT 'unknown', `timestamp` Nullable(DateTime), `ad_count` Int8 CODEC(T64), `ad_type` LowCardinality(FixedString(10)) DEFAULT 'unknown', `ad_categories` Array(FixedString(8)), `blocked_ad_categories` Array(FixedString(8)), `break_max_ad_length` Int8 CODEC(T64), `break_max_ads` Int8 CODEC(T64), `break_max_duration` Int8 CODEC(T64), `break_min_ad_length` Int8 CODEC(T64), `break_position` LowCardinality(FixedString(18)) DEFAULT 'unknown', `media_playhead` String DEFAULT 'unknown', `placement_type` Int8 CODEC(T64), `transaction_id` String, `universal_ad_id` Array(String), `client_ua` LowCardinality(String) DEFAULT 'unknown', `device_ip` FixedString(39) DEFAULT 'unknown', `device_ua` LowCardinality(String) DEFAULT 'unknown', `ifa` String, `ifa_type` LowCardinality(String) DEFAULT 'unknown', `vast_lat` Decimal(8, 6) CODEC(T64), `vast_long` Decimal(9, 6) CODEC(T64), `server_ua` String DEFAULT 'unknown', `app_bundle` String DEFAULT 'unknown', `page_url` String DEFAULT 'unknown', `api_framework` Array(UInt8), `click_type` LowCardinality(String), `extensions` Array(String), `media_mime` Array(String), `om_id_partner` LowCardinality(String) DEFAULT 'unknown', `player_capabilities` Array(FixedString(12)), `vast_versions` Array(UInt8), `verification_vendors` Array(String), `ad_play_head` String DEFAULT 'unknown', `ad_serving_id` String DEFAULT 'unknown', `asset_uri` String DEFAULT 'unknown', `content_id` String DEFAULT 'unknown', `content_uri` String DEFAULT 'unknown', `inventory_state` Array(FixedString(14)), `player_size` Array(UInt8), `player_state` Array(FixedString(12)), `pod_sequence` Int8 CODEC(T64), `click_position` Array(UInt32), `error_code` Int16 CODEC(T64), `error_reason` Int8 CODEC(T64), `gdpr_consent` String DEFAULT 'unknown', `limited_tracking` Bool, `regulations` String DEFAULT 'unknown', `content_category` Array(String), PROJECTION projection_TPAG_VAST_date (SELECT * ORDER BY toYYYYMMDD(date), metric, product_id, asset_id)) ENGINE = MergeTree ORDER BY (product_id, metric, asset_id, toYYYYMMDD(date));
+
+DETACH TABLE tab;
+
+ATTACH TABLE tab SETTINGS allow_nonconst_timezone_arguments = 0; -- { serverError ILLEGAL_COLUMN }
+ATTACH TABLE tab SETTINGS allow_nonconst_timezone_arguments = 1;
+
+DROP TABLE tab;
diff --git a/tests/queries/0_stateless/00569_parse_date_time_best_effort.reference b/tests/queries/0_stateless/00569_parse_date_time_best_effort.reference
index ad7c17b7717..0729a7628f2 100644
--- a/tests/queries/0_stateless/00569_parse_date_time_best_effort.reference
+++ b/tests/queries/0_stateless/00569_parse_date_time_best_effort.reference
@@ -2,8 +2,8 @@
 
  0                                                ᴺᵁᴸᴸ   1970-01-01 00:00:00 
  0000                                             ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 00:00:00                          2000-01-01 00:00:00   2000-01-01 00:00:00 
- 01:00:00                          2000-01-01 01:00:00   2000-01-01 01:00:00 
+ 2000-01-01 00:00:00               2000-01-01 00:00:00   2000-01-01 00:00:00 
+ 2000-01-01 01:00:00               2000-01-01 01:00:00   2000-01-01 01:00:00 
  02/01/17 010203 MSK               2017-01-01 22:02:03   2017-01-01 22:02:03 
  02/01/17 010203 MSK+0100          2017-01-01 21:02:03   2017-01-01 21:02:03 
  02/01/17 010203 UTC+0300          2017-01-01 22:02:03   2017-01-01 22:02:03 
@@ -11,13 +11,13 @@
  02/01/1970 010203Z                1970-01-02 01:02:03   1970-01-02 01:02:03 
  02/01/70 010203Z                  1970-01-02 01:02:03   1970-01-02 01:02:03 
  11 Feb 2018 06:40:50 +0300        2018-02-11 03:40:50   2018-02-11 03:40:50 
- 17 Apr 2 1:2:3                    2000-04-17 01:02:03   2000-04-17 01:02:03 
+ 17 Apr 2000 2 1:2:3               2000-04-17 01:02:03   2000-04-17 01:02:03 
  19700102 01:00:00                 1970-01-02 01:00:00   1970-01-02 01:00:00 
  1970010201:00:00                                 ᴺᵁᴸᴸ   1970-01-01 00:00:00 
  19700102010203                    1970-01-02 01:02:03   1970-01-02 01:02:03 
  19700102010203Z                   1970-01-02 01:02:03   1970-01-02 01:02:03 
  1970/01/02 010203Z                1970-01-02 01:02:03   1970-01-02 01:02:03 
- 20                                2000-01-20 00:00:00   2000-01-20 00:00:00 
+ 20 2000                           2000-01-20 00:00:00   2000-01-20 00:00:00 
  201                                              ᴺᵁᴸᴸ   1970-01-01 00:00:00 
  20160101                          2016-01-01 00:00:00   2016-01-01 00:00:00 
  2016-01-01                        2016-01-01 00:00:00   2016-01-01 00:00:00 
diff --git a/tests/queries/0_stateless/00569_parse_date_time_best_effort.sql b/tests/queries/0_stateless/00569_parse_date_time_best_effort.sql
index 5f71efa1485..511addb4e4d 100644
--- a/tests/queries/0_stateless/00569_parse_date_time_best_effort.sql
+++ b/tests/queries/0_stateless/00569_parse_date_time_best_effort.sql
@@ -7,8 +7,8 @@ FROM
     SELECT arrayJoin([
 '0',
 '0000',
-'00:00:00',
-'01:00:00',
+'2000-01-01 00:00:00',
+'2000-01-01 01:00:00',
 '02/01/17 010203 MSK',
 '02/01/17 010203 MSK+0100',
 '02/01/17 010203 UTC+0300',
@@ -16,13 +16,13 @@ FROM
 '02/01/1970 010203Z',
 '02/01/70 010203Z',
 '11 Feb 2018 06:40:50 +0300',
-'17 Apr 2 1:2:3',
+'17 Apr 2000 2 1:2:3',
 '19700102 01:00:00',
 '1970010201:00:00',
 '19700102010203',
 '19700102010203Z',
 '1970/01/02 010203Z',
-'20',
+'20 2000',
 '201',
 '20160101',
 '2016-01-01',
diff --git a/tests/queries/0_stateless/00626_replace_partition_from_table_zookeeper.sh b/tests/queries/0_stateless/00626_replace_partition_from_table_zookeeper.sh
index a0a3416e406..399511db701 100755
--- a/tests/queries/0_stateless/00626_replace_partition_from_table_zookeeper.sh
+++ b/tests/queries/0_stateless/00626_replace_partition_from_table_zookeeper.sh
@@ -36,8 +36,12 @@ $CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS dst_r1;"
 $CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS dst_r2;"
 
 $CLICKHOUSE_CLIENT --query="CREATE TABLE src (p UInt64, k String, d UInt64) ENGINE = MergeTree PARTITION BY p ORDER BY k;"
-$CLICKHOUSE_CLIENT --query="CREATE TABLE dst_r1 (p UInt64, k String, d UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/dst_1', '1') PARTITION BY p ORDER BY k SETTINGS old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=0;"
-$CLICKHOUSE_CLIENT --query="CREATE TABLE dst_r2 (p UInt64, k String, d UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/dst_1', '2') PARTITION BY p ORDER BY k SETTINGS old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=0;"
+$CLICKHOUSE_CLIENT --query="CREATE TABLE dst_r1 (p UInt64, k String, d UInt64)
+ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/dst_1', '1') PARTITION BY p ORDER BY k
+SETTINGS old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;"
+$CLICKHOUSE_CLIENT --query="CREATE TABLE dst_r2 (p UInt64, k String, d UInt64)
+ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/dst_1', '2') PARTITION BY p ORDER BY k
+SETTINGS old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;"
 
 $CLICKHOUSE_CLIENT --query="INSERT INTO src VALUES (0, '0', 1);"
 $CLICKHOUSE_CLIENT --query="INSERT INTO src VALUES (1, '0', 1);"
diff --git a/tests/queries/0_stateless/00652_replicated_mutations_zookeeper.sh b/tests/queries/0_stateless/00652_replicated_mutations_zookeeper.sh
index 1f5bcbdc0d0..d8b1bdec328 100755
--- a/tests/queries/0_stateless/00652_replicated_mutations_zookeeper.sh
+++ b/tests/queries/0_stateless/00652_replicated_mutations_zookeeper.sh
@@ -56,11 +56,13 @@ ${CLICKHOUSE_CLIENT} --query="DROP TABLE IF EXISTS mutations_cleaner_r2 SYNC"
 ${CLICKHOUSE_CLIENT} --query="CREATE TABLE mutations_cleaner_r1(x UInt32) ENGINE ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/mutations_cleaner', 'r1') ORDER BY x SETTINGS \
     finished_mutations_to_keep = 2,
     cleanup_delay_period = 1,
-    cleanup_delay_period_random_add = 0"
+    cleanup_delay_period_random_add = 0,
+    cleanup_thread_preferred_points_per_iteration=0"
 ${CLICKHOUSE_CLIENT} --query="CREATE TABLE mutations_cleaner_r2(x UInt32) ENGINE ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/mutations_cleaner', 'r2') ORDER BY x SETTINGS \
     finished_mutations_to_keep = 2,
     cleanup_delay_period = 1,
-    cleanup_delay_period_random_add = 0"
+    cleanup_delay_period_random_add = 0,
+    cleanup_thread_preferred_points_per_iteration=0"
 
 # Insert some data
 ${CLICKHOUSE_CLIENT} --insert_keeper_fault_injection_probability=0 --query="INSERT INTO mutations_cleaner_r1(x) VALUES (1), (2), (3), (4), (5)"
diff --git a/tests/queries/0_stateless/00804_test_deflate_qpl_codec_compression.reference b/tests/queries/0_stateless/00804_test_deflate_qpl_codec_compression.reference
new file mode 100644
index 00000000000..a2178f5eda7
--- /dev/null
+++ b/tests/queries/0_stateless/00804_test_deflate_qpl_codec_compression.reference
@@ -0,0 +1,6 @@
+CREATE TABLE default.compression_codec\n(\n    `id` UInt64 CODEC(DEFLATE_QPL),\n    `data` String CODEC(DEFLATE_QPL),\n    `ddd` Date CODEC(DEFLATE_QPL),\n    `ddd32` Date32 CODEC(DEFLATE_QPL),\n    `somenum` Float64 CODEC(DEFLATE_QPL),\n    `somestr` FixedString(3) CODEC(DEFLATE_QPL),\n    `othernum` Int64 CODEC(DEFLATE_QPL),\n    `somearray` Array(UInt8) CODEC(DEFLATE_QPL),\n    `somemap` Map(String, UInt32) CODEC(DEFLATE_QPL),\n    `sometuple` Tuple(UInt16, UInt64) CODEC(DEFLATE_QPL)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
+1	hello	2018-12-14	2018-12-14	1.1	aaa	5	[1,2,3]	{'k1':1,'k2':2}	(1,2)
+2	world	2018-12-15	2018-12-15	2.2	bbb	6	[4,5,6]	{'k3':3,'k4':4}	(3,4)
+3	!	2018-12-16	2018-12-16	3.3	ccc	7	[7,8,9]	{'k5':5,'k6':6}	(5,6)
+2
+10001
diff --git a/tests/queries/0_stateless/00804_test_deflate_qpl_codec_compression.sql b/tests/queries/0_stateless/00804_test_deflate_qpl_codec_compression.sql
new file mode 100644
index 00000000000..8a256567e80
--- /dev/null
+++ b/tests/queries/0_stateless/00804_test_deflate_qpl_codec_compression.sql
@@ -0,0 +1,49 @@
+--Tags: no-fasttest, no-cpu-aarch64
+-- no-fasttest because DEFLATE_QPL isn't available in fasttest
+-- no-cpu-aarch64 because DEFLATE_QPL is x86-only
+
+-- A bunch of random DDLs to test the DEFLATE_QPL codec.
+
+SET enable_deflate_qpl_codec = 1;
+
+-- Suppress test failures because stderr contains warning "Initialization of hardware-assisted DeflateQpl failed, falling
+-- back to software DeflateQpl coded."
+SET send_logs_level = 'fatal';
+
+DROP TABLE IF EXISTS compression_codec;
+
+CREATE TABLE compression_codec(
+    id UInt64 CODEC(DEFLATE_QPL),
+    data String CODEC(DEFLATE_QPL),
+    ddd Date CODEC(DEFLATE_QPL),
+    ddd32 Date32 CODEC(DEFLATE_QPL),
+    somenum Float64 CODEC(DEFLATE_QPL),
+    somestr FixedString(3) CODEC(DEFLATE_QPL),
+    othernum Int64 CODEC(DEFLATE_QPL),
+    somearray Array(UInt8) CODEC(DEFLATE_QPL),
+    somemap Map(String, UInt32) CODEC(DEFLATE_QPL),
+    sometuple Tuple(UInt16, UInt64) CODEC(DEFLATE_QPL),
+) ENGINE = MergeTree() ORDER BY tuple();
+
+SHOW CREATE TABLE compression_codec;
+
+INSERT INTO compression_codec VALUES(1, 'hello', toDate('2018-12-14'), toDate32('2018-12-14'), 1.1, 'aaa', 5, [1,2,3], map('k1',1,'k2',2), tuple(1,2));
+INSERT INTO compression_codec VALUES(2, 'world', toDate('2018-12-15'), toDate32('2018-12-15'), 2.2, 'bbb', 6, [4,5,6], map('k3',3,'k4',4), tuple(3,4));
+INSERT INTO compression_codec VALUES(3, '!', toDate('2018-12-16'), toDate32('2018-12-16'), 3.3, 'ccc', 7, [7,8,9], map('k5',5,'k6',6), tuple(5,6));
+
+SELECT * FROM compression_codec ORDER BY id;
+
+OPTIMIZE TABLE compression_codec FINAL;
+
+INSERT INTO compression_codec VALUES(2, '', toDate('2018-12-13'), toDate32('2018-12-13'), 4.4, 'ddd', 8, [10,11,12], map('k7',7,'k8',8), tuple(7,8));
+
+DETACH TABLE compression_codec;
+ATTACH TABLE compression_codec;
+
+SELECT count(*) FROM compression_codec WHERE id = 2 GROUP BY id;
+
+INSERT INTO compression_codec SELECT 3, '!', toDate('2018-12-16'), toDate32('2018-12-16'), 3.3, 'ccc', 7, [7,8,9], map('k5',5,'k6',6), tuple(5,6) FROM system.numbers LIMIT 10000;
+
+SELECT count(*) FROM compression_codec WHERE id = 3 GROUP BY id;
+
+DROP TABLE IF EXISTS compression_codec;
diff --git a/tests/queries/0_stateless/00809_add_days_segfault.sql b/tests/queries/0_stateless/00809_add_days_segfault.sql
index 6791439708a..d2d91dd2711 100644
--- a/tests/queries/0_stateless/00809_add_days_segfault.sql
+++ b/tests/queries/0_stateless/00809_add_days_segfault.sql
@@ -9,4 +9,4 @@ SET send_logs_level = 'fatal';
 SELECT ignore(addDays((CAST((96.338) AS DateTime)), -3));
 SELECT ignore(subtractDays((CAST((-5263074.47) AS DateTime)), -737895));
 SELECT quantileDeterministic([], identity(( SELECT subtractDays((CAST((566450.398706) AS DateTime)), 54) ) )), '\0', []; -- { serverError 43 }
-SELECT sequenceCount((CAST((( SELECT NULL ) AS rg, ( SELECT ( SELECT [], '<e', caseWithExpr([NULL], -588755.149, []), retention(addWeeks((CAST((-7644612.39732) AS DateTime)), -23578040.02833), (CAST(([]) AS DateTime)), (CAST(([010977.08]) AS String))), emptyArrayToSingle('') ) , '\0', toUInt64([], 't3hw@'), '\0', toStartOfQuarter(-4230.1872, []) ) ) AS Date))); -- { serverError 43 }
+SELECT sequenceCount((CAST((( SELECT NULL ) AS rg, ( SELECT ( SELECT [], '<e', caseWithExpr([NULL], -588755.149, []), retention(addWeeks((CAST((-7644612.39732) AS DateTime)), -23578040.02833), (CAST(([]) AS DateTime)), (CAST(([010977.08]) AS String))), emptyArrayToSingle('') ) , '\0', toUInt64([], 't3hw@'), '\0', toStartOfQuarter(-4230.1872, []) ) ) AS Date))); -- { serverError 43, 36 }
diff --git a/tests/queries/0_stateless/00814_replicated_minimalistic_part_header_zookeeper.sh b/tests/queries/0_stateless/00814_replicated_minimalistic_part_header_zookeeper.sh
index 5fc3fa460e6..bab2304cec2 100755
--- a/tests/queries/0_stateless/00814_replicated_minimalistic_part_header_zookeeper.sh
+++ b/tests/queries/0_stateless/00814_replicated_minimalistic_part_header_zookeeper.sh
@@ -20,13 +20,15 @@ CREATE TABLE part_header_r1(x UInt32, y UInt32)
     SETTINGS use_minimalistic_part_header_in_zookeeper = 0,
              old_parts_lifetime = 1,
              cleanup_delay_period = 0,
-             cleanup_delay_period_random_add = 0;
+             cleanup_delay_period_random_add = 0,
+             cleanup_thread_preferred_points_per_iteration=0;
 CREATE TABLE part_header_r2(x UInt32, y UInt32)
     ENGINE ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/test_00814/part_header/{shard}', '2{replica}') ORDER BY x
     SETTINGS use_minimalistic_part_header_in_zookeeper = 1,
              old_parts_lifetime = 1,
              cleanup_delay_period = 0,
-             cleanup_delay_period_random_add = 0;
+             cleanup_delay_period_random_add = 0,
+             cleanup_thread_preferred_points_per_iteration=0;
 
 SELECT '*** Test fetches ***';
 INSERT INTO part_header_r1 VALUES (1, 1);
diff --git a/tests/queries/0_stateless/00835_if_generic_case.reference b/tests/queries/0_stateless/00835_if_generic_case.reference
index 84c036b17ca..8f9c3f6ef13 100644
--- a/tests/queries/0_stateless/00835_if_generic_case.reference
+++ b/tests/queries/0_stateless/00835_if_generic_case.reference
@@ -3,7 +3,7 @@
 2000-01-01 00:00:00	2000-01-02	2000-01-02 00:00:00
 2000-01-01 00:00:00	2000-01-02	2000-01-02 00:00:00
 2000-01-01 00:00:00	2000-01-02	2000-01-02 00:00:00
-2000-01-01 00:00:00	2000-01-02	2000-01-02
+2000-01-01 00:00:00	2000-01-02	2000-01-02 00:00:00
 2000-01-01 00:00:00	2000-01-02	2000-01-02
 2000-01-01 00:00:00	2000-01-02	2000-01-02
 2000-01-01 00:00:00	2000-01-02	2000-01-01 00:00:00
diff --git a/tests/queries/0_stateless/00899_long_attach_memory_limit.sql b/tests/queries/0_stateless/00899_long_attach_memory_limit.sql
index aa507cda2ac..d4aa2a0eb7b 100644
--- a/tests/queries/0_stateless/00899_long_attach_memory_limit.sql
+++ b/tests/queries/0_stateless/00899_long_attach_memory_limit.sql
@@ -1,4 +1,5 @@
--- Tags: long, no-debug, no-parallel, no-fasttest
+-- Tags: long, no-debug, no-parallel, no-fasttest, no-msan, no-tsan
+-- This test is slow under MSan or TSan.
 
 DROP TABLE IF EXISTS index_memory;
 CREATE TABLE index_memory (x UInt64) ENGINE = MergeTree ORDER BY x SETTINGS index_granularity = 1;
diff --git a/tests/queries/0_stateless/00900_orc_load.sh b/tests/queries/0_stateless/00900_orc_load.sh
index 62149fa554e..5dc5dfb87a7 100755
--- a/tests/queries/0_stateless/00900_orc_load.sh
+++ b/tests/queries/0_stateless/00900_orc_load.sh
@@ -12,6 +12,6 @@ ${CLICKHOUSE_CLIENT} --query="select * from orc_load FORMAT ORC" > "${CLICKHOUSE
 ${CLICKHOUSE_CLIENT} --query="truncate table orc_load"
 
 cat "${CLICKHOUSE_TMP}"/test.orc | ${CLICKHOUSE_CLIENT} -q "insert into orc_load format ORC"
-timeout 3 ${CLICKHOUSE_CLIENT} -q "insert into orc_load format ORC" < "${CLICKHOUSE_TMP}"/test.orc
+${CLICKHOUSE_CLIENT} -q "insert into orc_load format ORC" < "${CLICKHOUSE_TMP}"/test.orc
 ${CLICKHOUSE_CLIENT} --query="select * from orc_load"
 ${CLICKHOUSE_CLIENT} --query="drop table orc_load"
diff --git a/tests/queries/0_stateless/00921_datetime64_compatibility_long.reference b/tests/queries/0_stateless/00921_datetime64_compatibility_long.reference
index 2f56230db37..a946a114bf4 100644
--- a/tests/queries/0_stateless/00921_datetime64_compatibility_long.reference
+++ b/tests/queries/0_stateless/00921_datetime64_compatibility_long.reference
@@ -135,13 +135,13 @@ Code: 43
 ------------------------------------------
 SELECT date_trunc(\'year\', N, \'Asia/Istanbul\')
 Code: 43
-"DateTime('Asia/Istanbul')","2019-01-01 00:00:00"
-"DateTime('Asia/Istanbul')","2019-01-01 00:00:00"
+"Date","2019-01-01"
+"Date","2019-01-01"
 ------------------------------------------
 SELECT date_trunc(\'month\', N, \'Asia/Istanbul\')
 Code: 43
-"DateTime('Asia/Istanbul')","2019-09-01 00:00:00"
-"DateTime('Asia/Istanbul')","2019-09-01 00:00:00"
+"Date","2019-09-01"
+"Date","2019-09-01"
 ------------------------------------------
 SELECT date_trunc(\'day\', N, \'Asia/Istanbul\')
 "DateTime('Asia/Istanbul')","2019-09-16 00:00:00"
diff --git a/tests/queries/0_stateless/00953_zookeeper_suetin_deduplication_bug.sh b/tests/queries/0_stateless/00953_zookeeper_suetin_deduplication_bug.sh
index c713c7c4926..ad0146b9d99 100755
--- a/tests/queries/0_stateless/00953_zookeeper_suetin_deduplication_bug.sh
+++ b/tests/queries/0_stateless/00953_zookeeper_suetin_deduplication_bug.sh
@@ -22,7 +22,7 @@ CREATE TABLE elog (
 ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/elog/{shard}', '{replica}')
 PARTITION BY date
 ORDER BY (engine_id)
-SETTINGS replicated_deduplication_window = 2, cleanup_delay_period=4, cleanup_delay_period_random_add=0;"
+SETTINGS replicated_deduplication_window = 2, cleanup_delay_period=4, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;"
 
 $CLICKHOUSE_CLIENT --query="INSERT INTO elog VALUES (toDate('2018-10-01'), 1, 'hello')"
 $CLICKHOUSE_CLIENT --query="INSERT INTO elog VALUES (toDate('2018-10-01'), 2, 'hello')"
diff --git a/tests/queries/0_stateless/00961_checksums_in_system_parts_columns_table.reference b/tests/queries/0_stateless/00961_checksums_in_system_parts_columns_table.reference
index 186f2feab79..4bf3cfe65a2 100644
--- a/tests/queries/0_stateless/00961_checksums_in_system_parts_columns_table.reference
+++ b/tests/queries/0_stateless/00961_checksums_in_system_parts_columns_table.reference
@@ -1 +1 @@
-20000101_1_1_0	test_00961	b5fce9c4ef1ca42ce4ed027389c208d2	fc3b062b646cd23d4c23d7f5920f89ae	da96ff1e527a8a1f908ddf2b1d0af239
+20000101_1_1_0	test_00961	e4ed027389c208d2b5fce9c4ef1ca42c	4c23d7f5920f89aefc3b062b646cd23d	908ddf2b1d0af239da96ff1e527a8a1f
diff --git a/tests/queries/0_stateless/00981_in_subquery_with_tuple.reference b/tests/queries/0_stateless/00981_in_subquery_with_tuple.reference
index 673d035ede6..833a8c93d24 100644
--- a/tests/queries/0_stateless/00981_in_subquery_with_tuple.reference
+++ b/tests/queries/0_stateless/00981_in_subquery_with_tuple.reference
@@ -1,7 +1,4 @@
-OK1
 OK2
 OK3
-OK4
-OK5
 2019-08-11	world
 2019-08-12	hello
diff --git a/tests/queries/0_stateless/00988_parallel_parts_removal.sql b/tests/queries/0_stateless/00988_parallel_parts_removal.sql
index bff9bbe6d8d..65629f0df01 100644
--- a/tests/queries/0_stateless/00988_parallel_parts_removal.sql
+++ b/tests/queries/0_stateless/00988_parallel_parts_removal.sql
@@ -1,6 +1,8 @@
 DROP TABLE IF EXISTS mt;
 
-CREATE TABLE mt (x UInt64) ENGINE = MergeTree ORDER BY x SETTINGS max_part_removal_threads = 16, cleanup_delay_period = 1, cleanup_delay_period_random_add = 0, old_parts_lifetime = 1, parts_to_delay_insert = 100000, parts_to_throw_insert = 100000;
+CREATE TABLE mt (x UInt64) ENGINE = MergeTree ORDER BY x
+    SETTINGS cleanup_delay_period = 1, cleanup_delay_period_random_add = 0,
+    cleanup_thread_preferred_points_per_iteration=0, old_parts_lifetime = 1, parts_to_delay_insert = 100000, parts_to_throw_insert = 100000;
 
 SYSTEM STOP MERGES mt;
 
diff --git a/tests/queries/0_stateless/00989_parallel_parts_loading.sql b/tests/queries/0_stateless/00989_parallel_parts_loading.sql
index 13cd56e1924..a05515cf756 100644
--- a/tests/queries/0_stateless/00989_parallel_parts_loading.sql
+++ b/tests/queries/0_stateless/00989_parallel_parts_loading.sql
@@ -2,7 +2,7 @@
 
 DROP TABLE IF EXISTS mt;
 
-CREATE TABLE mt (x UInt64) ENGINE = MergeTree ORDER BY x SETTINGS max_part_loading_threads = 16, parts_to_delay_insert = 100000, parts_to_throw_insert = 100000;
+CREATE TABLE mt (x UInt64) ENGINE = MergeTree ORDER BY x SETTINGS parts_to_delay_insert = 100000, parts_to_throw_insert = 100000;
 
 SYSTEM STOP MERGES mt;
 
diff --git a/tests/queries/0_stateless/00992_system_parts_race_condition_zookeeper_long.sh b/tests/queries/0_stateless/00992_system_parts_race_condition_zookeeper_long.sh
index 5b1c50262bf..d45cc3a6871 100755
--- a/tests/queries/0_stateless/00992_system_parts_race_condition_zookeeper_long.sh
+++ b/tests/queries/0_stateless/00992_system_parts_race_condition_zookeeper_long.sh
@@ -13,8 +13,14 @@ $CLICKHOUSE_CLIENT -n -q "
     DROP TABLE IF EXISTS alter_table0;
     DROP TABLE IF EXISTS alter_table1;
 
-    CREATE TABLE alter_table0 (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16)) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/alter_table', 'r1') ORDER BY a PARTITION BY b % 10 SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 1, cleanup_delay_period_random_add = 0, replicated_max_mutations_in_one_entry = $(($RANDOM / 50 + 100));
-    CREATE TABLE alter_table1 (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16)) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/alter_table', 'r2') ORDER BY a PARTITION BY b % 10 SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 1, cleanup_delay_period_random_add = 0, replicated_max_mutations_in_one_entry = $(($RANDOM / 50 + 200));
+    CREATE TABLE alter_table0 (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16))
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/alter_table', 'r1') ORDER BY a PARTITION BY b % 10
+    SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 1, cleanup_delay_period_random_add = 0,
+    cleanup_thread_preferred_points_per_iteration=0, replicated_max_mutations_in_one_entry = $(($RANDOM / 50 + 100));
+    CREATE TABLE alter_table1 (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16))
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/alter_table', 'r2') ORDER BY a PARTITION BY b % 10
+    SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 1, cleanup_delay_period_random_add = 0,
+    cleanup_thread_preferred_points_per_iteration=0, replicated_max_mutations_in_one_entry = $(($RANDOM / 50 + 200));
 "
 
 function thread1()
@@ -79,6 +85,8 @@ timeout $TIMEOUT bash -c thread5 2> /dev/null &
 wait
 check_replication_consistency "alter_table" "count(), sum(a), sum(b), round(sum(c))"
 
+$CLICKHOUSE_CLIENT -q "SELECT table, lost_part_count FROM system.replicas WHERE database=currentDatabase() AND lost_part_count!=0";
+
 $CLICKHOUSE_CLIENT -n -q "DROP TABLE alter_table0;" 2> >(grep -F -v 'is already started to be removing by another replica right now') &
 $CLICKHOUSE_CLIENT -n -q "DROP TABLE alter_table1;" 2> >(grep -F -v 'is already started to be removing by another replica right now') &
 wait
diff --git a/tests/queries/0_stateless/00993_system_parts_race_condition_drop_zookeeper.sh b/tests/queries/0_stateless/00993_system_parts_race_condition_drop_zookeeper.sh
index f4f38ad9c83..811681794a5 100755
--- a/tests/queries/0_stateless/00993_system_parts_race_condition_drop_zookeeper.sh
+++ b/tests/queries/0_stateless/00993_system_parts_race_condition_drop_zookeeper.sh
@@ -58,7 +58,8 @@ function thread6()
         $CLICKHOUSE_CLIENT -n -q "DROP TABLE IF EXISTS alter_table_$REPLICA;
             CREATE TABLE alter_table_$REPLICA (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16))
             ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/alter_table', 'r_$REPLICA') ORDER BY a PARTITION BY b % 10
-            SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0, replicated_max_mutations_in_one_entry = $(($RANDOM / 50));";
+            SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0,
+            cleanup_thread_preferred_points_per_iteration=0, replicated_max_mutations_in_one_entry = $(($RANDOM / 50));";
         sleep 0.$RANDOM;
     done
 }
diff --git a/tests/queries/0_stateless/01018_Distributed__shard_num.sql b/tests/queries/0_stateless/01018_Distributed__shard_num.sql
index 7e31062348d..6f9d8a6a1bb 100644
--- a/tests/queries/0_stateless/01018_Distributed__shard_num.sql
+++ b/tests/queries/0_stateless/01018_Distributed__shard_num.sql
@@ -3,6 +3,9 @@
 -- make the order static
 SET max_threads = 1;
 
+-- data should be inserted into Distributed table synchronously
+SET insert_distributed_sync = 1;
+
 DROP TABLE IF EXISTS mem1;
 DROP TABLE IF EXISTS mem2;
 DROP TABLE IF EXISTS mem3;
diff --git a/tests/queries/0_stateless/01034_move_partition_from_table_zookeeper.sh b/tests/queries/0_stateless/01034_move_partition_from_table_zookeeper.sh
index 5e9e69d999d..e0a84323dbd 100755
--- a/tests/queries/0_stateless/01034_move_partition_from_table_zookeeper.sh
+++ b/tests/queries/0_stateless/01034_move_partition_from_table_zookeeper.sh
@@ -28,7 +28,8 @@ $CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS src;"
 $CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS dst;"
 
 $CLICKHOUSE_CLIENT --query="CREATE TABLE src (p UInt64, k String, d UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/src1', '1') PARTITION BY p ORDER BY k;"
-$CLICKHOUSE_CLIENT --query="CREATE TABLE dst (p UInt64, k String, d UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/dst1', '1') PARTITION BY p ORDER BY k SETTINGS old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=0;"
+$CLICKHOUSE_CLIENT --query="CREATE TABLE dst (p UInt64, k String, d UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/dst1', '1') PARTITION BY p ORDER BY k
+SETTINGS old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;"
 
 $CLICKHOUSE_CLIENT --query="INSERT INTO src VALUES (0, '0', 1);"
 $CLICKHOUSE_CLIENT --query="INSERT INTO src VALUES (1, '0', 1);"
@@ -58,7 +59,8 @@ $CLICKHOUSE_CLIENT --query="DROP TABLE dst;"
 $CLICKHOUSE_CLIENT --query="SELECT 'MOVE incompatible schema missing column';"
 
 $CLICKHOUSE_CLIENT --query="CREATE TABLE src (p UInt64, k String, d UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/src2', '1') PARTITION BY p ORDER BY (d, p);"
-$CLICKHOUSE_CLIENT --query="CREATE TABLE dst (p UInt64, d UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/dst2', '1') PARTITION BY p ORDER BY (d, p) SETTINGS old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=0;"
+$CLICKHOUSE_CLIENT --query="CREATE TABLE dst (p UInt64, d UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/dst2', '1') PARTITION BY p ORDER BY (d, p)
+SETTINGS old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;"
 
 $CLICKHOUSE_CLIENT --query="INSERT INTO src VALUES (0, '0', 1);"
 $CLICKHOUSE_CLIENT --query="INSERT INTO src VALUES (1, '0', 1);"
diff --git a/tests/queries/0_stateless/01035_concurrent_move_partition_from_table_zookeeper.sh b/tests/queries/0_stateless/01035_concurrent_move_partition_from_table_zookeeper.sh
index 8ef03be02b6..06a460f3600 100755
--- a/tests/queries/0_stateless/01035_concurrent_move_partition_from_table_zookeeper.sh
+++ b/tests/queries/0_stateless/01035_concurrent_move_partition_from_table_zookeeper.sh
@@ -11,7 +11,8 @@ $CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS src;"
 $CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS dst;"
 
 $CLICKHOUSE_CLIENT --query="CREATE TABLE src (p UInt64, k String) ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/src', '1') PARTITION BY p ORDER BY k;"
-$CLICKHOUSE_CLIENT --query="CREATE TABLE dst (p UInt64, k String) ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/dst', '1') PARTITION BY p ORDER BY k SETTINGS old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=0;"
+$CLICKHOUSE_CLIENT --query="CREATE TABLE dst (p UInt64, k String) ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/dst', '1') PARTITION BY p ORDER BY k
+SETTINGS old_parts_lifetime=1, cleanup_delay_period=1, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;"
 
 function thread1()
 {
diff --git a/tests/queries/0_stateless/01076_parallel_alter_replicated_zookeeper.sh b/tests/queries/0_stateless/01076_parallel_alter_replicated_zookeeper.sh
index 7f53bf2a627..5f69427c0cd 100755
--- a/tests/queries/0_stateless/01076_parallel_alter_replicated_zookeeper.sh
+++ b/tests/queries/0_stateless/01076_parallel_alter_replicated_zookeeper.sh
@@ -31,7 +31,8 @@ for i in $(seq $REPLICAS); do
                  max_replicated_merges_in_queue = 1000,
                  temporary_directories_lifetime = 10,
                  cleanup_delay_period = 3,
-                 cleanup_delay_period_random_add = 0"
+                 cleanup_delay_period_random_add = 0,
+                 cleanup_thread_preferred_points_per_iteration=0"
 done
 
 $CLICKHOUSE_CLIENT --query "INSERT INTO concurrent_mutate_mt_1 SELECT number, number + 10, toString(number) from numbers(10)"
diff --git a/tests/queries/0_stateless/01079_parallel_alter_detach_table_zookeeper.sh b/tests/queries/0_stateless/01079_parallel_alter_detach_table_zookeeper.sh
index aec27792603..e508b77a0c2 100755
--- a/tests/queries/0_stateless/01079_parallel_alter_detach_table_zookeeper.sh
+++ b/tests/queries/0_stateless/01079_parallel_alter_detach_table_zookeeper.sh
@@ -12,7 +12,10 @@ for i in $(seq $REPLICAS); do
 done
 
 for i in $(seq $REPLICAS); do
-    $CLICKHOUSE_CLIENT --query "CREATE TABLE concurrent_alter_detach_$i (key UInt64, value1 UInt8, value2 UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/concurrent_alter_detach', '$i') ORDER BY key SETTINGS max_replicated_mutations_in_queue=1000, number_of_free_entries_in_pool_to_execute_mutation=0,max_replicated_merges_in_queue=1000,temporary_directories_lifetime=10,cleanup_delay_period=3,cleanup_delay_period_random_add=0"
+    $CLICKHOUSE_CLIENT --query "CREATE TABLE concurrent_alter_detach_$i (key UInt64, value1 UInt8, value2 UInt8)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/concurrent_alter_detach', '$i') ORDER BY key
+    SETTINGS max_replicated_mutations_in_queue=1000, number_of_free_entries_in_pool_to_execute_mutation=0,max_replicated_merges_in_queue=1000,
+    temporary_directories_lifetime=10,cleanup_delay_period=3,cleanup_delay_period_random_add=0,cleanup_thread_preferred_points_per_iteration=0"
 done
 
 $CLICKHOUSE_CLIENT --query "INSERT INTO concurrent_alter_detach_1 SELECT number, number + 10, number from numbers(10)"
diff --git a/tests/queries/0_stateless/01103_optimize_drop_race_zookeeper.sh b/tests/queries/0_stateless/01103_optimize_drop_race_zookeeper.sh
index 95f8dfc0377..3461283b5ea 100755
--- a/tests/queries/0_stateless/01103_optimize_drop_race_zookeeper.sh
+++ b/tests/queries/0_stateless/01103_optimize_drop_race_zookeeper.sh
@@ -27,7 +27,9 @@ function thread3()
 {
     while true; do
         $CLICKHOUSE_CLIENT -n -q "DROP TABLE IF EXISTS concurrent_optimize_table;
-            CREATE TABLE concurrent_optimize_table (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16)) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/concurrent_optimize_table', '1') ORDER BY a PARTITION BY b % 10 SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0;";
+            CREATE TABLE concurrent_optimize_table (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16))
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/concurrent_optimize_table', '1') ORDER BY a PARTITION BY b % 10
+            SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0, cleanup_thread_preferred_points_per_iteration=0;";
         sleep 0.$RANDOM;
         sleep 0.$RANDOM;
         sleep 0.$RANDOM;
diff --git a/tests/queries/0_stateless/01111_create_drop_replicated_db_stress.sh b/tests/queries/0_stateless/01111_create_drop_replicated_db_stress.sh
index 770a0780ca2..4d341e5b8a3 100755
--- a/tests/queries/0_stateless/01111_create_drop_replicated_db_stress.sh
+++ b/tests/queries/0_stateless/01111_create_drop_replicated_db_stress.sh
@@ -64,7 +64,7 @@ function alter_table()
         if [ -z "$table" ]; then continue; fi
         $CLICKHOUSE_CLIENT --distributed_ddl_task_timeout=0 -q \
         "alter table $table update n = n + (select max(n) from merge(REGEXP('${CLICKHOUSE_DATABASE}.*'), '.*')) where 1 settings allow_nondeterministic_mutations=1" \
-        2>&1| grep -Fa "Exception: " | grep -Fv "Cannot enqueue query" | grep -Fv "ZooKeeper session expired" | grep -Fv UNKNOWN_DATABASE | grep -Fv UNKNOWN_TABLE | grep -Fv TABLE_IS_READ_ONLY | grep -Fv TABLE_IS_DROPPED
+        2>&1| grep -Fa "Exception: " | grep -Fv "Cannot enqueue query" | grep -Fv "ZooKeeper session expired" | grep -Fv UNKNOWN_DATABASE | grep -Fv UNKNOWN_TABLE | grep -Fv TABLE_IS_READ_ONLY | grep -Fv TABLE_IS_DROPPED | grep -Fv "Error while executing table function merge"
         sleep 0.$RANDOM
     done
 }
diff --git a/tests/queries/0_stateless/01154_move_partition_long.sh b/tests/queries/0_stateless/01154_move_partition_long.sh
index c68b0944407..3e068fa0e2d 100755
--- a/tests/queries/0_stateless/01154_move_partition_long.sh
+++ b/tests/queries/0_stateless/01154_move_partition_long.sh
@@ -125,6 +125,8 @@ wait
 check_replication_consistency "dst_" "count(), sum(p), sum(k), sum(v)"
 try_sync_replicas "src_" 300
 
+$CLICKHOUSE_CLIENT -q "SELECT table, lost_part_count FROM system.replicas WHERE database=currentDatabase() AND lost_part_count!=0";
+
 for ((i=0; i<16; i++)) do
     $CLICKHOUSE_CLIENT -q "DROP TABLE dst_$i" 2>&1| grep -Fv "is already started to be removing" &
     $CLICKHOUSE_CLIENT -q "DROP TABLE IF EXISTS src_$i" 2>&1| grep -Fv "is already started to be removing" &
diff --git a/tests/queries/0_stateless/01158_zookeeper_log_long.sql b/tests/queries/0_stateless/01158_zookeeper_log_long.sql
index 45771494af6..9b5ae7ad7c6 100644
--- a/tests/queries/0_stateless/01158_zookeeper_log_long.sql
+++ b/tests/queries/0_stateless/01158_zookeeper_log_long.sql
@@ -6,7 +6,7 @@ SET insert_keeper_fault_injection_probability=0; -- disable fault injection; par
 drop table if exists rmt sync;
 -- cleanup code will perform extra Exists
 -- (so the .reference will not match)
-create table rmt (n int) engine=ReplicatedMergeTree('/test/01158/{database}/rmt', '1') order by n settings cleanup_delay_period=86400, replicated_can_become_leader=0;
+create table rmt (n int) engine=ReplicatedMergeTree('/test/01158/{database}/rmt', '1') order by n settings cleanup_delay_period=86400, max_cleanup_delay_period=86400, replicated_can_become_leader=0;
 system sync replica rmt;
 insert into rmt values (1);
 insert into rmt values (1);
diff --git a/tests/queries/0_stateless/01169_alter_partition_isolation_stress.sh b/tests/queries/0_stateless/01169_alter_partition_isolation_stress.sh
index 508ad05224c..f2348c29146 100755
--- a/tests/queries/0_stateless/01169_alter_partition_isolation_stress.sh
+++ b/tests/queries/0_stateless/01169_alter_partition_isolation_stress.sh
@@ -240,7 +240,7 @@ kill -TERM $PID_1
 kill -TERM $PID_2
 wait ||:
 
-wait_for_queries_to_finish
+wait_for_queries_to_finish 40
 
 $CLICKHOUSE_CLIENT -q "SELECT type, count(n) = countDistinct(n) FROM merge(currentDatabase(), '') GROUP BY type ORDER BY type"
 $CLICKHOUSE_CLIENT -q "SELECT DISTINCT arraySort(groupArrayIf(n, type=1)) = arraySort(groupArrayIf(n, type=2)) FROM merge(currentDatabase(), '') GROUP BY _table ORDER BY _table"
diff --git a/tests/queries/0_stateless/01171_mv_select_insert_isolation_long.sh b/tests/queries/0_stateless/01171_mv_select_insert_isolation_long.sh
index 199c2b5389f..619e212c3ae 100755
--- a/tests/queries/0_stateless/01171_mv_select_insert_isolation_long.sh
+++ b/tests/queries/0_stateless/01171_mv_select_insert_isolation_long.sh
@@ -131,7 +131,7 @@ kill -TERM $PID_6
 kill -TERM $PID_7
 kill -TERM $PID_8
 wait
-wait_for_queries_to_finish
+wait_for_queries_to_finish 40
 
 $CLICKHOUSE_CLIENT --multiquery --query "
 BEGIN TRANSACTION;
diff --git a/tests/queries/0_stateless/01174_select_insert_isolation.sh b/tests/queries/0_stateless/01174_select_insert_isolation.sh
index 29ccfbb1ccb..6321f6ff01b 100755
--- a/tests/queries/0_stateless/01174_select_insert_isolation.sh
+++ b/tests/queries/0_stateless/01174_select_insert_isolation.sh
@@ -56,7 +56,7 @@ thread_select & PID_4=$!
 wait $PID_1 && wait $PID_2 && wait $PID_3
 kill -TERM $PID_4
 wait
-wait_for_queries_to_finish
+wait_for_queries_to_finish 40
 
 $CLICKHOUSE_CLIENT --multiquery --query "
 BEGIN TRANSACTION;
diff --git a/tests/queries/0_stateless/01193_metadata_loading.sh b/tests/queries/0_stateless/01193_metadata_loading.sh
index d0f3001fceb..50425eae018 100755
--- a/tests/queries/0_stateless/01193_metadata_loading.sh
+++ b/tests/queries/0_stateless/01193_metadata_loading.sh
@@ -5,18 +5,14 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
+# Check that attaching a database with a large number of tables is not too slow.
 # it is the worst way of making performance test, nevertheless it can detect significant slowdown and some other issues, that usually found by stress test
 
 db="test_01193_$RANDOM"
 tables=1000
 threads=10
 count_multiplier=1
-max_time_ms=1000
-
-# In case of s390x, the query execution time seems to be approximately ~1.1 to ~1.2 secs. So, to match the query execution time, set max_time_ms=1500
-if [[ $(uname -a | grep s390x) ]]; then
-    max_time_ms=1500
-fi
+max_time_ms=1500
 
 debug_or_sanitizer_build=$($CLICKHOUSE_CLIENT -q "WITH ((SELECT value FROM system.build_options WHERE name='BUILD_TYPE') AS build, (SELECT value FROM system.build_options WHERE name='CXX_FLAGS') as flags) SELECT build='Debug' OR flags LIKE '%fsanitize%' OR hasThreadFuzzer()")
 
@@ -46,13 +42,15 @@ wait
 $CLICKHOUSE_CLIENT -q "CREATE TABLE $db.table_merge (i UInt64, d Date, s String, n Nested(i UInt8, f Float32)) ENGINE=Merge('$db', '^table_')"
 $CLICKHOUSE_CLIENT -q "SELECT count() * $count_multiplier, i, d, s, n.i, n.f FROM merge('$db', '^table_9') GROUP BY i, d, s, n.i, n.f ORDER BY i"
 
-for i in {1..5}; do
+for i in {1..50}; do
   $CLICKHOUSE_CLIENT -q "DETACH DATABASE $db"
-  $CLICKHOUSE_CLIENT -q "ATTACH DATABASE $db" --query_id="$db-$i";
+  $CLICKHOUSE_CLIENT --query_profiler_real_time_period_ns=100000000 --query_profiler_cpu_time_period_ns=100000000 -q "ATTACH DATABASE $db" --query_id="$db-$i";
 done
 
 $CLICKHOUSE_CLIENT -q "SYSTEM FLUSH LOGS"
-$CLICKHOUSE_CLIENT -q "SELECT if(quantile(0.5)(query_duration_ms) < $max_time_ms, 'ok', toString(groupArray(query_duration_ms))) FROM system.query_log WHERE current_database = currentDatabase() AND query_id LIKE '$db-%' AND type=2"
+durations=$($CLICKHOUSE_CLIENT -q "SELECT groupArray(query_duration_ms) FROM system.query_log WHERE current_database = currentDatabase() AND query_id LIKE '$db-%' AND type=2")
+$CLICKHOUSE_CLIENT -q "SELECT 'durations', '$db', $durations FORMAT Null"
+$CLICKHOUSE_CLIENT -q "SELECT if(quantile(0.5)(arrayJoin($durations)) < $max_time_ms, 'ok', toString($durations))"
 
 $CLICKHOUSE_CLIENT -q "SELECT count() * $count_multiplier, i, d, s, n.i, n.f FROM $db.table_merge GROUP BY i, d, s, n.i, n.f ORDER BY i"
 
diff --git a/tests/queries/0_stateless/01271_show_privileges.reference b/tests/queries/0_stateless/01271_show_privileges.reference
index ec245d8b9e0..9e6249bfcb3 100644
--- a/tests/queries/0_stateless/01271_show_privileges.reference
+++ b/tests/queries/0_stateless/01271_show_privileges.reference
@@ -149,6 +149,7 @@ FILE	[]	GLOBAL	SOURCES
 URL	[]	GLOBAL	SOURCES
 REMOTE	[]	GLOBAL	SOURCES
 MONGO	[]	GLOBAL	SOURCES
+REDIS	[]	GLOBAL	SOURCES
 MEILISEARCH	[]	GLOBAL	SOURCES
 MYSQL	[]	GLOBAL	SOURCES
 POSTGRES	[]	GLOBAL	SOURCES
@@ -158,6 +159,7 @@ JDBC	[]	GLOBAL	SOURCES
 HDFS	[]	GLOBAL	SOURCES
 S3	[]	GLOBAL	SOURCES
 HIVE	[]	GLOBAL	SOURCES
+AZURE	[]	GLOBAL	SOURCES
 SOURCES	[]	\N	ALL
 CLUSTER	[]	GLOBAL	ALL
 ALL	['ALL PRIVILEGES']	\N	\N
diff --git a/tests/queries/0_stateless/01280_ttl_where_group_by.sh b/tests/queries/0_stateless/01280_ttl_where_group_by.sh
index ebef8f2a797..e6f83d6edd1 100755
--- a/tests/queries/0_stateless/01280_ttl_where_group_by.sh
+++ b/tests/queries/0_stateless/01280_ttl_where_group_by.sh
@@ -15,9 +15,11 @@ function optimize()
     done
 }
 
+# "SETTINGS max_parts_to_merge_at_once = 1" prevents merges to start before our own OPTIMIZE FINAL
+
 echo "ttl_01280_1"
 $CLICKHOUSE_CLIENT -n --query "
-create table ttl_01280_1 (a Int, b Int, x Int, y Int, d DateTime) engine = MergeTree order by (a, b) ttl d + interval 1 second delete where x % 10 == 0 and y > 5;
+create table ttl_01280_1 (a Int, b Int, x Int, y Int, d DateTime) engine = MergeTree order by (a, b) ttl d + interval 1 second delete where x % 10 == 0 and y > 5 SETTINGS max_parts_to_merge_at_once = 1;
 insert into ttl_01280_1 values (1, 1, 0, 4, now() + 10);
 insert into ttl_01280_1 values (1, 1, 10, 6, now());
 insert into ttl_01280_1 values (1, 2, 3, 7, now());
@@ -34,7 +36,7 @@ $CLICKHOUSE_CLIENT --query "drop table if exists ttl_01280_2"
 
 echo "ttl_01280_2"
 $CLICKHOUSE_CLIENT -n --query "
-create table ttl_01280_2 (a Int, b Int, x Array(Int32), y Double, d DateTime) engine = MergeTree order by (a, b) ttl d + interval 1 second group by a, b set x = minForEach(x), y = sum(y), d = max(d);
+create table ttl_01280_2 (a Int, b Int, x Array(Int32), y Double, d DateTime) engine = MergeTree order by (a, b) ttl d + interval 1 second group by a, b set x = minForEach(x), y = sum(y), d = max(d) SETTINGS max_parts_to_merge_at_once = 1;
 insert into ttl_01280_2 values (1, 1, array(0, 2, 3), 4, now() + 10);
 insert into ttl_01280_2 values (1, 1, array(5, 4, 3), 6, now());
 insert into ttl_01280_2 values (1, 1, array(5, 5, 1), 7, now());
@@ -53,7 +55,7 @@ $CLICKHOUSE_CLIENT --query "drop table if exists ttl_01280_3"
 
 echo "ttl_01280_3"
 $CLICKHOUSE_CLIENT -n --query "
-create table ttl_01280_3 (a Int, b Int, x Int64, y Int, d DateTime) engine = MergeTree order by (a, b) ttl d + interval 1 second group by a set b = min(b), x = argMax(x, d), y = argMax(y, d), d = max(d);
+create table ttl_01280_3 (a Int, b Int, x Int64, y Int, d DateTime) engine = MergeTree order by (a, b) ttl d + interval 1 second group by a set b = min(b), x = argMax(x, d), y = argMax(y, d), d = max(d) SETTINGS max_parts_to_merge_at_once = 1;
 insert into ttl_01280_3 values (1, 1, 0, 4, now() + 10);
 insert into ttl_01280_3 values (1, 1, 10, 6, now() + 1);
 insert into ttl_01280_3 values (1, 2, 3, 7, now());
@@ -72,7 +74,7 @@ $CLICKHOUSE_CLIENT --query "drop table if exists ttl_01280_4"
 
 echo "ttl_01280_4"
 $CLICKHOUSE_CLIENT -n --query "
-create table ttl_01280_4 (a Int, b Int, x Int64, y Int64, d DateTime) engine = MergeTree order by (toDate(d), -(a + b)) ttl d + interval 1 second group by toDate(d) set x = sum(x), y = max(y);
+create table ttl_01280_4 (a Int, b Int, x Int64, y Int64, d DateTime) engine = MergeTree order by (toDate(d), -(a + b)) ttl d + interval 1 second group by toDate(d) set x = sum(x), y = max(y) SETTINGS max_parts_to_merge_at_once = 1;
 insert into ttl_01280_4 values (1, 1, 0, 4, now() + 10);
 insert into ttl_01280_4 values (10, 2, 3, 3, now());
 insert into ttl_01280_4 values (2, 10, 1, 7, now());
@@ -86,7 +88,7 @@ $CLICKHOUSE_CLIENT --query "select x, y from ttl_01280_4 ORDER BY a, b, x, y"
 $CLICKHOUSE_CLIENT --query "drop table if exists ttl_01280_5"
 
 echo "ttl_01280_5"
-$CLICKHOUSE_CLIENT -n --query "create table ttl_01280_5 (a Int, b Int, x Int64, y Int64, d DateTime) engine = MergeTree order by (toDate(d), a, -b) ttl d + interval 1 second group by toDate(d), a set x = sum(x), b = argMax(b, -b);
+$CLICKHOUSE_CLIENT -n --query "create table ttl_01280_5 (a Int, b Int, x Int64, y Int64, d DateTime) engine = MergeTree order by (toDate(d), a, -b) ttl d + interval 1 second group by toDate(d), a set x = sum(x), b = argMax(b, -b) SETTINGS max_parts_to_merge_at_once = 1;
 insert into ttl_01280_5 values (1, 2, 3, 5, now());
 insert into ttl_01280_5 values (2, 10, 1, 5, now());
 insert into ttl_01280_5 values (2, 3, 5, 5, now());
@@ -100,7 +102,7 @@ $CLICKHOUSE_CLIENT --query "drop table if exists ttl_01280_6"
 
 echo "ttl_01280_6"
 $CLICKHOUSE_CLIENT -n --query "
-create table ttl_01280_6 (a Int, b Int, x Int64, y Int64, d DateTime) engine = MergeTree order by (toDate(d), a, -b) ttl d + interval 1 second group by toDate(d), a;
+create table ttl_01280_6 (a Int, b Int, x Int64, y Int64, d DateTime) engine = MergeTree order by (toDate(d), a, -b) ttl d + interval 1 second group by toDate(d), a SETTINGS max_parts_to_merge_at_once = 1;
 insert into ttl_01280_6 values (1, 2, 3, 5, now());
 insert into ttl_01280_6 values (2, 10, 3, 5, now());
 insert into ttl_01280_6 values (2, 3, 3, 5, now());
diff --git a/tests/queries/0_stateless/01281_group_by_limit_memory_tracking.sh b/tests/queries/0_stateless/01281_group_by_limit_memory_tracking.sh
index 06f195f865f..e83e49dffef 100755
--- a/tests/queries/0_stateless/01281_group_by_limit_memory_tracking.sh
+++ b/tests/queries/0_stateless/01281_group_by_limit_memory_tracking.sh
@@ -23,7 +23,7 @@ set -o pipefail
 
 function execute_null()
 {
-    ${CLICKHOUSE_CLIENT} --format Null -n "$@"
+    ${CLICKHOUSE_CLIENT} -u u01281 --format Null -n "$@"
 }
 
 function execute_group_by()
@@ -46,6 +46,10 @@ function execute_group_by()
     execute_null "${opts[@]}" <<<'SELECT uniq(number) FROM numbers_mt(1e6) GROUP BY number % 5e5 LIMIT 10'
 }
 
+${CLICKHOUSE_CLIENT} -q 'DROP USER IF EXISTS u01281'
+${CLICKHOUSE_CLIENT} -q 'CREATE USER IF NOT EXISTS u01281 IDENTIFIED WITH no_password'
+${CLICKHOUSE_CLIENT} -q 'GRANT ALL ON *.* TO u01281'
+
 # This is needed to keep at least one running query for user for the time of test.
 execute_null <<<'SELECT sleep(3)' &
 execute_group_by
@@ -55,3 +59,4 @@ wait
 
 # Reset max_memory_usage_for_user, so it will not affect other tests
 ${CLICKHOUSE_CLIENT} --max_memory_usage_for_user=0 -q "SELECT 1 FORMAT Null"
+${CLICKHOUSE_CLIENT} -q 'DROP USER IF EXISTS u01281'
diff --git a/tests/queries/0_stateless/01293_optimize_final_force.sh b/tests/queries/0_stateless/01293_optimize_final_force.sh
index 994d5952dbc..9b9ed6272a1 100755
--- a/tests/queries/0_stateless/01293_optimize_final_force.sh
+++ b/tests/queries/0_stateless/01293_optimize_final_force.sh
@@ -1,5 +1,6 @@
 #!/usr/bin/env bash
-# Tags: no-fasttest
+# Tags: no-fasttest, long, no-debug, no-s3-storage
+# This test is too slow with S3 storage and debug modes.
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
diff --git a/tests/queries/0_stateless/01317_no_password_in_command_line.reference b/tests/queries/0_stateless/01317_no_password_in_command_line.reference
index e69de29bb2d..8f2f637d5e3 100644
--- a/tests/queries/0_stateless/01317_no_password_in_command_line.reference
+++ b/tests/queries/0_stateless/01317_no_password_in_command_line.reference
@@ -0,0 +1 @@
+Bad arguments
diff --git a/tests/queries/0_stateless/01317_no_password_in_command_line.sh b/tests/queries/0_stateless/01317_no_password_in_command_line.sh
index 7f2e91201a3..fc5b8997636 100755
--- a/tests/queries/0_stateless/01317_no_password_in_command_line.sh
+++ b/tests/queries/0_stateless/01317_no_password_in_command_line.sh
@@ -45,3 +45,5 @@ ps u --no-header $bg_query | grep -F -- '--password' | grep -F hello ||:
 grep -F -- '--password' < "/proc/$bg_query/comm" | grep -F hello ||:
 $CLICKHOUSE_CLIENT --format Null --param_query_id "$query_id" -q "KILL QUERY WHERE query_id = {query_id:String} SYNC"
 wait
+
+$CLICKHOUSE_CLIENT --user "$user" --password=hello --password -q 'select currentUser()' 2>&1 | grep -o 'Bad arguments'
diff --git a/tests/queries/0_stateless/01320_create_sync_race_condition_zookeeper.sh b/tests/queries/0_stateless/01320_create_sync_race_condition_zookeeper.sh
index ef45e8e63bc..aee69e64b1b 100755
--- a/tests/queries/0_stateless/01320_create_sync_race_condition_zookeeper.sh
+++ b/tests/queries/0_stateless/01320_create_sync_race_condition_zookeeper.sh
@@ -12,7 +12,10 @@ $CLICKHOUSE_CLIENT --allow_deprecated_database_ordinary=1 --query "CREATE DATABA
 
 function thread1()
 {
-    while true; do $CLICKHOUSE_CLIENT -n --query "CREATE TABLE test_01320.r (x UInt64) ENGINE = ReplicatedMergeTree('/test/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/table', 'r') ORDER BY x; DROP TABLE test_01320.r;"; done
+    while true; do
+        $CLICKHOUSE_CLIENT -n --query "CREATE TABLE test_01320.r (x UInt64) ENGINE = ReplicatedMergeTree('/test/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/table', 'r') ORDER BY x;
+        DROP TABLE test_01320.r;" 2>&1 | grep -F "Code:" | grep -v "UNKNOWN_DATABASE"
+    done
 }
 
 function thread2()
diff --git a/tests/queries/0_stateless/01361_fover_remote_num_tries.sh b/tests/queries/0_stateless/01361_fover_remote_num_tries.sh
index 2ee2ec1bc76..f07ffc02e4f 100755
--- a/tests/queries/0_stateless/01361_fover_remote_num_tries.sh
+++ b/tests/queries/0_stateless/01361_fover_remote_num_tries.sh
@@ -5,4 +5,4 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_CLIENT --connections_with_failover_max_tries 10 --query "SELECT hostName() FROM remote('128.1.2.3', default.tmp)" 2>&1 | grep -o -P 'Timeout exceeded while connecting to socket|Network is unreachable' | wc -l
+$CLICKHOUSE_CLIENT --connections_with_failover_max_tries 10 --query "SELECT hostName() FROM remote('128.1.2.3', default.tmp)" 2>&1 | grep -o -P 'Timeout exceeded while connecting to socket|Network is unreachable|Timeout: connect timed out' | wc -l
diff --git a/tests/queries/0_stateless/01396_inactive_replica_cleanup_nodes_zookeeper.sh b/tests/queries/0_stateless/01396_inactive_replica_cleanup_nodes_zookeeper.sh
index 411705e0469..2d761df998e 100755
--- a/tests/queries/0_stateless/01396_inactive_replica_cleanup_nodes_zookeeper.sh
+++ b/tests/queries/0_stateless/01396_inactive_replica_cleanup_nodes_zookeeper.sh
@@ -13,8 +13,10 @@ SCALE=5000
 $CLICKHOUSE_CLIENT -n --query "
     DROP TABLE IF EXISTS r1;
     DROP TABLE IF EXISTS r2;
-    CREATE TABLE r1 (x UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/{shard}', '1{replica}') ORDER BY x SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 1, parts_to_throw_insert = 100000, max_replicated_logs_to_keep = 10;
-    CREATE TABLE r2 (x UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/{shard}', '2{replica}') ORDER BY x SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 1, parts_to_throw_insert = 100000, max_replicated_logs_to_keep = 10;
+    CREATE TABLE r1 (x UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/{shard}', '1{replica}') ORDER BY x
+    SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 1, cleanup_thread_preferred_points_per_iteration=0, parts_to_throw_insert = 100000, max_replicated_logs_to_keep = 10;
+    CREATE TABLE r2 (x UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/{shard}', '2{replica}') ORDER BY x
+    SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 1, cleanup_thread_preferred_points_per_iteration=0, parts_to_throw_insert = 100000, max_replicated_logs_to_keep = 10;
     DETACH TABLE r2;
 "
 
diff --git a/tests/queries/0_stateless/01399_http_request_headers.reference b/tests/queries/0_stateless/01399_http_request_headers.reference
index 90a10a9818d..92ea6606a12 100644
--- a/tests/queries/0_stateless/01399_http_request_headers.reference
+++ b/tests/queries/0_stateless/01399_http_request_headers.reference
@@ -6,6 +6,7 @@ Code: 516
 1
 Code: 516
 processes
+processes
 Code: 81
 [1]
 Code: 73
diff --git a/tests/queries/0_stateless/01443_merge_truncate_long.reference b/tests/queries/0_stateless/01443_merge_truncate_long.reference
index e69de29bb2d..190423f88f8 100644
--- a/tests/queries/0_stateless/01443_merge_truncate_long.reference
+++ b/tests/queries/0_stateless/01443_merge_truncate_long.reference
@@ -0,0 +1,100 @@
+1
+2
+3
+4
+5
+6
+7
+8
+9
+10
+11
+12
+13
+14
+15
+16
+17
+18
+19
+20
+21
+22
+23
+24
+25
+26
+27
+28
+29
+30
+31
+32
+33
+34
+35
+36
+37
+38
+39
+40
+41
+42
+43
+44
+45
+46
+47
+48
+49
+50
+51
+52
+53
+54
+55
+56
+57
+58
+59
+60
+61
+62
+63
+64
+65
+66
+67
+68
+69
+70
+71
+72
+73
+74
+75
+76
+77
+78
+79
+80
+81
+82
+83
+84
+85
+86
+87
+88
+89
+90
+91
+92
+93
+94
+95
+96
+97
+98
+99
+100
diff --git a/tests/queries/0_stateless/01443_merge_truncate_long.sh b/tests/queries/0_stateless/01443_merge_truncate_long.sh
index 00abc48493a..65b9bcd366e 100755
--- a/tests/queries/0_stateless/01443_merge_truncate_long.sh
+++ b/tests/queries/0_stateless/01443_merge_truncate_long.sh
@@ -3,22 +3,38 @@
 
 set -e
 
+CLICKHOUSE_CLIENT_SERVER_LOGS_LEVEL=none
+
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-CLICKHOUSE_CLIENT=$(echo ${CLICKHOUSE_CLIENT} | sed 's/'"--send_logs_level=${CLICKHOUSE_CLIENT_SERVER_LOGS_LEVEL}"'/--send_logs_level=none/g')
-
 ${CLICKHOUSE_CLIENT} --query="DROP TABLE IF EXISTS t"
-${CLICKHOUSE_CLIENT} --query="CREATE TABLE t (x Int8) ENGINE = MergeTree ORDER BY tuple()"
+${CLICKHOUSE_CLIENT} --query="CREATE TABLE t (x Int8) ENGINE = MergeTree ORDER BY ()"
 
-for _ in {1..70}; do
-    ${CLICKHOUSE_CLIENT} --query="INSERT INTO t VALUES (0)"
-    ${CLICKHOUSE_CLIENT} --query="INSERT INTO t VALUES (0)"
-    ${CLICKHOUSE_CLIENT} --query="OPTIMIZE TABLE t FINAL" 2>/dev/null &
-    ${CLICKHOUSE_CLIENT} --query="TRUNCATE TABLE t"
-    ${CLICKHOUSE_CLIENT} --query="SELECT count() FROM t HAVING count() > 0"
-done
+
+function thread_optimize()
+{
+    while true;
+    do
+        ${CLICKHOUSE_CLIENT} --query="OPTIMIZE TABLE t FINAL;" 2>&1 | tr -d '\n' | rg -v 'Cancelled merging parts' ||:
+    done
+}
+
+TIMEOUT=15
+export -f thread_optimize
+timeout $TIMEOUT bash -c thread_optimize 2> /dev/null &
+
+for i in {1..100};
+do
+    echo "
+        INSERT INTO t VALUES (0);
+        INSERT INTO t VALUES (0);
+        TRUNCATE TABLE t;
+        SELECT count() FROM t HAVING count() > 0;
+        SELECT ${i};
+        "
+done | ${CLICKHOUSE_CLIENT} --multiquery
 
 wait
 
diff --git a/tests/queries/0_stateless/01479_cross_join_9855.sql b/tests/queries/0_stateless/01479_cross_join_9855.sql
index 6dc76f22057..9dcf209a1cd 100644
--- a/tests/queries/0_stateless/01479_cross_join_9855.sql
+++ b/tests/queries/0_stateless/01479_cross_join_9855.sql
@@ -2,8 +2,8 @@ SET cross_to_inner_join_rewrite = 1;
 
 SELECT count()
 FROM numbers(4) AS n1, numbers(3) AS n2
-WHERE n1.number > (select avg(n.number) from numbers(3) n);
+WHERE n1.number > (select avg(n.number) from numbers(3) n) SETTINGS allow_experimental_analyzer=0;
 
 SELECT count()
 FROM numbers(4) AS n1, numbers(3) AS n2, numbers(6) AS n3
-WHERE n1.number > (select avg(n.number) from numbers(3) n);
+WHERE n1.number > (select avg(n.number) from numbers(3) n) SETTINGS allow_experimental_analyzer=0;
diff --git a/tests/queries/0_stateless/01487_distributed_in_not_default_db.sql b/tests/queries/0_stateless/01487_distributed_in_not_default_db.sql
index ccd2c571290..cd027530ac8 100644
--- a/tests/queries/0_stateless/01487_distributed_in_not_default_db.sql
+++ b/tests/queries/0_stateless/01487_distributed_in_not_default_db.sql
@@ -25,6 +25,10 @@ CREATE TABLE d AS t ENGINE = Distributed(test_cluster_two_shards_different_datab
 USE test_01487;
 DROP DATABASE test_01487;
 
+-- After the default database is dropped QueryAnalysisPass cannot process the following SELECT query.
+-- That query is invalid on the initiator node.
+set allow_experimental_analyzer = 0;
+
 SELECT * FROM main_01487.d WHERE value IN (SELECT l.value FROM l) ORDER BY value;
 
 USE main_01487;
diff --git a/tests/queries/0_stateless/01508_race_condition_rename_clear_zookeeper_long.sh b/tests/queries/0_stateless/01508_race_condition_rename_clear_zookeeper_long.sh
index 80318ba67fb..c3c87eeaf8b 100755
--- a/tests/queries/0_stateless/01508_race_condition_rename_clear_zookeeper_long.sh
+++ b/tests/queries/0_stateless/01508_race_condition_rename_clear_zookeeper_long.sh
@@ -8,7 +8,9 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 $CLICKHOUSE_CLIENT --query "DROP TABLE IF EXISTS table_for_renames0"
 $CLICKHOUSE_CLIENT --query "DROP TABLE IF EXISTS table_for_renames50"
 
-$CLICKHOUSE_CLIENT --query "CREATE TABLE table_for_renames0 (value UInt64, data String) ENGINE ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/concurrent_rename', '1') ORDER BY tuple() SETTINGS cleanup_delay_period = 1, cleanup_delay_period_random_add = 0"
+$CLICKHOUSE_CLIENT --query "CREATE TABLE table_for_renames0 (value UInt64, data String)
+ENGINE ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/concurrent_rename', '1') ORDER BY tuple()
+SETTINGS cleanup_delay_period = 1, cleanup_delay_period_random_add = 0, cleanup_thread_preferred_points_per_iteration=0"
 
 $CLICKHOUSE_CLIENT --query "INSERT INTO table_for_renames0 SELECT number, toString(number) FROM numbers(1000)"
 
diff --git a/tests/queries/0_stateless/01509_parallel_quorum_and_merge_long.sh b/tests/queries/0_stateless/01509_parallel_quorum_and_merge_long.sh
index 445706e35bf..bf88ad0e0b2 100755
--- a/tests/queries/0_stateless/01509_parallel_quorum_and_merge_long.sh
+++ b/tests/queries/0_stateless/01509_parallel_quorum_and_merge_long.sh
@@ -13,7 +13,8 @@ $CLICKHOUSE_CLIENT -q "DROP TABLE IF EXISTS parallel_q1 SYNC"
 $CLICKHOUSE_CLIENT -q "DROP TABLE IF EXISTS parallel_q2 SYNC"
 
 
-$CLICKHOUSE_CLIENT -q "CREATE TABLE parallel_q1 (x UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/parallel_q', 'r1') ORDER BY tuple() SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0"
+$CLICKHOUSE_CLIENT -q "CREATE TABLE parallel_q1 (x UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/parallel_q', 'r1') ORDER BY tuple()
+SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0, cleanup_thread_preferred_points_per_iteration=0"
 
 $CLICKHOUSE_CLIENT -q "CREATE TABLE parallel_q2 (x UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/parallel_q', 'r2') ORDER BY tuple() SETTINGS always_fetch_merged_part = 1"
 
diff --git a/tests/queries/0_stateless/01543_parse_datetime_besteffort_or_null_empty_string.sql b/tests/queries/0_stateless/01543_parse_datetime_besteffort_or_null_empty_string.sql
index ad14c4ede06..7098028963d 100644
--- a/tests/queries/0_stateless/01543_parse_datetime_besteffort_or_null_empty_string.sql
+++ b/tests/queries/0_stateless/01543_parse_datetime_besteffort_or_null_empty_string.sql
@@ -4,7 +4,7 @@ SELECT parseDateTimeBestEffortOrNull('2020-01-01 11:01:01 am');
 SELECT parseDateTimeBestEffortOrNull('2020-01-01 11:01:01 pm');
 SELECT parseDateTimeBestEffortOrNull('2020-01-01 12:01:01 am');
 SELECT parseDateTimeBestEffortOrNull('2020-01-01 12:01:01 pm');
-SELECT parseDateTimeBestEffortOrNull('01:01:01');
+SELECT parseDateTimeBestEffortOrNull('2000-01-01 01:01:01');
 SELECT parseDateTimeBestEffortOrNull('20100');
 SELECT parseDateTimeBestEffortOrNull('0100:0100:0000');
 SELECT parseDateTimeBestEffortOrNull('x');
diff --git a/tests/queries/0_stateless/01556_accurate_cast_or_null.reference b/tests/queries/0_stateless/01556_accurate_cast_or_null.reference
index b329aede01a..31a9c37421e 100644
--- a/tests/queries/0_stateless/01556_accurate_cast_or_null.reference
+++ b/tests/queries/0_stateless/01556_accurate_cast_or_null.reference
@@ -30,3 +30,15 @@
 \N
 127
 \N
+\N
+\N
+\N
+2023-05-30 14:38:20
+1970-01-01 00:00:19
+1970-01-01 19:26:40
+\N
+\N
+\N
+2023-05-30
+2149-06-06
+1970-01-20
diff --git a/tests/queries/0_stateless/01556_accurate_cast_or_null.sql b/tests/queries/0_stateless/01556_accurate_cast_or_null.sql
index b45bbe35662..f00f6ef837f 100644
--- a/tests/queries/0_stateless/01556_accurate_cast_or_null.sql
+++ b/tests/queries/0_stateless/01556_accurate_cast_or_null.sql
@@ -35,3 +35,17 @@ SELECT accurateCastOrNull(nan, 'UInt64');
 SELECT accurateCastOrNull(nan, 'UInt256');
 
 SELECT accurateCastOrNull(number + 127, 'Int8') AS x FROM numbers (2) ORDER BY x;
+
+SELECT accurateCastOrNull(-1, 'DateTime');
+SELECT accurateCastOrNull(5000000000, 'DateTime');
+SELECT accurateCastOrNull('1xxx', 'DateTime');
+select toString(accurateCastOrNull('2023-05-30 14:38:20', 'DateTime'), timezone());
+SELECT toString(accurateCastOrNull(19, 'DateTime'), 'UTC');
+SELECT toString(accurateCastOrNull(70000, 'DateTime'), 'UTC');
+
+SELECT accurateCastOrNull(-1, 'Date');
+SELECT accurateCastOrNull(5000000000, 'Date');
+SELECT accurateCastOrNull('1xxx', 'Date');
+SELECT accurateCastOrNull('2023-05-30', 'Date');
+SELECT accurateCastOrNull('2180-01-01', 'Date');
+SELECT accurateCastOrNull(19, 'Date');
diff --git a/tests/queries/0_stateless/01561_clickhouse_client_stage.reference b/tests/queries/0_stateless/01561_clickhouse_client_stage.reference
index 00e0f4ddb2e..8a34751b071 100644
--- a/tests/queries/0_stateless/01561_clickhouse_client_stage.reference
+++ b/tests/queries/0_stateless/01561_clickhouse_client_stage.reference
@@ -2,7 +2,7 @@ execute: --allow_experimental_analyzer=1
 "foo"
 1
 execute: --allow_experimental_analyzer=1 --stage fetch_columns
-"system.one.dummy_0"
+"dummy_0"
 0
 execute: --allow_experimental_analyzer=1 --stage with_mergeable_state
 "1_UInt8"
diff --git a/tests/queries/0_stateless/01565_query_loop_after_client_error.expect b/tests/queries/0_stateless/01565_query_loop_after_client_error.expect
index 0faf8f0192b..e718fd99b7f 100755
--- a/tests/queries/0_stateless/01565_query_loop_after_client_error.expect
+++ b/tests/queries/0_stateless/01565_query_loop_after_client_error.expect
@@ -24,24 +24,24 @@ expect "\n:) "
 
 send -- "DROP TABLE IF EXISTS t01565;\n"
 # NOTE: this is important for -mn mode, you should send "\r" only after reading echoed command
-expect "DROP"
+expect "\r\n"
 send -- "\r"
 expect "\nOk."
 expect "\n:)"
 
 send -- "CREATE TABLE t01565 (c0 String, c1 Int32) ENGINE = Memory() ;\n"
-expect "CREATE"
+expect "\r\n"
 send -- "\r"
 expect "\nOk."
 expect "\n:) "
 
 send -- "INSERT INTO t01565(c0, c1) VALUES (\"1\",1) ;\n"
-expect "INSERT"
+expect "\r\n"
 send -- "\r"
 expect "\n:) "
 
 send -- "INSERT INTO t01565(c0, c1) VALUES ('1', 1) ;\n"
-expect "INSERT"
+expect "\r\n"
 send -- "\r"
 expect "\nOk."
 expect "\n:) "
diff --git a/tests/queries/0_stateless/01591_window_functions.reference b/tests/queries/0_stateless/01591_window_functions.reference
index b981a46b4fd..8939ea1111d 100644
--- a/tests/queries/0_stateless/01591_window_functions.reference
+++ b/tests/queries/0_stateless/01591_window_functions.reference
@@ -917,9 +917,9 @@ from
 ;
 Expression ((Project names + Projection))
   Window (Window step for window \'\')
-    Window (Window step for window \'PARTITION BY t.p_0\')
-      Window (Window step for window \'PARTITION BY t.p_0 ORDER BY t.o_1 ASC\')
-        Sorting (Sorting for window \'PARTITION BY t.p_0 ORDER BY t.o_1 ASC\')
+    Window (Window step for window \'PARTITION BY p_0\')
+      Window (Window step for window \'PARTITION BY p_0 ORDER BY o_1 ASC\')
+        Sorting (Sorting for window \'PARTITION BY p_0 ORDER BY o_1 ASC\')
           Expression ((Before WINDOW + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers)))))
             ReadFromStorage (SystemNumbers)
 explain select
@@ -930,11 +930,11 @@ from
         from numbers(16)) t
 ;
 Expression ((Project names + Projection))
-  Window (Window step for window \'ORDER BY t.o_0 ASC, t.number_1 ASC\')
-    Sorting (Sorting for window \'ORDER BY t.o_0 ASC, t.number_1 ASC\')
-      Window (Window step for window \'ORDER BY t.number_1 ASC\')
+  Window (Window step for window \'ORDER BY o_0 ASC, number_1 ASC\')
+    Sorting (Sorting for window \'ORDER BY o_0 ASC, number_1 ASC\')
+      Window (Window step for window \'ORDER BY number_1 ASC\')
         Expression ((Before WINDOW + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers)))) [lifted up part])
-          Sorting (Sorting for window \'ORDER BY t.number_1 ASC\')
+          Sorting (Sorting for window \'ORDER BY number_1 ASC\')
             Expression ((Before WINDOW + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers)))))
               ReadFromStorage (SystemNumbers)
 -- A test case for the sort comparator found by fuzzer.
diff --git a/tests/queries/0_stateless/01601_accurate_cast.reference b/tests/queries/0_stateless/01601_accurate_cast.reference
index c1e7feffbe6..3c6dceb1f16 100644
--- a/tests/queries/0_stateless/01601_accurate_cast.reference
+++ b/tests/queries/0_stateless/01601_accurate_cast.reference
@@ -6,3 +6,7 @@
 5
 1
 12
+2023-05-30 14:38:20
+1970-01-01 00:00:19
+2023-05-30
+1970-01-20
diff --git a/tests/queries/0_stateless/01601_accurate_cast.sql b/tests/queries/0_stateless/01601_accurate_cast.sql
index b5fd4fb04a4..2108e42df05 100644
--- a/tests/queries/0_stateless/01601_accurate_cast.sql
+++ b/tests/queries/0_stateless/01601_accurate_cast.sql
@@ -1,24 +1,36 @@
-SELECT accurateCast(-1, 'UInt8'); -- { serverError 70 }
+SELECT accurateCast(-1, 'UInt8'); -- { serverError CANNOT_CONVERT_TYPE }
 SELECT accurateCast(5, 'UInt8');
-SELECT accurateCast(257, 'UInt8'); -- { serverError 70 }
-SELECT accurateCast(-1, 'UInt16'); -- { serverError 70 }
+SELECT accurateCast(257, 'UInt8'); -- { serverError CANNOT_CONVERT_TYPE }
+SELECT accurateCast(-1, 'UInt16'); -- { serverError CANNOT_CONVERT_TYPE }
 SELECT accurateCast(5, 'UInt16');
-SELECT accurateCast(65536, 'UInt16'); -- { serverError 70 }
-SELECT accurateCast(-1, 'UInt32'); -- { serverError 70 }
+SELECT accurateCast(65536, 'UInt16'); -- { serverError CANNOT_CONVERT_TYPE }
+SELECT accurateCast(-1, 'UInt32'); -- { serverError CANNOT_CONVERT_TYPE }
 SELECT accurateCast(5, 'UInt32');
-SELECT accurateCast(4294967296, 'UInt32'); -- { serverError 70 }
-SELECT accurateCast(-1, 'UInt64'); -- { serverError 70 }
+SELECT accurateCast(4294967296, 'UInt32'); -- { serverError CANNOT_CONVERT_TYPE }
+SELECT accurateCast(-1, 'UInt64'); -- { serverError CANNOT_CONVERT_TYPE }
 SELECT accurateCast(5, 'UInt64');
-SELECT accurateCast(-1, 'UInt256'); -- { serverError 70 }
+SELECT accurateCast(-1, 'UInt256'); -- { serverError CANNOT_CONVERT_TYPE }
 SELECT accurateCast(5, 'UInt256');
 
-SELECT accurateCast(-129, 'Int8'); -- { serverError 70 }
+SELECT accurateCast(-129, 'Int8'); -- { serverError CANNOT_CONVERT_TYPE }
 SELECT accurateCast(5, 'Int8');
-SELECT accurateCast(128, 'Int8'); -- { serverError 70 }
+SELECT accurateCast(128, 'Int8'); -- { serverError CANNOT_CONVERT_TYPE }
 
-SELECT accurateCast(10, 'Decimal32(9)'); -- { serverError 407 }
+SELECT accurateCast(10, 'Decimal32(9)'); -- { serverError DECIMAL_OVERFLOW }
 SELECT accurateCast(1, 'Decimal32(9)');
-SELECT accurateCast(-10, 'Decimal32(9)'); -- { serverError 407 }
+SELECT accurateCast(-10, 'Decimal32(9)'); -- { serverError DECIMAL_OVERFLOW }
 
-SELECT accurateCast('123', 'FixedString(2)'); -- { serverError 131 }
+SELECT accurateCast('123', 'FixedString(2)'); -- { serverError TOO_LARGE_STRING_SIZE }
 SELECT accurateCast('12', 'FixedString(2)');
+
+SELECT accurateCast(-1, 'DateTime');   -- { serverError CANNOT_CONVERT_TYPE }
+SELECT accurateCast(0xFFFFFFFF + 1, 'DateTime');   -- { serverError CANNOT_CONVERT_TYPE }
+SELECT accurateCast('1xxx', 'DateTime');   -- { serverError CANNOT_PARSE_DATETIME }
+SELECT accurateCast('2023-05-30 14:38:20', 'DateTime');
+SELECT toString(accurateCast(19, 'DateTime'), 'UTC');
+
+SELECT accurateCast(-1, 'Date');   -- { serverError CANNOT_CONVERT_TYPE }
+SELECT accurateCast(0xFFFFFFFF + 1, 'Date');   -- { serverError CANNOT_CONVERT_TYPE }
+SELECT accurateCast('1xxx', 'Date');   -- { serverError CANNOT_PARSE_DATE }
+SELECT accurateCast('2023-05-30', 'Date');
+SELECT accurateCast(19, 'Date');
diff --git a/tests/queries/0_stateless/01605_adaptive_granularity_block_borders.sql b/tests/queries/0_stateless/01605_adaptive_granularity_block_borders.sql
index ca7d0f3c950..4623c456475 100644
--- a/tests/queries/0_stateless/01605_adaptive_granularity_block_borders.sql
+++ b/tests/queries/0_stateless/01605_adaptive_granularity_block_borders.sql
@@ -5,9 +5,9 @@ SET allow_prefetched_read_pool_for_remote_filesystem=0;
 
 DROP TABLE IF EXISTS adaptive_table;
 
---- If granularity of consequent blocks differs a lot, then adaptive
---- granularity will adjust amout of marks correctly. Data for test empirically
---- derived, it's quite hard to get good parameters.
+-- If granularity of consequent blocks differs a lot, then adaptive
+-- granularity will adjust the amount of marks correctly.
+-- Data for test was empirically derived, it's quite hard to get good parameters.
 
 CREATE TABLE adaptive_table(
     key UInt64,
@@ -32,6 +32,7 @@ SET enable_filesystem_cache = 0;
 
 -- If we have computed granularity incorrectly than we will exceed this limit.
 SET max_memory_usage='30M';
+SET max_threads = 1;
 
 SELECT max(length(value)) FROM adaptive_table;
 
diff --git a/tests/queries/0_stateless/01651_bugs_from_15889.reference b/tests/queries/0_stateless/01651_bugs_from_15889.reference
index 8b137891791..77ac542d4fb 100644
--- a/tests/queries/0_stateless/01651_bugs_from_15889.reference
+++ b/tests/queries/0_stateless/01651_bugs_from_15889.reference
@@ -1 +1,2 @@
+0
 
diff --git a/tests/queries/0_stateless/01651_bugs_from_15889.sql b/tests/queries/0_stateless/01651_bugs_from_15889.sql
index 4717a8dcc0d..6a8c6d35911 100644
--- a/tests/queries/0_stateless/01651_bugs_from_15889.sql
+++ b/tests/queries/0_stateless/01651_bugs_from_15889.sql
@@ -8,10 +8,9 @@ INSERT INTO xp SELECT '2020-01-01', number, '' FROM numbers(100000);
 
 CREATE TABLE xp_d AS xp ENGINE = Distributed(test_shard_localhost, currentDatabase(), xp);
 
--- FIXME: this query spontaneously returns either 8 or 20 error code. Looks like it's potentially flaky.
--- SELECT count(7 = (SELECT number FROM numbers(0) ORDER BY number ASC NULLS FIRST LIMIT 7)) FROM xp_d PREWHERE toYYYYMM(A) GLOBAL IN (SELECT NULL = (SELECT number FROM numbers(1) ORDER BY number DESC NULLS LAST LIMIT 1), toYYYYMM(min(A)) FROM xp_d) WHERE B > NULL; -- { serverError 8 }
+SELECT count(7 = (SELECT number FROM numbers(0) ORDER BY number ASC NULLS FIRST LIMIT 7)) FROM xp_d PREWHERE toYYYYMM(A) GLOBAL IN (SELECT NULL = (SELECT number FROM numbers(1) ORDER BY number DESC NULLS LAST LIMIT 1), toYYYYMM(min(A)) FROM xp_d) WHERE B > NULL; -- { serverError 8 }
 
-SELECT count() FROM xp_d WHERE A GLOBAL IN (SELECT NULL); -- { serverError 53 }
+SELECT count() FROM xp_d WHERE A GLOBAL IN (SELECT NULL);
 
 DROP TABLE IF EXISTS xp;
 DROP TABLE IF EXISTS xp_d;
diff --git a/tests/queries/0_stateless/01655_plan_optimizations.reference b/tests/queries/0_stateless/01655_plan_optimizations.reference
index 48d99647b43..be42a656c66 100644
--- a/tests/queries/0_stateless/01655_plan_optimizations.reference
+++ b/tests/queries/0_stateless/01655_plan_optimizations.reference
@@ -27,6 +27,11 @@ COLUMN Const(UInt8) -> notEquals(y, 0)
 Aggregating
 Filter
 Filter
+> (analyzer) filter should be pushed down after aggregating, column after aggregation is const
+COLUMN Const(UInt8) -> notEquals(y_1, 0_UInt8)
+Aggregating
+Filter
+Filter
 0	1	1
 1	2	1
 2	3	1
@@ -42,6 +47,11 @@ Filter column
 ALIAS notEquals(s, 4) :: 1 -> and(notEquals(y, 0), notEquals(s, 4))
 Aggregating
 Filter column: notEquals(y, 0)
+> (analyzer) one condition of filter should be pushed down after aggregating, other condition is aliased
+Filter column
+ALIAS notEquals(s_0, 4_UInt8) :: 0 -> and(notEquals(y_1, 0_UInt8), notEquals(s_0, 4_UInt8))
+Aggregating
+Filter column: notEquals(y_1, 0_UInt8)
 0	1
 1	2
 2	3
@@ -56,6 +66,11 @@ Filter column
 FUNCTION and(minus(s, 4) :: 1, 1 :: 3) -> and(notEquals(y, 0), minus(s, 4)) UInt8 : 2
 Aggregating
 Filter column: notEquals(y, 0)
+> (analyzer) one condition of filter should be pushed down after aggregating, other condition is casted
+Filter column
+FUNCTION and(minus(s_0, 4_UInt8) :: 0, 1 :: 3) -> and(notEquals(y_1, 0_UInt8), minus(s_0, 4_UInt8)) UInt8 : 2
+Aggregating
+Filter column: notEquals(y_1, 0_UInt8)
 0	1
 1	2
 2	3
@@ -70,6 +85,11 @@ Filter column
 FUNCTION and(minus(s, 8) :: 1, minus(s, 4) :: 2) -> and(notEquals(y, 0), minus(s, 8), minus(s, 4))
 Aggregating
 Filter column: notEquals(y, 0)
+> (analyzer) one condition of filter should be pushed down after aggregating, other two conditions are ANDed
+Filter column
+FUNCTION and(minus(s_0, 8_UInt8) :: 0, minus(s_0, 4_UInt8) :: 2) -> and(notEquals(y_1, 0_UInt8), minus(s_0, 8_UInt8), minus(s_0, 4_UInt8))
+Aggregating
+Filter column: notEquals(y_1, 0_UInt8)
 0	1
 1	2
 2	3
@@ -83,6 +103,11 @@ Filter column
 ALIAS notEquals(s, 8) :: 1 -> and(notEquals(y, 0), notEquals(s, 8), minus(y, 4))
 Aggregating
 Filter column: and(notEquals(y, 0), minus(y, 4))
+> (analyzer) two conditions of filter should be pushed down after aggregating and ANDed, one condition is aliased
+Filter column
+ALIAS notEquals(s_0, 8_UInt8) :: 0 -> and(notEquals(y_1, 0_UInt8), notEquals(s_0, 8_UInt8), minus(y_1, 4_UInt8))
+Aggregating
+Filter column: and(notEquals(y_1, 0_UInt8), minus(y_1, 4_UInt8))
 0	1
 1	2
 2	3
@@ -95,11 +120,19 @@ Filter column: and(notEquals(y, 0), minus(y, 4))
 Filter column: and(notEquals(y, 2), notEquals(x, 0))
 ARRAY JOIN x
 Filter column: notEquals(y, 2)
+> (analyzer) filter is split, one part is filtered before ARRAY JOIN
+Filter column: and(notEquals(y_1, 2_UInt8), notEquals(x_0, 0_UInt8))
+ARRAY JOIN x_0
+Filter column: notEquals(y_1, 2_UInt8)
 1	3
 > filter is pushed down before Distinct
 Distinct
 Distinct
 Filter column: notEquals(y, 2)
+> (analyzer) filter is pushed down before Distinct
+Distinct
+Distinct
+Filter column: notEquals(y_1, 2_UInt8)
 0	0
 0	1
 1	0
@@ -108,12 +141,20 @@ Filter column: notEquals(y, 2)
 Sorting
 Sorting
 Filter column: and(notEquals(x, 0), notEquals(y, 0))
+> (analyzer) filter is pushed down before sorting steps
+Sorting
+Sorting
+Filter column: and(notEquals(x_0, 0_UInt8), notEquals(y_1, 0_UInt8))
 1	2
 1	1
 > filter is pushed down before TOTALS HAVING and aggregating
 TotalsHaving
 Aggregating
 Filter column: notEquals(y, 2)
+> (analyzer) filter is pushed down before TOTALS HAVING and aggregating
+TotalsHaving
+Aggregating
+Filter column: notEquals(y_0, 2_UInt8)
 0	12
 1	15
 3	10
@@ -129,12 +170,18 @@ Filter
 Join
 Filter column: notEquals(number, 1)
 Join
+> (analyzer) one condition of filter is pushed down before LEFT JOIN
+Join
+Filter column: notEquals(number_0, 1_UInt8)
 0	0
 3	3
 > one condition of filter is pushed down before INNER JOIN
 Join
 Filter column: notEquals(number, 1)
 Join
+> (analyzer) one condition of filter is pushed down before INNER JOIN
+Join
+Filter column: notEquals(number_0, 1_UInt8)
 3	3
 > filter is pushed down before UNION
 Union
@@ -149,5 +196,12 @@ FUNCTION sipHash64
 Sorting
 Expression (Before ORDER BY)
 FUNCTION plus
+> (analyzer) function calculation should be done after sorting and limit (if possible)
+> Expression should be divided into two subexpressions and only one of them should be moved after Sorting
+Expression ((Project names + (Before ORDER BY + (Projection + Change column names to column identifiers)) [lifted up part]))
+FUNCTION sipHash64
+Sorting
+Expression ((Before ORDER BY + (Projection + Change column names to column identifiers)))
+FUNCTION plus
 > this query should be executed without throwing an exception
 0
diff --git a/tests/queries/0_stateless/01655_plan_optimizations.sh b/tests/queries/0_stateless/01655_plan_optimizations.sh
index ec856c9bf27..a765a6ea4fa 100755
--- a/tests/queries/0_stateless/01655_plan_optimizations.sh
+++ b/tests/queries/0_stateless/01655_plan_optimizations.sh
@@ -26,11 +26,17 @@ $CLICKHOUSE_CLIENT -q "
     settings enable_optimize_predicate_expression=0"
 
 echo "> filter should be pushed down after aggregating, column after aggregation is const"
-$CLICKHOUSE_CLIENT -q "
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 -q "
     explain actions = 1 select s, y, y != 0 from (select sum(x) as s, y from (
         select number as x, number + 1 as y from numbers(10)) group by y
     ) where y != 0
     settings enable_optimize_predicate_expression=0" | grep -o "Aggregating\|Filter\|COLUMN Const(UInt8) -> notEquals(y, 0)"
+echo "> (analyzer) filter should be pushed down after aggregating, column after aggregation is const"
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 -q "
+    explain actions = 1 select s, y, y != 0 from (select sum(x) as s, y from (
+        select number as x, number + 1 as y from numbers(10)) group by y
+    ) where y != 0
+    settings enable_optimize_predicate_expression=0" | grep -o "Aggregating\|Filter\|COLUMN Const(UInt8) -> notEquals(y_1, 0_UInt8)"
 $CLICKHOUSE_CLIENT -q "
     select s, y, y != 0 from (select sum(x) as s, y from (
         select number as x, number + 1 as y from numbers(10)) group by y
@@ -38,12 +44,19 @@ $CLICKHOUSE_CLIENT -q "
     settings enable_optimize_predicate_expression=0"
 
 echo "> one condition of filter should be pushed down after aggregating, other condition is aliased"
-$CLICKHOUSE_CLIENT -q "
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 -q "
     explain actions = 1 select s, y from (
         select sum(x) as s, y from (select number as x, number + 1 as y from numbers(10)) group by y
     ) where y != 0 and s != 4
     settings enable_optimize_predicate_expression=0" |
     grep -o "Aggregating\|Filter column\|Filter column: notEquals(y, 0)\|ALIAS notEquals(s, 4) :: 1 -> and(notEquals(y, 0), notEquals(s, 4))"
+echo "> (analyzer) one condition of filter should be pushed down after aggregating, other condition is aliased"
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 -q "
+    explain actions = 1 select s, y from (
+        select sum(x) as s, y from (select number as x, number + 1 as y from numbers(10)) group by y
+    ) where y != 0 and s != 4
+    settings enable_optimize_predicate_expression=0" |
+        grep -o "Aggregating\|Filter column\|Filter column: notEquals(y_1, 0_UInt8)\|ALIAS notEquals(s_0, 4_UInt8) :: 0 -> and(notEquals(y_1, 0_UInt8), notEquals(s_0, 4_UInt8))"
 $CLICKHOUSE_CLIENT -q "
     select s, y from (
         select sum(x) as s, y from (select number as x, number + 1 as y from numbers(10)) group by y
@@ -51,12 +64,19 @@ $CLICKHOUSE_CLIENT -q "
     settings enable_optimize_predicate_expression=0"
 
 echo "> one condition of filter should be pushed down after aggregating, other condition is casted"
-$CLICKHOUSE_CLIENT -q "
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 -q "
     explain actions = 1 select s, y from (
         select sum(x) as s, y from (select number as x, number + 1 as y from numbers(10)) group by y
     ) where y != 0 and s - 4
     settings enable_optimize_predicate_expression=0" |
     grep -o "Aggregating\|Filter column\|Filter column: notEquals(y, 0)\|FUNCTION and(minus(s, 4) :: 1, 1 :: 3) -> and(notEquals(y, 0), minus(s, 4)) UInt8 : 2"
+echo "> (analyzer) one condition of filter should be pushed down after aggregating, other condition is casted"
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 -q "
+    explain actions = 1 select s, y from (
+        select sum(x) as s, y from (select number as x, number + 1 as y from numbers(10)) group by y
+    ) where y != 0 and s - 4
+    settings enable_optimize_predicate_expression=0" |
+        grep -o "Aggregating\|Filter column\|Filter column: notEquals(y_1, 0_UInt8)\|FUNCTION and(minus(s_0, 4_UInt8) :: 0, 1 :: 3) -> and(notEquals(y_1, 0_UInt8), minus(s_0, 4_UInt8)) UInt8 : 2"
 $CLICKHOUSE_CLIENT -q "
     select s, y from (
         select sum(x) as s, y from (select number as x, number + 1 as y from numbers(10)) group by y
@@ -64,12 +84,19 @@ $CLICKHOUSE_CLIENT -q "
     settings enable_optimize_predicate_expression=0"
 
 echo "> one condition of filter should be pushed down after aggregating, other two conditions are ANDed"
-$CLICKHOUSE_CLIENT --convert_query_to_cnf=0 -q "
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 --convert_query_to_cnf=0 -q "
     explain actions = 1 select s, y from (
         select sum(x) as s, y from (select number as x, number + 1 as y from numbers(10)) group by y
     ) where y != 0 and s - 8 and s - 4
     settings enable_optimize_predicate_expression=0" |
     grep -o "Aggregating\|Filter column\|Filter column: notEquals(y, 0)\|FUNCTION and(minus(s, 8) :: 1, minus(s, 4) :: 2) -> and(notEquals(y, 0), minus(s, 8), minus(s, 4))"
+echo "> (analyzer) one condition of filter should be pushed down after aggregating, other two conditions are ANDed"
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 --convert_query_to_cnf=0 -q "
+    explain actions = 1 select s, y from (
+        select sum(x) as s, y from (select number as x, number + 1 as y from numbers(10)) group by y
+    ) where y != 0 and s - 8 and s - 4
+    settings enable_optimize_predicate_expression=0" |
+        grep -o "Aggregating\|Filter column\|Filter column: notEquals(y_1, 0_UInt8)\|FUNCTION and(minus(s_0, 8_UInt8) :: 0, minus(s_0, 4_UInt8) :: 2) -> and(notEquals(y_1, 0_UInt8), minus(s_0, 8_UInt8), minus(s_0, 4_UInt8))"
 $CLICKHOUSE_CLIENT -q "
     select s, y from (
         select sum(x) as s, y from (select number as x, number + 1 as y from numbers(10)) group by y
@@ -77,12 +104,19 @@ $CLICKHOUSE_CLIENT -q "
     settings enable_optimize_predicate_expression=0"
 
 echo "> two conditions of filter should be pushed down after aggregating and ANDed, one condition is aliased"
-$CLICKHOUSE_CLIENT --convert_query_to_cnf=0 -q "
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 --convert_query_to_cnf=0 -q "
     explain actions = 1 select s, y from (
         select sum(x) as s, y from (select number as x, number + 1 as y from numbers(10)) group by y
     ) where y != 0 and s != 8 and y - 4
     settings enable_optimize_predicate_expression=0" |
     grep -o "Aggregating\|Filter column\|Filter column: and(notEquals(y, 0), minus(y, 4))\|ALIAS notEquals(s, 8) :: 1 -> and(notEquals(y, 0), notEquals(s, 8), minus(y, 4))"
+echo "> (analyzer) two conditions of filter should be pushed down after aggregating and ANDed, one condition is aliased"
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 --convert_query_to_cnf=0 -q "
+    explain actions = 1 select s, y from (
+        select sum(x) as s, y from (select number as x, number + 1 as y from numbers(10)) group by y
+    ) where y != 0 and s != 8 and y - 4
+    settings enable_optimize_predicate_expression=0" |
+    grep -o "Aggregating\|Filter column\|Filter column: and(notEquals(y_1, 0_UInt8), minus(y_1, 4_UInt8))\|ALIAS notEquals(s_0, 8_UInt8) :: 0 -> and(notEquals(y_1, 0_UInt8), notEquals(s_0, 8_UInt8), minus(y_1, 4_UInt8))"
 $CLICKHOUSE_CLIENT -q "
     select s, y from (
         select sum(x) as s, y from (select number as x, number + 1 as y from numbers(10)) group by y
@@ -90,11 +124,17 @@ $CLICKHOUSE_CLIENT -q "
     settings enable_optimize_predicate_expression=0"
 
 echo "> filter is split, one part is filtered before ARRAY JOIN"
-$CLICKHOUSE_CLIENT -q "
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=0  -q "
     explain actions = 1 select x, y from (
         select range(number) as x, number + 1 as y from numbers(3)
     ) array join x where y != 2 and x != 0" |
     grep -o "Filter column: and(notEquals(y, 2), notEquals(x, 0))\|ARRAY JOIN x\|Filter column: notEquals(y, 2)"
+echo "> (analyzer) filter is split, one part is filtered before ARRAY JOIN"
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 -q "
+    explain actions = 1 select x, y from (
+        select range(number) as x, number + 1 as y from numbers(3)
+    ) array join x where y != 2 and x != 0" |
+    grep -o "Filter column: and(notEquals(y_1, 2_UInt8), notEquals(x_0, 0_UInt8))\|ARRAY JOIN x_0\|Filter column: notEquals(y_1, 2_UInt8)"
 $CLICKHOUSE_CLIENT -q "
     select x, y from (
         select range(number) as x, number + 1 as y from numbers(3)
@@ -114,12 +154,19 @@ $CLICKHOUSE_CLIENT -q "
 #     settings enable_optimize_predicate_expression=0"
 
 echo "> filter is pushed down before Distinct"
-$CLICKHOUSE_CLIENT -q "
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 -q "
     explain actions = 1 select x, y from (
         select distinct x, y from (select number % 2 as x, number % 3 as y from numbers(10))
     ) where y != 2
     settings enable_optimize_predicate_expression=0" |
     grep -o "Distinct\|Filter column: notEquals(y, 2)"
+echo "> (analyzer) filter is pushed down before Distinct"
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 -q "
+    explain actions = 1 select x, y from (
+        select distinct x, y from (select number % 2 as x, number % 3 as y from numbers(10))
+    ) where y != 2
+    settings enable_optimize_predicate_expression=0" |
+    grep -o "Distinct\|Filter column: notEquals(y_1, 2_UInt8)"
 $CLICKHOUSE_CLIENT -q "
     select x, y from (
         select distinct x, y from (select number % 2 as x, number % 3 as y from numbers(10))
@@ -127,12 +174,19 @@ $CLICKHOUSE_CLIENT -q "
     settings enable_optimize_predicate_expression=0"
 
 echo "> filter is pushed down before sorting steps"
-$CLICKHOUSE_CLIENT --convert_query_to_cnf=0 -q "
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 --convert_query_to_cnf=0 -q "
     explain actions = 1 select x, y from (
         select number % 2 as x, number % 3 as y from numbers(6) order by y desc
     ) where x != 0 and y != 0
     settings enable_optimize_predicate_expression = 0" |
     grep -o "Sorting\|Filter column: and(notEquals(x, 0), notEquals(y, 0))"
+echo "> (analyzer) filter is pushed down before sorting steps"
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 --convert_query_to_cnf=0 -q "
+    explain actions = 1 select x, y from (
+        select number % 2 as x, number % 3 as y from numbers(6) order by y desc
+    ) where x != 0 and y != 0
+    settings enable_optimize_predicate_expression = 0" |
+    grep -o "Sorting\|Filter column: and(notEquals(x_0, 0_UInt8), notEquals(y_1, 0_UInt8))"
 $CLICKHOUSE_CLIENT -q "
     select x, y from (
         select number % 2 as x, number % 3 as y from numbers(6) order by y desc
@@ -140,12 +194,19 @@ $CLICKHOUSE_CLIENT -q "
     settings enable_optimize_predicate_expression = 0"
 
 echo "> filter is pushed down before TOTALS HAVING and aggregating"
-$CLICKHOUSE_CLIENT -q "
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 -q "
     explain actions = 1 select * from (
         select y, sum(x) from (select number as x, number % 4 as y from numbers(10)) group by y with totals
     ) where y != 2
     settings enable_optimize_predicate_expression=0" |
     grep -o "TotalsHaving\|Aggregating\|Filter column: notEquals(y, 2)"
+echo "> (analyzer) filter is pushed down before TOTALS HAVING and aggregating"
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 -q "
+    explain actions = 1 select * from (
+        select y, sum(x) from (select number as x, number % 4 as y from numbers(10)) group by y with totals
+    ) where y != 2
+    settings enable_optimize_predicate_expression=0" |
+    grep -o "TotalsHaving\|Aggregating\|Filter column: notEquals(y_0, 2_UInt8)"
 $CLICKHOUSE_CLIENT -q "
     select * from (
         select y, sum(x) from (select number as x, number % 4 as y from numbers(10)) group by y with totals
@@ -163,24 +224,38 @@ $CLICKHOUSE_CLIENT -q "
     ) where number != 2 settings enable_optimize_predicate_expression=0"
 
 echo "> one condition of filter is pushed down before LEFT JOIN"
-$CLICKHOUSE_CLIENT -q "
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 -q "
     explain actions = 1
     select number as a, r.b from numbers(4) as l any left join (
         select number + 2 as b from numbers(3)
     ) as r on a = r.b where a != 1 and b != 2 settings enable_optimize_predicate_expression = 0" |
     grep -o "Join\|Filter column: notEquals(number, 1)"
+echo "> (analyzer) one condition of filter is pushed down before LEFT JOIN"
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 -q "
+    explain actions = 1
+    select number as a, r.b from numbers(4) as l any left join (
+        select number + 2 as b from numbers(3)
+    ) as r on a = r.b where a != 1 and b != 2 settings enable_optimize_predicate_expression = 0" |
+    grep -o "Join\|Filter column: notEquals(number_0, 1_UInt8)"
 $CLICKHOUSE_CLIENT -q "
     select number as a, r.b from numbers(4) as l any left join (
         select number + 2 as b from numbers(3)
     ) as r on a = r.b where a != 1 and b != 2 settings enable_optimize_predicate_expression = 0" | sort
 
 echo "> one condition of filter is pushed down before INNER JOIN"
-$CLICKHOUSE_CLIENT -q "
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 -q "
     explain actions = 1
     select number as a, r.b from numbers(4) as l any inner join (
         select number + 2 as b from numbers(3)
     ) as r on a = r.b where a != 1 and b != 2 settings enable_optimize_predicate_expression = 0" |
     grep -o "Join\|Filter column: notEquals(number, 1)"
+echo "> (analyzer) one condition of filter is pushed down before INNER JOIN"
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 -q "
+    explain actions = 1
+    select number as a, r.b from numbers(4) as l any inner join (
+        select number + 2 as b from numbers(3)
+    ) as r on a = r.b where a != 1 and b != 2 settings enable_optimize_predicate_expression = 0" |
+        grep -o "Join\|Filter column: notEquals(number_0, 1_UInt8)"
 $CLICKHOUSE_CLIENT -q "
     select number as a, r.b from numbers(4) as l any inner join (
         select number + 2 as b from numbers(3)
@@ -199,7 +274,12 @@ $CLICKHOUSE_CLIENT -q "
 
 echo "> function calculation should be done after sorting and limit (if possible)"
 echo "> Expression should be divided into two subexpressions and only one of them should be moved after Sorting"
-$CLICKHOUSE_CLIENT -q "
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 -q "
+    explain actions = 1 select number as n, sipHash64(n) from numbers(100) order by number + 1 limit 5" |
+    sed 's/^ *//g' | grep -o "^ *\(Expression (.*Before ORDER BY.*)\|Sorting\|FUNCTION \w\+\)"
+echo "> (analyzer) function calculation should be done after sorting and limit (if possible)"
+echo "> Expression should be divided into two subexpressions and only one of them should be moved after Sorting"
+$CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 -q "
     explain actions = 1 select number as n, sipHash64(n) from numbers(100) order by number + 1 limit 5" |
     sed 's/^ *//g' | grep -o "^ *\(Expression (.*Before ORDER BY.*)\|Sorting\|FUNCTION \w\+\)"
 echo "> this query should be executed without throwing an exception"
diff --git a/tests/queries/0_stateless/01655_plan_optimizations_optimize_read_in_window_order.reference b/tests/queries/0_stateless/01655_plan_optimizations_optimize_read_in_window_order.reference
index f23cf03913b..8a33df9fad2 100644
--- a/tests/queries/0_stateless/01655_plan_optimizations_optimize_read_in_window_order.reference
+++ b/tests/queries/0_stateless/01655_plan_optimizations_optimize_read_in_window_order.reference
@@ -7,19 +7,19 @@ Partial sorting plan
     Prefix sort description: n ASC
     Result sort description: n ASC, x ASC
   optimize_read_in_window_order=1, allow_experimental_analyzer=1
-    Prefix sort description: default.test_01655_plan_optimizations_optimize_read_in_window_order_n.n_0 ASC
-    Result sort description: default.test_01655_plan_optimizations_optimize_read_in_window_order_n.n_0 ASC, default.test_01655_plan_optimizations_optimize_read_in_window_order_n.x_1 ASC
+    Prefix sort description: n_0 ASC
+    Result sort description: n_0 ASC, x_1 ASC
 No sorting plan
   optimize_read_in_window_order=0
     Sort description: n ASC, x ASC
   optimize_read_in_window_order=0, allow_experimental_analyzer=1
-    Sort description: default.test_01655_plan_optimizations_optimize_read_in_window_order_n_x.n_0 ASC, default.test_01655_plan_optimizations_optimize_read_in_window_order_n_x.x_1 ASC
+    Sort description: n_0 ASC, x_1 ASC
   optimize_read_in_window_order=1
     Prefix sort description: n ASC, x ASC
     Result sort description: n ASC, x ASC
   optimize_read_in_window_order=1, allow_experimental_analyzer=1
-    Prefix sort description: default.test_01655_plan_optimizations_optimize_read_in_window_order_n_x.n_0 ASC, default.test_01655_plan_optimizations_optimize_read_in_window_order_n_x.x_1 ASC
-    Result sort description: default.test_01655_plan_optimizations_optimize_read_in_window_order_n_x.n_0 ASC, default.test_01655_plan_optimizations_optimize_read_in_window_order_n_x.x_1 ASC
+    Prefix sort description: n_0 ASC, x_1 ASC
+    Result sort description: n_0 ASC, x_1 ASC
 Complex ORDER BY
   optimize_read_in_window_order=0
 3	3	1
diff --git a/tests/queries/0_stateless/01676_clickhouse_client_autocomplete.sh b/tests/queries/0_stateless/01676_clickhouse_client_autocomplete.sh
index 42ae5e84f44..db62dedb5b4 100755
--- a/tests/queries/0_stateless/01676_clickhouse_client_autocomplete.sh
+++ b/tests/queries/0_stateless/01676_clickhouse_client_autocomplete.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long
+# Tags: long, no-ubsan
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
diff --git a/tests/queries/0_stateless/01721_join_implicit_cast_long.reference.j2 b/tests/queries/0_stateless/01721_join_implicit_cast_long.reference.j2
index ae43aa7195c..e9f32087439 100644
--- a/tests/queries/0_stateless/01721_join_implicit_cast_long.reference.j2
+++ b/tests/queries/0_stateless/01721_join_implicit_cast_long.reference.j2
@@ -1,6 +1,7 @@
 {% for join_algorithm in ['hash', 'partial_merge', 'auto', 'full_sorting_merge', 'grace_hash'] -%}
 === {{ join_algorithm }} ===
 = full =
+{% if join_algorithm not in ['grace_hash'] -%}
 -4	0	196
 -3	0	197
 -2	0	198
@@ -16,6 +17,7 @@
 8	108	\N
 9	109	\N
 10	110	\N
+{% endif -%}
 = left =
 1	101	201
 2	102	202
@@ -28,6 +30,7 @@
 9	109	\N
 10	110	\N
 = right =
+{% if join_algorithm not in ['grace_hash'] -%}
 -4	0	196
 -3	0	197
 -2	0	198
@@ -38,6 +41,7 @@
 3	103	203
 4	104	204
 5	105	205
+{% endif -%}
 = inner =
 1	101	201
 2	102	202
@@ -45,6 +49,7 @@
 4	104	204
 5	105	205
 = full =
+{% if join_algorithm not in ['grace_hash'] -%}
 0	0	-4
 0	0	-3
 0	0	-2
@@ -60,6 +65,7 @@
 8	8	0
 9	9	0
 10	10	0
+{% endif -%}
 = left =
 1	1	1
 2	2	2
@@ -72,6 +78,7 @@
 9	9	0
 10	10	0
 = right =
+{% if join_algorithm not in ['grace_hash'] -%}
 0	0	-4
 0	0	-3
 0	0	-2
@@ -82,6 +89,7 @@
 3	3	3
 4	4	4
 5	5	5
+{% endif -%}
 = inner =
 1	1	1
 2	2	2
@@ -90,6 +98,7 @@
 5	5	5
 = join on =
 = full =
+{% if join_algorithm not in ['grace_hash'] -%}
 0	0	-4	196
 0	0	-3	197
 0	0	-2	198
@@ -105,6 +114,7 @@
 8	108	0	\N
 9	109	0	\N
 10	110	0	\N
+{% endif -%}
 = left =
 1	101	1	201
 2	102	2	202
@@ -117,6 +127,7 @@
 9	109	0	\N
 10	110	0	\N
 = right =
+{% if join_algorithm not in ['grace_hash'] -%}
 0	0	-4	196
 0	0	-3	197
 0	0	-2	198
@@ -127,6 +138,7 @@
 3	103	3	203
 4	104	4	204
 5	105	5	205
+{% endif -%}
 = inner =
 1	101	1	201
 2	102	2	202
@@ -134,6 +146,7 @@
 4	104	4	204
 5	105	5	205
 = full =
+{% if join_algorithm not in ['grace_hash'] -%}
 0	0	-4	196
 0	0	-3	197
 0	0	-2	198
@@ -149,6 +162,7 @@
 8	108	0	\N
 9	109	0	\N
 10	110	0	\N
+{% endif -%}
 = left =
 1	101	1	201
 2	102	2	202
@@ -161,6 +175,7 @@
 9	109	0	\N
 10	110	0	\N
 = right =
+{% if join_algorithm not in ['grace_hash'] -%}
 0	0	-4	196
 0	0	-3	197
 0	0	-2	198
@@ -171,6 +186,7 @@
 3	103	3	203
 4	104	4	204
 5	105	5	205
+{% endif -%}
 = inner =
 1	101	1	201
 2	102	2	202
@@ -180,6 +196,7 @@
 = agg =
 1
 1
+{% if join_algorithm not in ['grace_hash'] -%}
 1
 1
 1
@@ -188,11 +205,13 @@
 1	55	1055
 0	0	-10	0	990
 1	55	15	1055	1015
+{% endif -%}
 = types =
 1
 1
 1
 1
+{% if join_algorithm not in ['grace_hash'] -%}
 1
 1
 1
@@ -200,9 +219,11 @@
 1
 1
 1
+{% endif -%}
 {% if join_algorithm not in ['full_sorting_merge'] -%}
 === join use nulls ===
 = full =
+{% if join_algorithm not in ['grace_hash'] -%}
 -4	\N	196
 -3	\N	197
 -2	\N	198
@@ -218,6 +239,7 @@
 8	108	\N
 9	109	\N
 10	110	\N
+{% endif -%}
 = left =
 1	101	201
 2	102	202
@@ -230,6 +252,7 @@
 9	109	\N
 10	110	\N
 = right =
+{% if join_algorithm not in ['grace_hash'] -%}
 -4	\N	196
 -3	\N	197
 -2	\N	198
@@ -240,6 +263,7 @@
 3	103	203
 4	104	204
 5	105	205
+{% endif -%}
 = inner =
 1	101	201
 2	102	202
@@ -247,6 +271,7 @@
 4	104	204
 5	105	205
 = full =
+{% if join_algorithm not in ['grace_hash'] -%}
 1	1	1
 2	2	2
 3	3	3
@@ -262,6 +287,7 @@
 \N	\N	-2
 \N	\N	-1
 \N	\N	0
+{% endif -%}
 = left =
 1	1	1
 2	2	2
@@ -274,6 +300,7 @@
 9	9	\N
 10	10	\N
 = right =
+{% if join_algorithm not in ['grace_hash'] -%}
 1	1	1
 2	2	2
 3	3	3
@@ -284,6 +311,7 @@
 \N	\N	-2
 \N	\N	-1
 \N	\N	0
+{% endif -%}
 = inner =
 1	1	1
 2	2	2
@@ -292,6 +320,7 @@
 5	5	5
 = join on =
 = full =
+{% if join_algorithm not in ['grace_hash'] -%}
 1	101	1	201
 2	102	2	202
 3	103	3	203
@@ -307,6 +336,7 @@
 \N	\N	-2	198
 \N	\N	-1	199
 \N	\N	0	200
+{% endif -%}
 = left =
 1	101	1	201
 2	102	2	202
@@ -319,6 +349,7 @@
 9	109	\N	\N
 10	110	\N	\N
 = right =
+{% if join_algorithm not in ['grace_hash'] -%}
 1	101	1	201
 2	102	2	202
 3	103	3	203
@@ -329,6 +360,7 @@
 \N	\N	-2	198
 \N	\N	-1	199
 \N	\N	0	200
+{% endif -%}
 = inner =
 1	101	1	201
 2	102	2	202
@@ -336,6 +368,7 @@
 4	104	4	204
 5	105	5	205
 = full =
+{% if join_algorithm not in ['grace_hash'] -%}
 1	101	1	201
 2	102	2	202
 3	103	3	203
@@ -351,6 +384,7 @@
 \N	\N	-2	198
 \N	\N	-1	199
 \N	\N	0	200
+{% endif -%}
 = left =
 1	101	1	201
 2	102	2	202
@@ -363,6 +397,7 @@
 9	109	\N	\N
 10	110	\N	\N
 = right =
+{% if join_algorithm not in ['grace_hash'] -%}
 1	101	1	201
 2	102	2	202
 3	103	3	203
@@ -373,6 +408,7 @@
 \N	\N	-2	198
 \N	\N	-1	199
 \N	\N	0	200
+{% endif -%}
 = inner =
 1	101	1	201
 2	102	2	202
@@ -382,6 +418,7 @@
 = agg =
 1
 1
+{% if join_algorithm not in ['grace_hash'] -%}
 1
 1
 1
@@ -390,11 +427,13 @@
 1	55	1055
 1	55	15	1055	1015
 \N	\N	-10	\N	990
+{% endif -%}
 = types =
 1
 1
 1
 1
+{% if join_algorithm not in ['grace_hash'] -%}
 1
 1
 1
@@ -403,4 +442,5 @@
 1
 1
 {% endif -%}
+{% endif -%}
 {% endfor -%}
diff --git a/tests/queries/0_stateless/01721_join_implicit_cast_long.sql.j2 b/tests/queries/0_stateless/01721_join_implicit_cast_long.sql.j2
index 38f71f4c5ec..f5321939f28 100644
--- a/tests/queries/0_stateless/01721_join_implicit_cast_long.sql.j2
+++ b/tests/queries/0_stateless/01721_join_implicit_cast_long.sql.j2
@@ -10,6 +10,7 @@ INSERT INTO t1 SELECT number as a, 100 + number as b FROM system.numbers LIMIT 1
 INSERT INTO t2 SELECT number - 5 as a, 200 + number - 5 as b FROM system.numbers LIMIT 1, 10;
 
 {% macro is_implemented(join_algorithm) -%}
+{% if join_algorithm == 'grace_hash' %} -- { serverError NOT_IMPLEMENTED } {% endif %}
 {% endmacro -%}
 
 {% for join_algorithm in ['hash', 'partial_merge', 'auto', 'full_sorting_merge', 'grace_hash'] -%}
diff --git a/tests/queries/0_stateless/01746_convert_type_with_default.reference b/tests/queries/0_stateless/01746_convert_type_with_default.reference
index 9ebef9c4a8d..e00156cd3c5 100644
--- a/tests/queries/0_stateless/01746_convert_type_with_default.reference
+++ b/tests/queries/0_stateless/01746_convert_type_with_default.reference
@@ -22,3 +22,40 @@
 -2
 61f0c404-5cb3-11e7-907b-a6006ad3dba0
 59f0c404-5cb3-11e7-907b-a6006ad3dba0
+1970-01-01
+2023-05-30
+2023-05-30
+2023-05-30
+1970-01-01
+1970-01-20
+1970-01-20
+1970-01-20
+1970-01-20
+1970-01-20
+1970-01-20
+1970-01-20
+1970-01-20
+1970-01-20
+1970-01-20
+1970-01-20
+1970-01-20
+2149-06-06
+1
+2023-05-30
+2023-05-30
+2023-05-30 14:38:20
+2023-05-30 14:38:20
+2023-05-30 14:38:20
+2023-05-30 14:38:20
+1970-01-01 00:00:19
+1970-01-01 00:00:19
+1970-01-01 00:00:19
+1970-01-01 00:00:19
+1970-01-01 00:00:19
+1970-01-01 00:00:19
+1970-01-01 00:00:19
+1970-01-01 00:00:19
+1970-01-01 00:00:19
+1970-01-01 00:00:19
+1970-01-01 00:00:19
+1970-01-01 00:00:19
diff --git a/tests/queries/0_stateless/01746_convert_type_with_default.sql b/tests/queries/0_stateless/01746_convert_type_with_default.sql
index 0881e911466..5ef7718784d 100644
--- a/tests/queries/0_stateless/01746_convert_type_with_default.sql
+++ b/tests/queries/0_stateless/01746_convert_type_with_default.sql
@@ -28,3 +28,56 @@ select toInt256OrDefault('-1xx', cast(-2 as Int256));
 
 SELECT toUUIDOrDefault('61f0c404-5cb3-11e7-907b-a6006ad3dba0', cast('59f0c404-5cb3-11e7-907b-a6006ad3dba0' as UUID));
 SELECT toUUIDOrDefault('-----61f0c404-5cb3-11e7-907b-a6006ad3dba0', cast('59f0c404-5cb3-11e7-907b-a6006ad3dba0' as UUID));
+
+select toDateOrDefault('1xxx');
+select toDateOrDefault('2023-05-30');
+select toDateOrDefault('2023-05-30', '2000-01-01'::Date);
+select toDateOrDefault('1xx', '2023-05-30'::Date);
+select toDateOrDefault(-1);
+
+select toDateOrDefault(cast(19 as Int8));
+select toDateOrDefault(cast(19 as UInt8));
+
+select toDateOrDefault(cast(19 as Int16));
+select toDateOrDefault(cast(19 as UInt16));
+
+select toDateOrDefault(cast(19 as Int32));
+select toDateOrDefault(cast(19 as UInt32));
+
+select toDateOrDefault(cast(19 as Int64));
+select toDateOrDefault(cast(19 as UInt64));
+
+select toDateOrDefault(cast(19 as Int128));
+select toDateOrDefault(cast(19 as UInt128));
+
+select toDateOrDefault(cast(19 as Int256));
+select toDateOrDefault(cast(19 as UInt256));
+
+select toDateOrDefault(65535);
+select toDateOrDefault(65536) in ('1970-01-01', '1970-01-02');
+
+select toDateOrDefault(19507, '2000-01-01'::Date);
+select toDateOrDefault(-1, '2023-05-30'::Date);
+
+select toDateTimeOrDefault('2023-05-30 14:38:20', 'UTC');
+select toDateTimeOrDefault('1xxx', 'UTC', '2023-05-30 14:38:20'::DateTime('UTC'));
+select toDateTimeOrDefault(1685457500, 'UTC');
+select toDateTimeOrDefault(-1, 'UTC', '2023-05-30 14:38:20'::DateTime('UTC'));
+
+select toDateTimeOrDefault(cast(19 as Int8), 'UTC');
+select toDateTimeOrDefault(cast(19 as UInt8), 'UTC');
+
+select toDateTimeOrDefault(cast(19 as Int16), 'UTC');
+select toDateTimeOrDefault(cast(19 as UInt16), 'UTC');
+
+select toDateTimeOrDefault(cast(19 as Int32), 'UTC');
+select toDateTimeOrDefault(cast(19 as UInt32), 'UTC');
+
+select toDateTimeOrDefault(cast(19 as Int64), 'UTC');
+select toDateTimeOrDefault(cast(19 as UInt64), 'UTC');
+
+select toDateTimeOrDefault(cast(19 as Int128), 'UTC');
+select toDateTimeOrDefault(cast(19 as UInt128), 'UTC');
+
+select toDateTimeOrDefault(cast(19 as Int256), 'UTC');
+select toDateTimeOrDefault(cast(19 as UInt256), 'UTC');
diff --git a/tests/queries/0_stateless/01763_filter_push_down_bugs.reference b/tests/queries/0_stateless/01763_filter_push_down_bugs.reference
index 5aa2e645509..c8045dd26f5 100644
--- a/tests/queries/0_stateless/01763_filter_push_down_bugs.reference
+++ b/tests/queries/0_stateless/01763_filter_push_down_bugs.reference
@@ -6,3 +6,41 @@ String1_0	String2_0	String3_0	String4_0	1
 String1_0	String2_0	String3_0	String4_0	1
 1	[0,1,2]
 1
+Expression ((Projection + Before ORDER BY))
+  Filter (WHERE)
+    Join (JOIN FillRightFirst)
+      Filter (( + Before JOIN))
+        ReadFromMergeTree (default.t1)
+        Indexes:
+          PrimaryKey
+            Keys: 
+              id
+            Condition: (id in [101, 101])
+            Parts: 1/1
+            Granules: 1/1
+      Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
+        ReadFromMergeTree (default.t2)
+        Indexes:
+          PrimaryKey
+            Condition: true
+            Parts: 1/1
+            Granules: 1/1
+Expression ((Project names + Projection))
+  Filter ((WHERE + DROP unused columns after JOIN))
+    Join (JOIN FillRightFirst)
+      Expression (Change column names to column identifiers)
+        ReadFromMergeTree (default.t1)
+        Indexes:
+          PrimaryKey
+            Keys: 
+              id
+            Condition: (id in [101, 101])
+            Parts: 1/1
+            Granules: 1/1
+      Expression ((Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers))))
+        ReadFromMergeTree (default.t2)
+        Indexes:
+          PrimaryKey
+            Condition: true
+            Parts: 1/1
+            Granules: 1/1
diff --git a/tests/queries/0_stateless/01763_filter_push_down_bugs.sql b/tests/queries/0_stateless/01763_filter_push_down_bugs.sql
index 1058bf75144..9a5ef4727c5 100644
--- a/tests/queries/0_stateless/01763_filter_push_down_bugs.sql
+++ b/tests/queries/0_stateless/01763_filter_push_down_bugs.sql
@@ -38,6 +38,31 @@ DROP TABLE IF EXISTS Test;
 
 select x, y from (select [0, 1, 2] as y, 1 as a, 2 as b) array join y as x where a = 1 and b = 2 and (x = 1 or x != 1) and x = 1;
 
+DROP TABLE IF EXISTS t;
 create table t(a UInt8) engine=MergeTree order by a;
 insert into t select * from numbers(2);
 select a from t t1 join t t2 on t1.a = t2.a where t1.a;
+DROP TABLE IF EXISTS t;
+
+DROP TABLE IF EXISTS t1;
+DROP TABLE IF EXISTS t2;
+CREATE TABLE t1 (id Int64, create_time DateTime) ENGINE = MergeTree ORDER BY id;
+CREATE TABLE t2 (delete_time DateTime) ENGINE = MergeTree ORDER BY delete_time;
+
+insert into t1 values (101, '2023-05-28 00:00:00'), (102, '2023-05-28 00:00:00');
+insert into t2 values ('2023-05-31 00:00:00');
+
+EXPLAIN indexes=1 SELECT id, delete_time FROM t1
+ CROSS JOIN (
+    SELECT delete_time
+    FROM t2
+) AS d WHERE create_time < delete_time AND id = 101 SETTINGS allow_experimental_analyzer=0;
+
+EXPLAIN indexes=1 SELECT id, delete_time FROM t1
+ CROSS JOIN (
+    SELECT delete_time
+    FROM t2
+) AS d WHERE create_time < delete_time AND id = 101 SETTINGS allow_experimental_analyzer=1;
+
+DROP TABLE IF EXISTS t1;
+DROP TABLE IF EXISTS t2;
diff --git a/tests/queries/0_stateless/01786_explain_merge_tree.reference b/tests/queries/0_stateless/01786_explain_merge_tree.reference
index e6628813dbd..8d3954484dd 100644
--- a/tests/queries/0_stateless/01786_explain_merge_tree.reference
+++ b/tests/queries/0_stateless/01786_explain_merge_tree.reference
@@ -10,7 +10,7 @@
         Keys: 
           y
           bitAnd(z, 3)
-        Condition: and((bitAnd(z, 3) not in [1, 1]), and((y in [1, +Inf)), (bitAnd(z, 3) not in [1, 1])))
+        Condition: and((y in [1, +Inf)), (bitAnd(z, 3) not in [1, 1]))
         Parts: 3/4
         Granules: 10/11
       PrimaryKey
@@ -46,7 +46,7 @@
                 {
                   "Type": "Partition",
                   "Keys": ["y", "bitAnd(z, 3)"],
-                  "Condition": "and((bitAnd(z, 3) not in [1, 1]), and((y in [1, +Inf)), (bitAnd(z, 3) not in [1, 1])))",
+                  "Condition": "and((y in [1, +Inf)), (bitAnd(z, 3) not in [1, 1]))",
                   "Initial Parts": 4,
                   "Selected Parts": 3,
                   "Initial Granules": 11,
diff --git a/tests/queries/0_stateless/01810_max_part_removal_threads_long.sh b/tests/queries/0_stateless/01810_max_part_removal_threads_long.sh
index f8f49816479..87153a4bd58 100755
--- a/tests/queries/0_stateless/01810_max_part_removal_threads_long.sh
+++ b/tests/queries/0_stateless/01810_max_part_removal_threads_long.sh
@@ -11,6 +11,9 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
+# The number of threads removing data parts should be between 1 and 129.
+# Because max_parts_cleaning_thread_pool_size is 128 by default
+
 $CLICKHOUSE_CLIENT --allow_deprecated_database_ordinary=1 -nm -q "create database ordinary_$CLICKHOUSE_DATABASE engine=Ordinary"
 
 # MergeTree
@@ -22,7 +25,7 @@ $CLICKHOUSE_CLIENT -nm -q """
     Engine=MergeTree()
     order by key
     partition by key%100
-    settings max_part_removal_threads=10, concurrent_part_removal_threshold=99, min_bytes_for_wide_part=0;
+    settings concurrent_part_removal_threshold=99, min_bytes_for_wide_part=0;
 
     insert into data_01810 select * from numbers(100);
     drop table data_01810 settings log_queries=1;
@@ -30,7 +33,7 @@ $CLICKHOUSE_CLIENT -nm -q """
 
     -- sometimes the same thread can be used to remove part, due to ThreadPool,
     -- hence we cannot compare strictly.
-    select throwIf(not(length(thread_ids) between 1 and 11))
+    select throwIf(not(length(thread_ids) between 1 and 129))
     from system.query_log
     where
         event_date >= yesterday() and
@@ -49,7 +52,7 @@ $CLICKHOUSE_CLIENT -nm -q """
     Engine=ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/rep_data_01810', '1')
     order by key
     partition by key%100
-    settings max_part_removal_threads=10, concurrent_part_removal_threshold=99, min_bytes_for_wide_part=0;
+    settings concurrent_part_removal_threshold=99, min_bytes_for_wide_part=0;
 
     SET insert_keeper_max_retries=1000;
     SET insert_keeper_retry_max_backoff_ms=10;
@@ -60,7 +63,7 @@ $CLICKHOUSE_CLIENT -nm -q """
 
     -- sometimes the same thread can be used to remove part, due to ThreadPool,
     -- hence we cannot compare strictly.
-    select throwIf(not(length(thread_ids) between 1 and 11))
+    select throwIf(not(length(thread_ids) between 1 and 129))
     from system.query_log
     where
         event_date >= yesterday() and
diff --git a/tests/queries/0_stateless/01851_hedged_connections_external_tables.sql b/tests/queries/0_stateless/01851_hedged_connections_external_tables.sql
index c4625720e59..22888d5e68c 100644
--- a/tests/queries/0_stateless/01851_hedged_connections_external_tables.sql
+++ b/tests/queries/0_stateless/01851_hedged_connections_external_tables.sql
@@ -1 +1,2 @@
+-- Tags: no-tsan
 select number from remote('127.0.0.{3|2}', numbers(2)) where number global in (select number from numbers(1))　settings async_socket_for_remote=1, use_hedged_requests = 1, sleep_in_send_data_ms=10, receive_data_timeout_ms=1;
diff --git a/tests/queries/0_stateless/01921_concurrent_ttl_and_normal_merges_zookeeper_long.sh b/tests/queries/0_stateless/01921_concurrent_ttl_and_normal_merges_zookeeper_long.sh
index a3682a3a74b..5e1600a0673 100755
--- a/tests/queries/0_stateless/01921_concurrent_ttl_and_normal_merges_zookeeper_long.sh
+++ b/tests/queries/0_stateless/01921_concurrent_ttl_and_normal_merges_zookeeper_long.sh
@@ -24,7 +24,8 @@ for i in $(seq 1 $NUM_REPLICAS); do
     ENGINE ReplicatedMergeTree('/test/01921_concurrent_ttl_and_normal_merges/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/ttl_table', '$i')
     ORDER BY tuple()
     TTL key + INTERVAL 1 SECOND
-    SETTINGS merge_with_ttl_timeout=1, max_replicated_merges_with_ttl_in_queue=100, max_number_of_merges_with_ttl_in_pool=100, cleanup_delay_period=1, cleanup_delay_period_random_add=0;"
+    SETTINGS merge_with_ttl_timeout=1, max_replicated_merges_with_ttl_in_queue=100, max_number_of_merges_with_ttl_in_pool=100,
+    cleanup_delay_period=1, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0;"
 done
 
 function optimize_thread
diff --git a/tests/queries/0_stateless/01942_snowflakeToDateTime.reference b/tests/queries/0_stateless/01942_snowflakeToDateTime.reference
index bed18023f6a..83fae3ef809 100644
--- a/tests/queries/0_stateless/01942_snowflakeToDateTime.reference
+++ b/tests/queries/0_stateless/01942_snowflakeToDateTime.reference
@@ -1,3 +1,5 @@
 const column
 UTC	1426860704886947840	2021-08-15 10:57:56	DateTime(\'UTC\')	2021-08-15 10:57:56.492	DateTime64(3, \'UTC\')
 Asia/Shanghai	1426860704886947840	2021-08-15 18:57:56	DateTime(\'Asia/Shanghai\')	2021-08-15 18:57:56.492	DateTime64(3, \'Asia/Shanghai\')
+1
+1
diff --git a/tests/queries/0_stateless/01942_snowflakeToDateTime.sql b/tests/queries/0_stateless/01942_snowflakeToDateTime.sql
index f6f171afabf..0092eca848c 100644
--- a/tests/queries/0_stateless/01942_snowflakeToDateTime.sql
+++ b/tests/queries/0_stateless/01942_snowflakeToDateTime.sql
@@ -29,4 +29,14 @@ SELECT
 	snowflakeToDateTime(i64, tz) as dt,
 	toTypeName(dt),
 	snowflakeToDateTime64(i64, tz) as dt64,
-	toTypeName(dt64);
\ No newline at end of file
+	toTypeName(dt64);
+
+
+DROP TABLE IF EXISTS tab;
+CREATE TABLE tab(val Int64, tz String) engine=Log;
+INSERT INTO tab VALUES (42, 'Asia/Singapore');
+
+SELECT 1 FROM tab WHERE snowflakeToDateTime(42::Int64, tz) != now() SETTINGS allow_nonconst_timezone_arguments = 1;
+SELECT 1 FROM tab WHERE snowflakeToDateTime64(42::Int64, tz) != now() SETTINGS allow_nonconst_timezone_arguments = 1;
+
+DROP TABLE tab;
diff --git a/tests/queries/0_stateless/01945_system_warnings.sh b/tests/queries/0_stateless/01945_system_warnings.sh
index bf11cee2911..c9bd0fd4b8a 100755
--- a/tests/queries/0_stateless/01945_system_warnings.sh
+++ b/tests/queries/0_stateless/01945_system_warnings.sh
@@ -21,5 +21,4 @@ ${CLICKHOUSE_CLIENT} --multiple_joins_rewriter_version=42 -q "SELECT message FRO
 ${CLICKHOUSE_CLIENT} -q "SELECT count() = countDistinct(message) FROM system.warnings"
 
 # Avoid too many warnings, especially in CI
-${CLICKHOUSE_CLIENT} -q "SELECT count() < 5 FROM system.warnings"
-
+${CLICKHOUSE_CLIENT} -q "SELECT count() < 10 FROM system.warnings"
diff --git a/tests/queries/0_stateless/01956_skip_unavailable_shards_excessive_attempts.reference b/tests/queries/0_stateless/01956_skip_unavailable_shards_excessive_attempts.reference
index e39f4b962e6..ad409aac5b8 100644
--- a/tests/queries/0_stateless/01956_skip_unavailable_shards_excessive_attempts.reference
+++ b/tests/queries/0_stateless/01956_skip_unavailable_shards_excessive_attempts.reference
@@ -1,10 +1,10 @@
 255.255.255.255
-HedgedConnectionsFactory: Connection failed at try №1
+ConnectionPoolWithFailover: Connection failed at try №1
 executeQuery: Code: 519.: All attempts to get table structure failed.
 127.2,255.255.255.255
 0
-HedgedConnectionsFactory: Connection failed at try №1
+ConnectionPoolWithFailover: Connection failed at try №1
 255.255.255.255,127.2
 0
-HedgedConnectionsFactory: Connection failed at try №1
-HedgedConnectionsFactory: Connection failed at try №1
+ConnectionPoolWithFailover: Connection failed at try №1
+ConnectionPoolWithFailover: Connection failed at try №1
diff --git a/tests/queries/0_stateless/01956_skip_unavailable_shards_excessive_attempts.sh b/tests/queries/0_stateless/01956_skip_unavailable_shards_excessive_attempts.sh
index 488e2fe106a..9f9de96ca6e 100755
--- a/tests/queries/0_stateless/01956_skip_unavailable_shards_excessive_attempts.sh
+++ b/tests/queries/0_stateless/01956_skip_unavailable_shards_excessive_attempts.sh
@@ -25,7 +25,7 @@ function execute_query()
     #   clickhouse-client 2> >(wc -l)
     #
     # May dump output of "wc -l" after some other programs.
-    $CLICKHOUSE_CLIENT "${opts[@]}" --query "select * from remote('$hosts', system.one)" 2>"$stderr"
+    $CLICKHOUSE_CLIENT "${opts[@]}" --query "select * from remote('$hosts', system.one) settings use_hedged_requests=0" 2>"$stderr"
     process_log_safe "$stderr"
 }
 execute_query 255.255.255.255
diff --git a/tests/queries/0_stateless/02003_memory_limit_in_client.expect b/tests/queries/0_stateless/02003_memory_limit_in_client.expect
deleted file mode 100755
index 377656fa641..00000000000
--- a/tests/queries/0_stateless/02003_memory_limit_in_client.expect
+++ /dev/null
@@ -1,64 +0,0 @@
-#!/usr/bin/expect -f
-
-# This is a test for system.warnings. Testing in interactive mode is necessary,
-# as we want to see certain warnings from client
-
-set basedir [file dirname $argv0]
-set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
-
-log_user 0
-set timeout 60
-match_max 100000
-
-expect_after {
-    # Do not ignore eof from expect
-    -i $any_spawn_id eof { exp_continue }
-    # A default timeout action is to do nothing, change it to fail
-    -i $any_spawn_id timeout { exit 1 }
-}
-
-#
-# Check that the query will fail in clickhouse-client
-#
-spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_CLIENT_BINARY \$CLICKHOUSE_CLIENT_OPT --disable_suggestion --max_memory_usage_in_client=1 --history_file=$history_file"
-expect ":) "
-
-send  -- "SELECT arrayMap(x -> range(x), range(number)) FROM numbers(1000)\r"
-expect "Code: 241"
-
-expect ":) "
-
-# Exit.
-send -- "\4"
-expect eof
-
-#
-# Check that the query will fail in clickhouse-client
-#
-spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_CLIENT_BINARY \$CLICKHOUSE_CLIENT_OPT --disable_suggestion --max_memory_usage_in_client=1 --history_file=$history_file"
-expect ":) "
-
-send  -- "SELECT arrayMap(x -> range(x), range(number)) FROM numbers(1000)\r"
-expect "Code: 241"
-
-expect ":) "
-
-# Exit.
-send -- "\4"
-expect eof
-
-#
-# Check that the query will not fail (due to max_untracked_memory)
-#
-spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_CLIENT_BINARY \$CLICKHOUSE_CLIENT_OPT --disable_suggestion --max_memory_usage_in_client=1 --history_file=$history_file"
-expect ":) "
-
-send  -- "SELECT * FROM (SELECT * FROM system.numbers LIMIT 600000) as num WHERE num.number=60000\r"
-expect "60000"
-expect ":) "
-
-# Exit.
-send -- "\4"
-expect eof
diff --git a/tests/queries/0_stateless/02003_memory_limit_in_client.reference b/tests/queries/0_stateless/02003_memory_limit_in_client.reference
index e69de29bb2d..541b3a18e90 100644
--- a/tests/queries/0_stateless/02003_memory_limit_in_client.reference
+++ b/tests/queries/0_stateless/02003_memory_limit_in_client.reference
@@ -0,0 +1 @@
+60000
diff --git a/tests/queries/0_stateless/02003_memory_limit_in_client.sh b/tests/queries/0_stateless/02003_memory_limit_in_client.sh
new file mode 100755
index 00000000000..2d2493828c8
--- /dev/null
+++ b/tests/queries/0_stateless/02003_memory_limit_in_client.sh
@@ -0,0 +1,8 @@
+#!/usr/bin/bash -f
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT --max_memory_usage_in_client=1 -n -q "SELECT arrayMap(x -> range(x), range(number)) FROM numbers(1000) -- { clientError MEMORY_LIMIT_EXCEEDED }"
+$CLICKHOUSE_CLIENT --max_memory_usage_in_client=0 -n -q "SELECT * FROM (SELECT * FROM system.numbers LIMIT 600000) as num WHERE num.number=60000"
diff --git a/tests/queries/0_stateless/02030_capnp_format.reference b/tests/queries/0_stateless/02030_capnp_format.reference
index 2b2307bfc6a..e08b1eb1271 100644
--- a/tests/queries/0_stateless/02030_capnp_format.reference
+++ b/tests/queries/0_stateless/02030_capnp_format.reference
@@ -12,6 +12,9 @@
 \N	[NULL,NULL,42]	(NULL)
 1	[1,NULL,2]	(1)
 \N	[NULL,NULL,42]	(NULL)
+OK
+OK
+OK
 one
 two
 tHrEe
@@ -21,6 +24,14 @@ threE
 first
 second
 third
+first
+second
+third
+OK
+one
+two
+tHrEe
+OK
 OK
 OK
 OK
diff --git a/tests/queries/0_stateless/02030_capnp_format.sh b/tests/queries/0_stateless/02030_capnp_format.sh
index c15d6fe442e..b4484ca3766 100755
--- a/tests/queries/0_stateless/02030_capnp_format.sh
+++ b/tests/queries/0_stateless/02030_capnp_format.sh
@@ -71,16 +71,25 @@ $CLICKHOUSE_CLIENT --query="DROP TABLE capnp_nullable"
 
 
 $CLICKHOUSE_CLIENT --query="SELECT CAST(number, 'Enum(\'one\' = 0, \'two\' = 1, \'tHrEe\' = 2)') AS value FROM numbers(3) FORMAT CapnProto SETTINGS format_schema='$CLIENT_SCHEMADIR/02030_capnp_enum:Message'" > $CAPN_PROTO_FILE
+$CLICKHOUSE_CLIENT --query="SELECT CAST(number % 2, 'Enum(\'one\' = 0, \'two\' = 1, \'tHrEe\' = 2, \'four\' = 4)') AS value FROM numbers(3) FORMAT CapnProto SETTINGS format_schema='$CLIENT_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_names'" 2>&1 | grep -F -q "CAPN_PROTO_BAD_CAST" && echo 'OK' || echo 'FAIL';
+$CLICKHOUSE_CLIENT --query="SELECT CAST(number % 2, 'Enum(\'one\' = 0, \'two\' = 1, \'tHrEe\' = 2, \'four\' = 4)') AS value FROM numbers(3) FORMAT CapnProto SETTINGS format_schema='$CLIENT_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_names_case_insensitive'" 2>&1 | grep -F -q "CAPN_PROTO_BAD_CAST" && echo 'OK' || echo 'FAIL';
+$CLICKHOUSE_CLIENT --query="SELECT CAST(number % 2, 'Enum(\'one\' = 0, \'two\' = 1, \'tHrEe\' = 2, \'four\' = 4)') AS value FROM numbers(3) FORMAT CapnProto SETTINGS format_schema='$CLIENT_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_values'" 2>&1 | grep -F -q "CAPN_PROTO_BAD_CAST" && echo 'OK' || echo 'FAIL';
 
 $CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'value Enum(\'one\' = 1, \'two\' = 2, \'tHrEe\' = 3)') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_names'"
 $CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'value Enum(\'oNe\' = 1, \'tWo\' = 2, \'threE\' = 3)') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_names_case_insensitive'"
 $CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'value Enum(\'first\' = 0, \'second\' = 1, \'third\' = 2)') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_values'"
-
+$CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'value Enum(\'first\' = 0, \'second\' = 1, \'third\' = 2)') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_values'"
 $CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'value Enum(\'one\' = 0, \'two\' = 1, \'three\' = 2)') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_names'" 2>&1 | grep -F -q "CAPN_PROTO_BAD_CAST" && echo 'OK' || echo 'FAIL';
-$CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'value Enum(\'one\' = 0, \'two\' = 1, \'tHrEe\' = 2, \'four\' = 3)') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_names'" 2>&1 | grep -F -q "CAPN_PROTO_BAD_CAST" && echo 'OK' || echo 'FAIL';
+$CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'value Enum(\'one\' = 0, \'two\' = 1, \'tHrEe\' = 2, \'four\' = 3)') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_names'"
 $CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'value Enum(\'one\' = 1, \'two\' = 2, \'tHrEe\' = 3)') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_values'" 2>&1 | grep -F -q "CAPN_PROTO_BAD_CAST" && echo 'OK' || echo 'FAIL';
 $CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'value Enum(\'first\' = 1, \'two\' = 2, \'three\' = 3)') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_names_case_insensitive'" 2>&1 | grep -F -q "CAPN_PROTO_BAD_CAST" && echo 'OK' || echo 'FAIL';
 
+$CLICKHOUSE_CLIENT --query="SELECT CAST(number % 2, 'Enum(\'one\' = 0, \'two\' = 1)') AS value FROM numbers(3) FORMAT CapnProto SETTINGS format_schema='$CLIENT_SCHEMADIR/02030_capnp_enum:Message'" > $CAPN_PROTO_FILE
+$CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'value Enum(\'first\' = 0, \'two\' = 1)') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_values'"  2>&1 | grep -F -q "CAPN_PROTO_BAD_CAST" && echo 'OK' || echo 'FAIL';
+$CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'value Enum(\'first\' = 0, \'two\' = 1)') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_names'"  2>&1 | grep -F -q "CAPN_PROTO_BAD_CAST" && echo 'OK' || echo 'FAIL';
+$CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'value Enum(\'first\' = 0, \'two\' = 1)') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_enum:Message', format_capn_proto_enum_comparising_mode='by_names_case_insensitive'" 2>&1 | grep -F -q "CAPN_PROTO_BAD_CAST" && echo 'OK' || echo 'FAIL';
+
+
 $CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS capnp_low_cardinality"
 $CLICKHOUSE_CLIENT --query="CREATE TABLE capnp_low_cardinality (lc1 LowCardinality(String), lc2 LowCardinality(Nullable(String)), lc3 Array(LowCardinality(Nullable(String)))) ENGINE=Memory"
 $CLICKHOUSE_CLIENT --query="INSERT INTO capnp_low_cardinality VALUES ('one', 'two', ['one', Null, 'two', Null]), ('two', Null, [Null])"
@@ -96,8 +105,8 @@ $CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'a_b U
 
 $CLICKHOUSE_CLIENT --query="SELECT number AS a_b, number + 1 AS a_c_d, number + 2 AS a_c_e_f FROM numbers(5) FORMAT CapnProto SETTINGS format_schema='$CLIENT_SCHEMADIR/02030_capnp_nested_tuples:Message'" > $CAPN_PROTO_FILE
 $CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'a Tuple(b UInt64, c Tuple(d UInt64, e Tuple(f UInt64)))') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_nested_tuples:Message'"
-$CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'a Tuple(bb UInt64, c Tuple(d UInt64, e Tuple(f UInt64)))') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_nested_tuples:Message'" 2>&1 | grep -F -q "CAPN_PROTO_BAD_CAST" && echo 'OK' || echo 'FAIL';
-$CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'a Tuple(b UInt64, c Tuple(d UInt64, e Tuple(ff UInt64)))') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_nested_tuples:Message'" 2>&1 | grep -F -q "CAPN_PROTO_BAD_CAST" && echo 'OK' || echo 'FAIL';
+$CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'a Tuple(bb UInt64, c Tuple(d UInt64, e Tuple(f UInt64)))') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_nested_tuples:Message'" 2>&1 | grep -F -q "THERE_IS_NO_COLUMN" && echo 'OK' || echo 'FAIL';
+$CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'a Tuple(b UInt64, c Tuple(d UInt64, e Tuple(ff UInt64)))') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_nested_tuples:Message'" 2>&1 | grep -F -q "THERE_IS_NO_COLUMN" && echo 'OK' || echo 'FAIL';
 
 
 $CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.capnp', 'CapnProto', 'string String') SETTINGS format_schema='$SERVER_SCHEMADIR/02030_capnp_simple_types:Message'" 2>&1 | grep -F -q "INCORRECT_DATA" && echo 'OK' || echo 'FAIL';
diff --git a/tests/queries/0_stateless/02048_clickhouse_local_stage.reference b/tests/queries/0_stateless/02048_clickhouse_local_stage.reference
index 00e0f4ddb2e..8a34751b071 100644
--- a/tests/queries/0_stateless/02048_clickhouse_local_stage.reference
+++ b/tests/queries/0_stateless/02048_clickhouse_local_stage.reference
@@ -2,7 +2,7 @@ execute: --allow_experimental_analyzer=1
 "foo"
 1
 execute: --allow_experimental_analyzer=1 --stage fetch_columns
-"system.one.dummy_0"
+"dummy_0"
 0
 execute: --allow_experimental_analyzer=1 --stage with_mergeable_state
 "1_UInt8"
diff --git a/tests/queries/0_stateless/02050_clickhouse_client_local_exception.sh b/tests/queries/0_stateless/02050_clickhouse_client_local_exception.sh
index eac085a914e..a2bb29377ac 100755
--- a/tests/queries/0_stateless/02050_clickhouse_client_local_exception.sh
+++ b/tests/queries/0_stateless/02050_clickhouse_client_local_exception.sh
@@ -10,4 +10,4 @@ function cleanup()
     rm "${CLICKHOUSE_TMP}/test_exception"
 }
 trap cleanup EXIT
-$CLICKHOUSE_LOCAL --query="SELECT 1 INTO OUTFILE '${CLICKHOUSE_TMP}/test_exception' FORMAT Native" 2>&1 | grep -q "Code: 76. DB::ErrnoException:" && echo 'OK' || echo 'FAIL' ||:
+$CLICKHOUSE_LOCAL --query="SELECT 1 INTO OUTFILE '${CLICKHOUSE_TMP}/test_exception' FORMAT Native" 2>&1 | grep -q "Code: 504. DB::Exception:" && echo 'OK' || echo 'FAIL' ||:
diff --git a/tests/queries/0_stateless/02067_lost_part_s3.sql b/tests/queries/0_stateless/02067_lost_part_s3.sql
index 12afdcd4421..7df15ab33c4 100644
--- a/tests/queries/0_stateless/02067_lost_part_s3.sql
+++ b/tests/queries/0_stateless/02067_lost_part_s3.sql
@@ -4,11 +4,17 @@ DROP TABLE IF EXISTS partslost_0;
 DROP TABLE IF EXISTS partslost_1;
 DROP TABLE IF EXISTS partslost_2;
 
-CREATE TABLE partslost_0 (x String) ENGINE=ReplicatedMergeTree('/clickhouse/table/{database}_02067_lost/partslost', '0') ORDER BY tuple() SETTINGS min_rows_for_wide_part = 0, min_bytes_for_wide_part = 0, old_parts_lifetime = 1, cleanup_delay_period = 1, cleanup_delay_period_random_add = 1;
+CREATE TABLE partslost_0 (x String) ENGINE=ReplicatedMergeTree('/clickhouse/table/{database}_02067_lost/partslost', '0') ORDER BY tuple()
+    SETTINGS min_rows_for_wide_part = 0, min_bytes_for_wide_part = 0, old_parts_lifetime = 1,
+    cleanup_delay_period = 1, cleanup_delay_period_random_add = 1, cleanup_thread_preferred_points_per_iteration=0;
 
-CREATE TABLE partslost_1 (x String) ENGINE=ReplicatedMergeTree('/clickhouse/table/{database}_02067_lost/partslost', '1') ORDER BY tuple() SETTINGS min_rows_for_wide_part = 0, min_bytes_for_wide_part = 0, old_parts_lifetime = 1, cleanup_delay_period = 1, cleanup_delay_period_random_add = 1;
+CREATE TABLE partslost_1 (x String) ENGINE=ReplicatedMergeTree('/clickhouse/table/{database}_02067_lost/partslost', '1') ORDER BY tuple()
+    SETTINGS min_rows_for_wide_part = 0, min_bytes_for_wide_part = 0, old_parts_lifetime = 1,
+    cleanup_delay_period = 1, cleanup_delay_period_random_add = 1, cleanup_thread_preferred_points_per_iteration=0;
 
-CREATE TABLE partslost_2 (x String) ENGINE=ReplicatedMergeTree('/clickhouse/table/{database}_02067_lost/partslost', '2') ORDER BY tuple() SETTINGS min_rows_for_wide_part = 0, min_bytes_for_wide_part = 0, old_parts_lifetime = 1, cleanup_delay_period = 1, cleanup_delay_period_random_add = 1;
+CREATE TABLE partslost_2 (x String) ENGINE=ReplicatedMergeTree('/clickhouse/table/{database}_02067_lost/partslost', '2') ORDER BY tuple()
+    SETTINGS min_rows_for_wide_part = 0, min_bytes_for_wide_part = 0, old_parts_lifetime = 1,
+    cleanup_delay_period = 1, cleanup_delay_period_random_add = 1, cleanup_thread_preferred_points_per_iteration=0;
 
 
 INSERT INTO partslost_0 SELECT toString(number) AS x from system.numbers LIMIT 10000;
diff --git a/tests/queries/0_stateless/02116_tuple_element.sql b/tests/queries/0_stateless/02116_tuple_element.sql
index c911712684d..97f6c049705 100644
--- a/tests/queries/0_stateless/02116_tuple_element.sql
+++ b/tests/queries/0_stateless/02116_tuple_element.sql
@@ -14,12 +14,12 @@ EXPLAIN SYNTAX SELECT tupleElement(t1, 2) FROM t_tuple_element;
 SELECT tupleElement(t1, 'a') FROM t_tuple_element;
 EXPLAIN SYNTAX SELECT tupleElement(t1, 'a') FROM t_tuple_element;
 
-SELECT tupleElement(number, 1) FROM numbers(1); -- { serverError 43 }
-SELECT tupleElement(t1) FROM t_tuple_element; -- { serverError 42 }
-SELECT tupleElement(t1, 'b') FROM t_tuple_element; -- { serverError 10, 47 }
-SELECT tupleElement(t1, 0) FROM t_tuple_element; -- { serverError 127 }
-SELECT tupleElement(t1, 3) FROM t_tuple_element; -- { serverError 127 }
-SELECT tupleElement(t1, materialize('a')) FROM t_tuple_element; -- { serverError 43 }
+SELECT tupleElement(number, 1) FROM numbers(1); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+SELECT tupleElement(t1) FROM t_tuple_element; -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
+SELECT tupleElement(t1, 'b') FROM t_tuple_element; -- { serverError NOT_FOUND_COLUMN_IN_BLOCK, UNKNOWN_IDENTIFIER }
+SELECT tupleElement(t1, 0) FROM t_tuple_element; -- { serverError ILLEGAL_INDEX, NOT_FOUND_COLUMN_IN_BLOCK }
+SELECT tupleElement(t1, 3) FROM t_tuple_element; -- { serverError ILLEGAL_INDEX, NOT_FOUND_COLUMN_IN_BLOCK }
+SELECT tupleElement(t1, materialize('a')) FROM t_tuple_element; -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 
 SELECT t2.1 FROM t_tuple_element;
 EXPLAIN SYNTAX SELECT t2.1 FROM t_tuple_element;
@@ -27,11 +27,11 @@ EXPLAIN SYNTAX SELECT t2.1 FROM t_tuple_element;
 SELECT tupleElement(t2, 1) FROM t_tuple_element;
 EXPLAIN SYNTAX SELECT tupleElement(t2, 1) FROM t_tuple_element;
 
-SELECT tupleElement(t2) FROM t_tuple_element; -- { serverError 42 }
-SELECT tupleElement(t2, 'a') FROM t_tuple_element; -- { serverError 10, 47 }
-SELECT tupleElement(t2, 0) FROM t_tuple_element; -- { serverError 127 }
-SELECT tupleElement(t2, 3) FROM t_tuple_element; -- { serverError 127 }
-SELECT tupleElement(t2, materialize(1)) FROM t_tuple_element; -- { serverError 43 }
+SELECT tupleElement(t2) FROM t_tuple_element; -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
+SELECT tupleElement(t2, 'a') FROM t_tuple_element; -- { serverError NOT_FOUND_COLUMN_IN_BLOCK, UNKNOWN_IDENTIFIER }
+SELECT tupleElement(t2, 0) FROM t_tuple_element; -- { serverError ILLEGAL_INDEX, NOT_FOUND_COLUMN_IN_BLOCK }
+SELECT tupleElement(t2, 3) FROM t_tuple_element; -- { serverError ILLEGAL_INDEX, NOT_FOUND_COLUMN_IN_BLOCK }
+SELECT tupleElement(t2, materialize(1)) FROM t_tuple_element; -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 
 DROP TABLE t_tuple_element;
 
diff --git a/tests/queries/0_stateless/02117_show_create_table_system.reference b/tests/queries/0_stateless/02117_show_create_table_system.reference
index 09cc62dac00..3834b05601f 100644
--- a/tests/queries/0_stateless/02117_show_create_table_system.reference
+++ b/tests/queries/0_stateless/02117_show_create_table_system.reference
@@ -297,7 +297,7 @@ CREATE TABLE system.grants
 (
     `user_name` Nullable(String),
     `role_name` Nullable(String),
-    `access_type` Enum16('SHOW DATABASES' = 0, 'SHOW TABLES' = 1, 'SHOW COLUMNS' = 2, 'SHOW DICTIONARIES' = 3, 'SHOW' = 4, 'SHOW FILESYSTEM CACHES' = 5, 'SELECT' = 6, 'INSERT' = 7, 'ALTER UPDATE' = 8, 'ALTER DELETE' = 9, 'ALTER ADD COLUMN' = 10, 'ALTER MODIFY COLUMN' = 11, 'ALTER DROP COLUMN' = 12, 'ALTER COMMENT COLUMN' = 13, 'ALTER CLEAR COLUMN' = 14, 'ALTER RENAME COLUMN' = 15, 'ALTER MATERIALIZE COLUMN' = 16, 'ALTER COLUMN' = 17, 'ALTER MODIFY COMMENT' = 18, 'ALTER ORDER BY' = 19, 'ALTER SAMPLE BY' = 20, 'ALTER ADD INDEX' = 21, 'ALTER DROP INDEX' = 22, 'ALTER MATERIALIZE INDEX' = 23, 'ALTER CLEAR INDEX' = 24, 'ALTER INDEX' = 25, 'ALTER ADD PROJECTION' = 26, 'ALTER DROP PROJECTION' = 27, 'ALTER MATERIALIZE PROJECTION' = 28, 'ALTER CLEAR PROJECTION' = 29, 'ALTER PROJECTION' = 30, 'ALTER ADD CONSTRAINT' = 31, 'ALTER DROP CONSTRAINT' = 32, 'ALTER CONSTRAINT' = 33, 'ALTER TTL' = 34, 'ALTER MATERIALIZE TTL' = 35, 'ALTER SETTINGS' = 36, 'ALTER MOVE PARTITION' = 37, 'ALTER FETCH PARTITION' = 38, 'ALTER FREEZE PARTITION' = 39, 'ALTER DATABASE SETTINGS' = 40, 'ALTER NAMED COLLECTION' = 41, 'ALTER TABLE' = 42, 'ALTER DATABASE' = 43, 'ALTER VIEW REFRESH' = 44, 'ALTER VIEW MODIFY QUERY' = 45, 'ALTER VIEW' = 46, 'ALTER' = 47, 'CREATE DATABASE' = 48, 'CREATE TABLE' = 49, 'CREATE VIEW' = 50, 'CREATE DICTIONARY' = 51, 'CREATE TEMPORARY TABLE' = 52, 'CREATE ARBITRARY TEMPORARY TABLE' = 53, 'CREATE FUNCTION' = 54, 'CREATE NAMED COLLECTION' = 55, 'CREATE' = 56, 'DROP DATABASE' = 57, 'DROP TABLE' = 58, 'DROP VIEW' = 59, 'DROP DICTIONARY' = 60, 'DROP FUNCTION' = 61, 'DROP NAMED COLLECTION' = 62, 'DROP' = 63, 'UNDROP TABLE' = 64, 'TRUNCATE' = 65, 'OPTIMIZE' = 66, 'BACKUP' = 67, 'KILL QUERY' = 68, 'KILL TRANSACTION' = 69, 'MOVE PARTITION BETWEEN SHARDS' = 70, 'CREATE USER' = 71, 'ALTER USER' = 72, 'DROP USER' = 73, 'CREATE ROLE' = 74, 'ALTER ROLE' = 75, 'DROP ROLE' = 76, 'ROLE ADMIN' = 77, 'CREATE ROW POLICY' = 78, 'ALTER ROW POLICY' = 79, 'DROP ROW POLICY' = 80, 'CREATE QUOTA' = 81, 'ALTER QUOTA' = 82, 'DROP QUOTA' = 83, 'CREATE SETTINGS PROFILE' = 84, 'ALTER SETTINGS PROFILE' = 85, 'DROP SETTINGS PROFILE' = 86, 'SHOW USERS' = 87, 'SHOW ROLES' = 88, 'SHOW ROW POLICIES' = 89, 'SHOW QUOTAS' = 90, 'SHOW SETTINGS PROFILES' = 91, 'SHOW ACCESS' = 92, 'ACCESS MANAGEMENT' = 93, 'SHOW NAMED COLLECTIONS' = 94, 'SHOW NAMED COLLECTIONS SECRETS' = 95, 'NAMED COLLECTION CONTROL' = 96, 'SYSTEM SHUTDOWN' = 97, 'SYSTEM DROP DNS CACHE' = 98, 'SYSTEM DROP MARK CACHE' = 99, 'SYSTEM DROP UNCOMPRESSED CACHE' = 100, 'SYSTEM DROP MMAP CACHE' = 101, 'SYSTEM DROP QUERY CACHE' = 102, 'SYSTEM DROP COMPILED EXPRESSION CACHE' = 103, 'SYSTEM DROP FILESYSTEM CACHE' = 104, 'SYSTEM DROP SCHEMA CACHE' = 105, 'SYSTEM DROP S3 CLIENT CACHE' = 106, 'SYSTEM DROP CACHE' = 107, 'SYSTEM RELOAD CONFIG' = 108, 'SYSTEM RELOAD USERS' = 109, 'SYSTEM RELOAD SYMBOLS' = 110, 'SYSTEM RELOAD DICTIONARY' = 111, 'SYSTEM RELOAD MODEL' = 112, 'SYSTEM RELOAD FUNCTION' = 113, 'SYSTEM RELOAD EMBEDDED DICTIONARIES' = 114, 'SYSTEM RELOAD' = 115, 'SYSTEM RESTART DISK' = 116, 'SYSTEM MERGES' = 117, 'SYSTEM TTL MERGES' = 118, 'SYSTEM FETCHES' = 119, 'SYSTEM MOVES' = 120, 'SYSTEM DISTRIBUTED SENDS' = 121, 'SYSTEM REPLICATED SENDS' = 122, 'SYSTEM SENDS' = 123, 'SYSTEM REPLICATION QUEUES' = 124, 'SYSTEM DROP REPLICA' = 125, 'SYSTEM SYNC REPLICA' = 126, 'SYSTEM RESTART REPLICA' = 127, 'SYSTEM RESTORE REPLICA' = 128, 'SYSTEM WAIT LOADING PARTS' = 129, 'SYSTEM SYNC DATABASE REPLICA' = 130, 'SYSTEM SYNC TRANSACTION LOG' = 131, 'SYSTEM SYNC FILE CACHE' = 132, 'SYSTEM FLUSH DISTRIBUTED' = 133, 'SYSTEM FLUSH LOGS' = 134, 'SYSTEM FLUSH' = 135, 'SYSTEM THREAD FUZZER' = 136, 'SYSTEM UNFREEZE' = 137, 'SYSTEM FAILPOINT' = 138, 'SYSTEM' = 139, 'dictGet' = 140, 'displaySecretsInShowAndSelect' = 141, 'addressToLine' = 142, 'addressToLineWithInlines' = 143, 'addressToSymbol' = 144, 'demangle' = 145, 'INTROSPECTION' = 146, 'FILE' = 147, 'URL' = 148, 'REMOTE' = 149, 'MONGO' = 150, 'MEILISEARCH' = 151, 'MYSQL' = 152, 'POSTGRES' = 153, 'SQLITE' = 154, 'ODBC' = 155, 'JDBC' = 156, 'HDFS' = 157, 'S3' = 158, 'HIVE' = 159, 'SOURCES' = 160, 'CLUSTER' = 161, 'ALL' = 162, 'NONE' = 163),
+    `access_type` Enum16('SHOW DATABASES' = 0, 'SHOW TABLES' = 1, 'SHOW COLUMNS' = 2, 'SHOW DICTIONARIES' = 3, 'SHOW' = 4, 'SHOW FILESYSTEM CACHES' = 5, 'SELECT' = 6, 'INSERT' = 7, 'ALTER UPDATE' = 8, 'ALTER DELETE' = 9, 'ALTER ADD COLUMN' = 10, 'ALTER MODIFY COLUMN' = 11, 'ALTER DROP COLUMN' = 12, 'ALTER COMMENT COLUMN' = 13, 'ALTER CLEAR COLUMN' = 14, 'ALTER RENAME COLUMN' = 15, 'ALTER MATERIALIZE COLUMN' = 16, 'ALTER COLUMN' = 17, 'ALTER MODIFY COMMENT' = 18, 'ALTER ORDER BY' = 19, 'ALTER SAMPLE BY' = 20, 'ALTER ADD INDEX' = 21, 'ALTER DROP INDEX' = 22, 'ALTER MATERIALIZE INDEX' = 23, 'ALTER CLEAR INDEX' = 24, 'ALTER INDEX' = 25, 'ALTER ADD PROJECTION' = 26, 'ALTER DROP PROJECTION' = 27, 'ALTER MATERIALIZE PROJECTION' = 28, 'ALTER CLEAR PROJECTION' = 29, 'ALTER PROJECTION' = 30, 'ALTER ADD CONSTRAINT' = 31, 'ALTER DROP CONSTRAINT' = 32, 'ALTER CONSTRAINT' = 33, 'ALTER TTL' = 34, 'ALTER MATERIALIZE TTL' = 35, 'ALTER SETTINGS' = 36, 'ALTER MOVE PARTITION' = 37, 'ALTER FETCH PARTITION' = 38, 'ALTER FREEZE PARTITION' = 39, 'ALTER DATABASE SETTINGS' = 40, 'ALTER NAMED COLLECTION' = 41, 'ALTER TABLE' = 42, 'ALTER DATABASE' = 43, 'ALTER VIEW REFRESH' = 44, 'ALTER VIEW MODIFY QUERY' = 45, 'ALTER VIEW' = 46, 'ALTER' = 47, 'CREATE DATABASE' = 48, 'CREATE TABLE' = 49, 'CREATE VIEW' = 50, 'CREATE DICTIONARY' = 51, 'CREATE TEMPORARY TABLE' = 52, 'CREATE ARBITRARY TEMPORARY TABLE' = 53, 'CREATE FUNCTION' = 54, 'CREATE NAMED COLLECTION' = 55, 'CREATE' = 56, 'DROP DATABASE' = 57, 'DROP TABLE' = 58, 'DROP VIEW' = 59, 'DROP DICTIONARY' = 60, 'DROP FUNCTION' = 61, 'DROP NAMED COLLECTION' = 62, 'DROP' = 63, 'UNDROP TABLE' = 64, 'TRUNCATE' = 65, 'OPTIMIZE' = 66, 'BACKUP' = 67, 'KILL QUERY' = 68, 'KILL TRANSACTION' = 69, 'MOVE PARTITION BETWEEN SHARDS' = 70, 'CREATE USER' = 71, 'ALTER USER' = 72, 'DROP USER' = 73, 'CREATE ROLE' = 74, 'ALTER ROLE' = 75, 'DROP ROLE' = 76, 'ROLE ADMIN' = 77, 'CREATE ROW POLICY' = 78, 'ALTER ROW POLICY' = 79, 'DROP ROW POLICY' = 80, 'CREATE QUOTA' = 81, 'ALTER QUOTA' = 82, 'DROP QUOTA' = 83, 'CREATE SETTINGS PROFILE' = 84, 'ALTER SETTINGS PROFILE' = 85, 'DROP SETTINGS PROFILE' = 86, 'SHOW USERS' = 87, 'SHOW ROLES' = 88, 'SHOW ROW POLICIES' = 89, 'SHOW QUOTAS' = 90, 'SHOW SETTINGS PROFILES' = 91, 'SHOW ACCESS' = 92, 'ACCESS MANAGEMENT' = 93, 'SHOW NAMED COLLECTIONS' = 94, 'SHOW NAMED COLLECTIONS SECRETS' = 95, 'NAMED COLLECTION CONTROL' = 96, 'SYSTEM SHUTDOWN' = 97, 'SYSTEM DROP DNS CACHE' = 98, 'SYSTEM DROP MARK CACHE' = 99, 'SYSTEM DROP UNCOMPRESSED CACHE' = 100, 'SYSTEM DROP MMAP CACHE' = 101, 'SYSTEM DROP QUERY CACHE' = 102, 'SYSTEM DROP COMPILED EXPRESSION CACHE' = 103, 'SYSTEM DROP FILESYSTEM CACHE' = 104, 'SYSTEM DROP SCHEMA CACHE' = 105, 'SYSTEM DROP S3 CLIENT CACHE' = 106, 'SYSTEM DROP CACHE' = 107, 'SYSTEM RELOAD CONFIG' = 108, 'SYSTEM RELOAD USERS' = 109, 'SYSTEM RELOAD SYMBOLS' = 110, 'SYSTEM RELOAD DICTIONARY' = 111, 'SYSTEM RELOAD MODEL' = 112, 'SYSTEM RELOAD FUNCTION' = 113, 'SYSTEM RELOAD EMBEDDED DICTIONARIES' = 114, 'SYSTEM RELOAD' = 115, 'SYSTEM RESTART DISK' = 116, 'SYSTEM MERGES' = 117, 'SYSTEM TTL MERGES' = 118, 'SYSTEM FETCHES' = 119, 'SYSTEM MOVES' = 120, 'SYSTEM DISTRIBUTED SENDS' = 121, 'SYSTEM REPLICATED SENDS' = 122, 'SYSTEM SENDS' = 123, 'SYSTEM REPLICATION QUEUES' = 124, 'SYSTEM DROP REPLICA' = 125, 'SYSTEM SYNC REPLICA' = 126, 'SYSTEM RESTART REPLICA' = 127, 'SYSTEM RESTORE REPLICA' = 128, 'SYSTEM WAIT LOADING PARTS' = 129, 'SYSTEM SYNC DATABASE REPLICA' = 130, 'SYSTEM SYNC TRANSACTION LOG' = 131, 'SYSTEM SYNC FILE CACHE' = 132, 'SYSTEM FLUSH DISTRIBUTED' = 133, 'SYSTEM FLUSH LOGS' = 134, 'SYSTEM FLUSH' = 135, 'SYSTEM THREAD FUZZER' = 136, 'SYSTEM UNFREEZE' = 137, 'SYSTEM FAILPOINT' = 138, 'SYSTEM' = 139, 'dictGet' = 140, 'displaySecretsInShowAndSelect' = 141, 'addressToLine' = 142, 'addressToLineWithInlines' = 143, 'addressToSymbol' = 144, 'demangle' = 145, 'INTROSPECTION' = 146, 'FILE' = 147, 'URL' = 148, 'REMOTE' = 149, 'MONGO' = 150, 'REDIS' = 151, 'MEILISEARCH' = 152, 'MYSQL' = 153, 'POSTGRES' = 154, 'SQLITE' = 155, 'ODBC' = 156, 'JDBC' = 157, 'HDFS' = 158, 'S3' = 159, 'HIVE' = 160, 'AZURE' = 161, 'SOURCES' = 162, 'CLUSTER' = 163, 'ALL' = 164, 'NONE' = 165),
     `database` Nullable(String),
     `table` Nullable(String),
     `column` Nullable(String),
@@ -565,6 +565,7 @@ CREATE TABLE system.parts_columns
     `column_data_compressed_bytes` UInt64,
     `column_data_uncompressed_bytes` UInt64,
     `column_marks_bytes` UInt64,
+    `column_modification_time` Nullable(DateTime),
     `serialization_kind` String,
     `subcolumns.names` Array(String),
     `subcolumns.types` Array(String),
@@ -581,10 +582,10 @@ ENGINE = SystemPartsColumns
 COMMENT 'SYSTEM TABLE is built on the fly.'
 CREATE TABLE system.privileges
 (
-    `privilege` Enum16('SHOW DATABASES' = 0, 'SHOW TABLES' = 1, 'SHOW COLUMNS' = 2, 'SHOW DICTIONARIES' = 3, 'SHOW' = 4, 'SHOW FILESYSTEM CACHES' = 5, 'SELECT' = 6, 'INSERT' = 7, 'ALTER UPDATE' = 8, 'ALTER DELETE' = 9, 'ALTER ADD COLUMN' = 10, 'ALTER MODIFY COLUMN' = 11, 'ALTER DROP COLUMN' = 12, 'ALTER COMMENT COLUMN' = 13, 'ALTER CLEAR COLUMN' = 14, 'ALTER RENAME COLUMN' = 15, 'ALTER MATERIALIZE COLUMN' = 16, 'ALTER COLUMN' = 17, 'ALTER MODIFY COMMENT' = 18, 'ALTER ORDER BY' = 19, 'ALTER SAMPLE BY' = 20, 'ALTER ADD INDEX' = 21, 'ALTER DROP INDEX' = 22, 'ALTER MATERIALIZE INDEX' = 23, 'ALTER CLEAR INDEX' = 24, 'ALTER INDEX' = 25, 'ALTER ADD PROJECTION' = 26, 'ALTER DROP PROJECTION' = 27, 'ALTER MATERIALIZE PROJECTION' = 28, 'ALTER CLEAR PROJECTION' = 29, 'ALTER PROJECTION' = 30, 'ALTER ADD CONSTRAINT' = 31, 'ALTER DROP CONSTRAINT' = 32, 'ALTER CONSTRAINT' = 33, 'ALTER TTL' = 34, 'ALTER MATERIALIZE TTL' = 35, 'ALTER SETTINGS' = 36, 'ALTER MOVE PARTITION' = 37, 'ALTER FETCH PARTITION' = 38, 'ALTER FREEZE PARTITION' = 39, 'ALTER DATABASE SETTINGS' = 40, 'ALTER NAMED COLLECTION' = 41, 'ALTER TABLE' = 42, 'ALTER DATABASE' = 43, 'ALTER VIEW REFRESH' = 44, 'ALTER VIEW MODIFY QUERY' = 45, 'ALTER VIEW' = 46, 'ALTER' = 47, 'CREATE DATABASE' = 48, 'CREATE TABLE' = 49, 'CREATE VIEW' = 50, 'CREATE DICTIONARY' = 51, 'CREATE TEMPORARY TABLE' = 52, 'CREATE ARBITRARY TEMPORARY TABLE' = 53, 'CREATE FUNCTION' = 54, 'CREATE NAMED COLLECTION' = 55, 'CREATE' = 56, 'DROP DATABASE' = 57, 'DROP TABLE' = 58, 'DROP VIEW' = 59, 'DROP DICTIONARY' = 60, 'DROP FUNCTION' = 61, 'DROP NAMED COLLECTION' = 62, 'DROP' = 63, 'UNDROP TABLE' = 64, 'TRUNCATE' = 65, 'OPTIMIZE' = 66, 'BACKUP' = 67, 'KILL QUERY' = 68, 'KILL TRANSACTION' = 69, 'MOVE PARTITION BETWEEN SHARDS' = 70, 'CREATE USER' = 71, 'ALTER USER' = 72, 'DROP USER' = 73, 'CREATE ROLE' = 74, 'ALTER ROLE' = 75, 'DROP ROLE' = 76, 'ROLE ADMIN' = 77, 'CREATE ROW POLICY' = 78, 'ALTER ROW POLICY' = 79, 'DROP ROW POLICY' = 80, 'CREATE QUOTA' = 81, 'ALTER QUOTA' = 82, 'DROP QUOTA' = 83, 'CREATE SETTINGS PROFILE' = 84, 'ALTER SETTINGS PROFILE' = 85, 'DROP SETTINGS PROFILE' = 86, 'SHOW USERS' = 87, 'SHOW ROLES' = 88, 'SHOW ROW POLICIES' = 89, 'SHOW QUOTAS' = 90, 'SHOW SETTINGS PROFILES' = 91, 'SHOW ACCESS' = 92, 'ACCESS MANAGEMENT' = 93, 'SHOW NAMED COLLECTIONS' = 94, 'SHOW NAMED COLLECTIONS SECRETS' = 95, 'NAMED COLLECTION CONTROL' = 96, 'SYSTEM SHUTDOWN' = 97, 'SYSTEM DROP DNS CACHE' = 98, 'SYSTEM DROP MARK CACHE' = 99, 'SYSTEM DROP UNCOMPRESSED CACHE' = 100, 'SYSTEM DROP MMAP CACHE' = 101, 'SYSTEM DROP QUERY CACHE' = 102, 'SYSTEM DROP COMPILED EXPRESSION CACHE' = 103, 'SYSTEM DROP FILESYSTEM CACHE' = 104, 'SYSTEM DROP SCHEMA CACHE' = 105, 'SYSTEM DROP S3 CLIENT CACHE' = 106, 'SYSTEM DROP CACHE' = 107, 'SYSTEM RELOAD CONFIG' = 108, 'SYSTEM RELOAD USERS' = 109, 'SYSTEM RELOAD SYMBOLS' = 110, 'SYSTEM RELOAD DICTIONARY' = 111, 'SYSTEM RELOAD MODEL' = 112, 'SYSTEM RELOAD FUNCTION' = 113, 'SYSTEM RELOAD EMBEDDED DICTIONARIES' = 114, 'SYSTEM RELOAD' = 115, 'SYSTEM RESTART DISK' = 116, 'SYSTEM MERGES' = 117, 'SYSTEM TTL MERGES' = 118, 'SYSTEM FETCHES' = 119, 'SYSTEM MOVES' = 120, 'SYSTEM DISTRIBUTED SENDS' = 121, 'SYSTEM REPLICATED SENDS' = 122, 'SYSTEM SENDS' = 123, 'SYSTEM REPLICATION QUEUES' = 124, 'SYSTEM DROP REPLICA' = 125, 'SYSTEM SYNC REPLICA' = 126, 'SYSTEM RESTART REPLICA' = 127, 'SYSTEM RESTORE REPLICA' = 128, 'SYSTEM WAIT LOADING PARTS' = 129, 'SYSTEM SYNC DATABASE REPLICA' = 130, 'SYSTEM SYNC TRANSACTION LOG' = 131, 'SYSTEM SYNC FILE CACHE' = 132, 'SYSTEM FLUSH DISTRIBUTED' = 133, 'SYSTEM FLUSH LOGS' = 134, 'SYSTEM FLUSH' = 135, 'SYSTEM THREAD FUZZER' = 136, 'SYSTEM UNFREEZE' = 137, 'SYSTEM FAILPOINT' = 138, 'SYSTEM' = 139, 'dictGet' = 140, 'displaySecretsInShowAndSelect' = 141, 'addressToLine' = 142, 'addressToLineWithInlines' = 143, 'addressToSymbol' = 144, 'demangle' = 145, 'INTROSPECTION' = 146, 'FILE' = 147, 'URL' = 148, 'REMOTE' = 149, 'MONGO' = 150, 'MEILISEARCH' = 151, 'MYSQL' = 152, 'POSTGRES' = 153, 'SQLITE' = 154, 'ODBC' = 155, 'JDBC' = 156, 'HDFS' = 157, 'S3' = 158, 'HIVE' = 159, 'SOURCES' = 160, 'CLUSTER' = 161, 'ALL' = 162, 'NONE' = 163),
+    `privilege` Enum16('SHOW DATABASES' = 0, 'SHOW TABLES' = 1, 'SHOW COLUMNS' = 2, 'SHOW DICTIONARIES' = 3, 'SHOW' = 4, 'SHOW FILESYSTEM CACHES' = 5, 'SELECT' = 6, 'INSERT' = 7, 'ALTER UPDATE' = 8, 'ALTER DELETE' = 9, 'ALTER ADD COLUMN' = 10, 'ALTER MODIFY COLUMN' = 11, 'ALTER DROP COLUMN' = 12, 'ALTER COMMENT COLUMN' = 13, 'ALTER CLEAR COLUMN' = 14, 'ALTER RENAME COLUMN' = 15, 'ALTER MATERIALIZE COLUMN' = 16, 'ALTER COLUMN' = 17, 'ALTER MODIFY COMMENT' = 18, 'ALTER ORDER BY' = 19, 'ALTER SAMPLE BY' = 20, 'ALTER ADD INDEX' = 21, 'ALTER DROP INDEX' = 22, 'ALTER MATERIALIZE INDEX' = 23, 'ALTER CLEAR INDEX' = 24, 'ALTER INDEX' = 25, 'ALTER ADD PROJECTION' = 26, 'ALTER DROP PROJECTION' = 27, 'ALTER MATERIALIZE PROJECTION' = 28, 'ALTER CLEAR PROJECTION' = 29, 'ALTER PROJECTION' = 30, 'ALTER ADD CONSTRAINT' = 31, 'ALTER DROP CONSTRAINT' = 32, 'ALTER CONSTRAINT' = 33, 'ALTER TTL' = 34, 'ALTER MATERIALIZE TTL' = 35, 'ALTER SETTINGS' = 36, 'ALTER MOVE PARTITION' = 37, 'ALTER FETCH PARTITION' = 38, 'ALTER FREEZE PARTITION' = 39, 'ALTER DATABASE SETTINGS' = 40, 'ALTER NAMED COLLECTION' = 41, 'ALTER TABLE' = 42, 'ALTER DATABASE' = 43, 'ALTER VIEW REFRESH' = 44, 'ALTER VIEW MODIFY QUERY' = 45, 'ALTER VIEW' = 46, 'ALTER' = 47, 'CREATE DATABASE' = 48, 'CREATE TABLE' = 49, 'CREATE VIEW' = 50, 'CREATE DICTIONARY' = 51, 'CREATE TEMPORARY TABLE' = 52, 'CREATE ARBITRARY TEMPORARY TABLE' = 53, 'CREATE FUNCTION' = 54, 'CREATE NAMED COLLECTION' = 55, 'CREATE' = 56, 'DROP DATABASE' = 57, 'DROP TABLE' = 58, 'DROP VIEW' = 59, 'DROP DICTIONARY' = 60, 'DROP FUNCTION' = 61, 'DROP NAMED COLLECTION' = 62, 'DROP' = 63, 'UNDROP TABLE' = 64, 'TRUNCATE' = 65, 'OPTIMIZE' = 66, 'BACKUP' = 67, 'KILL QUERY' = 68, 'KILL TRANSACTION' = 69, 'MOVE PARTITION BETWEEN SHARDS' = 70, 'CREATE USER' = 71, 'ALTER USER' = 72, 'DROP USER' = 73, 'CREATE ROLE' = 74, 'ALTER ROLE' = 75, 'DROP ROLE' = 76, 'ROLE ADMIN' = 77, 'CREATE ROW POLICY' = 78, 'ALTER ROW POLICY' = 79, 'DROP ROW POLICY' = 80, 'CREATE QUOTA' = 81, 'ALTER QUOTA' = 82, 'DROP QUOTA' = 83, 'CREATE SETTINGS PROFILE' = 84, 'ALTER SETTINGS PROFILE' = 85, 'DROP SETTINGS PROFILE' = 86, 'SHOW USERS' = 87, 'SHOW ROLES' = 88, 'SHOW ROW POLICIES' = 89, 'SHOW QUOTAS' = 90, 'SHOW SETTINGS PROFILES' = 91, 'SHOW ACCESS' = 92, 'ACCESS MANAGEMENT' = 93, 'SHOW NAMED COLLECTIONS' = 94, 'SHOW NAMED COLLECTIONS SECRETS' = 95, 'NAMED COLLECTION CONTROL' = 96, 'SYSTEM SHUTDOWN' = 97, 'SYSTEM DROP DNS CACHE' = 98, 'SYSTEM DROP MARK CACHE' = 99, 'SYSTEM DROP UNCOMPRESSED CACHE' = 100, 'SYSTEM DROP MMAP CACHE' = 101, 'SYSTEM DROP QUERY CACHE' = 102, 'SYSTEM DROP COMPILED EXPRESSION CACHE' = 103, 'SYSTEM DROP FILESYSTEM CACHE' = 104, 'SYSTEM DROP SCHEMA CACHE' = 105, 'SYSTEM DROP S3 CLIENT CACHE' = 106, 'SYSTEM DROP CACHE' = 107, 'SYSTEM RELOAD CONFIG' = 108, 'SYSTEM RELOAD USERS' = 109, 'SYSTEM RELOAD SYMBOLS' = 110, 'SYSTEM RELOAD DICTIONARY' = 111, 'SYSTEM RELOAD MODEL' = 112, 'SYSTEM RELOAD FUNCTION' = 113, 'SYSTEM RELOAD EMBEDDED DICTIONARIES' = 114, 'SYSTEM RELOAD' = 115, 'SYSTEM RESTART DISK' = 116, 'SYSTEM MERGES' = 117, 'SYSTEM TTL MERGES' = 118, 'SYSTEM FETCHES' = 119, 'SYSTEM MOVES' = 120, 'SYSTEM DISTRIBUTED SENDS' = 121, 'SYSTEM REPLICATED SENDS' = 122, 'SYSTEM SENDS' = 123, 'SYSTEM REPLICATION QUEUES' = 124, 'SYSTEM DROP REPLICA' = 125, 'SYSTEM SYNC REPLICA' = 126, 'SYSTEM RESTART REPLICA' = 127, 'SYSTEM RESTORE REPLICA' = 128, 'SYSTEM WAIT LOADING PARTS' = 129, 'SYSTEM SYNC DATABASE REPLICA' = 130, 'SYSTEM SYNC TRANSACTION LOG' = 131, 'SYSTEM SYNC FILE CACHE' = 132, 'SYSTEM FLUSH DISTRIBUTED' = 133, 'SYSTEM FLUSH LOGS' = 134, 'SYSTEM FLUSH' = 135, 'SYSTEM THREAD FUZZER' = 136, 'SYSTEM UNFREEZE' = 137, 'SYSTEM FAILPOINT' = 138, 'SYSTEM' = 139, 'dictGet' = 140, 'displaySecretsInShowAndSelect' = 141, 'addressToLine' = 142, 'addressToLineWithInlines' = 143, 'addressToSymbol' = 144, 'demangle' = 145, 'INTROSPECTION' = 146, 'FILE' = 147, 'URL' = 148, 'REMOTE' = 149, 'MONGO' = 150, 'REDIS' = 151, 'MEILISEARCH' = 152, 'MYSQL' = 153, 'POSTGRES' = 154, 'SQLITE' = 155, 'ODBC' = 156, 'JDBC' = 157, 'HDFS' = 158, 'S3' = 159, 'HIVE' = 160, 'AZURE' = 161, 'SOURCES' = 162, 'CLUSTER' = 163, 'ALL' = 164, 'NONE' = 165),
     `aliases` Array(String),
     `level` Nullable(Enum8('GLOBAL' = 0, 'DATABASE' = 1, 'TABLE' = 2, 'DICTIONARY' = 3, 'VIEW' = 4, 'COLUMN' = 5, 'NAMED_COLLECTION' = 6)),
-    `parent_group` Nullable(Enum16('SHOW DATABASES' = 0, 'SHOW TABLES' = 1, 'SHOW COLUMNS' = 2, 'SHOW DICTIONARIES' = 3, 'SHOW' = 4, 'SHOW FILESYSTEM CACHES' = 5, 'SELECT' = 6, 'INSERT' = 7, 'ALTER UPDATE' = 8, 'ALTER DELETE' = 9, 'ALTER ADD COLUMN' = 10, 'ALTER MODIFY COLUMN' = 11, 'ALTER DROP COLUMN' = 12, 'ALTER COMMENT COLUMN' = 13, 'ALTER CLEAR COLUMN' = 14, 'ALTER RENAME COLUMN' = 15, 'ALTER MATERIALIZE COLUMN' = 16, 'ALTER COLUMN' = 17, 'ALTER MODIFY COMMENT' = 18, 'ALTER ORDER BY' = 19, 'ALTER SAMPLE BY' = 20, 'ALTER ADD INDEX' = 21, 'ALTER DROP INDEX' = 22, 'ALTER MATERIALIZE INDEX' = 23, 'ALTER CLEAR INDEX' = 24, 'ALTER INDEX' = 25, 'ALTER ADD PROJECTION' = 26, 'ALTER DROP PROJECTION' = 27, 'ALTER MATERIALIZE PROJECTION' = 28, 'ALTER CLEAR PROJECTION' = 29, 'ALTER PROJECTION' = 30, 'ALTER ADD CONSTRAINT' = 31, 'ALTER DROP CONSTRAINT' = 32, 'ALTER CONSTRAINT' = 33, 'ALTER TTL' = 34, 'ALTER MATERIALIZE TTL' = 35, 'ALTER SETTINGS' = 36, 'ALTER MOVE PARTITION' = 37, 'ALTER FETCH PARTITION' = 38, 'ALTER FREEZE PARTITION' = 39, 'ALTER DATABASE SETTINGS' = 40, 'ALTER NAMED COLLECTION' = 41, 'ALTER TABLE' = 42, 'ALTER DATABASE' = 43, 'ALTER VIEW REFRESH' = 44, 'ALTER VIEW MODIFY QUERY' = 45, 'ALTER VIEW' = 46, 'ALTER' = 47, 'CREATE DATABASE' = 48, 'CREATE TABLE' = 49, 'CREATE VIEW' = 50, 'CREATE DICTIONARY' = 51, 'CREATE TEMPORARY TABLE' = 52, 'CREATE ARBITRARY TEMPORARY TABLE' = 53, 'CREATE FUNCTION' = 54, 'CREATE NAMED COLLECTION' = 55, 'CREATE' = 56, 'DROP DATABASE' = 57, 'DROP TABLE' = 58, 'DROP VIEW' = 59, 'DROP DICTIONARY' = 60, 'DROP FUNCTION' = 61, 'DROP NAMED COLLECTION' = 62, 'DROP' = 63, 'UNDROP TABLE' = 64, 'TRUNCATE' = 65, 'OPTIMIZE' = 66, 'BACKUP' = 67, 'KILL QUERY' = 68, 'KILL TRANSACTION' = 69, 'MOVE PARTITION BETWEEN SHARDS' = 70, 'CREATE USER' = 71, 'ALTER USER' = 72, 'DROP USER' = 73, 'CREATE ROLE' = 74, 'ALTER ROLE' = 75, 'DROP ROLE' = 76, 'ROLE ADMIN' = 77, 'CREATE ROW POLICY' = 78, 'ALTER ROW POLICY' = 79, 'DROP ROW POLICY' = 80, 'CREATE QUOTA' = 81, 'ALTER QUOTA' = 82, 'DROP QUOTA' = 83, 'CREATE SETTINGS PROFILE' = 84, 'ALTER SETTINGS PROFILE' = 85, 'DROP SETTINGS PROFILE' = 86, 'SHOW USERS' = 87, 'SHOW ROLES' = 88, 'SHOW ROW POLICIES' = 89, 'SHOW QUOTAS' = 90, 'SHOW SETTINGS PROFILES' = 91, 'SHOW ACCESS' = 92, 'ACCESS MANAGEMENT' = 93, 'SHOW NAMED COLLECTIONS' = 94, 'SHOW NAMED COLLECTIONS SECRETS' = 95, 'NAMED COLLECTION CONTROL' = 96, 'SYSTEM SHUTDOWN' = 97, 'SYSTEM DROP DNS CACHE' = 98, 'SYSTEM DROP MARK CACHE' = 99, 'SYSTEM DROP UNCOMPRESSED CACHE' = 100, 'SYSTEM DROP MMAP CACHE' = 101, 'SYSTEM DROP QUERY CACHE' = 102, 'SYSTEM DROP COMPILED EXPRESSION CACHE' = 103, 'SYSTEM DROP FILESYSTEM CACHE' = 104, 'SYSTEM DROP SCHEMA CACHE' = 105, 'SYSTEM DROP S3 CLIENT CACHE' = 106, 'SYSTEM DROP CACHE' = 107, 'SYSTEM RELOAD CONFIG' = 108, 'SYSTEM RELOAD USERS' = 109, 'SYSTEM RELOAD SYMBOLS' = 110, 'SYSTEM RELOAD DICTIONARY' = 111, 'SYSTEM RELOAD MODEL' = 112, 'SYSTEM RELOAD FUNCTION' = 113, 'SYSTEM RELOAD EMBEDDED DICTIONARIES' = 114, 'SYSTEM RELOAD' = 115, 'SYSTEM RESTART DISK' = 116, 'SYSTEM MERGES' = 117, 'SYSTEM TTL MERGES' = 118, 'SYSTEM FETCHES' = 119, 'SYSTEM MOVES' = 120, 'SYSTEM DISTRIBUTED SENDS' = 121, 'SYSTEM REPLICATED SENDS' = 122, 'SYSTEM SENDS' = 123, 'SYSTEM REPLICATION QUEUES' = 124, 'SYSTEM DROP REPLICA' = 125, 'SYSTEM SYNC REPLICA' = 126, 'SYSTEM RESTART REPLICA' = 127, 'SYSTEM RESTORE REPLICA' = 128, 'SYSTEM WAIT LOADING PARTS' = 129, 'SYSTEM SYNC DATABASE REPLICA' = 130, 'SYSTEM SYNC TRANSACTION LOG' = 131, 'SYSTEM SYNC FILE CACHE' = 132, 'SYSTEM FLUSH DISTRIBUTED' = 133, 'SYSTEM FLUSH LOGS' = 134, 'SYSTEM FLUSH' = 135, 'SYSTEM THREAD FUZZER' = 136, 'SYSTEM UNFREEZE' = 137, 'SYSTEM FAILPOINT' = 138, 'SYSTEM' = 139, 'dictGet' = 140, 'displaySecretsInShowAndSelect' = 141, 'addressToLine' = 142, 'addressToLineWithInlines' = 143, 'addressToSymbol' = 144, 'demangle' = 145, 'INTROSPECTION' = 146, 'FILE' = 147, 'URL' = 148, 'REMOTE' = 149, 'MONGO' = 150, 'MEILISEARCH' = 151, 'MYSQL' = 152, 'POSTGRES' = 153, 'SQLITE' = 154, 'ODBC' = 155, 'JDBC' = 156, 'HDFS' = 157, 'S3' = 158, 'HIVE' = 159, 'SOURCES' = 160, 'CLUSTER' = 161, 'ALL' = 162, 'NONE' = 163))
+    `parent_group` Nullable(Enum16('SHOW DATABASES' = 0, 'SHOW TABLES' = 1, 'SHOW COLUMNS' = 2, 'SHOW DICTIONARIES' = 3, 'SHOW' = 4, 'SHOW FILESYSTEM CACHES' = 5, 'SELECT' = 6, 'INSERT' = 7, 'ALTER UPDATE' = 8, 'ALTER DELETE' = 9, 'ALTER ADD COLUMN' = 10, 'ALTER MODIFY COLUMN' = 11, 'ALTER DROP COLUMN' = 12, 'ALTER COMMENT COLUMN' = 13, 'ALTER CLEAR COLUMN' = 14, 'ALTER RENAME COLUMN' = 15, 'ALTER MATERIALIZE COLUMN' = 16, 'ALTER COLUMN' = 17, 'ALTER MODIFY COMMENT' = 18, 'ALTER ORDER BY' = 19, 'ALTER SAMPLE BY' = 20, 'ALTER ADD INDEX' = 21, 'ALTER DROP INDEX' = 22, 'ALTER MATERIALIZE INDEX' = 23, 'ALTER CLEAR INDEX' = 24, 'ALTER INDEX' = 25, 'ALTER ADD PROJECTION' = 26, 'ALTER DROP PROJECTION' = 27, 'ALTER MATERIALIZE PROJECTION' = 28, 'ALTER CLEAR PROJECTION' = 29, 'ALTER PROJECTION' = 30, 'ALTER ADD CONSTRAINT' = 31, 'ALTER DROP CONSTRAINT' = 32, 'ALTER CONSTRAINT' = 33, 'ALTER TTL' = 34, 'ALTER MATERIALIZE TTL' = 35, 'ALTER SETTINGS' = 36, 'ALTER MOVE PARTITION' = 37, 'ALTER FETCH PARTITION' = 38, 'ALTER FREEZE PARTITION' = 39, 'ALTER DATABASE SETTINGS' = 40, 'ALTER NAMED COLLECTION' = 41, 'ALTER TABLE' = 42, 'ALTER DATABASE' = 43, 'ALTER VIEW REFRESH' = 44, 'ALTER VIEW MODIFY QUERY' = 45, 'ALTER VIEW' = 46, 'ALTER' = 47, 'CREATE DATABASE' = 48, 'CREATE TABLE' = 49, 'CREATE VIEW' = 50, 'CREATE DICTIONARY' = 51, 'CREATE TEMPORARY TABLE' = 52, 'CREATE ARBITRARY TEMPORARY TABLE' = 53, 'CREATE FUNCTION' = 54, 'CREATE NAMED COLLECTION' = 55, 'CREATE' = 56, 'DROP DATABASE' = 57, 'DROP TABLE' = 58, 'DROP VIEW' = 59, 'DROP DICTIONARY' = 60, 'DROP FUNCTION' = 61, 'DROP NAMED COLLECTION' = 62, 'DROP' = 63, 'UNDROP TABLE' = 64, 'TRUNCATE' = 65, 'OPTIMIZE' = 66, 'BACKUP' = 67, 'KILL QUERY' = 68, 'KILL TRANSACTION' = 69, 'MOVE PARTITION BETWEEN SHARDS' = 70, 'CREATE USER' = 71, 'ALTER USER' = 72, 'DROP USER' = 73, 'CREATE ROLE' = 74, 'ALTER ROLE' = 75, 'DROP ROLE' = 76, 'ROLE ADMIN' = 77, 'CREATE ROW POLICY' = 78, 'ALTER ROW POLICY' = 79, 'DROP ROW POLICY' = 80, 'CREATE QUOTA' = 81, 'ALTER QUOTA' = 82, 'DROP QUOTA' = 83, 'CREATE SETTINGS PROFILE' = 84, 'ALTER SETTINGS PROFILE' = 85, 'DROP SETTINGS PROFILE' = 86, 'SHOW USERS' = 87, 'SHOW ROLES' = 88, 'SHOW ROW POLICIES' = 89, 'SHOW QUOTAS' = 90, 'SHOW SETTINGS PROFILES' = 91, 'SHOW ACCESS' = 92, 'ACCESS MANAGEMENT' = 93, 'SHOW NAMED COLLECTIONS' = 94, 'SHOW NAMED COLLECTIONS SECRETS' = 95, 'NAMED COLLECTION CONTROL' = 96, 'SYSTEM SHUTDOWN' = 97, 'SYSTEM DROP DNS CACHE' = 98, 'SYSTEM DROP MARK CACHE' = 99, 'SYSTEM DROP UNCOMPRESSED CACHE' = 100, 'SYSTEM DROP MMAP CACHE' = 101, 'SYSTEM DROP QUERY CACHE' = 102, 'SYSTEM DROP COMPILED EXPRESSION CACHE' = 103, 'SYSTEM DROP FILESYSTEM CACHE' = 104, 'SYSTEM DROP SCHEMA CACHE' = 105, 'SYSTEM DROP S3 CLIENT CACHE' = 106, 'SYSTEM DROP CACHE' = 107, 'SYSTEM RELOAD CONFIG' = 108, 'SYSTEM RELOAD USERS' = 109, 'SYSTEM RELOAD SYMBOLS' = 110, 'SYSTEM RELOAD DICTIONARY' = 111, 'SYSTEM RELOAD MODEL' = 112, 'SYSTEM RELOAD FUNCTION' = 113, 'SYSTEM RELOAD EMBEDDED DICTIONARIES' = 114, 'SYSTEM RELOAD' = 115, 'SYSTEM RESTART DISK' = 116, 'SYSTEM MERGES' = 117, 'SYSTEM TTL MERGES' = 118, 'SYSTEM FETCHES' = 119, 'SYSTEM MOVES' = 120, 'SYSTEM DISTRIBUTED SENDS' = 121, 'SYSTEM REPLICATED SENDS' = 122, 'SYSTEM SENDS' = 123, 'SYSTEM REPLICATION QUEUES' = 124, 'SYSTEM DROP REPLICA' = 125, 'SYSTEM SYNC REPLICA' = 126, 'SYSTEM RESTART REPLICA' = 127, 'SYSTEM RESTORE REPLICA' = 128, 'SYSTEM WAIT LOADING PARTS' = 129, 'SYSTEM SYNC DATABASE REPLICA' = 130, 'SYSTEM SYNC TRANSACTION LOG' = 131, 'SYSTEM SYNC FILE CACHE' = 132, 'SYSTEM FLUSH DISTRIBUTED' = 133, 'SYSTEM FLUSH LOGS' = 134, 'SYSTEM FLUSH' = 135, 'SYSTEM THREAD FUZZER' = 136, 'SYSTEM UNFREEZE' = 137, 'SYSTEM FAILPOINT' = 138, 'SYSTEM' = 139, 'dictGet' = 140, 'displaySecretsInShowAndSelect' = 141, 'addressToLine' = 142, 'addressToLineWithInlines' = 143, 'addressToSymbol' = 144, 'demangle' = 145, 'INTROSPECTION' = 146, 'FILE' = 147, 'URL' = 148, 'REMOTE' = 149, 'MONGO' = 150, 'REDIS' = 151, 'MEILISEARCH' = 152, 'MYSQL' = 153, 'POSTGRES' = 154, 'SQLITE' = 155, 'ODBC' = 156, 'JDBC' = 157, 'HDFS' = 158, 'S3' = 159, 'HIVE' = 160, 'AZURE' = 161, 'SOURCES' = 162, 'CLUSTER' = 163, 'ALL' = 164, 'NONE' = 165))
 )
 ENGINE = SystemPrivileges
 COMMENT 'SYSTEM TABLE is built on the fly.'
@@ -750,6 +751,7 @@ CREATE TABLE system.projection_parts_columns
     `column_data_compressed_bytes` UInt64,
     `column_data_uncompressed_bytes` UInt64,
     `column_marks_bytes` UInt64,
+    `column_modification_time` Nullable(DateTime),
     `bytes` UInt64,
     `marks_size` UInt64,
     `part_name` String
diff --git a/tests/queries/0_stateless/02125_many_mutations.sh b/tests/queries/0_stateless/02125_many_mutations.sh
index 7a89e5f7c4f..b42d5bb15d3 100755
--- a/tests/queries/0_stateless/02125_many_mutations.sh
+++ b/tests/queries/0_stateless/02125_many_mutations.sh
@@ -5,7 +5,9 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_CLIENT -q "create table many_mutations (x UInt32, y UInt32) engine = MergeTree order by x"
+# "max_parts_to_merge_at_once = 1" prevents merges to start in background before our own OPTIMIZE FINAL
+
+$CLICKHOUSE_CLIENT -q "create table many_mutations (x UInt32, y UInt32) engine = MergeTree order by x settings number_of_mutations_to_delay = 0, number_of_mutations_to_throw = 0, max_parts_to_merge_at_once = 1"
 $CLICKHOUSE_CLIENT -q "insert into many_mutations values (0, 0), (1, 1)"
 $CLICKHOUSE_CLIENT -q "system stop merges many_mutations"
 
@@ -44,6 +46,6 @@ wait
 
 $CLICKHOUSE_CLIENT -q "select count() from system.mutations where database = currentDatabase() and table = 'many_mutations' and not is_done"
 $CLICKHOUSE_CLIENT -q "system start merges many_mutations"
-$CLICKHOUSE_CLIENT -q "optimize table many_mutations final"
+$CLICKHOUSE_CLIENT -q "optimize table many_mutations final" --optimize_throw_if_noop 1
 $CLICKHOUSE_CLIENT -q "select count() from system.mutations where database = currentDatabase() and table = 'many_mutations' and not is_done"
 $CLICKHOUSE_CLIENT -q "select x, y from many_mutations order by x"
diff --git a/tests/queries/0_stateless/02125_many_mutations_2.sh b/tests/queries/0_stateless/02125_many_mutations_2.sh
index df170a402c6..e5e3070a944 100755
--- a/tests/queries/0_stateless/02125_many_mutations_2.sh
+++ b/tests/queries/0_stateless/02125_many_mutations_2.sh
@@ -5,7 +5,9 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_CLIENT -q "create table many_mutations (x UInt32, y UInt32) engine = MergeTree order by x"
+# "max_parts_to_merge_at_once = 1" prevents merges to start in background before our own OPTIMIZE FINAL
+
+$CLICKHOUSE_CLIENT -q "create table many_mutations (x UInt32, y UInt32) engine = MergeTree order by x settings number_of_mutations_to_delay = 0, number_of_mutations_to_throw = 0, max_parts_to_merge_at_once = 1"
 $CLICKHOUSE_CLIENT -q "insert into many_mutations select number, number + 1 from numbers(2000)"
 $CLICKHOUSE_CLIENT -q "system stop merges many_mutations"
 
@@ -44,7 +46,7 @@ wait
 
 $CLICKHOUSE_CLIENT -q "select count() from system.mutations where database = currentDatabase() and table = 'many_mutations' and not is_done"
 $CLICKHOUSE_CLIENT -q "system start merges many_mutations"
-$CLICKHOUSE_CLIENT -q "optimize table many_mutations final"
+$CLICKHOUSE_CLIENT -q "optimize table many_mutations final" --optimize_throw_if_noop 1
 $CLICKHOUSE_CLIENT -q "system flush logs"
 $CLICKHOUSE_CLIENT -q "select count() from system.mutations where database = currentDatabase() and table = 'many_mutations' and not is_done"
 $CLICKHOUSE_CLIENT -q "select count() from many_mutations"
diff --git a/tests/queries/0_stateless/02149_schema_inference_formats_with_schema.sh b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema.sh
deleted file mode 100755
index cf5a086fb5e..00000000000
--- a/tests/queries/0_stateless/02149_schema_inference_formats_with_schema.sh
+++ /dev/null
@@ -1,65 +0,0 @@
-#!/usr/bin/env bash
-# Tags: no-parallel, no-fasttest
-
-CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CURDIR"/../shell_config.sh
-
-
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
-FILE_NAME=test_$CLICKHOUSE_TEST_UNIQUE_NAME.data
-DATA_FILE=$USER_FILES_PATH/$FILE_NAME
-
-for format in Arrow ArrowStream Parquet ORC Native TSVWithNamesAndTypes TSVRawWithNamesAndTypes CSVWithNamesAndTypes JSONCompactEachRowWithNamesAndTypes JSONCompactStringsEachRowWithNamesAndTypes RowBinaryWithNamesAndTypes CustomSeparatedWithNamesAndTypes
-do
-    echo $format
-    $CLICKHOUSE_CLIENT -q "select toInt8(-number) as int8, toUInt8(number) as uint8, toInt16(-number) as int16, toUInt16(number) as uint16, toInt32(-number) as int32, toUInt32(number) as uint32, toInt64(-number) as int64, toUInt64(number) as uint64 from numbers(2) format $format" > $DATA_FILE
-    $CLICKHOUSE_CLIENT -q "desc file('$FILE_NAME', '$format')"
-    $CLICKHOUSE_CLIENT -q "select * from file('$FILE_NAME', '$format')"
-
-    $CLICKHOUSE_CLIENT -q "select toFloat32(number * 1.2) as float32, toFloat64(number / 1.3) as float64, toDecimal32(number / 0.3, 5) as decimal32, toDecimal64(number / 0.003, 5) as decimal64 from numbers(2) format $format" > $DATA_FILE
-    $CLICKHOUSE_CLIENT -q "desc file('$FILE_NAME', '$format')"
-    $CLICKHOUSE_CLIENT -q "select * from file('$FILE_NAME', '$format')"
-
-    $CLICKHOUSE_CLIENT -q "select toDate(number) as date, toDate32(number) as date32 from numbers(2) format $format" > $DATA_FILE
-    $CLICKHOUSE_CLIENT -q "desc file('$FILE_NAME', '$format')"
-    $CLICKHOUSE_CLIENT -q "select * from file('$FILE_NAME', '$format')"
-
-    $CLICKHOUSE_CLIENT -q "select concat('Str: ', toString(number)) as str, toFixedString(toString((number + 1) * 100 % 1000), 3) as fixed_string from numbers(2) format $format" > $DATA_FILE
-    $CLICKHOUSE_CLIENT -q "desc file('$FILE_NAME', '$format')"
-    $CLICKHOUSE_CLIENT -q "select * from file('$FILE_NAME', '$format')"
- 
-    $CLICKHOUSE_CLIENT -q "select [number, number + 1] as array, (number, toString(number)) as tuple, map(toString(number), number) as map from numbers(2) format $format" > $DATA_FILE
-    $CLICKHOUSE_CLIENT -q "desc file('$FILE_NAME', '$format')"
-    $CLICKHOUSE_CLIENT -q "select * from file('$FILE_NAME', '$format')"
-
-    $CLICKHOUSE_CLIENT -q "select [([number, number + 1], map('42', number)), ([], map()), ([42], map('42', 42))] as nested1, (([[number], [number + 1], []], map(number, [(number, '42'), (number + 1, '42')])), 42) as nested2 from numbers(2) format $format" > $DATA_FILE
-    $CLICKHOUSE_CLIENT -q "desc file('$FILE_NAME', '$format')"
-    $CLICKHOUSE_CLIENT -q "select * from file('$FILE_NAME', '$format')"
-done
-
-echo "Avro"
-
-echo $format
-$CLICKHOUSE_CLIENT -q "select toInt8(-number) as int8, toUInt8(number) as uint8, toInt16(-number) as int16, toUInt16(number) as uint16, toInt32(-number) as int32, toUInt32(number) as uint32, toInt64(-number) as int64, toUInt64(number) as uint64 from numbers(2) format Avro" > $DATA_FILE
-$CLICKHOUSE_CLIENT -q "desc file('$FILE_NAME', 'Avro')"
-$CLICKHOUSE_CLIENT -q "select * from file('$FILE_NAME', 'Avro')"
-
-$CLICKHOUSE_CLIENT -q "select toFloat32(number * 1.2) as float32, toFloat64(number / 1.3) as float64 from numbers(2) format Avro" > $DATA_FILE
-$CLICKHOUSE_CLIENT -q "desc file('$FILE_NAME', 'Avro')"
-$CLICKHOUSE_CLIENT -q "select * from file('$FILE_NAME', 'Avro')"
-
-$CLICKHOUSE_CLIENT -q "select toDate(number) as date from numbers(2) format Avro" > $DATA_FILE
-$CLICKHOUSE_CLIENT -q "desc file('$FILE_NAME', 'Avro')"
-$CLICKHOUSE_CLIENT -q "select * from file('$FILE_NAME', 'Avro')"
-
-$CLICKHOUSE_CLIENT -q "select concat('Str: ', toString(number)) as str, toFixedString(toString((number + 1) * 100 % 1000), 3) as fixed_string from numbers(2) format Avro" > $DATA_FILE
-$CLICKHOUSE_CLIENT -q "desc file('$FILE_NAME', 'Avro')"
-$CLICKHOUSE_CLIENT -q "select * from file('$FILE_NAME', 'Avro')"
- 
-$CLICKHOUSE_CLIENT -q "select [number, number + 1] as array, [[[number], [number + 1]]] as nested from numbers(2) format Avro" > $DATA_FILE
-$CLICKHOUSE_CLIENT -q "desc file('$FILE_NAME', 'Avro')"
-$CLICKHOUSE_CLIENT -q "select * from file('$FILE_NAME', 'Avro')"
-
-rm $DATA_FILE
-
diff --git a/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_1.reference b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_1.reference
new file mode 100644
index 00000000000..4e020427ad0
--- /dev/null
+++ b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_1.reference
@@ -0,0 +1,170 @@
+Arrow
+int8	Nullable(Int8)					
+uint8	Nullable(UInt8)					
+int16	Nullable(Int16)					
+uint16	Nullable(UInt16)					
+int32	Nullable(Int32)					
+uint32	Nullable(UInt32)					
+int64	Nullable(Int64)					
+uint64	Nullable(UInt64)					
+0	0	0	0	0	0	0	0
+-1	1	-1	1	-1	1	-1	1
+float32	Nullable(Float32)					
+float64	Nullable(Float64)					
+decimal32	Nullable(Decimal(9, 5))					
+decimal64	Nullable(Decimal(18, 5))					
+0	0	0	0
+1.2	0.7692307692307692	3.33333	333.33333
+date	Nullable(UInt16)					
+date32	Nullable(Date32)					
+0	1970-01-01
+1	1970-01-02
+str	Nullable(String)					
+fixed_string	Nullable(FixedString(3))					
+Str: 0	100
+Str: 1	200
+array	Array(Nullable(UInt64))					
+tuple	Tuple(`1` Nullable(UInt64), `2` Nullable(String))					
+map	Map(String, Nullable(UInt64))					
+[0,1]	(0,'0')	{'0':0}
+[1,2]	(1,'1')	{'1':1}
+nested1	Array(Tuple(`1` Array(Nullable(UInt64)), `2` Map(String, Nullable(UInt64))))					
+nested2	Tuple(`1` Tuple(`1` Array(Array(Nullable(UInt64))), `2` Map(UInt64, Array(Tuple(`1` Nullable(UInt64), `2` Nullable(String))))), `2` Nullable(UInt8))					
+[([0,1],{'42':0}),([],{}),([42],{'42':42})]	(([[0],[1],[]],{0:[(0,'42'),(1,'42')]}),42)
+[([1,2],{'42':1}),([],{}),([42],{'42':42})]	(([[1],[2],[]],{1:[(1,'42'),(2,'42')]}),42)
+ArrowStream
+int8	Nullable(Int8)					
+uint8	Nullable(UInt8)					
+int16	Nullable(Int16)					
+uint16	Nullable(UInt16)					
+int32	Nullable(Int32)					
+uint32	Nullable(UInt32)					
+int64	Nullable(Int64)					
+uint64	Nullable(UInt64)					
+0	0	0	0	0	0	0	0
+-1	1	-1	1	-1	1	-1	1
+float32	Nullable(Float32)					
+float64	Nullable(Float64)					
+decimal32	Nullable(Decimal(9, 5))					
+decimal64	Nullable(Decimal(18, 5))					
+0	0	0	0
+1.2	0.7692307692307692	3.33333	333.33333
+date	Nullable(UInt16)					
+date32	Nullable(Date32)					
+0	1970-01-01
+1	1970-01-02
+str	Nullable(String)					
+fixed_string	Nullable(FixedString(3))					
+Str: 0	100
+Str: 1	200
+array	Array(Nullable(UInt64))					
+tuple	Tuple(`1` Nullable(UInt64), `2` Nullable(String))					
+map	Map(String, Nullable(UInt64))					
+[0,1]	(0,'0')	{'0':0}
+[1,2]	(1,'1')	{'1':1}
+nested1	Array(Tuple(`1` Array(Nullable(UInt64)), `2` Map(String, Nullable(UInt64))))					
+nested2	Tuple(`1` Tuple(`1` Array(Array(Nullable(UInt64))), `2` Map(UInt64, Array(Tuple(`1` Nullable(UInt64), `2` Nullable(String))))), `2` Nullable(UInt8))					
+[([0,1],{'42':0}),([],{}),([42],{'42':42})]	(([[0],[1],[]],{0:[(0,'42'),(1,'42')]}),42)
+[([1,2],{'42':1}),([],{}),([42],{'42':42})]	(([[1],[2],[]],{1:[(1,'42'),(2,'42')]}),42)
+Parquet
+int8	Nullable(Int8)					
+uint8	Nullable(UInt8)					
+int16	Nullable(Int16)					
+uint16	Nullable(UInt16)					
+int32	Nullable(Int32)					
+uint32	Nullable(UInt32)					
+int64	Nullable(Int64)					
+uint64	Nullable(UInt64)					
+0	0	0	0	0	0	0	0
+-1	1	-1	1	-1	1	-1	1
+float32	Nullable(Float32)					
+float64	Nullable(Float64)					
+decimal32	Nullable(Decimal(9, 5))					
+decimal64	Nullable(Decimal(18, 5))					
+0	0	0	0
+1.2	0.7692307692307692	3.33333	333.33333
+date	Nullable(UInt16)					
+date32	Nullable(Date32)					
+0	1970-01-01
+1	1970-01-02
+str	Nullable(String)					
+fixed_string	Nullable(FixedString(3))					
+Str: 0	100
+Str: 1	200
+array	Array(Nullable(UInt64))					
+tuple	Tuple(`1` Nullable(UInt64), `2` Nullable(String))					
+map	Map(String, Nullable(UInt64))					
+[0,1]	(0,'0')	{'0':0}
+[1,2]	(1,'1')	{'1':1}
+nested1	Array(Tuple(`1` Array(Nullable(UInt64)), `2` Map(String, Nullable(UInt64))))					
+nested2	Tuple(`1` Tuple(`1` Array(Array(Nullable(UInt64))), `2` Map(UInt64, Array(Tuple(`1` Nullable(UInt64), `2` Nullable(String))))), `2` Nullable(UInt8))					
+[([0,1],{'42':0}),([],{}),([42],{'42':42})]	(([[0],[1],[]],{0:[(0,'42'),(1,'42')]}),42)
+[([1,2],{'42':1}),([],{}),([42],{'42':42})]	(([[1],[2],[]],{1:[(1,'42'),(2,'42')]}),42)
+ORC
+int8	Nullable(Int8)					
+uint8	Nullable(Int8)					
+int16	Nullable(Int16)					
+uint16	Nullable(Int16)					
+int32	Nullable(Int32)					
+uint32	Nullable(Int32)					
+int64	Nullable(Int64)					
+uint64	Nullable(Int64)					
+0	0	0	0	0	0	0	0
+-1	1	-1	1	-1	1	-1	1
+float32	Nullable(Float32)					
+float64	Nullable(Float64)					
+decimal32	Nullable(Decimal(9, 5))					
+decimal64	Nullable(Decimal(18, 5))					
+0	0	0	0
+1.2	0.7692307692307692	3.33333	333.33333
+date	Nullable(Date32)					
+date32	Nullable(Date32)					
+1970-01-01	1970-01-01
+1970-01-02	1970-01-02
+str	Nullable(String)					
+fixed_string	Nullable(String)					
+Str: 0	100
+Str: 1	200
+array	Array(Nullable(Int64))					
+tuple	Tuple(`1` Nullable(Int64), `2` Nullable(String))					
+map	Map(String, Nullable(Int64))					
+[0,1]	(0,'0')	{'0':0}
+[1,2]	(1,'1')	{'1':1}
+nested1	Array(Tuple(`1` Array(Nullable(Int64)), `2` Map(String, Nullable(Int64))))					
+nested2	Tuple(`1` Tuple(`1` Array(Array(Nullable(Int64))), `2` Map(Int64, Array(Tuple(`1` Nullable(Int64), `2` Nullable(String))))), `2` Nullable(Int8))					
+[([0,1],{'42':0}),([],{}),([42],{'42':42})]	(([[0],[1],[]],{0:[(0,'42'),(1,'42')]}),42)
+[([1,2],{'42':1}),([],{}),([42],{'42':42})]	(([[1],[2],[]],{1:[(1,'42'),(2,'42')]}),42)
+Native
+int8	Int8					
+uint8	UInt8					
+int16	Int16					
+uint16	UInt16					
+int32	Int32					
+uint32	UInt32					
+int64	Int64					
+uint64	UInt64					
+0	0	0	0	0	0	0	0
+-1	1	-1	1	-1	1	-1	1
+float32	Float32					
+float64	Float64					
+decimal32	Decimal(9, 5)					
+decimal64	Decimal(18, 5)					
+0	0	0	0
+1.2	0.7692307692307692	3.33333	333.33333
+date	Date					
+date32	Date32					
+1970-01-01	1970-01-01
+1970-01-02	1970-01-02
+str	String					
+fixed_string	FixedString(3)					
+Str: 0	100
+Str: 1	200
+array	Array(UInt64)					
+tuple	Tuple(UInt64, String)					
+map	Map(String, UInt64)					
+[0,1]	(0,'0')	{'0':0}
+[1,2]	(1,'1')	{'1':1}
+nested1	Array(Tuple(Array(UInt64), Map(String, UInt64)))					
+nested2	Tuple(Tuple(Array(Array(UInt64)), Map(UInt64, Array(Tuple(UInt64, String)))), UInt8)					
+[([0,1],{'42':0}),([],{}),([42],{'42':42})]	(([[0],[1],[]],{0:[(0,'42'),(1,'42')]}),42)
+[([1,2],{'42':1}),([],{}),([42],{'42':42})]	(([[1],[2],[]],{1:[(1,'42'),(2,'42')]}),42)
diff --git a/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_1.sh b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_1.sh
new file mode 100755
index 00000000000..a74d7c138d3
--- /dev/null
+++ b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_1.sh
@@ -0,0 +1,39 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+
+DATA_FILE=$CURDIR/test_$CLICKHOUSE_TEST_UNIQUE_NAME.data
+
+for format in Arrow ArrowStream Parquet ORC Native
+do
+    echo $format
+    $CLICKHOUSE_LOCAL -q "select toInt8(-number) as int8, toUInt8(number) as uint8, toInt16(-number) as int16, toUInt16(number) as uint16, toInt32(-number) as int32, toUInt32(number) as uint32, toInt64(-number) as int64, toUInt64(number) as uint64 from numbers(2) format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', '$format')"
+    $CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', '$format')"
+
+    $CLICKHOUSE_LOCAL -q "select toFloat32(number * 1.2) as float32, toFloat64(number / 1.3) as float64, toDecimal32(number / 0.3, 5) as decimal32, toDecimal64(number / 0.003, 5) as decimal64 from numbers(2) format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', '$format')"
+    $CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', '$format')"
+
+    $CLICKHOUSE_LOCAL -q "select toDate(number) as date, toDate32(number) as date32 from numbers(2) format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', '$format')"
+    $CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', '$format')"
+
+    $CLICKHOUSE_LOCAL -q "select concat('Str: ', toString(number)) as str, toFixedString(toString((number + 1) * 100 % 1000), 3) as fixed_string from numbers(2) format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', '$format')"
+    $CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', '$format')"
+ 
+    $CLICKHOUSE_LOCAL -q "select [number, number + 1] as array, (number, toString(number)) as tuple, map(toString(number), number) as map from numbers(2) format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', '$format')"
+    $CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', '$format')"
+
+    $CLICKHOUSE_LOCAL -q "select [([number, number + 1], map('42', number)), ([], map()), ([42], map('42', 42))] as nested1, (([[number], [number + 1], []], map(number, [(number, '42'), (number + 1, '42')])), 42) as nested2 from numbers(2) format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', '$format')"
+    $CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', '$format')"
+done
+
+rm $DATA_FILE
diff --git a/tests/queries/0_stateless/02149_schema_inference_formats_with_schema.reference b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_2.reference
similarity index 51%
rename from tests/queries/0_stateless/02149_schema_inference_formats_with_schema.reference
rename to tests/queries/0_stateless/02149_schema_inference_formats_with_schema_2.reference
index 9a7a1611a7b..ec6ac9539f8 100644
--- a/tests/queries/0_stateless/02149_schema_inference_formats_with_schema.reference
+++ b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_2.reference
@@ -1,173 +1,3 @@
-Arrow
-int8	Nullable(Int8)					
-uint8	Nullable(UInt8)					
-int16	Nullable(Int16)					
-uint16	Nullable(UInt16)					
-int32	Nullable(Int32)					
-uint32	Nullable(UInt32)					
-int64	Nullable(Int64)					
-uint64	Nullable(UInt64)					
-0	0	0	0	0	0	0	0
--1	1	-1	1	-1	1	-1	1
-float32	Nullable(Float32)					
-float64	Nullable(Float64)					
-decimal32	Nullable(Decimal(9, 5))					
-decimal64	Nullable(Decimal(18, 5))					
-0	0	0	0
-1.2	0.7692307692307692	3.33333	333.33333
-date	Nullable(UInt16)					
-date32	Nullable(Date32)					
-0	1970-01-01
-1	1970-01-02
-str	Nullable(String)					
-fixed_string	Nullable(FixedString(3))					
-Str: 0	100
-Str: 1	200
-array	Array(Nullable(UInt64))					
-tuple	Tuple(`1` Nullable(UInt64), `2` Nullable(String))					
-map	Map(String, Nullable(UInt64))					
-[0,1]	(0,'0')	{'0':0}
-[1,2]	(1,'1')	{'1':1}
-nested1	Array(Tuple(`1` Array(Nullable(UInt64)), `2` Map(String, Nullable(UInt64))))					
-nested2	Tuple(`1` Tuple(`1` Array(Array(Nullable(UInt64))), `2` Map(UInt64, Array(Tuple(`1` Nullable(UInt64), `2` Nullable(String))))), `2` Nullable(UInt8))					
-[([0,1],{'42':0}),([],{}),([42],{'42':42})]	(([[0],[1],[]],{0:[(0,'42'),(1,'42')]}),42)
-[([1,2],{'42':1}),([],{}),([42],{'42':42})]	(([[1],[2],[]],{1:[(1,'42'),(2,'42')]}),42)
-ArrowStream
-int8	Nullable(Int8)					
-uint8	Nullable(UInt8)					
-int16	Nullable(Int16)					
-uint16	Nullable(UInt16)					
-int32	Nullable(Int32)					
-uint32	Nullable(UInt32)					
-int64	Nullable(Int64)					
-uint64	Nullable(UInt64)					
-0	0	0	0	0	0	0	0
--1	1	-1	1	-1	1	-1	1
-float32	Nullable(Float32)					
-float64	Nullable(Float64)					
-decimal32	Nullable(Decimal(9, 5))					
-decimal64	Nullable(Decimal(18, 5))					
-0	0	0	0
-1.2	0.7692307692307692	3.33333	333.33333
-date	Nullable(UInt16)					
-date32	Nullable(Date32)					
-0	1970-01-01
-1	1970-01-02
-str	Nullable(String)					
-fixed_string	Nullable(FixedString(3))					
-Str: 0	100
-Str: 1	200
-array	Array(Nullable(UInt64))					
-tuple	Tuple(`1` Nullable(UInt64), `2` Nullable(String))					
-map	Map(String, Nullable(UInt64))					
-[0,1]	(0,'0')	{'0':0}
-[1,2]	(1,'1')	{'1':1}
-nested1	Array(Tuple(`1` Array(Nullable(UInt64)), `2` Map(String, Nullable(UInt64))))					
-nested2	Tuple(`1` Tuple(`1` Array(Array(Nullable(UInt64))), `2` Map(UInt64, Array(Tuple(`1` Nullable(UInt64), `2` Nullable(String))))), `2` Nullable(UInt8))					
-[([0,1],{'42':0}),([],{}),([42],{'42':42})]	(([[0],[1],[]],{0:[(0,'42'),(1,'42')]}),42)
-[([1,2],{'42':1}),([],{}),([42],{'42':42})]	(([[1],[2],[]],{1:[(1,'42'),(2,'42')]}),42)
-Parquet
-int8	Nullable(Int8)					
-uint8	Nullable(UInt8)					
-int16	Nullable(Int16)					
-uint16	Nullable(UInt16)					
-int32	Nullable(Int32)					
-uint32	Nullable(UInt32)					
-int64	Nullable(Int64)					
-uint64	Nullable(UInt64)					
-0	0	0	0	0	0	0	0
--1	1	-1	1	-1	1	-1	1
-float32	Nullable(Float32)					
-float64	Nullable(Float64)					
-decimal32	Nullable(Decimal(9, 5))					
-decimal64	Nullable(Decimal(18, 5))					
-0	0	0	0
-1.2	0.7692307692307692	3.33333	333.33333
-date	Nullable(UInt16)					
-date32	Nullable(Date32)					
-0	1970-01-01
-1	1970-01-02
-str	Nullable(String)					
-fixed_string	Nullable(FixedString(3))					
-Str: 0	100
-Str: 1	200
-array	Array(Nullable(UInt64))					
-tuple	Tuple(`1` Nullable(UInt64), `2` Nullable(String))					
-map	Map(String, Nullable(UInt64))					
-[0,1]	(0,'0')	{'0':0}
-[1,2]	(1,'1')	{'1':1}
-nested1	Array(Tuple(`1` Array(Nullable(UInt64)), `2` Map(String, Nullable(UInt64))))					
-nested2	Tuple(`1` Tuple(`1` Array(Array(Nullable(UInt64))), `2` Map(UInt64, Array(Tuple(`1` Nullable(UInt64), `2` Nullable(String))))), `2` Nullable(UInt8))					
-[([0,1],{'42':0}),([],{}),([42],{'42':42})]	(([[0],[1],[]],{0:[(0,'42'),(1,'42')]}),42)
-[([1,2],{'42':1}),([],{}),([42],{'42':42})]	(([[1],[2],[]],{1:[(1,'42'),(2,'42')]}),42)
-ORC
-int8	Nullable(Int8)					
-uint8	Nullable(Int8)					
-int16	Nullable(Int16)					
-uint16	Nullable(Int16)					
-int32	Nullable(Int32)					
-uint32	Nullable(Int32)					
-int64	Nullable(Int64)					
-uint64	Nullable(Int64)					
-0	0	0	0	0	0	0	0
--1	1	-1	1	-1	1	-1	1
-float32	Nullable(Float32)					
-float64	Nullable(Float64)					
-decimal32	Nullable(Decimal(9, 5))					
-decimal64	Nullable(Decimal(18, 5))					
-0	0	0	0
-1.2	0.7692307692307692	3.33333	333.33333
-date	Nullable(Date32)					
-date32	Nullable(Date32)					
-1970-01-01	1970-01-01
-1970-01-02	1970-01-02
-str	Nullable(String)					
-fixed_string	Nullable(String)					
-Str: 0	100
-Str: 1	200
-array	Array(Nullable(Int64))					
-tuple	Tuple(`1` Nullable(Int64), `2` Nullable(String))					
-map	Map(String, Nullable(Int64))					
-[0,1]	(0,'0')	{'0':0}
-[1,2]	(1,'1')	{'1':1}
-nested1	Array(Tuple(`1` Array(Nullable(Int64)), `2` Map(String, Nullable(Int64))))					
-nested2	Tuple(`1` Tuple(`1` Array(Array(Nullable(Int64))), `2` Map(Int64, Array(Tuple(`1` Nullable(Int64), `2` Nullable(String))))), `2` Nullable(Int8))					
-[([0,1],{'42':0}),([],{}),([42],{'42':42})]	(([[0],[1],[]],{0:[(0,'42'),(1,'42')]}),42)
-[([1,2],{'42':1}),([],{}),([42],{'42':42})]	(([[1],[2],[]],{1:[(1,'42'),(2,'42')]}),42)
-Native
-int8	Int8					
-uint8	UInt8					
-int16	Int16					
-uint16	UInt16					
-int32	Int32					
-uint32	UInt32					
-int64	Int64					
-uint64	UInt64					
-0	0	0	0	0	0	0	0
--1	1	-1	1	-1	1	-1	1
-float32	Float32					
-float64	Float64					
-decimal32	Decimal(9, 5)					
-decimal64	Decimal(18, 5)					
-0	0	0	0
-1.2	0.7692307692307692	3.33333	333.33333
-date	Date					
-date32	Date32					
-1970-01-01	1970-01-01
-1970-01-02	1970-01-02
-str	String					
-fixed_string	FixedString(3)					
-Str: 0	100
-Str: 1	200
-array	Array(UInt64)					
-tuple	Tuple(UInt64, String)					
-map	Map(String, UInt64)					
-[0,1]	(0,'0')	{'0':0}
-[1,2]	(1,'1')	{'1':1}
-nested1	Array(Tuple(Array(UInt64), Map(String, UInt64)))					
-nested2	Tuple(Tuple(Array(Array(UInt64)), Map(UInt64, Array(Tuple(UInt64, String)))), UInt8)					
-[([0,1],{'42':0}),([],{}),([42],{'42':42})]	(([[0],[1],[]],{0:[(0,'42'),(1,'42')]}),42)
-[([1,2],{'42':1}),([],{}),([42],{'42':42})]	(([[1],[2],[]],{1:[(1,'42'),(2,'42')]}),42)
 TSVWithNamesAndTypes
 int8	Int8					
 uint8	UInt8					
@@ -406,30 +236,3 @@ nested1	Array(Tuple(Array(UInt64), Map(String, UInt64)))
 nested2	Tuple(Tuple(Array(Array(UInt64)), Map(UInt64, Array(Tuple(UInt64, String)))), UInt8)					
 [([0,1],{'42':0}),([],{}),([42],{'42':42})]	(([[0],[1],[]],{0:[(0,'42'),(1,'42')]}),42)
 [([1,2],{'42':1}),([],{}),([42],{'42':42})]	(([[1],[2],[]],{1:[(1,'42'),(2,'42')]}),42)
-Avro
-CustomSeparatedWithNamesAndTypes
-int8	Int32					
-uint8	Int32					
-int16	Int32					
-uint16	Int32					
-int32	Int32					
-uint32	Int32					
-int64	Int64					
-uint64	Int64					
-0	0	0	0	0	0	0	0
--1	1	-1	1	-1	1	-1	1
-float32	Float32					
-float64	Float64					
-0	0
-1.2	0.7692307692307692
-date	Date32					
-1970-01-01
-1970-01-02
-str	String					
-fixed_string	FixedString(3)					
-Str: 0	100
-Str: 1	200
-array	Array(Int64)					
-nested	Array(Array(Array(Int64)))					
-[0,1]	[[[0],[1]]]
-[1,2]	[[[1],[2]]]
diff --git a/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_2.sh b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_2.sh
new file mode 100755
index 00000000000..f6d2d7483a1
--- /dev/null
+++ b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_2.sh
@@ -0,0 +1,39 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+DATA_FILE=$CURDIR/test_$CLICKHOUSE_TEST_UNIQUE_NAME.data
+
+for format in TSVWithNamesAndTypes TSVRawWithNamesAndTypes CSVWithNamesAndTypes JSONCompactEachRowWithNamesAndTypes JSONCompactStringsEachRowWithNamesAndTypes RowBinaryWithNamesAndTypes CustomSeparatedWithNamesAndTypes
+do
+    echo $format
+    $CLICKHOUSE_LOCAL -q "select toInt8(-number) as int8, toUInt8(number) as uint8, toInt16(-number) as int16, toUInt16(number) as uint16, toInt32(-number) as int32, toUInt32(number) as uint32, toInt64(-number) as int64, toUInt64(number) as uint64 from numbers(2) format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', '$format')"
+    $CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', '$format')"
+
+    $CLICKHOUSE_LOCAL -q "select toFloat32(number * 1.2) as float32, toFloat64(number / 1.3) as float64, toDecimal32(number / 0.3, 5) as decimal32, toDecimal64(number / 0.003, 5) as decimal64 from numbers(2) format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', '$format')"
+    $CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', '$format')"
+
+    $CLICKHOUSE_LOCAL -q "select toDate(number) as date, toDate32(number) as date32 from numbers(2) format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', '$format')"
+    $CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', '$format')"
+
+    $CLICKHOUSE_LOCAL -q "select concat('Str: ', toString(number)) as str, toFixedString(toString((number + 1) * 100 % 1000), 3) as fixed_string from numbers(2) format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', '$format')"
+    $CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', '$format')"
+ 
+    $CLICKHOUSE_LOCAL -q "select [number, number + 1] as array, (number, toString(number)) as tuple, map(toString(number), number) as map from numbers(2) format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', '$format')"
+    $CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', '$format')"
+
+    $CLICKHOUSE_LOCAL -q "select [([number, number + 1], map('42', number)), ([], map()), ([42], map('42', 42))] as nested1, (([[number], [number + 1], []], map(number, [(number, '42'), (number + 1, '42')])), 42) as nested2 from numbers(2) format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', '$format')"
+    $CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', '$format')"
+done
+
+rm $DATA_FILE
+
diff --git a/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_3.reference b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_3.reference
new file mode 100644
index 00000000000..d076bf9ed4e
--- /dev/null
+++ b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_3.reference
@@ -0,0 +1,26 @@
+Avro
+int8	Int32					
+uint8	Int32					
+int16	Int32					
+uint16	Int32					
+int32	Int32					
+uint32	Int32					
+int64	Int64					
+uint64	Int64					
+0	0	0	0	0	0	0	0
+-1	1	-1	1	-1	1	-1	1
+float32	Float32					
+float64	Float64					
+0	0
+1.2	0.7692307692307692
+date	Date32					
+1970-01-01
+1970-01-02
+str	String					
+fixed_string	FixedString(3)					
+Str: 0	100
+Str: 1	200
+array	Array(Int64)					
+nested	Array(Array(Array(Int64)))					
+[0,1]	[[[0],[1]]]
+[1,2]	[[[1],[2]]]
diff --git a/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_3.sh b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_3.sh
new file mode 100755
index 00000000000..fef85f0f1ed
--- /dev/null
+++ b/tests/queries/0_stateless/02149_schema_inference_formats_with_schema_3.sh
@@ -0,0 +1,33 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+DATA_FILE=$CURDIR/test_$CLICKHOUSE_TEST_UNIQUE_NAME.data
+
+echo "Avro"
+
+$CLICKHOUSE_LOCAL -q "select toInt8(-number) as int8, toUInt8(number) as uint8, toInt16(-number) as int16, toUInt16(number) as uint16, toInt32(-number) as int32, toUInt32(number) as uint32, toInt64(-number) as int64, toUInt64(number) as uint64 from numbers(2) format Avro" > $DATA_FILE
+$CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', 'Avro')"
+$CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', 'Avro')"
+
+$CLICKHOUSE_LOCAL -q "select toFloat32(number * 1.2) as float32, toFloat64(number / 1.3) as float64 from numbers(2) format Avro" > $DATA_FILE
+$CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', 'Avro')"
+$CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', 'Avro')"
+
+$CLICKHOUSE_LOCAL -q "select toDate(number) as date from numbers(2) format Avro" > $DATA_FILE
+$CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', 'Avro')"
+$CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', 'Avro')"
+
+$CLICKHOUSE_LOCAL -q "select concat('Str: ', toString(number)) as str, toFixedString(toString((number + 1) * 100 % 1000), 3) as fixed_string from numbers(2) format Avro" > $DATA_FILE
+$CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', 'Avro')"
+$CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', 'Avro')"
+ 
+$CLICKHOUSE_LOCAL -q "select [number, number + 1] as array, [[[number], [number + 1]]] as nested from numbers(2) format Avro" > $DATA_FILE
+$CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', 'Avro')"
+$CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', 'Avro')"
+
+rm $DATA_FILE
+
diff --git a/tests/queries/0_stateless/02226_parallel_reading_from_replicas_benchmark.sh b/tests/queries/0_stateless/02226_parallel_reading_from_replicas_benchmark.sh
index 4b8f8da5480..941f024825a 100755
--- a/tests/queries/0_stateless/02226_parallel_reading_from_replicas_benchmark.sh
+++ b/tests/queries/0_stateless/02226_parallel_reading_from_replicas_benchmark.sh
@@ -17,6 +17,8 @@ opts=(
     --allow_experimental_parallel_reading_from_replicas 1
     --parallel_replicas_for_non_replicated_merge_tree 1
     --max_parallel_replicas 3
+    --use_hedged_requests 0
+    --cluster_for_parallel_replicas parallel_replicas
 
     --iterations 1
 )
diff --git a/tests/queries/0_stateless/02227_union_match_by_name.reference b/tests/queries/0_stateless/02227_union_match_by_name.reference
index e51ea983f7f..685b3c83b05 100644
--- a/tests/queries/0_stateless/02227_union_match_by_name.reference
+++ b/tests/queries/0_stateless/02227_union_match_by_name.reference
@@ -30,7 +30,7 @@ Header: avgWeighted(x, y) Nullable(Float64)
                         255_UInt8 UInt8
                         1_UInt8 UInt8
                   Expression (Change column names to column identifiers)
-                  Header: system.one.dummy_0 UInt8
+                  Header: dummy_0 UInt8
                     ReadFromStorage (SystemOne)
                     Header: dummy UInt8
             Expression (Conversion before UNION)
@@ -46,7 +46,7 @@ Header: avgWeighted(x, y) Nullable(Float64)
                         NULL_Nullable(Nothing) Nullable(Nothing)
                         1_UInt8 UInt8
                   Expression (Change column names to column identifiers)
-                  Header: system.one.dummy_0 UInt8
+                  Header: dummy_0 UInt8
                     ReadFromStorage (SystemOne)
                     Header: dummy UInt8
 SELECT avgWeighted(x, y) FROM (SELECT NULL, 255 AS x, 1 AS y UNION ALL SELECT y, NULL AS x, 1 AS y);
diff --git a/tests/queries/0_stateless/02234_cast_to_ip_address.reference b/tests/queries/0_stateless/02234_cast_to_ip_address.reference
index 9023b36a9bf..fa9c6bd0f94 100644
--- a/tests/queries/0_stateless/02234_cast_to_ip_address.reference
+++ b/tests/queries/0_stateless/02234_cast_to_ip_address.reference
@@ -11,6 +11,10 @@ IPv4 functions
 127.0.0.1
 127.0.0.1
 --
+1.2.3.4
+1.2.3.4
+0.0.0.0
+--
 127.0.0.1
 --
 0
diff --git a/tests/queries/0_stateless/02234_cast_to_ip_address.sql b/tests/queries/0_stateless/02234_cast_to_ip_address.sql
index 6c65fe86cc9..28f1afff57f 100644
--- a/tests/queries/0_stateless/02234_cast_to_ip_address.sql
+++ b/tests/queries/0_stateless/02234_cast_to_ip_address.sql
@@ -20,6 +20,13 @@ SELECT toIPv4OrNull('127.0.0.1');
 
 SELECT '--';
 
+SELECT toIPv4(toIPv6('::ffff:1.2.3.4'));
+SELECT toIPv4(toIPv6('::afff:1.2.3.4')); --{serverError CANNOT_CONVERT_TYPE}
+SELECT toIPv4OrDefault(toIPv6('::ffff:1.2.3.4'));
+SELECT toIPv4OrDefault(toIPv6('::afff:1.2.3.4'));
+
+SELECT '--';
+
 SELECT cast('test' , 'IPv4'); --{serverError CANNOT_PARSE_IPV4}
 SELECT cast('127.0.0.1' , 'IPv4');
 
diff --git a/tests/queries/0_stateless/02273_full_sort_join.reference.j2 b/tests/queries/0_stateless/02273_full_sort_join.reference.j2
index 0af4158e971..98bfd9d9b2b 100644
--- a/tests/queries/0_stateless/02273_full_sort_join.reference.j2
+++ b/tests/queries/0_stateless/02273_full_sort_join.reference.j2
@@ -1,7 +1,7 @@
 {% set table_size = 15 -%}
 {% for join_algorithm in ['default', 'full_sorting_merge', 'grace_hash'] -%}
 -- {{ join_algorithm }} --
-{% for block_size in range(1, table_size + 1, 4) -%}
+{% for block_size in range(1, table_size + 1) -%}
 ALL INNER USING | bs = {{ block_size }}
 4	0	0
 5	0	0
@@ -50,6 +50,7 @@ ALL LEFT | bs = {{ block_size }}
 14	14	val9	0
 14	14	val9	0
 ALL RIGHT | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 4	4	0	val10
 5	5	0	val6
 6	6	0	val8
@@ -63,6 +64,7 @@ ALL RIGHT | bs = {{ block_size }}
 13	13	0	val9
 14	14	0	val3
 14	14	0	val7
+{% endif -%}
 ALL INNER | bs = {{ block_size }} | copmosite key
 2	2	2	2	2	2	0	0
 2	2	2	2	2	2	0	0
@@ -83,6 +85,7 @@ ALL LEFT | bs = {{ block_size }} | copmosite key
 2	2	2	2	2	2	val12	0
 2	2	2	2	2	2	val9	0
 ALL RIGHT | bs = {{ block_size }} | copmosite key
+{% if join_algorithm != 'grace_hash' -%}
 0	\N	0	1	1	1	1	val2
 0	\N	0	1	1	1	1	val7
 0	\N	0	1	1	2	1	val5
@@ -96,6 +99,7 @@ ALL RIGHT | bs = {{ block_size }} | copmosite key
 0	\N	0	2	2	\N	1	val9
 2	2	2	2	2	2	0	val4
 2	2	2	2	2	2	0	val4
+{% endif -%}
 ANY INNER USING | bs = {{ block_size }}
 4	0	0
 5	0	0
@@ -133,6 +137,7 @@ ANY LEFT | bs = {{ block_size }}
 13	13	val13	0
 14	14	val9	0
 ANY RIGHT | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 4	4	0	val10
 5	5	0	val6
 6	6	0	val8
@@ -145,6 +150,7 @@ ANY RIGHT | bs = {{ block_size }}
 13	13	0	val9
 14	14	0	val3
 14	14	0	val7
+{% endif -%}
 ANY INNER | bs = {{ block_size }} | copmosite key
 2	2	2	2	2	2	0	0
 ANY LEFT | bs = {{ block_size }} | copmosite key
@@ -164,6 +170,7 @@ ANY LEFT | bs = {{ block_size }} | copmosite key
 2	2	2	2	2	2	val12	0
 2	2	2	2	2	2	val9	0
 ANY RIGHT | bs = {{ block_size }} | copmosite key
+{% if join_algorithm != 'grace_hash' -%}
 0	\N	0	1	1	1	1	val2
 0	\N	0	1	1	1	1	val7
 0	\N	0	1	1	2	1	val5
@@ -176,6 +183,7 @@ ANY RIGHT | bs = {{ block_size }} | copmosite key
 0	\N	0	2	1	\N	1	val3
 0	\N	0	2	2	\N	1	val9
 2	2	2	2	2	2	0	val4
+{% endif -%}
 {% endfor -%}
 ALL INNER | join_use_nulls = 1
 4	4	0	0
@@ -211,6 +219,7 @@ ALL LEFT | join_use_nulls = 1
 14	14	val9	0
 14	14	val9	0
 ALL RIGHT | join_use_nulls = 1
+{% if join_algorithm != 'grace_hash' -%}
 4	4	0	val10
 5	5	0	val6
 6	6	0	val8
@@ -224,6 +233,7 @@ ALL RIGHT | join_use_nulls = 1
 13	13	0	val9
 14	14	0	val3
 14	14	0	val7
+{% endif -%}
 ALL INNER | join_use_nulls = 1 | copmosite key
 2	2	2	2	2	2	0	0
 2	2	2	2	2	2	0	0
@@ -244,6 +254,7 @@ ALL LEFT | join_use_nulls = 1 | copmosite key
 2	2	2	2	2	2	val12	0
 2	2	2	2	2	2	val9	0
 ALL RIGHT | join_use_nulls = 1 | copmosite key
+{% if join_algorithm != 'grace_hash' -%}
 2	2	2	2	2	2	0	val4
 2	2	2	2	2	2	0	val4
 \N	\N	\N	1	1	1	\N	val2
@@ -257,6 +268,7 @@ ALL RIGHT | join_use_nulls = 1 | copmosite key
 \N	\N	\N	2	1	2	\N	val8
 \N	\N	\N	2	1	\N	\N	val3
 \N	\N	\N	2	2	\N	\N	val9
+{% endif -%}
 ANY INNER | join_use_nulls = 1
 4	4	0	0
 5	5	0	0
@@ -284,6 +296,7 @@ ANY LEFT | join_use_nulls = 1
 13	13	val13	0
 14	14	val9	0
 ANY RIGHT | join_use_nulls = 1
+{% if join_algorithm != 'grace_hash' -%}
 4	4	0	val10
 5	5	0	val6
 6	6	0	val8
@@ -296,6 +309,7 @@ ANY RIGHT | join_use_nulls = 1
 13	13	0	val9
 14	14	0	val3
 14	14	0	val7
+{% endif -%}
 ANY INNER | join_use_nulls = 1 | copmosite key
 2	2	2	2	2	2	0	0
 ANY LEFT | join_use_nulls = 1 | copmosite key
@@ -315,6 +329,7 @@ ANY LEFT | join_use_nulls = 1 | copmosite key
 2	2	2	2	2	2	val12	0
 2	2	2	2	2	2	val9	0
 ANY RIGHT | join_use_nulls = 1 | copmosite key
+{% if join_algorithm != 'grace_hash' -%}
 2	2	2	2	2	2	0	val4
 \N	\N	\N	1	1	1	\N	val2
 \N	\N	\N	1	1	1	\N	val7
@@ -327,4 +342,5 @@ ANY RIGHT | join_use_nulls = 1 | copmosite key
 \N	\N	\N	2	1	2	\N	val8
 \N	\N	\N	2	1	\N	\N	val3
 \N	\N	\N	2	2	\N	\N	val9
+{% endif -%}
 {% endfor -%}
diff --git a/tests/queries/0_stateless/02273_full_sort_join.sql.j2 b/tests/queries/0_stateless/02273_full_sort_join.sql.j2
index 6500306356c..8b739330364 100644
--- a/tests/queries/0_stateless/02273_full_sort_join.sql.j2
+++ b/tests/queries/0_stateless/02273_full_sort_join.sql.j2
@@ -26,7 +26,9 @@ INSERT INTO t2
         'val' || toString(number) as s
     FROM numbers_mt({{ table_size - 3 }});
 
+
 {% macro is_implemented(join_algorithm) -%}
+{% if join_algorithm == 'grace_hash' %} -- { serverError NOT_IMPLEMENTED } {% endif %}
 {% endmacro -%}
 
 {% for join_algorithm in ['default', 'full_sorting_merge', 'grace_hash'] -%}
@@ -36,7 +38,7 @@ SET max_bytes_in_join = '{% if join_algorithm == 'grace_hash' %}10K{% else %}0{%
 SELECT '-- {{ join_algorithm }} --';
 SET join_algorithm = '{{ join_algorithm }}';
 
-{% for block_size in range(1, table_size + 1, 4) -%}
+{% for block_size in range(1, table_size + 1) -%}
 {% for kind in ['ALL', 'ANY'] -%}
 
 SET max_block_size = {{ block_size }};
diff --git a/tests/queries/0_stateless/02274_full_sort_join_nodistinct.reference.j2 b/tests/queries/0_stateless/02274_full_sort_join_nodistinct.reference.j2
index df968e86e8d..2cc6c6e85d6 100644
--- a/tests/queries/0_stateless/02274_full_sort_join_nodistinct.reference.j2
+++ b/tests/queries/0_stateless/02274_full_sort_join_nodistinct.reference.j2
@@ -1,6 +1,6 @@
 {% for join_algorithm in ['full_sorting_merge', 'grace_hash'] -%}
 --- {{ join_algorithm }} ---
-{% for block_size in range(1, 11, 4) -%}
+{% for block_size in range(1, 11) -%}
 t1 ALL INNER JOIN t2 | bs = {{ block_size }}
 1	1	4	5
 1	1	4	5
@@ -108,6 +108,7 @@ t1 ALL LEFT JOIN t2 | bs = {{ block_size }}
 2	2	val27	5
 3	3	val3	4
 t1 ALL RIGHT JOIN t2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	1	4	val11
 1	1	4	val12
 2	2	5	val22
@@ -160,6 +161,7 @@ t1 ALL RIGHT JOIN t2 | bs = {{ block_size }}
 2	2	5	val28
 2	2	5	val28
 3	3	4	val3
+{% endif -%}
 t1 ANY INNER JOIN t2 | bs = {{ block_size }}
 1	1	4	5
 2	2	5	5
@@ -175,6 +177,7 @@ t1 ANY LEFT JOIN t2 | bs = {{ block_size }}
 2	2	val27	5
 3	3	val3	4
 t1 ANY RIGHT JOIN t2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	1	4	val11
 1	1	4	val12
 2	2	5	val22
@@ -185,7 +188,9 @@ t1 ANY RIGHT JOIN t2 | bs = {{ block_size }}
 2	2	5	val27
 2	2	5	val28
 3	3	4	val3
+{% endif -%}
 t1 ALL FULL JOIN t2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	1	4	5
 1	1	4	5
 2	2	5	5
@@ -238,7 +243,9 @@ t1 ALL FULL JOIN t2 | bs = {{ block_size }}
 2	2	5	5
 2	2	5	5
 3	3	4	4
+{% endif -%}
 t1 ALL FULL JOIN USING t2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	4	5
 1	4	5
 2	5	5
@@ -291,6 +298,7 @@ t1 ALL FULL JOIN USING t2 | bs = {{ block_size }}
 2	5	5
 2	5	5
 3	4	4
+{% endif -%}
 t1 ALL INNER JOIN tn2 | bs = {{ block_size }}
 1	1	4	5
 1	1	4	5
@@ -307,6 +315,7 @@ t1 ALL LEFT JOIN tn2 | bs = {{ block_size }}
 2	\N	val27	0
 3	3	val3	4
 t1 ALL RIGHT JOIN tn2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 0	\N	0	val22
 0	\N	0	val23
 0	\N	0	val24
@@ -317,6 +326,7 @@ t1 ALL RIGHT JOIN tn2 | bs = {{ block_size }}
 1	1	4	val11
 1	1	4	val12
 3	3	4	val3
+{% endif -%}
 t1 ANY INNER JOIN tn2 | bs = {{ block_size }}
 1	1	4	5
 3	3	4	4
@@ -331,6 +341,7 @@ t1 ANY LEFT JOIN tn2 | bs = {{ block_size }}
 2	\N	val27	0
 3	3	val3	4
 t1 ANY RIGHT JOIN tn2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 0	\N	0	val22
 0	\N	0	val23
 0	\N	0	val24
@@ -341,7 +352,9 @@ t1 ANY RIGHT JOIN tn2 | bs = {{ block_size }}
 1	1	4	val11
 1	1	4	val12
 3	3	4	val3
+{% endif -%}
 t1 ALL FULL JOIN tn2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 0	\N	0	5
 0	\N	0	5
 0	\N	0	5
@@ -359,8 +372,9 @@ t1 ALL FULL JOIN tn2 | bs = {{ block_size }}
 2	\N	5	0
 2	\N	5	0
 3	3	4	4
-{% if join_algorithm != 'grace_hash' -%}
+{% endif -%}
 t1 ALL FULL JOIN USING tn2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	4	5
 1	4	5
 2	5	0
@@ -395,6 +409,7 @@ tn1 ALL LEFT JOIN t2 | bs = {{ block_size }}
 \N	0	val26	0
 \N	0	val27	0
 tn1 ALL RIGHT JOIN t2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	1	4	val11
 1	1	4	val12
 3	3	4	val3
@@ -405,6 +420,7 @@ tn1 ALL RIGHT JOIN t2 | bs = {{ block_size }}
 \N	2	0	val26
 \N	2	0	val27
 \N	2	0	val28
+{% endif -%}
 tn1 ANY INNER JOIN t2 | bs = {{ block_size }}
 1	1	4	5
 3	3	4	4
@@ -419,6 +435,7 @@ tn1 ANY LEFT JOIN t2 | bs = {{ block_size }}
 \N	0	val26	0
 \N	0	val27	0
 tn1 ANY RIGHT JOIN t2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	1	4	val11
 1	1	4	val12
 3	3	4	val3
@@ -429,7 +446,9 @@ tn1 ANY RIGHT JOIN t2 | bs = {{ block_size }}
 \N	2	0	val26
 \N	2	0	val27
 \N	2	0	val28
+{% endif -%}
 tn1 ALL FULL JOIN t2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	1	4	5
 1	1	4	5
 3	3	4	4
@@ -447,7 +466,9 @@ tn1 ALL FULL JOIN t2 | bs = {{ block_size }}
 \N	2	0	5
 \N	2	0	5
 \N	2	0	5
+{% endif -%}
 tn1 ALL FULL JOIN USING t2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	4	5
 1	4	5
 2	0	5
@@ -465,6 +486,7 @@ tn1 ALL FULL JOIN USING t2 | bs = {{ block_size }}
 \N	5	0
 \N	5	0
 \N	5	0
+{% endif -%}
 tn1 ALL INNER JOIN tn2 | bs = {{ block_size }}
 1	1	4	5
 1	1	4	5
@@ -481,6 +503,7 @@ tn1 ALL LEFT JOIN tn2 | bs = {{ block_size }}
 \N	\N	val26	0
 \N	\N	val27	0
 tn1 ALL RIGHT JOIN tn2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	1	4	val11
 1	1	4	val12
 3	3	4	val3
@@ -491,6 +514,7 @@ tn1 ALL RIGHT JOIN tn2 | bs = {{ block_size }}
 \N	\N	0	val26
 \N	\N	0	val27
 \N	\N	0	val28
+{% endif -%}
 tn1 ANY INNER JOIN tn2 | bs = {{ block_size }}
 1	1	4	5
 3	3	4	4
@@ -505,6 +529,7 @@ tn1 ANY LEFT JOIN tn2 | bs = {{ block_size }}
 \N	\N	val26	0
 \N	\N	val27	0
 tn1 ANY RIGHT JOIN tn2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	1	4	val11
 1	1	4	val12
 3	3	4	val3
@@ -515,7 +540,9 @@ tn1 ANY RIGHT JOIN tn2 | bs = {{ block_size }}
 \N	\N	0	val26
 \N	\N	0	val27
 \N	\N	0	val28
+{% endif -%}
 tn1 ALL FULL JOIN tn2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	1	4	5
 1	1	4	5
 3	3	4	4
@@ -533,8 +560,9 @@ tn1 ALL FULL JOIN tn2 | bs = {{ block_size }}
 \N	\N	5	0
 \N	\N	5	0
 \N	\N	5	0
-{% if join_algorithm != 'grace_hash' -%}
+{% endif -%}
 tn1 ALL FULL JOIN USING tn2 | bs = {{ block_size }}
+{% if join_algorithm != 'grace_hash' -%}
 1	4	5
 1	4	5
 3	4	4
diff --git a/tests/queries/0_stateless/02274_full_sort_join_nodistinct.sql.j2 b/tests/queries/0_stateless/02274_full_sort_join_nodistinct.sql.j2
index f8eb4b1a53e..613da65421e 100644
--- a/tests/queries/0_stateless/02274_full_sort_join_nodistinct.sql.j2
+++ b/tests/queries/0_stateless/02274_full_sort_join_nodistinct.sql.j2
@@ -16,6 +16,7 @@ INSERT INTO t2 VALUES (1, 'val11'), (1, 'val12'), (2, 'val22'), (2, 'val23'), (2
 INSERT INTO tn2 VALUES (1, 'val11'), (1, 'val12'), (NULL, 'val22'), (NULL, 'val23'), (NULL, 'val24'), (NULL, 'val25'), (NULL, 'val26'), (NULL, 'val27'), (NULL, 'val28'), (3, 'val3');
 
 {% macro is_implemented(join_algorithm) -%}
+{% if join_algorithm == 'grace_hash' %} -- { serverError NOT_IMPLEMENTED } {% endif %}
 {% endmacro -%}
 
 {% for join_algorithm in ['full_sorting_merge', 'grace_hash'] -%}
@@ -26,7 +27,7 @@ SET join_algorithm = '{{ join_algorithm }}';
 
 SELECT '--- {{ join_algorithm }} ---';
 
-{% for block_size in range(1, 11, 4) -%}
+{% for block_size in range(1, 11) -%}
 SET max_block_size = {{ block_size }};
 
 {% for t1, t2 in [('t1', 't2'), ('t1', 'tn2'), ('tn1', 't2'), ('tn1', 'tn2')]  -%}
@@ -46,10 +47,9 @@ SELECT t1.key, t2.key, length(t1.s), t2.s FROM {{ t1 }} AS t1 {{ kind }} RIGHT J
 SELECT '{{ t1 }} ALL FULL JOIN {{ t2 }} | bs = {{ block_size }}';
 SELECT t1.key, t2.key, length(t1.s), length(t2.s) FROM {{ t1 }} AS t1 {{ kind }} FULL JOIN {{ t2 }} AS t2 ON t1.key == t2.key ORDER BY t1.key, t2.key, length(t1.s), length(t2.s); {{ is_implemented(join_algorithm) }}
 
-{% if join_algorithm == 'full_sorting_merge' or t2 != 'tn2' -%}
 SELECT '{{ t1 }} ALL FULL JOIN USING {{ t2 }} | bs = {{ block_size }}';
 SELECT key, length(t1.s), length(t2.s) FROM {{ t1 }} AS t1 ALL FULL JOIN {{ t2 }} AS t2 USING (key) ORDER BY key, length(t1.s), length(t2.s); {{ is_implemented(join_algorithm) }}
-{% endif -%}
+
 {% endfor -%}
 {% endfor -%}
 SET max_bytes_in_join = 0;
diff --git a/tests/queries/0_stateless/02275_full_sort_join_long.reference b/tests/queries/0_stateless/02275_full_sort_join_long.reference
index 73482358d12..9ec06aea3e6 100644
--- a/tests/queries/0_stateless/02275_full_sort_join_long.reference
+++ b/tests/queries/0_stateless/02275_full_sort_join_long.reference
@@ -41,34 +41,16 @@ ALL INNER
 ALL LEFT
 50195752660639	500353531835	10369589	10369589	1000342
 ALL RIGHT
-500353531835	684008812186	1367170	1000342	1367170
+skipped
 ALL INNER
 500353531835	500353531835	1000342	1000342	1000342
 ALL LEFT
 50195752660639	500353531835	10369589	10369589	1000342
 ALL RIGHT
-500353531835	684008812186	1367170	1000342	1367170
+skipped
 ALL INNER
 500353531835	500353531835	1000342	1000342	1000342
 ALL LEFT
 50195752660639	500353531835	10369589	10369589	1000342
 ALL RIGHT
-500353531835	684008812186	1367170	1000342	1367170
-ANY INNER
-199622811843	199622811843	399458	399458	399458
-ANY LEFT
-50010619420459	315220291655	10000000	10000000	630753
-ANY RIGHT
-316611844056	500267124407	1000000	633172	1000000
-ANY INNER
-199622811843	199622811843	399458	399458	399458
-ANY LEFT
-50010619420459	315220291655	10000000	10000000	630753
-ANY RIGHT
-316611844056	500267124407	1000000	633172	1000000
-ANY INNER
-199622811843	199622811843	399458	399458	399458
-ANY LEFT
-50010619420459	315220291655	10000000	10000000	630753
-ANY RIGHT
-316611844056	500267124407	1000000	633172	1000000
+skipped
diff --git a/tests/queries/0_stateless/02275_full_sort_join_long.sql.j2 b/tests/queries/0_stateless/02275_full_sort_join_long.sql.j2
index 0b28fd67050..7276e77dc16 100644
--- a/tests/queries/0_stateless/02275_full_sort_join_long.sql.j2
+++ b/tests/queries/0_stateless/02275_full_sort_join_long.sql.j2
@@ -22,10 +22,15 @@ INSERT INTO t2
     FROM numbers_mt({{ rtable_size }})
 ;
 
+{% macro is_implemented(join_algorithm) -%}
+{% if join_algorithm == 'grace_hash' %} -- { serverError NOT_IMPLEMENTED }
+SELECT 'skipped';
+{% endif -%}
+{% endmacro -%}
 
 {% for join_algorithm in ['full_sorting_merge', 'grace_hash'] -%}
 
-SET max_bytes_in_join = '{% if join_algorithm == 'grace_hash' %}1M{% else %}0{% endif %}';
+SET max_bytes_in_join = '{% if join_algorithm == 'grace_hash' %}16M{% else %}0{% endif %}';
 
 SELECT '-- {{ join_algorithm }} --';
 SET join_algorithm = '{{ join_algorithm }}';
@@ -35,6 +40,7 @@ SET join_algorithm = '{{ join_algorithm }}';
 
 SET max_block_size = {{ block_size }};
 
+{% if not (kind == 'ANY' and join_algorithm == 'grace_hash') -%}
 
 SELECT '{{ kind }} INNER';
 SELECT sum(t1.key), sum(t2.key), count(), countIf(t1.key != 0), countIf(t2.key != 0) FROM t1
@@ -52,8 +58,9 @@ SELECT '{{ kind }} RIGHT';
 SELECT sum(t1.key), sum(t2.key), count(), countIf(t1.key != 0), countIf(t2.key != 0) FROM t1
 {{ kind }} RIGHT JOIN t2
 ON t1.key == t2.key
-;
+; {{ is_implemented(join_algorithm) }}
 
+{% endif -%}
 
 {% endfor -%}
 {% endfor -%}
diff --git a/tests/queries/0_stateless/02286_tuple_numeric_identifier.sql b/tests/queries/0_stateless/02286_tuple_numeric_identifier.sql
index a5fd8e57ad5..f723284ad61 100644
--- a/tests/queries/0_stateless/02286_tuple_numeric_identifier.sql
+++ b/tests/queries/0_stateless/02286_tuple_numeric_identifier.sql
@@ -12,8 +12,8 @@ SELECT * FROM t_tuple_numeric FORMAT JSONEachRow;
 SELECT `t`.`1`.`2`, `t`.`1`.`3`, `t`.`4` FROM t_tuple_numeric;
 SELECT t.1.1, t.1.2, t.2 FROM t_tuple_numeric;
 
-SELECT t.1.3 FROM t_tuple_numeric; -- {serverError ILLEGAL_INDEX}
-SELECT t.4 FROM t_tuple_numeric; -- {serverError ILLEGAL_INDEX}
+SELECT t.1.3 FROM t_tuple_numeric; -- {serverError NOT_FOUND_COLUMN_IN_BLOCK}
+SELECT t.4 FROM t_tuple_numeric; -- {serverError NOT_FOUND_COLUMN_IN_BLOCK}
 SELECT `t`.`1`.`1`, `t`.`1`.`2`, `t`.`2` FROM t_tuple_numeric; -- {serverError UNKNOWN_IDENTIFIER}
 
 DROP TABLE t_tuple_numeric;
diff --git a/tests/queries/0_stateless/02302_lc_nullable_string_insert_as_number.reference b/tests/queries/0_stateless/02302_lc_nullable_string_insert_as_number.reference
new file mode 100644
index 00000000000..0d66ea1aee9
--- /dev/null
+++ b/tests/queries/0_stateless/02302_lc_nullable_string_insert_as_number.reference
@@ -0,0 +1,2 @@
+0
+1
diff --git a/tests/queries/0_stateless/02302_lc_nullable_string_insert_as_number.sql b/tests/queries/0_stateless/02302_lc_nullable_string_insert_as_number.sql
new file mode 100644
index 00000000000..9859c1559d5
--- /dev/null
+++ b/tests/queries/0_stateless/02302_lc_nullable_string_insert_as_number.sql
@@ -0,0 +1,11 @@
+DROP TABLE IF EXISTS lc_nullable_string;
+
+CREATE TABLE lc_nullable_string(`c1` LowCardinality(Nullable(String)) DEFAULT CAST(NULL, 'LowCardinality(Nullable(String))')) 
+ENGINE = Memory;
+
+INSERT INTO lc_nullable_string (c1) FORMAT Values (0);
+INSERT INTO lc_nullable_string (c1) Values (1);
+
+SELECT * FROM lc_nullable_string ORDER BY c1;
+
+DROP TABLE lc_nullable_string;
diff --git a/tests/queries/0_stateless/02303_query_kind.reference b/tests/queries/0_stateless/02303_query_kind.reference
index 5af8c2b743f..8d119fb22b2 100644
--- a/tests/queries/0_stateless/02303_query_kind.reference
+++ b/tests/queries/0_stateless/02303_query_kind.reference
@@ -2,35 +2,35 @@ clickhouse-client --allow_experimental_analyzer=1 --query_kind secondary_query -
 Expression ((Project names + Projection))
 Header: dummy String
   Aggregating
-  Header: toString(system.one.dummy_0) String
+  Header: toString(dummy_0) String
     Expression ((Before GROUP BY + Change column names to column identifiers))
-    Header: toString(system.one.dummy_0) String
+    Header: toString(dummy_0) String
       ReadFromStorage (SystemOne)
       Header: dummy UInt8
 clickhouse-local --allow_experimental_analyzer=1 --query_kind secondary_query -q explain plan header=1 select toString(dummy) as dummy from system.one group by dummy
 Expression ((Project names + Projection))
 Header: dummy String
   Aggregating
-  Header: toString(system.one.dummy_0) String
+  Header: toString(dummy_0) String
     Expression ((Before GROUP BY + Change column names to column identifiers))
-    Header: toString(system.one.dummy_0) String
+    Header: toString(dummy_0) String
       ReadFromStorage (SystemOne)
       Header: dummy UInt8
 clickhouse-client --allow_experimental_analyzer=1 --query_kind initial_query -q explain plan header=1 select toString(dummy) as dummy from system.one group by dummy
 Expression ((Project names + Projection))
 Header: dummy String
   Aggregating
-  Header: toString(system.one.dummy_0) String
+  Header: toString(dummy_0) String
     Expression ((Before GROUP BY + Change column names to column identifiers))
-    Header: toString(system.one.dummy_0) String
+    Header: toString(dummy_0) String
       ReadFromStorage (SystemOne)
       Header: dummy UInt8
 clickhouse-local --allow_experimental_analyzer=1 --query_kind initial_query -q explain plan header=1 select toString(dummy) as dummy from system.one group by dummy
 Expression ((Project names + Projection))
 Header: dummy String
   Aggregating
-  Header: toString(system.one.dummy_0) String
+  Header: toString(dummy_0) String
     Expression ((Before GROUP BY + Change column names to column identifiers))
-    Header: toString(system.one.dummy_0) String
+    Header: toString(dummy_0) String
       ReadFromStorage (SystemOne)
       Header: dummy UInt8
diff --git a/tests/queries/0_stateless/02344_describe_cache.reference b/tests/queries/0_stateless/02344_describe_cache.reference
index a803ca1fab1..f1d0240d80e 100644
--- a/tests/queries/0_stateless/02344_describe_cache.reference
+++ b/tests/queries/0_stateless/02344_describe_cache.reference
@@ -1,2 +1,2 @@
-134217728	1048576	8388608	1	0	0	0	/var/lib/clickhouse/caches/s3_cache/	0
-134217728	1048576	104857600	0	0	0	0	/var/lib/clickhouse/caches/s3_cache_2/	0
+134217728	10000000	33554432	4194304	1	0	0	0	/var/lib/clickhouse/caches/s3_cache/	100	2	0
+134217728	10000000	104857600	4194304	0	0	0	0	/var/lib/clickhouse/caches/s3_cache_2/	100	2	0
diff --git a/tests/queries/0_stateless/02346_into_outfile_and_stdout.sh b/tests/queries/0_stateless/02346_into_outfile_and_stdout.sh
index 021dc9125d4..38145ab3e51 100755
--- a/tests/queries/0_stateless/02346_into_outfile_and_stdout.sh
+++ b/tests/queries/0_stateless/02346_into_outfile_and_stdout.sh
@@ -66,7 +66,7 @@ performBadQuery "bad_query_incorrect_usage" "SELECT 1, 2, 3 INTO OUTFILE AND STD
 
 performBadQuery "bad_query_no_into_outfile" "SELECT 1, 2, 3 AND STDOUT'" "SYNTAX_ERROR"
 
-performFileExists "bad_query_file_exists" "SELECT 1, 2, 3 INTO OUTFILE '${CLICKHOUSE_TMP}/test_into_outfile_and_stdout_bad_query_file_exists.out' AND STDOUT" "File exists. (CANNOT_OPEN_FILE)"
+performFileExists "bad_query_file_exists" "SELECT 1, 2, 3 INTO OUTFILE '${CLICKHOUSE_TMP}/test_into_outfile_and_stdout_bad_query_file_exists.out' AND STDOUT" "File ${CLICKHOUSE_TMP}/test_into_outfile_and_stdout_bad_query_file_exists.out exists, consider using APPEND or TRUNCATE."
 
 performCompression "compression" "SELECT * FROM (SELECT 'Hello, World! From clickhouse.') INTO OUTFILE '${CLICKHOUSE_TMP}/test_into_outfile_and_stdout_compression.gz' AND STDOUT COMPRESSION 'GZ' FORMAT TabSeparated"
 
diff --git a/tests/queries/0_stateless/02354_annoy.reference b/tests/queries/0_stateless/02354_annoy.reference
deleted file mode 100644
index 38678fb67c9..00000000000
--- a/tests/queries/0_stateless/02354_annoy.reference
+++ /dev/null
@@ -1,26 +0,0 @@
-1	[0,0,10]
-2	[0,0,10.5]
-3	[0,0,9.5]
-4	[0,0,9.7]
-5	[0,0,10.2]
-1	[0,0,10]
-5	[0,0,10.2]
-4	[0,0,9.7]
-1	[0,0,10]
-2	[0,0,10.5]
-3	[0,0,9.5]
-4	[0,0,9.7]
-5	[0,0,10.2]
-1	[0,0,10]
-5	[0,0,10.2]
-4	[0,0,9.7]
-        Name: annoy_index
-            Name: annoy_index
-1	[0,0,10]
-2	[0.2,0,10]
-3	[-0.3,0,10]
-1	[0,0,10]
-2	[0.2,0,10]
-3	[-0.3,0,10]
-        Name: annoy_index
-            Name: annoy_index
diff --git a/tests/queries/0_stateless/02354_annoy.sh b/tests/queries/0_stateless/02354_annoy.sh
deleted file mode 100755
index 87258debf0f..00000000000
--- a/tests/queries/0_stateless/02354_annoy.sh
+++ /dev/null
@@ -1,212 +0,0 @@
-#!/usr/bin/env bash
-# Tags: no-fasttest, no-ubsan, no-cpu-aarch64, no-upgrade-check
-
-CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CURDIR"/../shell_config.sh
-
-# Check that index works correctly for L2Distance and with client parameters
-$CLICKHOUSE_CLIENT -nm --allow_experimental_annoy_index=1 -q "
-DROP TABLE IF EXISTS 02354_annoy_l2;
-
-CREATE TABLE 02354_annoy_l2
-(
-    id Int32,
-    embedding Array(Float32),
-    INDEX annoy_index embedding TYPE annoy() GRANULARITY 1
-)
-ENGINE = MergeTree
-ORDER BY id
-SETTINGS index_granularity=5, index_granularity_bytes = '10Mi';
-
-INSERT INTO 02354_annoy_l2 VALUES (1, [0.0, 0.0, 10.0]), (2, [0.0, 0.0, 10.5]), (3, [0.0, 0.0, 9.5]), (4, [0.0, 0.0, 9.7]), (5, [0.0, 0.0, 10.2]), (6, [10.0, 0.0, 0.0]), (7, [9.5, 0.0, 0.0]), (8, [9.7, 0.0, 0.0]), (9, [10.2, 0.0, 0.0]), (10, [10.5, 0.0, 0.0]), (11, [0.0, 10.0, 0.0]), (12, [0.0, 9.5, 0.0]), (13, [0.0, 9.7, 0.0]), (14, [0.0, 10.2, 0.0]), (15, [0.0, 10.5, 0.0]);
-
-SELECT *
-FROM 02354_annoy_l2
-WHERE L2Distance(embedding, [0.0, 0.0, 10.0]) < 1.0
-LIMIT 5;
-
-SELECT *
-FROM 02354_annoy_l2
-ORDER BY L2Distance(embedding, [0.0, 0.0, 10.0])
-LIMIT 3;
-
-SET param_02354_target_vector='[0.0, 0.0, 10.0]';
-
-SELECT *
-FROM 02354_annoy_l2
-WHERE L2Distance(embedding, {02354_target_vector: Array(Float32)}) < 1.0
-LIMIT 5;
-
-SELECT *
-FROM 02354_annoy_l2
-ORDER BY L2Distance(embedding, {02354_target_vector: Array(Float32)})
-LIMIT 3;
-
-SELECT *
-FROM 02354_annoy_l2
-ORDER BY L2Distance(embedding, [0.0, 0.0])
-LIMIT 3; -- { serverError 80 }
-
-
-DROP TABLE IF EXISTS 02354_annoy_l2;
-"
-
-# Check that indexes are used
-$CLICKHOUSE_CLIENT -nm --allow_experimental_annoy_index=1 -q "
-DROP TABLE IF EXISTS 02354_annoy_l2;
-
-CREATE TABLE 02354_annoy_l2
-(
-    id Int32,
-    embedding Array(Float32),
-    INDEX annoy_index embedding TYPE annoy() GRANULARITY 1
-)
-ENGINE = MergeTree
-ORDER BY id
-SETTINGS index_granularity=5, index_granularity_bytes = '10Mi';
-
-INSERT INTO 02354_annoy_l2 VALUES (1, [0.0, 0.0, 10.0]), (2, [0.0, 0.0, 10.5]), (3, [0.0, 0.0, 9.5]), (4, [0.0, 0.0, 9.7]), (5, [0.0, 0.0, 10.2]), (6, [10.0, 0.0, 0.0]), (7, [9.5, 0.0, 0.0]), (8, [9.7, 0.0, 0.0]), (9, [10.2, 0.0, 0.0]), (10, [10.5, 0.0, 0.0]), (11, [0.0, 10.0, 0.0]), (12, [0.0, 9.5, 0.0]), (13, [0.0, 9.7, 0.0]), (14, [0.0, 10.2, 0.0]), (15, [0.0, 10.5, 0.0]);
-
-EXPLAIN indexes=1
-SELECT *
-FROM 02354_annoy_l2
-WHERE L2Distance(embedding, [0.0, 0.0, 10.0]) < 1.0
-LIMIT 5;
-
-EXPLAIN indexes=1
-SELECT *
-FROM 02354_annoy_l2
-ORDER BY L2Distance(embedding, [0.0, 0.0, 10.0])
-LIMIT 3;
-DROP TABLE IF EXISTS 02354_annoy_l2;
-" | grep "annoy_index"
-
-
-# # Check that index works correctly for cosineDistance
-$CLICKHOUSE_CLIENT -nm --allow_experimental_annoy_index=1 -q "
-DROP TABLE IF EXISTS 02354_annoy_cosine;
-
-CREATE TABLE 02354_annoy_cosine
-(
-    id Int32,
-    embedding Array(Float32),
-    INDEX annoy_index embedding TYPE annoy(100, 'cosineDistance') GRANULARITY 1
-)
-ENGINE = MergeTree
-ORDER BY id
-SETTINGS index_granularity=5, index_granularity_bytes = '10Mi';
-
-INSERT INTO 02354_annoy_cosine VALUES (1, [0.0, 0.0, 10.0]), (2, [0.2, 0.0, 10.0]), (3, [-0.3, 0.0, 10.0]), (4, [0.5, 0.0, 10.1]), (5, [0.8, 0.0, 10.0]), (6, [10.0, 0.0, 0.0]), (7, [9.5, 0.0, 0.0]), (8, [9.7, 0.0, 0.0]), (9, [10.2, 0.0, 0.0]), (10, [10.5, 0.0, 0.0]), (11, [0.0, 10.0, 0.0]), (12, [0.0, 9.5, 0.0]), (13, [0.0, 9.7, 0.0]), (14, [0.0, 10.2, 0.0]), (15, [0.0, 10.5, 0.0]);
-
-SELECT *
-FROM 02354_annoy_cosine
-WHERE cosineDistance(embedding, [0.0, 0.0, 10.0]) < 1.0
-LIMIT 3;
-
-SELECT *
-FROM 02354_annoy_cosine
-ORDER BY cosineDistance(embedding, [0.0, 0.0, 10.0])
-LIMIT 3;
-
-DROP TABLE IF EXISTS 02354_annoy_cosine;
-"
-
-# # Check that indexes are used
-$CLICKHOUSE_CLIENT -nm --allow_experimental_annoy_index=1 -q "
-DROP TABLE IF EXISTS 02354_annoy_cosine;
-
-CREATE TABLE 02354_annoy_cosine
-(
-    id Int32,
-    embedding Array(Float32),
-    INDEX annoy_index embedding TYPE annoy(100, 'cosineDistance') GRANULARITY 1
-)
-ENGINE = MergeTree
-ORDER BY id
-SETTINGS index_granularity=5, index_granularity_bytes = '10Mi';
-
-INSERT INTO 02354_annoy_cosine VALUES (1, [0.0, 0.0, 10.0]), (2, [0.2, 0.0, 10.0]), (3, [-0.3, 0.0, 10.0]), (4, [0.5, 0.0, 10.1]), (5, [0.8, 0.0, 10.0]), (6, [10.0, 0.0, 0.0]), (7, [9.5, 0.0, 0.0]), (8, [9.7, 0.0, 0.0]), (9, [10.2, 0.0, 0.0]), (10, [10.5, 0.0, 0.0]), (11, [0.0, 10.0, 0.0]), (12, [0.0, 9.5, 0.0]), (13, [0.0, 9.7, 0.0]), (14, [0.0, 10.2, 0.0]), (15, [0.0, 10.5, 0.0]);
-
-EXPLAIN indexes=1
-SELECT *
-FROM 02354_annoy_cosine
-WHERE cosineDistance(embedding, [0.0, 0.0, 10.0]) < 1.0
-LIMIT 3;
-
-EXPLAIN indexes=1
-SELECT *
-FROM 02354_annoy_cosine
-ORDER BY cosineDistance(embedding, [0.0, 0.0, 10.0])
-LIMIT 3;
-DROP TABLE IF EXISTS 02354_annoy_cosine;
-" | grep "annoy_index"
-
-# # Check that weird base columns are rejected
-$CLICKHOUSE_CLIENT -nm --allow_experimental_annoy_index=1 -q "
-DROP TABLE IF EXISTS 02354_annoy;
-
--- Index spans >1 column
-
-CREATE TABLE 02354_annoy
-(
-    id Int32,
-    embedding Array(Float32),
-    INDEX annoy_index (embedding, id) TYPE annoy(100) GRANULARITY 1
-)
-ENGINE = MergeTree
-ORDER BY id
-SETTINGS index_granularity=5, index_granularity_bytes = '10Mi'; -- {serverError 7 }
-
--- Index must be created on Array(Float32) or Tuple(Float32)
-
-CREATE TABLE 02354_annoy
-(
-    id Int32,
-    embedding Float32,
-    INDEX annoy_index embedding TYPE annoy(100) GRANULARITY 1
-)
-ENGINE = MergeTree
-ORDER BY id
-SETTINGS index_granularity=5, index_granularity_bytes = '10Mi'; -- {serverError 44 }
-
-
-CREATE TABLE 02354_annoy
-(
-    id Int32,
-    embedding Array(Float64),
-    INDEX annoy_index embedding TYPE annoy(100) GRANULARITY 1
-)
-ENGINE = MergeTree
-ORDER BY id
-SETTINGS index_granularity=5, index_granularity_bytes = '10Mi'; -- {serverError 44 }
-
-CREATE TABLE 02354_annoy
-(
-    id Int32,
-    embedding Tuple(Float32, Float64),
-    INDEX annoy_index embedding TYPE annoy(100) GRANULARITY 1
-)
-ENGINE = MergeTree
-ORDER BY id
-SETTINGS index_granularity=5, index_granularity_bytes = '10Mi'; -- {serverError 44 }
-
-CREATE TABLE 02354_annoy
-(
-    id Int32,
-    embedding Array(LowCardinality(Float32)),
-    INDEX annoy_index embedding TYPE annoy(100) GRANULARITY 1
-)
-ENGINE = MergeTree
-ORDER BY id
-SETTINGS index_granularity=5, index_granularity_bytes = '10Mi'; -- {serverError 44 }
-
-CREATE TABLE 02354_annoy
-(
-    id Int32,
-    embedding Array(Nullable(Float32)),
-    INDEX annoy_index embedding TYPE annoy(100) GRANULARITY 1
-)
-ENGINE = MergeTree
-ORDER BY id
-SETTINGS index_granularity=5, index_granularity_bytes = '10Mi'; -- {serverError 44 }"
diff --git a/tests/queries/0_stateless/02354_annoy_index.reference b/tests/queries/0_stateless/02354_annoy_index.reference
new file mode 100644
index 00000000000..5e01a6e566e
--- /dev/null
+++ b/tests/queries/0_stateless/02354_annoy_index.reference
@@ -0,0 +1,144 @@
+--- Negative tests ---
+--- Test default GRANULARITY (should be 100 mio. for annoy)---
+CREATE TABLE default.tab\n(\n    `id` Int32,\n    `vector` Array(Float32),\n    INDEX annoy_index vector TYPE annoy GRANULARITY 100000000\n)\nENGINE = MergeTree\nORDER BY id\nSETTINGS index_granularity = 8192
+CREATE TABLE default.tab\n(\n    `id` Int32,\n    `vector` Array(Float32),\n    INDEX annoy_index vector TYPE annoy GRANULARITY 100000000\n)\nENGINE = MergeTree\nORDER BY id\nSETTINGS index_granularity = 8192
+--- Test with Array, GRANULARITY = 1, index_granularity = 5 ---
+WHERE type, L2Distance, check that index is used
+Expression ((Projection + Before ORDER BY))
+  Limit (preliminary LIMIT (without OFFSET))
+    ReadFromMergeTree (default.tab)
+    Indexes:
+      PrimaryKey
+        Condition: true
+        Parts: 1/1
+        Granules: 3/3
+      Skip
+        Name: annoy_index
+        Description: annoy GRANULARITY 1
+        Parts: 1/1
+        Granules: 1/3
+ORDER BY type, L2Distance, check that index is used
+Expression (Projection)
+  Limit (preliminary LIMIT (without OFFSET))
+    Sorting (Sorting for ORDER BY)
+      Expression (Before ORDER BY)
+        ReadFromMergeTree (default.tab)
+        Indexes:
+          PrimaryKey
+            Condition: true
+            Parts: 1/1
+            Granules: 3/3
+          Skip
+            Name: annoy_index
+            Description: annoy GRANULARITY 1
+            Parts: 1/1
+            Granules: 3/3
+Reference ARRAYs with non-matching dimension are rejected
+Special case: MaximumDistance is negative
+WHERE type, L2Distance
+Special case: setting annoy_index_search_k_nodes
+Special case: setting max_limit_for_ann_queries
+Expression (Projection)
+  Limit (preliminary LIMIT (without OFFSET))
+    Sorting (Sorting for ORDER BY)
+      Expression (Before ORDER BY)
+        ReadFromMergeTree (default.tab)
+        Indexes:
+          PrimaryKey
+            Condition: true
+            Parts: 1/1
+            Granules: 3/3
+--- Test with Tuple, GRANULARITY = 1, index_granularity = 5 ---
+WHERE type, L2Distance, check that index is used
+Expression ((Projection + Before ORDER BY))
+  Limit (preliminary LIMIT (without OFFSET))
+    ReadFromMergeTree (default.tab)
+    Indexes:
+      PrimaryKey
+        Condition: true
+        Parts: 1/1
+        Granules: 3/3
+      Skip
+        Name: annoy_index
+        Description: annoy GRANULARITY 1
+        Parts: 1/1
+        Granules: 1/3
+ORDER BY type, L2Distance, check that index is used
+Expression (Projection)
+  Limit (preliminary LIMIT (without OFFSET))
+    Sorting (Sorting for ORDER BY)
+      Expression (Before ORDER BY)
+        ReadFromMergeTree (default.tab)
+        Indexes:
+          PrimaryKey
+            Condition: true
+            Parts: 1/1
+            Granules: 3/3
+          Skip
+            Name: annoy_index
+            Description: annoy GRANULARITY 1
+            Parts: 1/1
+            Granules: 3/3
+--- Test non-default metric (cosine distance) + non-default NumTrees (200) ---
+--- Test with Array, GRANULARITY = 2, index_granularity = 4 ---
+WHERE type, L2Distance, check that index is used
+Expression ((Projection + Before ORDER BY))
+  Limit (preliminary LIMIT (without OFFSET))
+    ReadFromMergeTree (default.tab)
+    Indexes:
+      PrimaryKey
+        Condition: true
+        Parts: 1/1
+        Granules: 4/4
+      Skip
+        Name: annoy_index
+        Description: annoy GRANULARITY 2
+        Parts: 0/1
+        Granules: 2/4
+ORDER BY type, L2Distance, check that index is used
+Expression (Projection)
+  Limit (preliminary LIMIT (without OFFSET))
+    Sorting (Sorting for ORDER BY)
+      Expression (Before ORDER BY)
+        ReadFromMergeTree (default.tab)
+        Indexes:
+          PrimaryKey
+            Condition: true
+            Parts: 1/1
+            Granules: 4/4
+          Skip
+            Name: annoy_index
+            Description: annoy GRANULARITY 2
+            Parts: 1/1
+            Granules: 4/4
+--- Test with Array, GRANULARITY = 4, index_granularity = 4 ---
+WHERE type, L2Distance, check that index is used
+Expression ((Projection + Before ORDER BY))
+  Limit (preliminary LIMIT (without OFFSET))
+    ReadFromMergeTree (default.tab)
+    Indexes:
+      PrimaryKey
+        Condition: true
+        Parts: 1/1
+        Granules: 4/4
+      Skip
+        Name: annoy_index
+        Description: annoy GRANULARITY 4
+        Parts: 0/1
+        Granules: 3/4
+ORDER BY type, L2Distance, check that index is used
+Expression (Projection)
+  Limit (preliminary LIMIT (without OFFSET))
+    Sorting (Sorting for ORDER BY)
+      Expression (Before ORDER BY)
+        ReadFromMergeTree (default.tab)
+        Indexes:
+          PrimaryKey
+            Condition: true
+            Parts: 1/1
+            Granules: 4/4
+          Skip
+            Name: annoy_index
+            Description: annoy GRANULARITY 4
+            Parts: 1/1
+            Granules: 4/4
diff --git a/tests/queries/0_stateless/02354_annoy_index.sql b/tests/queries/0_stateless/02354_annoy_index.sql
new file mode 100644
index 00000000000..fefb51dfcc9
--- /dev/null
+++ b/tests/queries/0_stateless/02354_annoy_index.sql
@@ -0,0 +1,251 @@
+-- Tags: no-fasttest, no-ubsan, no-cpu-aarch64, no-upgrade-check
+
+SET allow_experimental_annoy_index = 1;
+SET allow_experimental_analyzer = 0;
+
+SELECT '--- Negative tests ---';
+
+DROP TABLE IF EXISTS tab;
+
+-- must have at most 2 arguments
+CREATE TABLE tab(id Int32, vector Array(Float32), INDEX annoy_index vector TYPE annoy('too', 'many', 'arguments')) ENGINE = MergeTree ORDER BY id; -- { serverError INCORRECT_QUERY }
+
+-- first argument (distance_function) must be String
+CREATE TABLE tab(id Int32, vector Array(Float32), INDEX annoy_index vector TYPE annoy(3)) ENGINE = MergeTree ORDER BY id; -- { serverError INCORRECT_QUERY }
+
+-- 2nd argument (number of trees) must be UInt64
+CREATE TABLE tab(id Int32, vector Array(Float32), INDEX annoy_index vector TYPE annoy('L2Distance', 'not an UInt64')) ENGINE = MergeTree ORDER BY id; -- { serverError INCORRECT_QUERY }
+
+-- must be created on single column
+CREATE TABLE tab(id Int32, vector Array(Float32), INDEX annoy_index (vector, id) TYPE annoy()) ENGINE = MergeTree ORDER BY id; -- { serverError INCORRECT_NUMBER_OF_COLUMNS }
+
+-- reject unsupported distance functions
+CREATE TABLE tab(id Int32, vector Array(Float32), INDEX annoy_index vector TYPE annoy('wormholeDistance')) ENGINE = MergeTree ORDER BY id; -- { serverError INCORRECT_DATA }
+
+-- must be created on Array/Tuple(Float32) columns
+SET allow_suspicious_low_cardinality_types = 1;
+CREATE TABLE tab(id Int32, vector Float32, INDEX annoy_index vector TYPE annoy()) ENGINE = MergeTree ORDER BY id; -- { serverError ILLEGAL_COLUMN }
+CREATE TABLE tab(id Int32, vector Array(Float64), INDEX annoy_index vector TYPE annoy()) ENGINE = MergeTree ORDER BY id; -- { serverError ILLEGAL_COLUMN }
+CREATE TABLE tab(id Int32, vector Tuple(Float64), INDEX annoy_index vector TYPE annoy()) ENGINE = MergeTree ORDER BY id; -- { serverError ILLEGAL_COLUMN }
+CREATE TABLE tab(id Int32, vector LowCardinality(Float32), INDEX annoy_index vector TYPE annoy()) ENGINE = MergeTree ORDER BY id; -- { serverError ILLEGAL_COLUMN }
+CREATE TABLE tab(id Int32, vector Nullable(Float32), INDEX annoy_index vector TYPE annoy()) ENGINE = MergeTree ORDER BY id; -- { serverError ILLEGAL_COLUMN }
+
+SELECT '--- Test default GRANULARITY (should be 100 mio. for annoy)---';
+
+CREATE TABLE tab (id Int32, vector Array(Float32), INDEX annoy_index(vector) TYPE annoy) ENGINE=MergeTree ORDER BY id;
+SHOW CREATE TABLE tab;
+DROP TABLE tab;
+
+CREATE TABLE tab (id Int32, vector Array(Float32)) ENGINE=MergeTree ORDER BY id;
+ALTER TABLE tab ADD INDEX annoy_index(vector) TYPE annoy;
+SHOW CREATE TABLE tab;
+
+DROP TABLE tab;
+
+SELECT '--- Test with Array, GRANULARITY = 1, index_granularity = 5 ---';
+
+DROP TABLE IF EXISTS tab;
+CREATE TABLE tab(id Int32, vector Array(Float32), INDEX annoy_index vector TYPE annoy() GRANULARITY 1) ENGINE = MergeTree ORDER BY id SETTINGS index_granularity = 5;
+INSERT INTO tab VALUES (1, [0.0, 0.0, 10.0]), (2, [0.0, 0.0, 10.5]), (3, [0.0, 0.0, 9.5]), (4, [0.0, 0.0, 9.7]), (5, [0.0, 0.0, 10.2]), (6, [10.0, 0.0, 0.0]), (7, [9.5, 0.0, 0.0]), (8, [9.7, 0.0, 0.0]), (9, [10.2, 0.0, 0.0]), (10, [10.5, 0.0, 0.0]), (11, [0.0, 10.0, 0.0]), (12, [0.0, 9.5, 0.0]), (13, [0.0, 9.7, 0.0]), (14, [0.0, 10.2, 0.0]), (15, [0.0, 10.5, 0.0]);
+
+-- rows = 15, index_granularity = 5, GRANULARITY = 1 gives 3 annoy-indexed blocks (each comprising a single granule)
+-- condition 'L2Distance(vector, reference_vector) < 1.0' ensures that only one annoy-indexed block produces results --> "Granules: 1/3"
+
+-- See (*) why commented out
+-- SELECT 'WHERE type, L2Distance';
+-- SELECT *
+-- FROM tab
+-- WHERE L2Distance(vector, [0.0, 0.0, 10.0]) < 1.0
+-- LIMIT 3;
+
+SELECT 'WHERE type, L2Distance, check that index is used';
+EXPLAIN indexes=1
+SELECT *
+FROM tab
+WHERE L2Distance(vector, [0.0, 0.0, 10.0]) < 1.0
+LIMIT 3;
+
+-- See (*) why commented out
+-- SELECT 'ORDER BY type, L2Distance';
+-- SELECT *
+-- FROM tab
+-- ORDER BY L2Distance(vector, [0.0, 0.0, 10.0])
+-- LIMIT 3;
+
+SELECT 'ORDER BY type, L2Distance, check that index is used';
+EXPLAIN indexes=1
+SELECT *
+FROM tab
+ORDER BY L2Distance(vector, [0.0, 0.0, 10.0])
+LIMIT 3;
+
+-- Test special cases. Corresponding special case tests are omitted from later tests.
+
+SELECT 'Reference ARRAYs with non-matching dimension are rejected';
+SELECT *
+FROM tab
+ORDER BY L2Distance(vector, [0.0, 0.0])
+LIMIT 3; -- { serverError INCORRECT_QUERY }
+
+SELECT 'Special case: MaximumDistance is negative';
+SELECT 'WHERE type, L2Distance';
+SELECT *
+FROM tab
+WHERE L2Distance(vector, [0.0, 0.0, 10.0]) < -1.0
+LIMIT 3; -- { serverError INCORRECT_QUERY }
+
+SELECT 'Special case: setting annoy_index_search_k_nodes';
+SELECT *
+FROM tab
+ORDER BY L2Distance(vector, [5.3, 7.3, 2.1])
+LIMIT 3
+SETTINGS annoy_index_search_k_nodes=0; -- searches zero nodes --> no results
+
+SELECT 'Special case: setting max_limit_for_ann_queries';
+EXPLAIN indexes=1
+SELECT *
+FROM tab
+ORDER BY L2Distance(vector, [5.3, 7.3, 2.1])
+LIMIT 3
+SETTINGS max_limit_for_ann_queries=2; -- doesn't use the ann index
+
+DROP TABLE tab;
+
+-- Test Tuple embeddings. Triggers different logic than Array inside MergeTreeIndexAnnoy but the same logic as Array above MergeTreeIndexAnnoy.
+-- Therefore test Tuple case just once.
+
+SELECT '--- Test with Tuple, GRANULARITY = 1, index_granularity = 5 ---';
+
+CREATE TABLE tab(id Int32, vector Tuple(Float32, Float32, Float32), INDEX annoy_index vector TYPE annoy() GRANULARITY 1) ENGINE = MergeTree ORDER BY id SETTINGS index_granularity = 5;
+INSERT INTO tab VALUES (1, (0.0, 0.0, 10.0)), (2, (0.0, 0.0, 10.5)), (3, (0.0, 0.0, 9.5)), (4, (0.0, 0.0, 9.7)), (5, (0.0, 0.0, 10.2)), (6, (10.0, 0.0, 0.0)), (7, (9.5, 0.0, 0.0)), (8, (9.7, 0.0, 0.0)), (9, (10.2, 0.0, 0.0)), (10, (10.5, 0.0, 0.0)), (11, (0.0, 10.0, 0.0)), (12, (0.0, 9.5, 0.0)), (13, (0.0, 9.7, 0.0)), (14, (0.0, 10.2, 0.0)), (15, (0.0, 10.5, 0.0));
+
+-- See (*) why commented out
+-- SELECT 'WHERE type, L2Distance';
+-- SELECT *
+-- FROM tab
+-- WHERE L2Distance(vector, (0.0, 0.0, 10.0)) < 1.0
+-- LIMIT 3;
+
+SELECT 'WHERE type, L2Distance, check that index is used';
+EXPLAIN indexes=1
+SELECT *
+FROM tab
+WHERE L2Distance(vector, (0.0, 0.0, 10.0)) < 1.0
+LIMIT 3;
+
+-- See (*) why commented out
+-- SELECT 'ORDER BY type, L2Distance';
+-- SELECT *
+-- FROM tab
+-- ORDER BY L2Distance(vector, (0.0, 0.0, 10.0))
+-- LIMIT 3;
+
+SELECT 'ORDER BY type, L2Distance, check that index is used';
+EXPLAIN indexes=1
+SELECT *
+FROM tab
+ORDER BY L2Distance(vector, (0.0, 0.0, 10.0))
+LIMIT 3;
+
+DROP TABLE tab;
+
+-- Not a systematic test, just to make sure no bad things happen
+SELECT '--- Test non-default metric (cosine distance) + non-default NumTrees (200) ---';
+
+CREATE TABLE tab(id Int32, vector Array(Float32), INDEX annoy_index vector TYPE annoy('cosineDistance', 200) GRANULARITY 1) ENGINE = MergeTree ORDER BY id SETTINGS index_granularity = 5;
+INSERT INTO tab VALUES (1, [0.0, 0.0, 10.0]), (2, [0.0, 0.0, 10.5]), (3, [0.0, 0.0, 9.5]), (4, [0.0, 0.0, 9.7]), (5, [0.0, 0.0, 10.2]), (6, [10.0, 0.0, 0.0]), (7, [9.5, 0.0, 0.0]), (8, [9.7, 0.0, 0.0]), (9, [10.2, 0.0, 0.0]), (10, [10.5, 0.0, 0.0]), (11, [0.0, 10.0, 0.0]), (12, [0.0, 9.5, 0.0]), (13, [0.0, 9.7, 0.0]), (14, [0.0, 10.2, 0.0]), (15, [0.0, 10.5, 0.0]);
+
+-- See (*) why commented out
+-- SELECT 'WHERE type, L2Distance';
+-- SELECT *
+-- FROM tab
+-- WHERE L2Distance(vector, [0.0, 0.0, 10.0]) < 1.0
+-- LIMIT 3;
+
+-- See (*) why commented out
+-- SELECT 'ORDER BY type, L2Distance';
+-- SELECT *
+-- FROM tab
+-- ORDER BY L2Distance(vector, [0.0, 0.0, 10.0])
+-- LIMIT 3;
+
+DROP TABLE tab;
+
+SELECT '--- Test with Array, GRANULARITY = 2, index_granularity = 4 ---';
+
+CREATE TABLE tab(id Int32, vector Array(Float32), INDEX annoy_index vector TYPE annoy() GRANULARITY 2) ENGINE = MergeTree ORDER BY id SETTINGS index_granularity = 4;
+INSERT INTO tab VALUES (1, [0.0, 0.0, 10.0, 0.0]), (2, [0.0, 0.0, 10.5, 0.0]), (3, [0.0, 0.0, 9.5, 0.0]), (4, [0.0, 0.0, 9.7, 0.0]), (5, [10.0, 0.0, 0.0, 0.0]), (6, [9.5, 0.0, 0.0, 0.0]), (7, [9.7, 0.0, 0.0, 0.0]), (8, [10.2, 0.0, 0.0, 0.0]), (9, [0.0, 10.0, 0.0, 0.0]), (10, [0.0, 9.5, 0.0, 0.0]), (11, [0.0, 9.7, 0.0, 0.0]), (12, [0.0, 9.7, 0.0, 0.0]), (13, [0.0, 0.0, 0.0, 10.3]), (14, [0.0, 0.0, 0.0, 9.5]), (15, [0.0, 0.0, 0.0, 10.0]), (16, [0.0, 0.0, 0.0, 10.5]);
+
+-- rows = 16, index_granularity = 4, GRANULARITY = 2 gives 2 annoy-indexed blocks (each comprising two granules)
+-- condition 'L2Distance(vector, reference_vector) < 1.0' ensures that only one annoy-indexed block produces results --> "Granules: 2/4"
+
+-- See (*) why commented out
+-- SELECT 'WHERE type, L2Distance';
+-- SELECT *
+-- FROM tab
+-- WHERE L2Distance(vector, [10.0, 0.0, 10.0, 0.0]) < 5.0
+-- LIMIT 3;
+
+SELECT 'WHERE type, L2Distance, check that index is used';
+EXPLAIN indexes=1
+SELECT *
+FROM tab
+WHERE L2Distance(vector, [10.0, 0.0, 10.0, 0.0]) < 5.0
+LIMIT 3;
+
+-- See (*) why commented out
+-- SELECT 'ORDER BY type, L2Distance';
+-- SELECT *
+-- FROM tab
+-- ORDER BY L2Distance(vector, [10.0, 0.0, 10.0, 0.0])
+-- LIMIT 3;
+
+SELECT 'ORDER BY type, L2Distance, check that index is used';
+EXPLAIN indexes=1
+SELECT *
+FROM tab
+ORDER BY L2Distance(vector, [10.0, 0.0, 10.0, 0.0])
+LIMIT 3;
+
+DROP TABLE tab;
+
+SELECT '--- Test with Array, GRANULARITY = 4, index_granularity = 4 ---';
+
+CREATE TABLE tab(id Int32, vector Array(Float32), INDEX annoy_index vector TYPE annoy() GRANULARITY 4) ENGINE = MergeTree ORDER BY id SETTINGS index_granularity = 4;
+INSERT INTO tab VALUES (1, [0.0, 0.0, 10.0, 0.0]), (2, [0.0, 0.0, 10.5, 0.0]), (3, [0.0, 0.0, 9.5, 0.0]), (4, [0.0, 0.0, 9.7, 0.0]), (5, [10.0, 0.0, 0.0, 0.0]), (6, [9.5, 0.0, 0.0, 0.0]), (7, [9.7, 0.0, 0.0, 0.0]), (8, [10.2, 0.0, 0.0, 0.0]), (9, [0.0, 10.0, 0.0, 0.0]), (10, [0.0, 9.5, 0.0, 0.0]), (11, [0.0, 9.7, 0.0, 0.0]), (12, [0.0, 9.7, 0.0, 0.0]), (13, [0.0, 0.0, 0.0, 10.3]), (14, [0.0, 0.0, 0.0, 9.5]), (15, [0.0, 0.0, 0.0, 10.0]), (16, [0.0, 0.0, 0.0, 10.5]);
+
+-- rows = 16, index_granularity = 4, GRANULARITY = 4 gives a single annoy-indexed block (comprising all granules)
+-- no two matches happen to be located in the same granule, so with LIMIT = 3, we'll get "Granules: 2/4"
+
+-- See (*) why commented out
+-- SELECT 'WHERE type, L2Distance';
+-- SELECT *
+-- FROM tab
+-- WHERE L2Distance(vector, [10.0, 0.0, 10.0, 0.0]) < 5.0
+-- LIMIT 3;
+
+SELECT 'WHERE type, L2Distance, check that index is used';
+EXPLAIN indexes=1
+SELECT *
+FROM tab
+WHERE L2Distance(vector, [10.0, 0.0, 10.0, 0.0]) < 5.0
+LIMIT 3;
+
+-- See (*) why commented out
+-- SELECT 'ORDER BY type, L2Distance';
+-- SELECT *
+-- FROM tab
+-- ORDER BY L2Distance(vector, [10.0, 0.0, 10.0, 0.0])
+-- LIMIT 3;
+
+SELECT 'ORDER BY type, L2Distance, check that index is used';
+EXPLAIN indexes=1
+SELECT *
+FROM tab
+ORDER BY L2Distance(vector, [10.0, 0.0, 10.0, 0.0])
+LIMIT 3;
+
+DROP TABLE tab;
+
+-- (*) Storage and search in Annoy indexes is inherently random. Tests which check for exact row matches would be unstable. Therefore,
+-- comment them out.
diff --git a/tests/queries/0_stateless/02354_tuple_element_with_default.reference b/tests/queries/0_stateless/02354_tuple_element_with_default.reference
index d5dfff17ef1..499b4c36a10 100644
--- a/tests/queries/0_stateless/02354_tuple_element_with_default.reference
+++ b/tests/queries/0_stateless/02354_tuple_element_with_default.reference
@@ -1,26 +1,15 @@
-z
-SELECT tupleElement(t1, \'z\', \'z\')
-FROM t_tuple_element_default
-0
-SELECT tupleElement(t1, \'z\', 0)
-FROM t_tuple_element_default
-z
-SELECT tupleElement(t2, \'z\', \'z\')
-FROM t_tuple_element_default
---------------------
-[(3,4)]
-SELECT tupleElement([(1, 2)], \'a\', [(3, 4)])
---------------------
-SELECT tupleElement(t1, \'a\', [tuple(1)])
-FROM t_tuple_element_default
---------------------
-[(0)]
-SELECT tupleElement(t1, \'a\', [tuple(0)])
-FROM t_tuple_element_default
-[0]
-SELECT tupleElement(t1, \'a\', [0])
-FROM t_tuple_element_default
-[0]
-[0]
-SELECT tupleElement(t1, \'a\', [0])
-FROM t_tuple_element_default
+hello
+world
+default
+default
+[(['a'],1)]
+[1,3]
+[2,4]
+default
+--------
+hello
+world
+default
+default
+[(['a'],1)]
+[[1,2,3]]
diff --git a/tests/queries/0_stateless/02354_tuple_element_with_default.sql b/tests/queries/0_stateless/02354_tuple_element_with_default.sql
index 908a869885b..89320f4d210 100644
--- a/tests/queries/0_stateless/02354_tuple_element_with_default.sql
+++ b/tests/queries/0_stateless/02354_tuple_element_with_default.sql
@@ -1,50 +1,23 @@
-DROP TABLE IF EXISTS t_tuple_element_default;
+-- const tuple argument
 
-CREATE TABLE t_tuple_element_default(t1 Tuple(a UInt32, s String), t2 Tuple(UInt32, String)) ENGINE = Memory;
-INSERT INTO t_tuple_element_default VALUES ((1, 'a'), (2, 'b'));
+SELECT tupleElement(('hello', 'world'), 1, 'default');
+SELECT tupleElement(('hello', 'world'), 2, 'default');
+SELECT tupleElement(('hello', 'world'), 3, 'default');
+SELECT tupleElement(('hello', 'world'), 'xyz', 'default');
+SELECT tupleElement(('hello', 'world'), 3, [([('a')], 1)]); -- arbitrary default value
 
-SELECT tupleElement(t1, 'z', 'z') FROM t_tuple_element_default;
-EXPLAIN SYNTAX SELECT tupleElement(t1, 'z', 'z') FROM t_tuple_element_default;
-SELECT tupleElement(t1, 'z', 0) FROM t_tuple_element_default;
-EXPLAIN SYNTAX SELECT tupleElement(t1, 'z', 0) FROM t_tuple_element_default;
-SELECT tupleElement(t2, 'z', 'z') FROM t_tuple_element_default;
-EXPLAIN SYNTAX SELECT tupleElement(t2, 'z', 'z') FROM t_tuple_element_default;
+SELECT tupleElement([(1, 2), (3, 4)], 1, 'default');
+SELECT tupleElement([(1, 2), (3, 4)], 2, 'default');
+SELECT tupleElement([(1, 2), (3, 4)], 3, 'default');
 
-SELECT tupleElement(t1, 3, 'z') FROM t_tuple_element_default; -- { serverError 127 }
-SELECT tupleElement(t1, 0, 'z') FROM t_tuple_element_default; -- { serverError 127 }
+SELECT '--------';
 
-DROP TABLE t_tuple_element_default;
+-- non-const tuple argument
 
-SELECT '--------------------';
-
-SELECT tupleElement(array(tuple(1, 2)), 'a', 0); -- { serverError 645 }
-SELECT tupleElement(array(tuple(1, 2)), 'a', array(tuple(1, 2), tuple(3, 4))); -- { serverError 190 }
-SELECT tupleElement(array(array(tuple(1))), 'a', array(array(1, 2, 3))); -- { serverError 190 }
-
-SELECT tupleElement(array(tuple(1, 2)), 'a', array(tuple(3, 4)));
-EXPLAIN SYNTAX SELECT tupleElement(array(tuple(1, 2)), 'a', array(tuple(3, 4)));
-
-SELECT '--------------------';
-
-CREATE TABLE t_tuple_element_default(t1 Array(Tuple(UInt32)), t2 UInt32) ENGINE = Memory;
-
-SELECT tupleElement(t1, 'a', array(tuple(1))) FROM t_tuple_element_default;
-EXPLAIN SYNTAX SELECT tupleElement(t1, 'a', array(tuple(1))) FROM t_tuple_element_default;
-
-SELECT '--------------------';
-
-INSERT INTO t_tuple_element_default VALUES ([(1)], 100);
-
-SELECT tupleElement(t1, 'a', array(tuple(0))) FROM t_tuple_element_default;
-EXPLAIN SYNTAX SELECT tupleElement(t1, 'a', array(tuple(0))) FROM t_tuple_element_default;
-
-SELECT tupleElement(t1, 'a', array(0)) FROM t_tuple_element_default;
-EXPLAIN SYNTAX SELECT tupleElement(t1, 'a', array(0)) FROM t_tuple_element_default;
-
-INSERT INTO t_tuple_element_default VALUES ([(2)], 200);
-
-SELECT tupleElement(t1, 'a', array(0)) FROM t_tuple_element_default;
-EXPLAIN SYNTAX SELECT tupleElement(t1, 'a', array(0)) FROM t_tuple_element_default;
-
-DROP TABLE t_tuple_element_default;
+SELECT tupleElement(materialize(('hello', 'world')), 1, 'default');
+SELECT tupleElement(materialize(('hello', 'world')), 2, 'default');
+SELECT tupleElement(materialize(('hello', 'world')), 3, 'default');
+SELECT tupleElement(materialize(('hello', 'world')), 'xzy', 'default');
+SELECT tupleElement(materialize(('hello', 'world')), 'xzy', [([('a')], 1)]); -- arbitrary default value
 
+SELECT tupleElement([[(count('2147483646'), 1)]], 'aaaa', [[1, 2, 3]]) -- bug #51525
diff --git a/tests/queries/0_stateless/02370_lost_part_intersecting_merges.sh b/tests/queries/0_stateless/02370_lost_part_intersecting_merges.sh
index bc297cbb963..e34163d0502 100755
--- a/tests/queries/0_stateless/02370_lost_part_intersecting_merges.sh
+++ b/tests/queries/0_stateless/02370_lost_part_intersecting_merges.sh
@@ -9,7 +9,7 @@ $CLICKHOUSE_CLIENT -q "drop table if exists rmt1 sync;"
 $CLICKHOUSE_CLIENT -q "drop table if exists rmt2 sync;"
 
 $CLICKHOUSE_CLIENT -q "create table rmt1 (n int) engine=ReplicatedMergeTree('/test/02369/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/{database}', '1') order by n
-  settings cleanup_delay_period=0, cleanup_delay_period_random_add=0, old_parts_lifetime=0"
+  settings cleanup_delay_period=0, cleanup_delay_period_random_add=0, cleanup_thread_preferred_points_per_iteration=0, old_parts_lifetime=0"
 $CLICKHOUSE_CLIENT -q "create table rmt2 (n int) engine=ReplicatedMergeTree('/test/02369/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/{database}', '2') order by n"
 
 $CLICKHOUSE_CLIENT -q "system stop replicated sends rmt2"
diff --git a/tests/queries/0_stateless/02377_optimize_sorting_by_input_stream_properties_explain.reference b/tests/queries/0_stateless/02377_optimize_sorting_by_input_stream_properties_explain.reference
index 69c325c21a9..5c9e39805b7 100644
--- a/tests/queries/0_stateless/02377_optimize_sorting_by_input_stream_properties_explain.reference
+++ b/tests/queries/0_stateless/02377_optimize_sorting_by_input_stream_properties_explain.reference
@@ -8,7 +8,7 @@ Sorting (None)
 -- QUERY (analyzer): set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a FROM optimize_sorting ORDER BY a
 Sorting (Global): a ASC
 Sorting (Sorting for ORDER BY)
-Sorting (Global): default.optimize_sorting.a_0 ASC
+Sorting (Global): a_0 ASC
 Sorting (None)
 Sorting (None)
 -- disable optimization -> sorting order is NOT propagated from subquery -> full sort
@@ -36,8 +36,8 @@ Sorting (Stream): a ASC
 -- QUERY (analyzer): set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a FROM optimize_sorting ORDER BY a
 Sorting (Global): a ASC
 Sorting (Sorting for ORDER BY)
-Sorting (Global): default.optimize_sorting.a_0 ASC
-Sorting (Stream): default.optimize_sorting.a_0 ASC
+Sorting (Global): a_0 ASC
+Sorting (Stream): a_0 ASC
 Sorting (Stream): a ASC
 -- QUERY: set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a FROM optimize_sorting ORDER BY a+1
 Sorting (None)
@@ -48,8 +48,8 @@ Sorting (Chunk): a ASC
 -- QUERY (analyzer): set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a FROM optimize_sorting ORDER BY a+1
 Sorting (None)
 Sorting (Sorting for ORDER BY)
-Sorting (Global): plus(default.optimize_sorting.a_0, 1_UInt8) ASC
-Sorting (Chunk): default.optimize_sorting.a_0 ASC
+Sorting (Global): plus(a_0, 1_UInt8) ASC
+Sorting (Chunk): a_0 ASC
 Sorting (Chunk): a ASC
 -- ExpressionStep breaks sort mode
 -- QUERY: set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a+1 FROM optimize_sorting ORDER BY a+1
@@ -61,7 +61,7 @@ Sorting (Chunk): a ASC
 -- QUERY (analyzer): set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a+1 FROM optimize_sorting ORDER BY a+1
 Sorting (Global): plus(a, 1) ASC
 Sorting (Sorting for ORDER BY)
-Sorting (Global): plus(default.optimize_sorting.a_0, 1_UInt8) ASC
+Sorting (Global): plus(a_0, 1_UInt8) ASC
 Sorting (None)
 Sorting (Chunk): a ASC
 -- FilterStep preserves sort mode
@@ -71,7 +71,7 @@ Sorting (Chunk): a ASC
 Sorting (Chunk): a ASC
 -- QUERY (analyzer): set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a FROM optimize_sorting WHERE a > 0
 Sorting (Chunk): a ASC
-Sorting (Chunk): default.optimize_sorting.a_0 ASC
+Sorting (Chunk): a_0 ASC
 Sorting (Chunk): a ASC
 -- QUERY: set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a FROM optimize_sorting WHERE a+1 > 0
 Sorting (Chunk): a ASC
@@ -79,7 +79,7 @@ Sorting (Chunk): a ASC
 Sorting (Chunk): a ASC
 -- QUERY (analyzer): set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a FROM optimize_sorting WHERE a+1 > 0
 Sorting (Chunk): a ASC
-Sorting (Chunk): default.optimize_sorting.a_0 ASC
+Sorting (Chunk): a_0 ASC
 Sorting (Chunk): a ASC
 -- QUERY: set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a, a+1 FROM optimize_sorting WHERE a+1 > 0
 Sorting (Chunk): a ASC
@@ -87,7 +87,7 @@ Sorting (Chunk): a ASC
 Sorting (Chunk): a ASC
 -- QUERY (analyzer): set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a, a+1 FROM optimize_sorting WHERE a+1 > 0
 Sorting (Chunk): a ASC
-Sorting (Chunk): default.optimize_sorting.a_0 ASC
+Sorting (Chunk): a_0 ASC
 Sorting (Chunk): a ASC
 -- FilterStep breaks sort mode
 -- QUERY: set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a > 0 FROM optimize_sorting WHERE a > 0
@@ -122,8 +122,8 @@ Sorting (Sorting for ORDER BY)
 Sorting (Global): a_0 ASC
 Sorting (None)
 Sorting (Sorting for ORDER BY)
-Sorting (Global): default.optimize_sorting.a_2 ASC
-Sorting (Stream): default.optimize_sorting.a_2 ASC
+Sorting (Global): a_2 ASC
+Sorting (Stream): a_2 ASC
 Sorting (Stream): a ASC
 -- aliases DONT break sorting order
 -- QUERY: set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN actions=1, header=1, sorting=1 SELECT a, b FROM (SELECT x AS a, y AS b FROM (SELECT a AS x, b AS y FROM optimize_sorting) ORDER BY x, y)
@@ -152,10 +152,10 @@ Sorting (Chunk): a ASC
 Sorting (None)
 Sorting (Sorting for ORDER BY)
 Sorting (Global): plus(a_0, 1_UInt8) ASC
-Sorting (Global): plus(default.optimize_sorting.a_3, 1_UInt8) ASC
+Sorting (Global): plus(a_3, 1_UInt8) ASC
 Sorting (Sorting for ORDER BY)
-Sorting (Global): plus(default.optimize_sorting.a_3, 1_UInt8) ASC
-Sorting (Chunk): default.optimize_sorting.a_3 ASC
+Sorting (Global): plus(a_3, 1_UInt8) ASC
+Sorting (Chunk): a_3 ASC
 Sorting (Chunk): a ASC
 -- check that correct sorting info is provided in case of only prefix of sorting key is in ORDER BY clause but all sorting key columns returned by query
 -- QUERY: set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN sorting=1 SELECT a, b FROM optimize_sorting ORDER BY a
@@ -167,6 +167,6 @@ Sorting (Stream): a ASC
 -- QUERY (analyzer): set optimize_read_in_order=1;set max_threads=3;set query_plan_remove_redundant_sorting=0;EXPLAIN PLAN sorting=1 SELECT a, b FROM optimize_sorting ORDER BY a
 Sorting (Global): a ASC
 Sorting (Sorting for ORDER BY)
-Sorting (Global): default.optimize_sorting.a_0 ASC
-Sorting (Stream): default.optimize_sorting.a_0 ASC
+Sorting (Global): a_0 ASC
+Sorting (Stream): a_0 ASC
 Sorting (Stream): a ASC
diff --git a/tests/queries/0_stateless/02381_join_dup_columns_in_plan.reference b/tests/queries/0_stateless/02381_join_dup_columns_in_plan.reference
index 31a37862663..dd5c9d4616e 100644
--- a/tests/queries/0_stateless/02381_join_dup_columns_in_plan.reference
+++ b/tests/queries/0_stateless/02381_join_dup_columns_in_plan.reference
@@ -2,51 +2,51 @@ Expression
 Header: key String
         value String
   Join
-  Header: s1.key_0 String
-          s2.value_1 String
+  Header: key_0 String
+          value_1 String
     Expression
-    Header: s1.key_0 String
+    Header: key_0 String
       ReadFromStorage
       Header: dummy UInt8
     Union
-    Header: s2.key_2 String
-            s2.value_1 String
+    Header: key_2 String
+            value_1 String
       Expression
-      Header: s2.key_2 String
-              s2.value_1 String
+      Header: key_2 String
+              value_1 String
         ReadFromStorage
         Header: dummy UInt8
       Expression
-      Header: s2.key_2 String
-              s2.value_1 String
+      Header: key_2 String
+              value_1 String
         ReadFromStorage
         Header: dummy UInt8
 Expression
 Header: key String
         value String
   Join
-  Header: s1.key_0 String
-          s2.key_2 String
-          s2.value_1 String
+  Header: key_0 String
+          key_2 String
+          value_1 String
     Sorting
-    Header: s1.key_0 String
+    Header: key_0 String
       Expression
-      Header: s1.key_0 String
+      Header: key_0 String
         ReadFromStorage
         Header: dummy UInt8
     Sorting
-    Header: s2.key_2 String
-            s2.value_1 String
+    Header: key_2 String
+            value_1 String
       Union
-      Header: s2.key_2 String
-              s2.value_1 String
+      Header: key_2 String
+              value_1 String
         Expression
-        Header: s2.key_2 String
-                s2.value_1 String
+        Header: key_2 String
+                value_1 String
           ReadFromStorage
           Header: dummy UInt8
         Expression
-        Header: s2.key_2 String
-                s2.value_1 String
+        Header: key_2 String
+                value_1 String
           ReadFromStorage
           Header: dummy UInt8
diff --git a/tests/queries/0_stateless/02382_filesystem_cache_persistent_files.reference b/tests/queries/0_stateless/02382_filesystem_cache_persistent_files.reference
deleted file mode 100644
index e77afc98007..00000000000
--- a/tests/queries/0_stateless/02382_filesystem_cache_persistent_files.reference
+++ /dev/null
@@ -1,79 +0,0 @@
--- { echo }
-
-SET enable_filesystem_cache_on_write_operations=0;
-SYSTEM DROP FILESYSTEM CACHE;
-DROP TABLE IF EXISTS nopers;
-CREATE TABLE nopers (key UInt32, value String) Engine=MergeTree() ORDER BY key SETTINGS storage_policy='s3_cache', min_bytes_for_wide_part = 10485760, compress_marks=false, compress_primary_key=false;
-SYSTEM STOP MERGES nopers;
-INSERT INTO nopers SELECT number, toString(number) FROM numbers(10);
-SELECT * FROM nopers FORMAT Null;
-SELECT sum(size) FROM system.filesystem_cache;
-195
-SELECT extract(local_path, '.*/([\w.]+)') as file, extract(cache_path, '.*/([\w.]+)') as cache, size
-FROM
-(
-    SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path
-    FROM system.remote_data_paths
-) AS data_paths
-INNER JOIN
-    system.filesystem_cache AS caches
-ON data_paths.cache_path = caches.cache_path
-ORDER BY file, cache, size;
-data.bin	0	114
-data.mrk3	0	80
-format_version.txt	0	1
-DROP TABLE IF EXISTS test;
-CREATE TABLE test (key UInt32, value String) Engine=MergeTree() ORDER BY key SETTINGS storage_policy='s3_cache_small', min_bytes_for_wide_part = 10485760, compress_marks=false, compress_primary_key=false;
-SYSTEM STOP MERGES test;
-INSERT INTO test SELECT number, toString(number) FROM numbers(100);
-SELECT * FROM test FORMAT Null;
-SELECT sum(size) FROM system.filesystem_cache;
-1021
-SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path;
-5
-SELECT count() FROM system.filesystem_cache;
-5
-SELECT extract(local_path, '.*/([\w.]+)') as file, extract(cache_path, '.*/([\w.]+)') as cache, size
-FROM
-(
-    SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path
-    FROM system.remote_data_paths
-) AS data_paths
-INNER JOIN
-    system.filesystem_cache AS caches
-ON data_paths.cache_path = caches.cache_path
-ORDER BY file, cache, size;
-data.bin	0	114
-data.bin	0	746
-data.mrk3	0	80
-data.mrk3	0_persistent	80
-format_version.txt	0	1
-DROP TABLE IF EXISTS test2;
-CREATE TABLE test2 (key UInt32, value String) Engine=MergeTree() ORDER BY key SETTINGS storage_policy='s3_cache_small', min_bytes_for_wide_part = 10485760, compress_marks=false, compress_primary_key=false;
-SYSTEM STOP MERGES test2;
-INSERT INTO test2 SELECT number, toString(number) FROM numbers(100000);
-SELECT * FROM test2 FORMAT Null;
-SELECT sum(size) FROM system.filesystem_cache;
-795
-SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path;
-5
-SELECT count() FROM system.filesystem_cache;
-5
-SELECT extract(local_path, '.*/([\w.]+)') as file, extract(cache_path, '.*/([\w.]+)') as cache, size
-FROM
-(
-    SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path
-    FROM system.remote_data_paths
-) AS data_paths
-INNER JOIN
-    system.filesystem_cache AS caches
-ON data_paths.cache_path = caches.cache_path
-ORDER BY file, cache, size;
-data.bin	0	114
-data.mrk3	0	80
-data.mrk3	0_persistent	80
-data.mrk3	0_persistent	520
-format_version.txt	0	1
-DROP TABLE test;
-DROP TABLE test2;
-DROP TABLE nopers;
diff --git a/tests/queries/0_stateless/02382_filesystem_cache_persistent_files.sql b/tests/queries/0_stateless/02382_filesystem_cache_persistent_files.sql
deleted file mode 100644
index 6486840602e..00000000000
--- a/tests/queries/0_stateless/02382_filesystem_cache_persistent_files.sql
+++ /dev/null
@@ -1,76 +0,0 @@
--- Tags: no-fasttest, no-parallel, no-s3-storage, no-random-settings
-
--- { echo }
-
-SET enable_filesystem_cache_on_write_operations=0;
-
-SYSTEM DROP FILESYSTEM CACHE;
-
-DROP TABLE IF EXISTS nopers;
-CREATE TABLE nopers (key UInt32, value String) Engine=MergeTree() ORDER BY key SETTINGS storage_policy='s3_cache', min_bytes_for_wide_part = 10485760, compress_marks=false, compress_primary_key=false;
-SYSTEM STOP MERGES nopers;
-
-INSERT INTO nopers SELECT number, toString(number) FROM numbers(10);
-SELECT * FROM nopers FORMAT Null;
-SELECT sum(size) FROM system.filesystem_cache;
-
-SELECT extract(local_path, '.*/([\w.]+)') as file, extract(cache_path, '.*/([\w.]+)') as cache, size
-FROM
-(
-    SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path
-    FROM system.remote_data_paths
-) AS data_paths
-INNER JOIN
-    system.filesystem_cache AS caches
-ON data_paths.cache_path = caches.cache_path
-ORDER BY file, cache, size;
-
-DROP TABLE IF EXISTS test;
-CREATE TABLE test (key UInt32, value String) Engine=MergeTree() ORDER BY key SETTINGS storage_policy='s3_cache_small', min_bytes_for_wide_part = 10485760, compress_marks=false, compress_primary_key=false;
-SYSTEM STOP MERGES test;
-
-INSERT INTO test SELECT number, toString(number) FROM numbers(100);
-SELECT * FROM test FORMAT Null;
-
-SELECT sum(size) FROM system.filesystem_cache;
-
-SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path;
-SELECT count() FROM system.filesystem_cache;
-
-SELECT extract(local_path, '.*/([\w.]+)') as file, extract(cache_path, '.*/([\w.]+)') as cache, size
-FROM
-(
-    SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path
-    FROM system.remote_data_paths
-) AS data_paths
-INNER JOIN
-    system.filesystem_cache AS caches
-ON data_paths.cache_path = caches.cache_path
-ORDER BY file, cache, size;
-
-DROP TABLE IF EXISTS test2;
-CREATE TABLE test2 (key UInt32, value String) Engine=MergeTree() ORDER BY key SETTINGS storage_policy='s3_cache_small', min_bytes_for_wide_part = 10485760, compress_marks=false, compress_primary_key=false;
-SYSTEM STOP MERGES test2;
-
-INSERT INTO test2 SELECT number, toString(number) FROM numbers(100000);
-SELECT * FROM test2 FORMAT Null;
-
-SELECT sum(size) FROM system.filesystem_cache;
-
-SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path;
-SELECT count() FROM system.filesystem_cache;
-
-SELECT extract(local_path, '.*/([\w.]+)') as file, extract(cache_path, '.*/([\w.]+)') as cache, size
-FROM
-(
-    SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path
-    FROM system.remote_data_paths
-) AS data_paths
-INNER JOIN
-    system.filesystem_cache AS caches
-ON data_paths.cache_path = caches.cache_path
-ORDER BY file, cache, size;
-
-DROP TABLE test;
-DROP TABLE test2;
-DROP TABLE nopers;
diff --git a/tests/queries/0_stateless/02396_system_parts_race_condition_rm.sh b/tests/queries/0_stateless/02396_system_parts_race_condition_rm.sh
index 5df1a9ba095..e31a091ff45 100755
--- a/tests/queries/0_stateless/02396_system_parts_race_condition_rm.sh
+++ b/tests/queries/0_stateless/02396_system_parts_race_condition_rm.sh
@@ -15,8 +15,12 @@ $CLICKHOUSE_CLIENT -n -q "
     DROP TABLE IF EXISTS alter_table0;
     DROP TABLE IF EXISTS alter_table1;
 
-    CREATE TABLE alter_table0 (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16)) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/alter_table', 'r1') ORDER BY a PARTITION BY b % 10 SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 1, cleanup_delay_period_random_add = 0;
-    CREATE TABLE alter_table1 (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16)) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/alter_table', 'r2') ORDER BY a PARTITION BY b % 10 SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 1, cleanup_delay_period_random_add = 0
+    CREATE TABLE alter_table0 (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16))
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/alter_table', 'r1') ORDER BY a PARTITION BY b % 10
+    SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 1, cleanup_delay_period_random_add = 0, cleanup_thread_preferred_points_per_iteration=0;
+    CREATE TABLE alter_table1 (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16))
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/alter_table', 'r2') ORDER BY a PARTITION BY b % 10
+    SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 1, cleanup_delay_period_random_add = 0, cleanup_thread_preferred_points_per_iteration=0
 "
 
 function thread1()
diff --git a/tests/queries/0_stateless/02397_system_parts_race_condition_drop_rm.sh b/tests/queries/0_stateless/02397_system_parts_race_condition_drop_rm.sh
index 548179b94c9..39e513f6be4 100755
--- a/tests/queries/0_stateless/02397_system_parts_race_condition_drop_rm.sh
+++ b/tests/queries/0_stateless/02397_system_parts_race_condition_drop_rm.sh
@@ -58,7 +58,9 @@ function thread6()
     while true; do
         REPLICA=$(($RANDOM % 10))
         $CLICKHOUSE_CLIENT -n -q "DROP TABLE IF EXISTS alter_table_$REPLICA;
-            CREATE TABLE alter_table_$REPLICA (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16)) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/alter_table', 'r_$REPLICA') ORDER BY a PARTITION BY b % 10 SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0;";
+            CREATE TABLE alter_table_$REPLICA (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16))
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/alter_table', 'r_$REPLICA') ORDER BY a PARTITION BY b % 10
+            SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0, cleanup_thread_preferred_points_per_iteration=0;";
         sleep 0.$RANDOM;
     done
 }
diff --git a/tests/queries/0_stateless/02414_all_new_table_functions_must_be_documented.reference b/tests/queries/0_stateless/02414_all_new_table_functions_must_be_documented.reference
index 2277e19cf25..bc83e626207 100644
--- a/tests/queries/0_stateless/02414_all_new_table_functions_must_be_documented.reference
+++ b/tests/queries/0_stateless/02414_all_new_table_functions_must_be_documented.reference
@@ -13,6 +13,7 @@ null
 numbers
 numbers_mt
 odbc
+redis
 remote
 remoteSecure
 url
diff --git a/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference b/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
index bf43288fe1d..b5c133988e6 100644
--- a/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
+++ b/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
@@ -686,7 +686,6 @@ throwIf
 tid
 timeSlot
 timeSlots
-timezone
 timezoneOf
 timezoneOffset
 toBool
diff --git a/tests/queries/0_stateless/02421_explain_subquery.sql b/tests/queries/0_stateless/02421_explain_subquery.sql
index 32631b54d0c..4b970f81219 100644
--- a/tests/queries/0_stateless/02421_explain_subquery.sql
+++ b/tests/queries/0_stateless/02421_explain_subquery.sql
@@ -34,7 +34,7 @@ DROP TABLE t1;
 
 SET allow_experimental_analyzer = 1;
 
-SELECT count() > 3 FROM (EXPLAIN PIPELINE header = 1 SELECT * FROM system.numbers ORDER BY number DESC) WHERE explain LIKE '%Header: system.numbers.number__ UInt64%';
+SELECT count() > 3 FROM (EXPLAIN PIPELINE header = 1 SELECT * FROM system.numbers ORDER BY number DESC) WHERE explain LIKE '%Header: number__ UInt64%';
 SELECT count() > 0 FROM (EXPLAIN PLAN SELECT * FROM system.numbers ORDER BY number DESC) WHERE explain ILIKE '%Sort%';
 SELECT count() > 0 FROM (EXPLAIN SELECT * FROM system.numbers ORDER BY number DESC) WHERE explain ILIKE '%Sort%';
 SELECT count() > 0 FROM (EXPLAIN CURRENT TRANSACTION);
diff --git a/tests/queries/0_stateless/02427_mutate_and_zero_copy_replication_zookeeper.sql b/tests/queries/0_stateless/02427_mutate_and_zero_copy_replication_zookeeper.sql
index 9b0a52b8dbd..e3c8583ccf4 100644
--- a/tests/queries/0_stateless/02427_mutate_and_zero_copy_replication_zookeeper.sql
+++ b/tests/queries/0_stateless/02427_mutate_and_zero_copy_replication_zookeeper.sql
@@ -9,7 +9,7 @@ CREATE TABLE mutate_and_zero_copy_replication1
 )
 ENGINE ReplicatedMergeTree('/clickhouse/tables/{database}/test_02427_mutate_and_zero_copy_replication/alter', '1')
 ORDER BY tuple()
-SETTINGS old_parts_lifetime=0, cleanup_delay_period=300, cleanup_delay_period_random_add=300, min_bytes_for_wide_part = 0;
+SETTINGS old_parts_lifetime=0, cleanup_delay_period=300, max_cleanup_delay_period=300, cleanup_delay_period_random_add=300, min_bytes_for_wide_part = 0;
 
 CREATE TABLE mutate_and_zero_copy_replication2
 (
@@ -19,7 +19,7 @@ CREATE TABLE mutate_and_zero_copy_replication2
 )
 ENGINE ReplicatedMergeTree('/clickhouse/tables/{database}/test_02427_mutate_and_zero_copy_replication/alter', '2')
 ORDER BY tuple()
-SETTINGS old_parts_lifetime=0, cleanup_delay_period=300, cleanup_delay_period_random_add=300;
+SETTINGS old_parts_lifetime=0, cleanup_delay_period=300,  max_cleanup_delay_period=300, cleanup_delay_period_random_add=300;
 
 
 INSERT INTO mutate_and_zero_copy_replication1 VALUES (1, '1', 1.0);
diff --git a/tests/queries/0_stateless/02428_parameterized_view.reference b/tests/queries/0_stateless/02428_parameterized_view.reference
index b73c52c478f..422fdaa4983 100644
--- a/tests/queries/0_stateless/02428_parameterized_view.reference
+++ b/tests/queries/0_stateless/02428_parameterized_view.reference
@@ -40,3 +40,4 @@ ERROR
 10
 10
 1
+ERROR
diff --git a/tests/queries/0_stateless/02428_parameterized_view.sh b/tests/queries/0_stateless/02428_parameterized_view.sh
index 3abfbfc22fc..ad9c672f4c5 100755
--- a/tests/queries/0_stateless/02428_parameterized_view.sh
+++ b/tests/queries/0_stateless/02428_parameterized_view.sh
@@ -112,7 +112,10 @@ $CLICKHOUSE_CLIENT -q "CREATE VIEW 02428_trace_view AS WITH  {trace_id:String} A
                        FROM 02428_otel_traces"
 $CLICKHOUSE_CLIENT -q "SELECT * FROM 02428_trace_view(trace_id='1')"
 
+$CLICKHOUSE_CLIENT -q "CREATE MATERIALIZED VIEW test_02428_mv1 ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/materialized_view', 'r1') ORDER BY Name AS SELECT * FROM test_02428_Catalog;"
+$CLICKHOUSE_CLIENT -q "SELECT * FROM test_02428_mv1(test)" 2>&1 |  grep -Fq "UNKNOWN_FUNCTION" && echo 'ERROR' || echo 'OK'
 
+$CLICKHOUSE_CLIENT -q "DROP VIEW test_02428_mv1"
 $CLICKHOUSE_CLIENT -q "DROP VIEW test_02428_pv1"
 $CLICKHOUSE_CLIENT -q "DROP VIEW test_02428_pv2"
 $CLICKHOUSE_CLIENT -q "DROP VIEW test_02428_pv3"
diff --git a/tests/queries/0_stateless/02432_s3_parallel_parts_cleanup.sql b/tests/queries/0_stateless/02432_s3_parallel_parts_cleanup.sql
index 88fb2cdf9b1..948ec9e9e8a 100644
--- a/tests/queries/0_stateless/02432_s3_parallel_parts_cleanup.sql
+++ b/tests/queries/0_stateless/02432_s3_parallel_parts_cleanup.sql
@@ -8,7 +8,7 @@ drop table if exists rmt2;
 -- Disable compact parts, because we need hardlinks in mutations.
 create table rmt (n int, m int, k int) engine=ReplicatedMergeTree('/test/02432/{database}', '1') order by tuple()
     settings storage_policy = 's3_cache', allow_remote_fs_zero_copy_replication=1,
-        max_part_removal_threads=10, concurrent_part_removal_threshold=1, cleanup_delay_period=1, cleanup_delay_period_random_add=1,
+        concurrent_part_removal_threshold=1, cleanup_delay_period=1, cleanup_delay_period_random_add=1, cleanup_thread_preferred_points_per_iteration=0,
         max_replicated_merges_in_queue=0, max_replicated_mutations_in_queue=0, min_bytes_for_wide_part=0, min_rows_for_wide_part=0;
 
 insert into rmt(n, m) values (1, 42);
@@ -38,7 +38,7 @@ select count(), sum(n), sum(m) from rmt;
 -- New table can assign merges/mutations and can remove old parts
 create table rmt2 (n int, m int, k String) engine=ReplicatedMergeTree('/test/02432/{database}', '2') order by tuple()
     settings storage_policy = 's3_cache', allow_remote_fs_zero_copy_replication=1,
-        max_part_removal_threads=10, concurrent_part_removal_threshold=1, cleanup_delay_period=1, cleanup_delay_period_random_add=1,
+        concurrent_part_removal_threshold=1, cleanup_delay_period=1, cleanup_delay_period_random_add=1, cleanup_thread_preferred_points_per_iteration=0,
         min_bytes_for_wide_part=0, min_rows_for_wide_part=0, max_replicated_merges_in_queue=1,
         old_parts_lifetime=0;
 
@@ -66,4 +66,3 @@ drop table rmt2;
 system flush logs;
 select count() > 0 from system.text_log where yesterday() <= event_date and logger_name like '%' || currentDatabase() || '%' and message like '%Removing % parts from filesystem (concurrently): Parts:%';
 select count() > 1, countDistinct(thread_id) > 1 from system.text_log where yesterday() <= event_date and logger_name like '%' || currentDatabase() || '%' and message like '%Removing % parts in blocks range%';
-
diff --git a/tests/queries/0_stateless/02444_async_broken_outdated_part_loading.reference b/tests/queries/0_stateless/02444_async_broken_outdated_part_loading.reference
new file mode 100644
index 00000000000..389b1b4ec25
--- /dev/null
+++ b/tests/queries/0_stateless/02444_async_broken_outdated_part_loading.reference
@@ -0,0 +1,5 @@
+1	1	all_0_1_1
+1	2	all_0_1_1
+0
+2	1	all_0_1_1
+2	2	all_0_1_1
diff --git a/tests/queries/0_stateless/02444_async_broken_outdated_part_loading.sh b/tests/queries/0_stateless/02444_async_broken_outdated_part_loading.sh
new file mode 100755
index 00000000000..d24c6afcef3
--- /dev/null
+++ b/tests/queries/0_stateless/02444_async_broken_outdated_part_loading.sh
@@ -0,0 +1,35 @@
+#!/usr/bin/env bash
+# Tags: long, zookeeper
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT -q "drop table if exists rmt sync;"
+$CLICKHOUSE_CLIENT -q "create table rmt (n int) engine=ReplicatedMergeTree('/test/02444/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/rmt', '1') order by n"
+
+$CLICKHOUSE_CLIENT --insert_keeper_fault_injection_probability=0 -q "insert into rmt values (1);"
+$CLICKHOUSE_CLIENT --insert_keeper_fault_injection_probability=0 -q "insert into rmt values (2);"
+
+$CLICKHOUSE_CLIENT -q "system sync replica rmt pull;"
+$CLICKHOUSE_CLIENT --optimize_throw_if_noop=1 -q "optimize table rmt final"
+$CLICKHOUSE_CLIENT -q "system sync replica rmt;"
+$CLICKHOUSE_CLIENT -q "select 1, *, _part from rmt order by n;"
+
+path=$($CLICKHOUSE_CLIENT -q "select path from system.parts where database='$CLICKHOUSE_DATABASE' and table='rmt' and name='all_1_1_0'")
+# ensure that path is absolute before removing
+$CLICKHOUSE_CLIENT -q "select throwIf(substring('$path', 1, 1) != '/', 'Path is relative: $path')" || exit
+rm -f "$path/*.bin"
+
+$CLICKHOUSE_CLIENT -q "detach table rmt sync;"
+$CLICKHOUSE_CLIENT -q "attach table rmt;"
+$CLICKHOUSE_CLIENT -q "select 2, *, _part from rmt order by n;"
+
+$CLICKHOUSE_CLIENT -q "truncate table rmt;"
+
+$CLICKHOUSE_CLIENT -q "detach table rmt sync;"
+$CLICKHOUSE_CLIENT -q "attach table rmt;"
+
+$CLICKHOUSE_CLIENT -q "SELECT table, lost_part_count FROM system.replicas WHERE database=currentDatabase() AND lost_part_count!=0";
+
+$CLICKHOUSE_CLIENT -q "drop table rmt sync;"
diff --git a/tests/queries/0_stateless/02445_replicated_db_alter_partition.reference b/tests/queries/0_stateless/02445_replicated_db_alter_partition.reference
new file mode 100644
index 00000000000..e95b2e817e2
--- /dev/null
+++ b/tests/queries/0_stateless/02445_replicated_db_alter_partition.reference
@@ -0,0 +1,20 @@
+not allowed to execute ALTERs of different types
+not allowed to execute ALTERs of different types
+not allowed to execute ALTERs of different types
+not allowed to execute ALTERs of different types
+TIMEOUT_EXCEEDED
+TIMEOUT_EXCEEDED
+TIMEOUT_EXCEEDED
+TIMEOUT_EXCEEDED
+not allowed to execute ALTERs of different types
+not allowed to execute ALTERs of different types
+not allowed to execute ALTERs of different types
+not allowed to execute ALTERs of different types
+TIMEOUT_EXCEEDED
+1	0
+1	2
+TIMEOUT_EXCEEDED
+2	0
+TIMEOUT_EXCEEDED
+3	0
+3	0
diff --git a/tests/queries/0_stateless/02445_replicated_db_alter_partition.sh b/tests/queries/0_stateless/02445_replicated_db_alter_partition.sh
new file mode 100755
index 00000000000..e07737225db
--- /dev/null
+++ b/tests/queries/0_stateless/02445_replicated_db_alter_partition.sh
@@ -0,0 +1,59 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+db="rdb_$CLICKHOUSE_DATABASE"
+db2="${db}_2"
+db3="${db}_3"
+
+$CLICKHOUSE_CLIENT --allow_experimental_database_replicated=1 -q "create database $db engine=Replicated('/test/$CLICKHOUSE_DATABASE/rdb', 's1', 'r1')"
+
+$CLICKHOUSE_CLIENT --distributed_ddl_output_mode=none -q "create table $db.mt (n int) engine=MergeTree order by tuple()"
+$CLICKHOUSE_CLIENT --distributed_ddl_output_mode=none -q "create table $db.rmt (n int) engine=ReplicatedMergeTree order by tuple()"
+
+$CLICKHOUSE_CLIENT -q "insert into $db.rmt values (0), (1)"
+$CLICKHOUSE_CLIENT -q "insert into $db.mt values (0), (1)"
+
+$CLICKHOUSE_CLIENT --allow_experimental_database_replicated=1 -q "create database $db2 engine=Replicated('/test/$CLICKHOUSE_DATABASE/rdb', 's1', 'r2')"
+$CLICKHOUSE_CLIENT --allow_experimental_database_replicated=1 -q "create database $db3 engine=Replicated('/test/$CLICKHOUSE_DATABASE/rdb', 's2', 'r1')"
+
+$CLICKHOUSE_CLIENT -q "alter table $db.mt drop partition id 'all', add column m int" 2>&1| grep -Eo "not allowed to execute ALTERs of different types" | head -1
+$CLICKHOUSE_CLIENT -q "alter table $db.rmt drop partition id 'all', add column m int" 2>&1| grep -Eo "not allowed to execute ALTERs of different types" | head -1
+
+$CLICKHOUSE_CLIENT -q "alter table $db.mt drop partition id 'all', update n = 2 where 1" 2>&1| grep -Eo "not allowed to execute ALTERs of different types" | head -1
+$CLICKHOUSE_CLIENT -q "alter table $db.rmt drop partition id 'all', update n = 2 where 1" 2>&1| grep -Eo "not allowed to execute ALTERs of different types" | head -1
+
+$CLICKHOUSE_CLIENT --distributed_ddl_task_timeout=3 -q "delete from $db.mt where n=2" 2>&1| grep -Eo "TIMEOUT_EXCEEDED" | head -1
+$CLICKHOUSE_CLIENT --distributed_ddl_task_timeout=3 -q "delete from $db.rmt where n=2" 2>&1| grep -Eo "TIMEOUT_EXCEEDED" | head -1
+
+$CLICKHOUSE_CLIENT --distributed_ddl_task_timeout=3 -q "alter table $db.mt update n=2 where n=3" 2>&1| grep -Eo "TIMEOUT_EXCEEDED" | head -1
+$CLICKHOUSE_CLIENT --distributed_ddl_task_timeout=3 -q "alter table $db.rmt update n=2 where n=3" 2>&1| grep -Eo "TIMEOUT_EXCEEDED" | head -1
+
+$CLICKHOUSE_CLIENT -q "drop database $db3"
+# now there's only one shard
+
+$CLICKHOUSE_CLIENT -q "alter table $db.mt drop partition id 'all', add column m int" 2>&1| grep -Eo "not allowed to execute ALTERs of different types" | head -1
+$CLICKHOUSE_CLIENT -q "alter table $db.rmt drop partition id 'all', add column m int" 2>&1| grep -Eo "not allowed to execute ALTERs of different types" | head -1
+
+$CLICKHOUSE_CLIENT -q "alter table $db.mt drop partition id 'all', update n = 2 where 1" 2>&1| grep -Eo "not allowed to execute ALTERs of different types" | head -1
+$CLICKHOUSE_CLIENT -q "alter table $db.rmt drop partition id 'all', update n = 2 where 1" 2>&1| grep -Eo "not allowed to execute ALTERs of different types" | head -1
+
+$CLICKHOUSE_CLIENT --distributed_ddl_task_timeout=3 -q "alter table $db.mt update n=2 where n=1" 2>&1| grep -Eo "TIMEOUT_EXCEEDED" | head -1
+$CLICKHOUSE_CLIENT -q "alter table $db.rmt update n=2 where n=1 settings mutations_sync=1"
+
+$CLICKHOUSE_CLIENT -q "select 1, * from $db.rmt order by n"
+
+$CLICKHOUSE_CLIENT --distributed_ddl_task_timeout=3 -q "delete from $db.mt where n=2" 2>&1| grep -Eo "TIMEOUT_EXCEEDED" | head -1
+$CLICKHOUSE_CLIENT --distributed_ddl_task_timeout=3 -q "delete from $db.rmt where n=2"
+
+$CLICKHOUSE_CLIENT -q "select 2, * from $db.rmt order by n"
+
+$CLICKHOUSE_CLIENT --distributed_ddl_task_timeout=3 -q "delete from $db.mt where n=2" 2>&1| grep -Eo "TIMEOUT_EXCEEDED" | head -1
+$CLICKHOUSE_CLIENT --distributed_ddl_task_timeout=3 -q "alter table $db.rmt attach partition id 'all' from $db.mt"
+
+$CLICKHOUSE_CLIENT -q "select 3, * from $db.rmt order by n"
+
+$CLICKHOUSE_CLIENT -q "drop database $db2"
+$CLICKHOUSE_CLIENT -q "drop database $db"
diff --git a/tests/queries/0_stateless/02448_clone_replica_lost_part.sql b/tests/queries/0_stateless/02448_clone_replica_lost_part.sql
index 4befe952a14..ec669ace620 100644
--- a/tests/queries/0_stateless/02448_clone_replica_lost_part.sql
+++ b/tests/queries/0_stateless/02448_clone_replica_lost_part.sql
@@ -5,9 +5,15 @@ SET insert_keeper_fault_injection_probability=0; -- disable fault injection; par
 drop table if exists rmt1;
 drop table if exists rmt2;
 create table rmt1 (n int) engine=ReplicatedMergeTree('/test/02448/{database}/rmt', '1') order by tuple()
-    settings min_replicated_logs_to_keep=1, max_replicated_logs_to_keep=2, cleanup_delay_period=0, cleanup_delay_period_random_add=1, old_parts_lifetime=0, max_parts_to_merge_at_once=4;
+    settings min_replicated_logs_to_keep=1, max_replicated_logs_to_keep=2,
+    max_cleanup_delay_period=1, cleanup_delay_period=0, cleanup_delay_period_random_add=1,
+    cleanup_thread_preferred_points_per_iteration=0, old_parts_lifetime=0, max_parts_to_merge_at_once=4,
+    merge_selecting_sleep_ms=1000, max_merge_selecting_sleep_ms=2000;
 create table rmt2 (n int) engine=ReplicatedMergeTree('/test/02448/{database}/rmt', '2') order by tuple()
-    settings min_replicated_logs_to_keep=1, max_replicated_logs_to_keep=2, cleanup_delay_period=0, cleanup_delay_period_random_add=1, old_parts_lifetime=0, max_parts_to_merge_at_once=4;
+    settings min_replicated_logs_to_keep=1, max_replicated_logs_to_keep=2,
+    max_cleanup_delay_period=1, cleanup_delay_period=0, cleanup_delay_period_random_add=1,
+    cleanup_thread_preferred_points_per_iteration=0, old_parts_lifetime=0, max_parts_to_merge_at_once=4,
+    merge_selecting_sleep_ms=1000, max_merge_selecting_sleep_ms=2000;
 
 -- insert part only on one replica
 system stop replicated sends rmt1;
@@ -137,7 +143,10 @@ system sync replica rmt2;
 -- merge through gap
 optimize table rmt2;
 -- give it a chance to cleanup log
-select sleep(2) format Null; -- increases probability of reproducing the issue
+
+select sleepEachRow(2) from url('http://localhost:8123/?param_tries={1..10}&query=' || encodeURLComponent(
+            'select value from system.zookeeper where path=''/test/02448/' || currentDatabase() || '/rmt/replicas/1'' and name=''is_lost'' and value=''0'''
+    ), 'LineAsString', 's String') settings max_threads=1 format Null;
 
 -- rmt1 will mimic rmt2, but will not be able to fetch parts for a while
 system stop replicated sends rmt2;
diff --git a/tests/queries/0_stateless/02451_order_by_monotonic.reference b/tests/queries/0_stateless/02451_order_by_monotonic.reference
index f9f0ef38be1..05f20a9bad8 100644
--- a/tests/queries/0_stateless/02451_order_by_monotonic.reference
+++ b/tests/queries/0_stateless/02451_order_by_monotonic.reference
@@ -4,19 +4,19 @@
 2022-09-09 12:00:00	0x
 2022-09-09 12:00:00	1
 2022-09-09 12:00:00	1x
-  Prefix sort description: toStartOfMinute(test.t_0) ASC
-  Result sort description: toStartOfMinute(test.t_0) ASC, test.c1_1 ASC
-  Prefix sort description: toStartOfMinute(test.t_0) ASC
-  Result sort description: toStartOfMinute(test.t_0) ASC
-  Prefix sort description: negate(test.a_0) ASC
-  Result sort description: negate(test.a_0) ASC
-  Prefix sort description: negate(test.a_0) ASC, negate(test.b_1) ASC
-  Result sort description: negate(test.a_0) ASC, negate(test.b_1) ASC
-  Prefix sort description: test.a_0 DESC, negate(test.b_1) ASC
-  Result sort description: test.a_0 DESC, negate(test.b_1) ASC
-  Prefix sort description: negate(test.a_0) ASC, test.b_1 DESC
-  Result sort description: negate(test.a_0) ASC, test.b_1 DESC
-  Prefix sort description: negate(test.a_0) ASC
-  Result sort description: negate(test.a_0) ASC, test.b_1 ASC
-  Prefix sort description: test.a_0 ASC
-  Result sort description: test.a_0 ASC, negate(test.b_1) ASC
+  Prefix sort description: toStartOfMinute(t_0) ASC
+  Result sort description: toStartOfMinute(t_0) ASC, c1_1 ASC
+  Prefix sort description: toStartOfMinute(t_0) ASC
+  Result sort description: toStartOfMinute(t_0) ASC
+  Prefix sort description: negate(a_0) ASC
+  Result sort description: negate(a_0) ASC
+  Prefix sort description: negate(a_0) ASC, negate(b_1) ASC
+  Result sort description: negate(a_0) ASC, negate(b_1) ASC
+  Prefix sort description: a_0 DESC, negate(b_1) ASC
+  Result sort description: a_0 DESC, negate(b_1) ASC
+  Prefix sort description: negate(a_0) ASC, b_1 DESC
+  Result sort description: negate(a_0) ASC, b_1 DESC
+  Prefix sort description: negate(a_0) ASC
+  Result sort description: negate(a_0) ASC, b_1 ASC
+  Prefix sort description: a_0 ASC
+  Result sort description: a_0 ASC, negate(b_1) ASC
diff --git a/tests/queries/0_stateless/02458_relax_too_many_parts.sql b/tests/queries/0_stateless/02458_relax_too_many_parts.sql
index a1f8e86fce5..01f9edce675 100644
--- a/tests/queries/0_stateless/02458_relax_too_many_parts.sql
+++ b/tests/queries/0_stateless/02458_relax_too_many_parts.sql
@@ -1,5 +1,5 @@
 DROP TABLE IF EXISTS test;
-CREATE TABLE test (x UInt64, s String) ENGINE = MergeTree ORDER BY tuple() SETTINGS parts_to_throw_insert = 3;
+CREATE TABLE test (x UInt64, s String) ENGINE = MergeTree ORDER BY tuple() SETTINGS parts_to_throw_insert = 3, max_parts_to_merge_at_once = 1;
 
 -- The "too many parts" threshold works:
 SET max_block_size = 1, min_insert_block_size_rows = 1, min_insert_block_size_bytes = 1;
@@ -14,7 +14,7 @@ ALTER TABLE test MODIFY SETTING max_avg_part_size_for_too_many_parts = '1M';
 
 -- It works in the same way if parts are small:
 SYSTEM START MERGES test;
-OPTIMIZE TABLE test FINAL;
+OPTIMIZE TABLE test FINAL SETTINGS optimize_throw_if_noop=1;
 SYSTEM STOP MERGES test;
 
 INSERT INTO test VALUES (5, 'a');
@@ -23,7 +23,7 @@ INSERT INTO test VALUES (7, 'a'); -- { serverError TOO_MANY_PARTS }
 
 -- But it allows having more parts if their average size is large:
 SYSTEM START MERGES test;
-OPTIMIZE TABLE test FINAL;
+OPTIMIZE TABLE test FINAL SETTINGS optimize_throw_if_noop=1;
 SYSTEM STOP MERGES test;
 
 SET max_block_size = 65000, min_insert_block_size_rows = 65000, min_insert_block_size_bytes = '1M';
diff --git a/tests/queries/0_stateless/02461_prewhere_row_level_policy_lightweight_delete.sql.j2 b/tests/queries/0_stateless/02461_prewhere_row_level_policy_lightweight_delete.sql.j2
index 1e4258cef7e..0ec6b2ed144 100644
--- a/tests/queries/0_stateless/02461_prewhere_row_level_policy_lightweight_delete.sql.j2
+++ b/tests/queries/0_stateless/02461_prewhere_row_level_policy_lightweight_delete.sql.j2
@@ -8,25 +8,10 @@ ORDER BY (SiteId, DateVisit)
 SETTINGS index_granularity = {{ index_granularity }}, min_bytes_for_wide_part = 0;
 
 -- Insert some data to have 110K rows in the range 2022-08-10 .. 2022-08-20 and some more rows before and after that range
-insert into url_na_log select 209, '2022-08-09' from numbers(10000);
-insert into url_na_log select 209, '2022-08-10' from numbers(10000);
-insert into url_na_log select 209, '2022-08-11' from numbers(10000);
-insert into url_na_log select 209, '2022-08-12' from numbers(10000);
-insert into url_na_log select 209, '2022-08-13' from numbers(10000);
-insert into url_na_log select 209, '2022-08-14' from numbers(10000);
-insert into url_na_log select 209, '2022-08-15' from numbers(10000);
-insert into url_na_log select 209, '2022-08-16' from numbers(10000);
-insert into url_na_log select 209, '2022-08-17' from numbers(10000);
-insert into url_na_log select 209, '2022-08-18' from numbers(10000);
-insert into url_na_log select 209, '2022-08-19' from numbers(10000);
-insert into url_na_log select 209, '2022-08-20' from numbers(10000);
-insert into url_na_log select 209, '2022-08-21' from numbers(10000);
-
+insert into url_na_log select 209, ('2022-08-09'::Date + INTERVAL intDiv(number,10000) DAY) from numbers(130000) SETTINGS max_insert_block_size=200000;
 
 SET mutations_sync=2;
 
-OPTIMIZE TABLE url_na_log FINAL;
-
 -- { echoOn }
 
 SELECT count() FROM url_na_log;
diff --git a/tests/queries/0_stateless/02479_mysql_connect_to_self.sql b/tests/queries/0_stateless/02479_mysql_connect_to_self.sql
index ff46ebf1ed2..cf2220073d3 100644
--- a/tests/queries/0_stateless/02479_mysql_connect_to_self.sql
+++ b/tests/queries/0_stateless/02479_mysql_connect_to_self.sql
@@ -2,34 +2,36 @@
 
 SET send_logs_level = 'fatal'; -- failed connection tries are ok, if it succeeded after retry.
 
+DROP TABLE IF EXISTS foo;
+
 CREATE TABLE foo (key UInt32, a String, b Int64, c String) ENGINE = TinyLog;
 INSERT INTO foo VALUES (1, 'one', -1, 'een'), (2, 'two', -2, 'twee'), (3, 'three', -3, 'drie'), (4, 'four', -4, 'vier'), (5, 'five', -5, 'vijf');
 
 SET allow_experimental_analyzer = 1;
 
 SELECT '---';
-SELECT * FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '') ORDER BY key;
+SELECT * FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '', SETTINGS connect_timeout = 100, connection_wait_timeout = 100) ORDER BY key;
 
 SELECT '---';
-SELECT count() FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '');
+SELECT count() FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '', SETTINGS connect_timeout = 100, connection_wait_timeout = 100);
 
 SELECT '---';
-SELECT 1 FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '');
+SELECT 1 FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '', SETTINGS connect_timeout = 100, connection_wait_timeout = 100);
 
 SELECT '---';
-SELECT key FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '') ORDER BY key;
+SELECT key FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '', SETTINGS connect_timeout = 100, connection_wait_timeout = 100) ORDER BY key;
 
 SELECT '---';
-SELECT b, a FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '') ORDER BY a;
+SELECT b, a FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '', SETTINGS connect_timeout = 100, connection_wait_timeout = 100) ORDER BY a;
 
 SELECT '---';
-SELECT b, a FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '') ORDER BY c;
+SELECT b, a FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '', SETTINGS connect_timeout = 100, connection_wait_timeout = 100) ORDER BY c;
 
 SELECT '---';
-SELECT b FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '') WHERE c != 'twee' ORDER BY b;
+SELECT b FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '', SETTINGS connect_timeout = 100, connection_wait_timeout = 100) WHERE c != 'twee' ORDER BY b;
 
 SELECT '---';
-SELECT count() FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '') WHERE c != 'twee';
+SELECT count() FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '', SETTINGS connect_timeout = 100, connection_wait_timeout = 100) WHERE c != 'twee';
 
 EXPLAIN QUERY TREE dump_ast = 1
 SELECT * FROM mysql(
@@ -38,5 +40,7 @@ SELECT * FROM mysql(
 );
 
 SELECT '---';
-SELECT count() FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '', SETTINGS connection_pool_size = 1);
+SELECT count() FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '', SETTINGS connection_pool_size = 1, connect_timeout = 100, connection_wait_timeout = 100);
 SELECT count() FROM mysql('127.0.0.1:9004', currentDatabase(), foo, 'default', '', SETTINGS connection_pool_size = 0); -- { serverError BAD_ARGUMENTS }
+
+DROP TABLE foo;
diff --git a/tests/queries/0_stateless/02481_aggregation_in_order_plan.reference b/tests/queries/0_stateless/02481_aggregation_in_order_plan.reference
index bb4eb4ddd75..b11f3e3a1d3 100644
--- a/tests/queries/0_stateless/02481_aggregation_in_order_plan.reference
+++ b/tests/queries/0_stateless/02481_aggregation_in_order_plan.reference
@@ -6,5 +6,5 @@
   Order: a ASC, c ASC
       ReadFromMergeTree (default.tab)
   Aggregating
-  Order: default.tab.a_0 ASC, default.tab.c_2 ASC
+  Order: a_0 ASC, c_2 ASC
         ReadFromMergeTree (default.tab)
diff --git a/tests/queries/0_stateless/02481_parquet_list_monotonically_increasing_offsets.sh b/tests/queries/0_stateless/02481_parquet_list_monotonically_increasing_offsets.sh
index 47245eeb940..55e6ac2f758 100755
--- a/tests/queries/0_stateless/02481_parquet_list_monotonically_increasing_offsets.sh
+++ b/tests/queries/0_stateless/02481_parquet_list_monotonically_increasing_offsets.sh
@@ -1,5 +1,6 @@
 #!/usr/bin/env bash
-# Tags: no-ubsan, no-fasttest
+# Tags: no-ubsan, no-fasttest, no-tsan
+# It is too slow under TSan
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -13,4 +14,4 @@ ${CLICKHOUSE_CLIENT} --query="CREATE TABLE parquet_load (list Array(Int64), json
 cat "$DATA_FILE" | ${CLICKHOUSE_CLIENT} -q "INSERT INTO parquet_load FORMAT Parquet"
 ${CLICKHOUSE_CLIENT} --query="SELECT * FROM parquet_load" | md5sum
 ${CLICKHOUSE_CLIENT} --query="SELECT count() FROM parquet_load"
-${CLICKHOUSE_CLIENT} --query="drop table parquet_load"
\ No newline at end of file
+${CLICKHOUSE_CLIENT} --query="drop table parquet_load"
diff --git a/tests/queries/0_stateless/02483_elapsed_time.sh b/tests/queries/0_stateless/02483_elapsed_time.sh
index 608299eb01b..e3b983129fb 100755
--- a/tests/queries/0_stateless/02483_elapsed_time.sh
+++ b/tests/queries/0_stateless/02483_elapsed_time.sh
@@ -25,7 +25,7 @@ QUERY_ID="${CLICKHOUSE_DATABASE}_$(date +%s)_02883_q1"
 ${CLICKHOUSE_CLIENT} -m --query "$EXCEPTION_BEFORE_START_QUERY" --query_id="$QUERY_ID" >/dev/null 2>&1
 
 ${CLICKHOUSE_CLIENT} --query "SYSTEM FLUSH LOGS"
-${CLICKHOUSE_CLIENT} --query "SELECT type == 'ExceptionBeforeStart' as expected_type, query_duration_ms <= 1000 as elapsed_more_than_one_second FROM system.query_log WHERE query_id='$QUERY_ID'"
+${CLICKHOUSE_CLIENT} --query "SELECT type == 'ExceptionBeforeStart' as expected_type, query_duration_ms <= 1000 as elapsed_more_than_one_second FROM system.query_log WHERE current_database = '$CLICKHOUSE_DATABASE' AND query_id='$QUERY_ID'"
 
 # Now we test with a query that will take 1+ seconds. The CLI should show that as part of the output format
 OK_QUERY_JSON="
diff --git a/tests/queries/0_stateless/02494_query_cache_case_agnostic_matching.sql b/tests/queries/0_stateless/02494_query_cache_case_agnostic_matching.sql
index 9f26d7759de..7dbd79059af 100644
--- a/tests/queries/0_stateless/02494_query_cache_case_agnostic_matching.sql
+++ b/tests/queries/0_stateless/02494_query_cache_case_agnostic_matching.sql
@@ -1,9 +1,8 @@
 -- Tags: no-parallel
 -- Tag no-parallel: Messes with internal cache
 
--- Start with empty query cache (QC) and query log
+-- Start with empty query cache (QC)
 SYSTEM DROP QUERY CACHE;
-DROP TABLE system.query_log SYNC;
 
 -- Insert an entry into the query cache.
 SELECT 1 SETTINGS use_query_cache = true;
@@ -22,6 +21,7 @@ SYSTEM FLUSH LOGS;
 SELECT ProfileEvents['QueryCacheHits'], ProfileEvents['QueryCacheMisses']
 FROM system.query_log
 WHERE type = 'QueryFinish'
+  AND current_database = currentDatabase()
   AND query = 'select 1 SETTINGS use_query_cache = true;';
 
 SYSTEM DROP QUERY CACHE;
diff --git a/tests/queries/0_stateless/02494_query_cache_events.reference b/tests/queries/0_stateless/02494_query_cache_events.reference
index db60d3699e0..9bcd2820f27 100644
--- a/tests/queries/0_stateless/02494_query_cache_events.reference
+++ b/tests/queries/0_stateless/02494_query_cache_events.reference
@@ -3,4 +3,5 @@
 0	1
 ---
 1
+0	1
 1	0
diff --git a/tests/queries/0_stateless/02494_query_cache_events.sql b/tests/queries/0_stateless/02494_query_cache_events.sql
index 900b68f5eb2..05c0acad4b8 100644
--- a/tests/queries/0_stateless/02494_query_cache_events.sql
+++ b/tests/queries/0_stateless/02494_query_cache_events.sql
@@ -1,9 +1,8 @@
 -- Tags: no-parallel
 -- Tag no-parallel: Messes with internal cache
 
--- Start with empty query cache QC and query log
+-- Start with empty query cache QC
 SYSTEM DROP QUERY CACHE;
-DROP TABLE system.query_log SYNC;
 
 -- Run a query with QC on. The first execution is a QC miss.
 SELECT '---';
@@ -13,6 +12,7 @@ SYSTEM FLUSH LOGS;
 SELECT ProfileEvents['QueryCacheHits'], ProfileEvents['QueryCacheMisses']
 FROM system.query_log
 WHERE type = 'QueryFinish'
+  AND current_database = currentDatabase()
   AND query = 'SELECT 1 SETTINGS use_query_cache = true;';
 
 
@@ -20,11 +20,12 @@ WHERE type = 'QueryFinish'
 SELECT '---';
 SELECT 1 SETTINGS use_query_cache = true;
 
-DROP TABLE system.query_log SYNC;
 SYSTEM FLUSH LOGS;
 SELECT ProfileEvents['QueryCacheHits'], ProfileEvents['QueryCacheMisses']
 FROM system.query_log
 WHERE type = 'QueryFinish'
-  AND query = 'SELECT 1 SETTINGS use_query_cache = true;';
+  AND current_database = currentDatabase()
+  AND query = 'SELECT 1 SETTINGS use_query_cache = true;'
+ORDER BY event_time_microseconds;
 
 SYSTEM DROP QUERY CACHE;
diff --git a/tests/queries/0_stateless/02494_query_cache_nested_query_bug.reference b/tests/queries/0_stateless/02494_query_cache_nested_query_bug.reference
new file mode 100644
index 00000000000..389e2621455
--- /dev/null
+++ b/tests/queries/0_stateless/02494_query_cache_nested_query_bug.reference
@@ -0,0 +1,2 @@
+2
+0
diff --git a/tests/queries/0_stateless/02494_query_cache_nested_query_bug.sh b/tests/queries/0_stateless/02494_query_cache_nested_query_bug.sh
new file mode 100755
index 00000000000..394367919e9
--- /dev/null
+++ b/tests/queries/0_stateless/02494_query_cache_nested_query_bug.sh
@@ -0,0 +1,23 @@
+#!/usr/bin/env bash
+# Tags: no-parallel, no-fasttest
+# Tag no-parallel: Messes with internal cache
+#     no-fasttest: Produces wrong results in fasttest, unclear why, didn't reproduce locally.
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+# Start with empty query cache (QC).
+${CLICKHOUSE_CLIENT} --query "SYSTEM DROP QUERY CACHE"
+
+${CLICKHOUSE_CLIENT} --query "DROP TABLE IF EXISTS tab"
+${CLICKHOUSE_CLIENT} --query "CREATE TABLE tab (a UInt64) ENGINE=MergeTree() ORDER BY a"
+${CLICKHOUSE_CLIENT} --query "INSERT INTO tab VALUES (1) (2) (3)"
+${CLICKHOUSE_CLIENT} --query "INSERT INTO tab VALUES (3) (4) (5)"
+
+# Verify that the first query does two aggregations and the second query zero aggregations. Since query cache is currently not integrated
+# with EXPLAIN PLAN, we need need to check the logs.
+${CLICKHOUSE_CLIENT} --send_logs_level=trace --query "SELECT count(a) / (SELECT sum(a) FROM tab) FROM tab SETTINGS use_query_cache=1, max_threads=1, allow_experimental_analyzer=0" 2>&1 | grep "Aggregated. " | wc -l
+${CLICKHOUSE_CLIENT} --send_logs_level=trace --query "SELECT count(a) / (SELECT sum(a) FROM tab) FROM tab SETTINGS use_query_cache=1, max_threads=1, allow_experimental_analyzer=0" 2>&1 | grep "Aggregated. " | wc -l
+
+${CLICKHOUSE_CLIENT} --query "SYSTEM DROP QUERY CACHE"
diff --git a/tests/queries/0_stateless/02494_query_cache_normalize_ast.sql b/tests/queries/0_stateless/02494_query_cache_normalize_ast.sql
index 5fd09eb935b..1dbb3ef8158 100644
--- a/tests/queries/0_stateless/02494_query_cache_normalize_ast.sql
+++ b/tests/queries/0_stateless/02494_query_cache_normalize_ast.sql
@@ -1,9 +1,8 @@
 -- Tags: no-parallel
 -- Tag no-parallel: Messes with internal cache
 
--- Start with empty query cache (QC) and query log.
+-- Start with empty query cache (QC)
 SYSTEM DROP QUERY CACHE;
-DROP TABLE system.query_log SYNC;
 
 -- Run query whose result gets cached in the query cache.
 -- Besides "use_query_cache", pass two more knobs (one QC-specific knob and one non-QC-specific knob). We just care
@@ -24,6 +23,7 @@ SYSTEM FLUSH LOGS;
 SELECT ProfileEvents['QueryCacheHits'], ProfileEvents['QueryCacheMisses']
 FROM system.query_log
 WHERE type = 'QueryFinish'
+  AND current_database = currentDatabase()
   AND query = 'SELECT 1 SETTINGS use_query_cache = true, enable_writes_to_query_cache = false, max_threads = 16;';
 
 SYSTEM DROP QUERY CACHE;
diff --git a/tests/queries/0_stateless/02494_query_cache_passive_usage.reference b/tests/queries/0_stateless/02494_query_cache_passive_usage.reference
index edff09773d1..8b73647196e 100644
--- a/tests/queries/0_stateless/02494_query_cache_passive_usage.reference
+++ b/tests/queries/0_stateless/02494_query_cache_passive_usage.reference
@@ -9,4 +9,5 @@
 -----
 1
 1
+0	1
 1	0
diff --git a/tests/queries/0_stateless/02494_query_cache_passive_usage.sql b/tests/queries/0_stateless/02494_query_cache_passive_usage.sql
index 6143b5f7083..f0d2f6398a8 100644
--- a/tests/queries/0_stateless/02494_query_cache_passive_usage.sql
+++ b/tests/queries/0_stateless/02494_query_cache_passive_usage.sql
@@ -22,10 +22,7 @@ SELECT COUNT(*) FROM system.query_cache;
 
 SELECT '-----';
 
--- Run same query with passive mode again. There must still be one entry in the QC and we must have a QC hit.
-
--- Get rid of log of previous SELECT
-DROP TABLE system.query_log SYNC;
+/* Run same query with passive mode again. There must still be one entry in the QC and we must have a QC hit. */
 
 SELECT 1 SETTINGS use_query_cache = true, enable_writes_to_query_cache = false;
 SELECT COUNT(*) FROM system.query_cache;
@@ -34,6 +31,9 @@ SYSTEM FLUSH LOGS;
 SELECT ProfileEvents['QueryCacheHits'], ProfileEvents['QueryCacheMisses']
 FROM system.query_log
 WHERE type = 'QueryFinish'
-  AND query = 'SELECT 1 SETTINGS use_query_cache = true, enable_writes_to_query_cache = false;';
+  AND current_database = currentDatabase()
+  /* NOTE: client incorrectly join comments from the previous line into query, hence LIKE */
+  AND query LIKE '%\nSELECT 1 SETTINGS use_query_cache = true, enable_writes_to_query_cache = false;'
+ORDER BY event_time_microseconds;
 
 SYSTEM DROP QUERY CACHE;
diff --git a/tests/queries/0_stateless/02494_zero_copy_and_projection_and_mutation_work_together.sql b/tests/queries/0_stateless/02494_zero_copy_and_projection_and_mutation_work_together.sql
index 98427874160..b4504a55643 100644
--- a/tests/queries/0_stateless/02494_zero_copy_and_projection_and_mutation_work_together.sql
+++ b/tests/queries/0_stateless/02494_zero_copy_and_projection_and_mutation_work_together.sql
@@ -24,7 +24,8 @@ CREATE TABLE wikistat1
 )
 ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/02494_zero_copy_and_projection', '1')
 ORDER BY (path, time)
-SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0, allow_remote_fs_zero_copy_replication=1, min_bytes_for_wide_part=0;
+SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0,
+    cleanup_thread_preferred_points_per_iteration=0, allow_remote_fs_zero_copy_replication=1, min_bytes_for_wide_part=0;
 
 CREATE TABLE wikistat2
 (
@@ -49,7 +50,8 @@ CREATE TABLE wikistat2
 )
 ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/02494_zero_copy_and_projection', '2')
 ORDER BY (path, time)
-SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0, allow_remote_fs_zero_copy_replication=1, min_bytes_for_wide_part=0;
+SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0,
+    cleanup_thread_preferred_points_per_iteration=0, allow_remote_fs_zero_copy_replication=1, min_bytes_for_wide_part=0;
 
 INSERT INTO wikistat1 SELECT toDateTime('2020-10-01 00:00:00'), 'hello', 'world', '/data/path', 10 from numbers(100);
 
diff --git a/tests/queries/0_stateless/02497_if_transform_strings_to_enum.reference b/tests/queries/0_stateless/02497_if_transform_strings_to_enum.reference
index a1a653361ee..88f23334d31 100644
--- a/tests/queries/0_stateless/02497_if_transform_strings_to_enum.reference
+++ b/tests/queries/0_stateless/02497_if_transform_strings_to_enum.reference
@@ -405,6 +405,16 @@ QUERY id: 0
     TABLE id: 7, table_name: system.numbers
   LIMIT
     CONSTANT id: 17, constant_value: UInt64_10, constant_value_type: UInt64
+other
+other
+other
+other
+other
+other
+other
+other
+other
+other
 SELECT transform(number, [NULL], _CAST([\'google\', \'censor.net\', \'yahoo\'], \'Array(Enum8(\\\'censor.net\\\' = 1, \\\'google\\\' = 2, \\\'other\\\' = 3, \\\'yahoo\\\' = 4))\'), _CAST(\'other\', \'Enum8(\\\'censor.net\\\' = 1, \\\'google\\\' = 2, \\\'other\\\' = 3, \\\'yahoo\\\' = 4)\'))
 FROM
 (
diff --git a/tests/queries/0_stateless/02497_if_transform_strings_to_enum.sql b/tests/queries/0_stateless/02497_if_transform_strings_to_enum.sql
index 492d42cb6bc..c3db61d1fb2 100644
--- a/tests/queries/0_stateless/02497_if_transform_strings_to_enum.sql
+++ b/tests/queries/0_stateless/02497_if_transform_strings_to_enum.sql
@@ -33,7 +33,7 @@ SELECT transform(number, [2, 4, 6], ['google', 'censor.net', 'yahoo'], 'other')
 EXPLAIN SYNTAX SELECT transform(number, [2, 4, 6], ['google', 'censor.net', 'yahoo'], 'other') as value, value FROM system.numbers LIMIT 10;
 EXPLAIN QUERY TREE run_passes = 1 SELECT transform(number, [2, 4, 6], ['google', 'censor.net', 'yahoo'], 'other') as value, value FROM system.numbers LIMIT 10;
 
-SELECT transform(number, [NULL], ['google', 'censor.net', 'yahoo'], 'other') FROM (SELECT NULL as number FROM system.numbers LIMIT 10); -- { serverError 36 }
+SELECT transform(number, [NULL], ['google', 'censor.net', 'yahoo'], 'other') FROM (SELECT NULL as number FROM system.numbers LIMIT 10);
 EXPLAIN SYNTAX SELECT transform(number, [NULL], ['google', 'censor.net', 'yahoo'], 'other') FROM (SELECT NULL as number FROM system.numbers LIMIT 10);
 EXPLAIN QUERY TREE run_passes = 1 SELECT transform(number, [NULL], ['google', 'censor.net', 'yahoo'], 'other') FROM (SELECT NULL as number FROM system.numbers LIMIT 10);
 
diff --git a/tests/queries/0_stateless/02497_storage_file_reader_selection.sh b/tests/queries/0_stateless/02497_storage_file_reader_selection.sh
index 20bde68718d..66b894404cf 100755
--- a/tests/queries/0_stateless/02497_storage_file_reader_selection.sh
+++ b/tests/queries/0_stateless/02497_storage_file_reader_selection.sh
@@ -7,7 +7,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 DATA_FILE=test_02497_$CLICKHOUSE_TEST_UNIQUE_NAME.tsv
 echo -e 'key\nfoo\nbar' > $DATA_FILE
 
-$CLICKHOUSE_LOCAL --storage_file_read_method=mmap --print-profile-events -q "SELECT * FROM file($DATA_FILE) FORMAT Null" 2>&1 | grep -F -c "CreatedReadBufferMMap"
+$CLICKHOUSE_LOCAL --storage_file_read_method=mmap --print-profile-events -q "SELECT * FROM file($DATA_FILE) FORMAT Null" 2>&1 | grep -F -c "CreatedReadBufferMMap:"
 $CLICKHOUSE_LOCAL --storage_file_read_method=mmap --print-profile-events -q "SELECT * FROM file($DATA_FILE) FORMAT Null" 2>&1 | grep -F -c "CreatedReadBufferOrdinary"
 
 $CLICKHOUSE_LOCAL --storage_file_read_method=pread --print-profile-events -q "SELECT * FROM file($DATA_FILE) FORMAT Null" 2>&1 | grep -F -c "CreatedReadBufferMMap"
diff --git a/tests/queries/0_stateless/02497_trace_events_stress_long.sh b/tests/queries/0_stateless/02497_trace_events_stress_long.sh
index 7dc72807c5a..3ec729079b8 100755
--- a/tests/queries/0_stateless/02497_trace_events_stress_long.sh
+++ b/tests/queries/0_stateless/02497_trace_events_stress_long.sh
@@ -43,5 +43,21 @@ timeout $TIMEOUT bash -c thread2 >/dev/null &
 
 wait
 
-$CLICKHOUSE_CLIENT -q "KILL QUERY WHERE query_id LIKE '02497_$CLICKHOUSE_DATABASE%' SYNC" >/dev/null
-$CLICKHOUSE_CLIENT -q "SELECT count() FROM system.processes WHERE query_id LIKE '02497_$CLICKHOUSE_DATABASE%'"
+for _ in {1..10}
+do
+    $CLICKHOUSE_CLIENT -q "KILL QUERY WHERE query_id LIKE '02497_$CLICKHOUSE_DATABASE%' SYNC" >/dev/null
+
+    # After this moment, the server can still run another query.
+    # For example, the 'timeout' command killed all threads of thread1,
+    # and the 'timeout' itself has finished, and we have successfully 'wait'-ed for it,
+    # but just before that, one of the threads successfully sent a query to the server,
+    # but the server didn't start to run this query yet,
+    # and even when the KILL QUERY was run, the query from the thread didn't start,
+    # but only started after the KILL QUERY has been already processed.
+
+    # That's why we have to run this in a loop.
+
+    $CLICKHOUSE_CLIENT -q "SELECT count() FROM system.processes WHERE query_id LIKE '02497_$CLICKHOUSE_DATABASE%'" | rg '^0$' && break
+
+    sleep 1
+done
diff --git a/tests/queries/0_stateless/02499_monotonicity_toUnixTimestamp64.sh b/tests/queries/0_stateless/02499_monotonicity_toUnixTimestamp64.sh
index 1223d7957b5..5d787aa0d8e 100755
--- a/tests/queries/0_stateless/02499_monotonicity_toUnixTimestamp64.sh
+++ b/tests/queries/0_stateless/02499_monotonicity_toUnixTimestamp64.sh
@@ -18,5 +18,5 @@ query_id="${CLICKHOUSE_DATABASE}_02499_$RANDOM$RANDOM"
 $CLICKHOUSE_CLIENT --query_id="$query_id" -q "select ts from t order by toUnixTimestamp64Nano(ts) limit 10 format Null settings max_block_size = $max_block_size, optimize_read_in_order = 1;"
 
 $CLICKHOUSE_CLIENT -q "system flush logs;"
-$CLICKHOUSE_CLIENT --param_query_id="$query_id" -q "select read_rows <= $max_block_size from system.query_log where event_date >= yesterday() and query_id = {query_id:String} and type = 'QueryFinish';"
+$CLICKHOUSE_CLIENT --param_query_id="$query_id" -q "select read_rows <= $max_block_size from system.query_log where event_date >= yesterday() and current_database = '$CLICKHOUSE_DATABASE' and query_id = {query_id:String} and type = 'QueryFinish';"
 
diff --git a/tests/queries/0_stateless/02504_regexp_dictionary_yaml_source.reference b/tests/queries/0_stateless/02504_regexp_dictionary_yaml_source.reference
index dfcd170e8f4..79871e3716c 100644
--- a/tests/queries/0_stateless/02504_regexp_dictionary_yaml_source.reference
+++ b/tests/queries/0_stateless/02504_regexp_dictionary_yaml_source.reference
@@ -5,3 +5,25 @@
 ('BlackBerry WebKit','10.0')
 ('BlackBerry WebKit','1.0')
 (true,'61f0c404-5cb3-11e7-907b-a6006ad3dba0','2023-01-01','2023-01-01 01:01:01',[1,2,3,-1,-2,-3])
+(['ClickHouse'],[1],[],[])
+(['ClickHouse'],[1],[],[])
+(['ClickHouse Documentation','ClickHouse','Documentation'],[0,1,2],['/en'],['ClickHouse'])
+(['ClickHouse Documentation','ClickHouse'],[0,1],['/en'],['ClickHouse'])
+(['Documentation','GitHub'],[2,3],[NULL],[])
+(['Documentation','GitHub'],[2,3],[NULL],[])
+ClickHouse
+['ClickHouse']
+ClickHouse Documentation
+['ClickHouse Documentation','ClickHouse','Documentation']
+GitHub Documentation
+['GitHub Documentation','GitHub']
+Documentation
+['Documentation']
+ClickHouse
+['ClickHouse']
+ClickHouse Documentation
+['ClickHouse Documentation','ClickHouse','Documentation']
+GitHub Documentation
+['GitHub Documentation','GitHub']
+Documentation
+['Documentation']
diff --git a/tests/queries/0_stateless/02504_regexp_dictionary_yaml_source.sh b/tests/queries/0_stateless/02504_regexp_dictionary_yaml_source.sh
index 1b5a9cdeea4..5e8985406ae 100755
--- a/tests/queries/0_stateless/02504_regexp_dictionary_yaml_source.sh
+++ b/tests/queries/0_stateless/02504_regexp_dictionary_yaml_source.sh
@@ -128,9 +128,121 @@ LAYOUT(regexp_tree);
 select dictGet('regexp_dict2', ('col_bool','col_uuid', 'col_date', 'col_datetime', 'col_array'), 'abc');
 "
 
+cat > "$yaml" <<EOL
+- regexp: 'clickhouse\.com'
+  tag: 'ClickHouse'
+  topological_index: 1
+  paths:
+    - regexp: 'clickhouse\.com/docs(.*)'
+      tag: 'ClickHouse Documentation'
+      topological_index: 0
+      captured: '\1'
+      parent: 'ClickHouse'
+
+- regexp: '/docs(/|$)'
+  tag: 'Documentation'
+  topological_index: 2
+
+- regexp: 'github.com'
+  tag: 'GitHub'
+  topological_index: 3
+  captured: 'NULL'
+EOL
+
+# dictGetAll
+$CLICKHOUSE_CLIENT -n --query="
+drop dictionary if exists regexp_dict3;
+create dictionary regexp_dict3
+(
+    regexp String,
+    tag String,
+    topological_index Int64,
+    captured Nullable(String),
+    parent String
+)
+PRIMARY KEY(regexp)
+SOURCE(YAMLRegExpTree(PATH '$yaml'))
+LIFETIME(0)
+LAYOUT(regexp_tree);
+
+select dictGetAll('regexp_dict3', ('tag', 'topological_index', 'captured', 'parent'), 'clickhouse.com');
+select dictGetAll('regexp_dict3', ('tag', 'topological_index', 'captured', 'parent'), 'clickhouse.com', 2);
+
+select dictGetAll('regexp_dict3', ('tag', 'topological_index', 'captured', 'parent'), 'clickhouse.com/docs/en');
+select dictGetAll('regexp_dict3', ('tag', 'topological_index', 'captured', 'parent'), 'clickhouse.com/docs/en', 2);
+
+select dictGetAll('regexp_dict3', ('tag', 'topological_index', 'captured', 'parent'), 'github.com/clickhouse/tree/master/docs');
+select dictGetAll('regexp_dict3', ('tag', 'topological_index', 'captured', 'parent'), 'github.com/clickhouse/tree/master/docs', 2);
+"
+
+# Test that things work the same for "simple" regexps that go through Hyperscan and "complex" regexps that go through RE2.
+# An easy way to force the use of RE2 is to disable Hyperscan.
+# This tree is constructed purposely so that text might (falsely) match leaf nodes without matching their corresponding parent nodes
+cat > "$yaml" <<EOL
+- regexp: 'clickhouse\.com'
+  tag: 'ClickHouse'
+  paths:
+    - regexp: 'docs'
+      tag: 'ClickHouse Documentation'
+
+- regexp: 'github\.com'
+  tag: 'GitHub'
+  paths:
+    - regexp: 'docs'
+      tag: 'GitHub Documentation'
+
+- regexp: '/docs(/|$)'
+  tag: 'Documentation'
+EOL
+
+$CLICKHOUSE_CLIENT -n --query="
+drop dictionary if exists regexp_dict3;
+create dictionary regexp_dict3
+(
+    regexp String,
+    tag String
+)
+PRIMARY KEY(regexp)
+SOURCE(YAMLRegExpTree(PATH '$yaml'))
+LIFETIME(0)
+LAYOUT(regexp_tree)
+SETTINGS(regexp_dict_allow_hyperscan = true);
+
+select dictGet('regexp_dict3', 'tag', 'clickhouse.com');
+select dictGetAll('regexp_dict3', 'tag', 'clickhouse.com');
+select dictGet('regexp_dict3', 'tag', 'clickhouse.com/docs');
+select dictGetAll('regexp_dict3', 'tag', 'clickhouse.com/docs');
+select dictGet('regexp_dict3', 'tag', 'docs.github.com');
+select dictGetAll('regexp_dict3', 'tag', 'docs.github.com');
+select dictGet('regexp_dict3', 'tag', '/docs');
+select dictGetAll('regexp_dict3', 'tag', '/docs');
+
+drop dictionary if exists regexp_dict3;
+create dictionary regexp_dict3
+(
+    regexp String,
+    tag String
+)
+PRIMARY KEY(regexp)
+SOURCE(YAMLRegExpTree(PATH '$yaml'))
+LIFETIME(0)
+LAYOUT(regexp_tree)
+SETTINGS(regexp_dict_allow_hyperscan = false);
+
+select dictGet('regexp_dict3', 'tag', 'clickhouse.com');
+select dictGetAll('regexp_dict3', 'tag', 'clickhouse.com');
+select dictGet('regexp_dict3', 'tag', 'clickhouse.com/docs');
+select dictGetAll('regexp_dict3', 'tag', 'clickhouse.com/docs');
+select dictGet('regexp_dict3', 'tag', 'docs.github.com');
+select dictGetAll('regexp_dict3', 'tag', 'docs.github.com');
+select dictGet('regexp_dict3', 'tag', '/docs');
+select dictGetAll('regexp_dict3', 'tag', '/docs');
+"
+
 $CLICKHOUSE_CLIENT -n --query="
 drop dictionary regexp_dict1;
 drop dictionary regexp_dict2;
+drop dictionary regexp_dict3;
 "
 
 rm -rf "$USER_FILES_PATH/test_02504"
diff --git a/tests/queries/0_stateless/02514_analyzer_drop_join_on.reference b/tests/queries/0_stateless/02514_analyzer_drop_join_on.reference
index 8b4cafc3260..0037ab85c07 100644
--- a/tests/queries/0_stateless/02514_analyzer_drop_join_on.reference
+++ b/tests/queries/0_stateless/02514_analyzer_drop_join_on.reference
@@ -6,43 +6,43 @@ SELECT count() FROM a JOIN b ON b.b1 = a.a1 JOIN c ON c.c1 = b.b1 JOIN d ON d.d1
 Expression ((Project names + Projection))
 Header: count() UInt64
   Aggregating
-  Header: default.a.a2_4 String
+  Header: a2_4 String
           count() UInt64
     Expression ((Before GROUP BY + DROP unused columns after JOIN))
-    Header: default.a.a2_4 String
+    Header: a2_4 String
       Join (JOIN FillRightFirst)
-      Header: default.a.a2_4 String
-              default.c.c1_2 UInt64
+      Header: a2_4 String
+              c1_2 UInt64
         Expression ((JOIN actions + DROP unused columns after JOIN))
-        Header: default.a.a2_4 String
-                default.c.c1_2 UInt64
+        Header: a2_4 String
+                c1_2 UInt64
           Join (JOIN FillRightFirst)
-          Header: default.a.a2_4 String
-                  default.b.b1_0 UInt64
-                  default.c.c1_2 UInt64
+          Header: a2_4 String
+                  b1_0 UInt64
+                  c1_2 UInt64
             Expression ((JOIN actions + DROP unused columns after JOIN))
-            Header: default.a.a2_4 String
-                    default.b.b1_0 UInt64
+            Header: a2_4 String
+                    b1_0 UInt64
               Join (JOIN FillRightFirst)
-              Header: default.a.a1_1 UInt64
-                      default.a.a2_4 String
-                      default.b.b1_0 UInt64
+              Header: a1_1 UInt64
+                      a2_4 String
+                      b1_0 UInt64
                 Expression ((JOIN actions + Change column names to column identifiers))
-                Header: default.a.a1_1 UInt64
-                        default.a.a2_4 String
+                Header: a1_1 UInt64
+                        a2_4 String
                   ReadFromMemoryStorage
                   Header: a1 UInt64
                           a2 String
                 Expression ((JOIN actions + Change column names to column identifiers))
-                Header: default.b.b1_0 UInt64
+                Header: b1_0 UInt64
                   ReadFromMemoryStorage
                   Header: b1 UInt64
             Expression ((JOIN actions + Change column names to column identifiers))
-            Header: default.c.c1_2 UInt64
+            Header: c1_2 UInt64
               ReadFromMemoryStorage
               Header: c1 UInt64
         Expression ((JOIN actions + Change column names to column identifiers))
-        Header: default.d.d1_3 UInt64
+        Header: d1_3 UInt64
           ReadFromMemoryStorage
           Header: d1 UInt64
 EXPLAIN PLAN header = 1
@@ -52,38 +52,38 @@ Expression ((Project names + (Projection + DROP unused columns after JOIN)))
 Header: a2 String
         d2 String
   Join (JOIN FillRightFirst)
-  Header: default.a.a2_0 String
-          default.a.k_2 UInt64
-          default.d.d2_1 String
+  Header: a2_0 String
+          k_2 UInt64
+          d2_1 String
     Expression (DROP unused columns after JOIN)
-    Header: default.a.a2_0 String
-            default.a.k_2 UInt64
+    Header: a2_0 String
+            k_2 UInt64
       Join (JOIN FillRightFirst)
-      Header: default.a.a2_0 String
-              default.a.k_2 UInt64
+      Header: a2_0 String
+              k_2 UInt64
         Expression (DROP unused columns after JOIN)
-        Header: default.a.a2_0 String
-                default.a.k_2 UInt64
+        Header: a2_0 String
+                k_2 UInt64
           Join (JOIN FillRightFirst)
-          Header: default.a.a2_0 String
-                  default.a.k_2 UInt64
+          Header: a2_0 String
+                  k_2 UInt64
             Expression (Change column names to column identifiers)
-            Header: default.a.a2_0 String
-                    default.a.k_2 UInt64
+            Header: a2_0 String
+                    k_2 UInt64
               ReadFromMemoryStorage
               Header: a2 String
                       k UInt64
             Expression (Change column names to column identifiers)
-            Header: default.b.k_3 UInt64
+            Header: k_3 UInt64
               ReadFromMemoryStorage
               Header: k UInt64
         Expression (Change column names to column identifiers)
-        Header: default.c.k_4 UInt64
+        Header: k_4 UInt64
           ReadFromMemoryStorage
           Header: k UInt64
     Expression (Change column names to column identifiers)
-    Header: default.d.d2_1 String
-            default.d.k_5 UInt64
+    Header: d2_1 String
+            k_5 UInt64
       ReadFromMemoryStorage
       Header: d2 String
               k UInt64
@@ -97,55 +97,55 @@ WHERE c.c2 != '' ORDER BY a.a2
 Expression (Project names)
 Header: bx String
   Sorting (Sorting for ORDER BY)
-  Header: default.a.a2_6 String
-          b.bx_0 String
+  Header: a2_6 String
+          bx_0 String
     Expression ((Before ORDER BY + (Projection + )))
-    Header: default.a.a2_6 String
-            b.bx_0 String
+    Header: a2_6 String
+            bx_0 String
       Join (JOIN FillRightFirst)
-      Header: default.a.a2_6 String
-              b.bx_0 String
-              default.c.c2_5 String
-              default.c.c1_3 UInt64
+      Header: a2_6 String
+              bx_0 String
+              c2_5 String
+              c1_3 UInt64
         Filter (( + (JOIN actions + DROP unused columns after JOIN)))
-        Header: default.a.a2_6 String
-                b.bx_0 String
-                default.c.c2_5 String
-                default.c.c1_3 UInt64
+        Header: a2_6 String
+                bx_0 String
+                c2_5 String
+                c1_3 UInt64
           Join (JOIN FillRightFirst)
-          Header: default.a.a2_6 String
-                  b.bx_0 String
-                  b.b1_1 UInt64
-                  default.c.c2_5 String
-                  default.c.c1_3 UInt64
+          Header: a2_6 String
+                  bx_0 String
+                  b1_1 UInt64
+                  c2_5 String
+                  c1_3 UInt64
             Expression ((JOIN actions + DROP unused columns after JOIN))
-            Header: default.a.a2_6 String
-                    b.bx_0 String
-                    b.b1_1 UInt64
+            Header: a2_6 String
+                    bx_0 String
+                    b1_1 UInt64
               Join (JOIN FillRightFirst)
-              Header: default.a.a1_2 UInt64
-                      default.a.a2_6 String
-                      b.bx_0 String
-                      b.b1_1 UInt64
+              Header: a1_2 UInt64
+                      a2_6 String
+                      bx_0 String
+                      b1_1 UInt64
                 Expression ((JOIN actions + Change column names to column identifiers))
-                Header: default.a.a1_2 UInt64
-                        default.a.a2_6 String
+                Header: a1_2 UInt64
+                        a2_6 String
                   ReadFromMemoryStorage
                   Header: a1 UInt64
                           a2 String
                 Expression ((JOIN actions + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers)))))
-                Header: b.b1_1 UInt64
-                        b.bx_0 String
+                Header: b1_1 UInt64
+                        bx_0 String
                   ReadFromMemoryStorage
                   Header: b1 UInt64
                           b2 String
             Expression ((JOIN actions + Change column names to column identifiers))
-            Header: default.c.c1_3 UInt64
-                    default.c.c2_5 String
+            Header: c1_3 UInt64
+                    c2_5 String
               ReadFromMemoryStorage
               Header: c1 UInt64
                       c2 String
         Expression ((JOIN actions + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers)))))
-        Header: d.d1_4 UInt64
+        Header: d1_4 UInt64
           ReadFromStorage (SystemNumbers)
           Header: number UInt64
diff --git a/tests/queries/0_stateless/02515_cleanup_async_insert_block_ids.sh b/tests/queries/0_stateless/02515_cleanup_async_insert_block_ids.sh
index 458a5e95faa..bc6e7eeb214 100755
--- a/tests/queries/0_stateless/02515_cleanup_async_insert_block_ids.sh
+++ b/tests/queries/0_stateless/02515_cleanup_async_insert_block_ids.sh
@@ -13,7 +13,7 @@ $CLICKHOUSE_CLIENT -n --query "
     CREATE TABLE t_async_insert_cleanup (
         KeyID UInt32
     ) Engine = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/t_async_insert_cleanup', '{replica}')
-    ORDER BY (KeyID) SETTINGS cleanup_delay_period = 1, cleanup_delay_period_random_add = 1, replicated_deduplication_window_for_async_inserts=10
+    ORDER BY (KeyID) SETTINGS cleanup_delay_period = 1, cleanup_delay_period_random_add = 1, cleanup_thread_preferred_points_per_iteration=0, replicated_deduplication_window_for_async_inserts=10
 "
 
 for i in {1..100}; do
diff --git a/tests/queries/0_stateless/02521_incorrect_dealy_for_insert_bug_44902.sh b/tests/queries/0_stateless/02521_incorrect_dealy_for_insert_bug_44902.sh
index 5f91ef19a5a..0ae44ec0c01 100755
--- a/tests/queries/0_stateless/02521_incorrect_dealy_for_insert_bug_44902.sh
+++ b/tests/queries/0_stateless/02521_incorrect_dealy_for_insert_bug_44902.sh
@@ -16,7 +16,7 @@ do
     query_id="${CLICKHOUSE_DATABASE}_02521_${i}_$RANDOM$RANDOM"
     $CLICKHOUSE_CLIENT --query_id="$query_id" -q "INSERT INTO test_02521_insert_delay SELECT number, toString(number) FROM numbers(${i}, 1)"
     $CLICKHOUSE_CLIENT -q "SYSTEM FLUSH LOGS"
-    $CLICKHOUSE_CLIENT --param_query_id="$query_id" -q "select ProfileEvents['DelayedInsertsMilliseconds'] as delay from system.query_log where event_date >= yesterday() and query_id = {query_id:String} order by delay desc limit 1"
+    $CLICKHOUSE_CLIENT --param_query_id="$query_id" -q "select ProfileEvents['DelayedInsertsMilliseconds'] as delay from system.query_log where event_date >= yesterday() and current_database = '$CLICKHOUSE_DATABASE' and query_id = {query_id:String} order by delay desc limit 1"
 done
 
 $CLICKHOUSE_CLIENT -q "INSERT INTO test_02521_insert_delay VALUES(0, 'This query throws error')" 2>&1 | grep -o 'TOO_MANY_PARTS' | head -n 1
diff --git a/tests/queries/0_stateless/02525_different_engines_in_temporary_tables.sql b/tests/queries/0_stateless/02525_different_engines_in_temporary_tables.sql
index 7ebc05dfece..58e9ecab30c 100644
--- a/tests/queries/0_stateless/02525_different_engines_in_temporary_tables.sql
+++ b/tests/queries/0_stateless/02525_different_engines_in_temporary_tables.sql
@@ -7,7 +7,9 @@ CREATE TEMPORARY TABLE table_merge_tree_02525
 ENGINE = MergeTree
 ORDER BY id
 PRIMARY KEY id;
-INSERT INTO table_merge_tree_02525 VALUES (1, 'a'), (2, 'b'), (3, 'c');
+INSERT INTO table_merge_tree_02525 VALUES (1, 'a'), (2, 'b');
+INSERT INTO table_merge_tree_02525 VALUES (3, 'c');
+OPTIMIZE TABLE table_merge_tree_02525 FINAL;
 SELECT * FROM table_merge_tree_02525;
 -- Check that temporary table with MergeTree is not sent to remote servers
 -- The query with remote() should not fail
diff --git a/tests/queries/0_stateless/02534_default_granularity.reference b/tests/queries/0_stateless/02534_default_granularity.reference
index e60036653c9..0fe7fe0a1b3 100644
--- a/tests/queries/0_stateless/02534_default_granularity.reference
+++ b/tests/queries/0_stateless/02534_default_granularity.reference
@@ -1 +1,2 @@
 CREATE TABLE default.users_02534\n(\n    `id` Int16,\n    `name` String,\n    INDEX bf_idx name TYPE minmax GRANULARITY 1\n)\nENGINE = MergeTree\nORDER BY id\nSETTINGS index_granularity = 8192
+CREATE TABLE default.users_02534\n(\n    `id` Int16,\n    `name` String,\n    INDEX bf_idx name TYPE minmax GRANULARITY 1\n)\nENGINE = MergeTree\nORDER BY id\nSETTINGS index_granularity = 8192
diff --git a/tests/queries/0_stateless/02534_default_granularity.sql b/tests/queries/0_stateless/02534_default_granularity.sql
index 781df3ce934..e3de5fce7c8 100644
--- a/tests/queries/0_stateless/02534_default_granularity.sql
+++ b/tests/queries/0_stateless/02534_default_granularity.sql
@@ -1,4 +1,9 @@
 DROP TABLE IF EXISTS users_02534;
 CREATE TABLE users_02534 (id Int16, name String, INDEX bf_idx(name) TYPE minmax) ENGINE=MergeTree ORDER BY id;
 SHOW CREATE TABLE users_02534;
-DROP TABLE users_02534;
\ No newline at end of file
+DROP TABLE users_02534;
+
+CREATE TABLE users_02534 (id Int16, name String) ENGINE=MergeTree ORDER BY id;
+ALTER TABLE users_02534 ADD INDEX bf_idx(name) TYPE minmax;
+SHOW CREATE TABLE users_02534;
+DROP TABLE users_02534;
diff --git a/tests/queries/0_stateless/02539_generate_random_map.reference b/tests/queries/0_stateless/02539_generate_random_map.reference
index c0dc175c3cd..25e7f55667e 100644
--- a/tests/queries/0_stateless/02539_generate_random_map.reference
+++ b/tests/queries/0_stateless/02539_generate_random_map.reference
@@ -1,2 +1,2 @@
-1
-20
+0
+10
diff --git a/tests/queries/0_stateless/02552_siphash128_reference.reference b/tests/queries/0_stateless/02552_siphash128_reference.reference
index 452e9910660..d00491fd7e5 100644
--- a/tests/queries/0_stateless/02552_siphash128_reference.reference
+++ b/tests/queries/0_stateless/02552_siphash128_reference.reference
@@ -1,130 +1 @@
-A3817F04BA25A8E66DF67214C7550293
-DA87C1D86B99AF44347659119B22FC45
-8177228DA4A45DC7FCA38BDEF60AFFE4
-9C70B60C5267A94E5F33B6B02985ED51
-F88164C12D9C8FAF7D0F6E7C7BCD5579
-1368875980776F8854527A07690E9627
-14EECA338B208613485EA0308FD7A15E
-A1F1EBBED8DBC153C0B84AA61FF08239
-3B62A9BA6258F5610F83E264F31497B4
-264499060AD9BAABC47F8B02BB6D71ED
-00110DC378146956C95447D3F3D0FBBA
-0151C568386B6677A2B4DC6F81E5DC18
-D626B266905EF35882634DF68532C125
-9869E247E9C08B10D029934FC4B952F7
-31FCEFAC66D7DE9C7EC7485FE4494902
-5493E99933B0A8117E08EC0F97CFC3D9
-6EE2A4CA67B054BBFD3315BF85230577
-473D06E8738DB89854C066C47AE47740
-A426E5E423BF4885294DA481FEAEF723
-78017731CF65FAB074D5208952512EB1
-9E25FC833F2290733E9344A5E83839EB
-568E495ABE525A218A2214CD3E071D12
-4A29B54552D16B9A469C10528EFF0AAE
-C9D184DDD5A9F5E0CF8CE29A9ABF691C
-2DB479AE78BD50D8882A8A178A6132AD
-8ECE5F042D5E447B5051B9EACB8D8F6F
-9C0B53B4B3C307E87EAEE08678141F66
-ABF248AF69A6EAE4BFD3EB2F129EEB94
-0664DA1668574B88B935F3027358AEF4
-AA4B9DC4BF337DE90CD4FD3C467C6AB7
-EA5C7F471FAF6BDE2B1AD7D4686D2287
-2939B0183223FAFC1723DE4F52C43D35
-7C3956CA5EEAFC3E363E9D556546EB68
-77C6077146F01C32B6B69D5F4EA9FFCF
-37A6986CB8847EDF0925F0F1309B54DE
-A705F0E69DA9A8F907241A2E923C8CC8
-3DC47D1F29C448461E9E76ED904F6711
-0D62BF01E6FC0E1A0D3C4751C5D3692B
-8C03468BCA7C669EE4FD5E084BBEE7B5
-528A5BB93BAF2C9C4473CCE5D0D22BD9
-DF6A301E95C95DAD97AE0CC8C6913BD8
-801189902C857F39E73591285E70B6DB
-E617346AC9C231BB3650AE34CCCA0C5B
-27D93437EFB721AA401821DCEC5ADF89
-89237D9DED9C5E78D8B1C9B166CC7342
-4A6D8091BF5E7D651189FA94A250B14C
-0E33F96055E7AE893FFC0E3DCF492902
-E61C432B720B19D18EC8D84BDC63151B
-F7E5AEF549F782CF379055A608269B16
-438D030FD0B7A54FA837F2AD201A6403
-A590D3EE4FBF04E3247E0D27F286423F
-5FE2C1A172FE93C4B15CD37CAEF9F538
-2C97325CBD06B36EB2133DD08B3A017C
-92C814227A6BCA949FF0659F002AD39E
-DCE850110BD8328CFBD50841D6911D87
-67F14984C7DA791248E32BB5922583DA
-1938F2CF72D54EE97E94166FA91D2A36
-74481E9646ED49FE0F6224301604698E
-57FCA5DE98A9D6D8006438D0583D8A1D
-9FECDE1CEFDC1CBED4763674D9575359
-E3040C00EB28F15366CA73CBD872E740
-7697009A6A831DFECCA91C5993670F7A
-5853542321F567A005D547A4F04759BD
-5150D1772F50834A503E069A973FBD7C
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
 1
diff --git a/tests/queries/0_stateless/02552_siphash128_reference.sql b/tests/queries/0_stateless/02552_siphash128_reference.sql
index c238e51b690..200954c3b57 100644
--- a/tests/queries/0_stateless/02552_siphash128_reference.sql
+++ b/tests/queries/0_stateless/02552_siphash128_reference.sql
@@ -1,207 +1 @@
--- Test Vectors from the SipHash reference C implementation:
--- Written by
--- Jean-Philippe Aumasson <jeanphilippe.aumasson@gmail.com>
--- Daniel J. Bernstein <djb@cr.yp.to>
--- Released under CC0
--- https://github.com/veorq/SipHash/blob/eee7d0d84dc7731df2359b243aa5e75d85f6eaef/vectors.h#L645
-
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           ''));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61)));
-select hex(sipHash128ReferenceKeyed((toUInt64(506097522914230528), toUInt64(1084818905618843912)),
-                           char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62)));
-
--- CH tests
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0)) == sipHash128Reference(char(0));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1)) == sipHash128Reference(char(0, 1));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2)) == sipHash128Reference(char(0, 1, 2));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3)) == sipHash128Reference(char(0, 1, 2, 3));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4)) == sipHash128Reference(char(0, 1, 2, 3, 4));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62));
-select sipHash128ReferenceKeyed((toUInt64(0),toUInt64(0)),char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63)) == sipHash128Reference(char(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63));
-
-select sipHash128ReferenceKeyed((0, 0), '1'); -- { serverError 48 }
-select sipHash128ReferenceKeyed(toUInt64(0), '1'); -- { serverError 48 }
-
 SELECT hex(sipHash128Reference()) = hex(reverse(unhex('1CE422FEE7BD8DE20000000000000000'))) or hex(sipHash128()) = '1CE422FEE7BD8DE20000000000000000';
-SELECT hex(sipHash128ReferenceKeyed()) = hex(reverse(unhex('1CE422FEE7BD8DE20000000000000000'))) or hex(sipHash128Keyed()) = '1CE422FEE7BD8DE20000000000000000';
diff --git a/tests/queries/0_stateless/02561_null_as_default_more_formats.sh b/tests/queries/0_stateless/02561_null_as_default_more_formats.sh
index eacd8e964a6..603f8b33618 100755
--- a/tests/queries/0_stateless/02561_null_as_default_more_formats.sh
+++ b/tests/queries/0_stateless/02561_null_as_default_more_formats.sh
@@ -10,7 +10,14 @@ $CLICKHOUSE_CLIENT -q "create table test (x UInt64 default 42, y UInt64, z LowCa
 for format in Parquet Arrow ORC Avro MsgPack Native
 do
     echo $format
-    $CLICKHOUSE_CLIENT -q "select number % 2 ? NULL : number as x, x as y, CAST(number % 2 ? NULL : toString(number), 'LowCardinality(Nullable(String))') as z from numbers(2) format $format" | $CLICKHOUSE_CLIENT -q "insert into test settings input_format_null_as_default=0 format $format" 2>&1 | grep "Exception" -c
+    # insert data by using file, not a pipe (stdout->stdin)
+    # the insert query is intended to fail (close the pipe), and it can happen before select process finishes writing to the pipe
+    # so, it will lead to 'Broken pipe' error, see #49177
+    data_file=$CLICKHOUSE_TEST_UNIQUE_NAME.$format
+    $CLICKHOUSE_CLIENT -q "select number % 2 ? NULL : number as x, x as y, CAST(number % 2 ? NULL : toString(number), 'LowCardinality(Nullable(String))') as z from numbers(2) format $format" > $data_file
+    $CLICKHOUSE_CLIENT -q "insert into test from infile '$data_file' settings input_format_null_as_default=0 format $format" 2>&1 | grep "Exception" -c
+    rm $data_file
+
     $CLICKHOUSE_CLIENT -q "select number % 2 ? NULL : number as x, x as y, CAST(number % 2 ? NULL : toString(number), 'LowCardinality(Nullable(String))') as z from numbers(2) format $format settings output_format_arrow_low_cardinality_as_dictionary=1" | $CLICKHOUSE_CLIENT -q "insert into test settings input_format_null_as_default=1, input_format_defaults_for_omitted_fields=0 format $format"
     $CLICKHOUSE_CLIENT -q "select * from test"
     $CLICKHOUSE_CLIENT -q "truncate table test"
diff --git a/tests/queries/0_stateless/02578_parameterized_rename_queries.sql b/tests/queries/0_stateless/02578_parameterized_rename_queries.sql
index eecb282083f..de36f8ae3b5 100644
--- a/tests/queries/0_stateless/02578_parameterized_rename_queries.sql
+++ b/tests/queries/0_stateless/02578_parameterized_rename_queries.sql
@@ -24,6 +24,7 @@ SET param_new_tbl_name = 02661_t1;
 CREATE TABLE {new_db_name:Identifier}.{old_tbl_name:Identifier} (a UInt64) ENGINE = MergeTree ORDER BY tuple();
 RENAME TABLE {new_db_name:Identifier}.{old_tbl_name:Identifier} TO {new_db_name:Identifier}.{new_tbl_name:Identifier};
 
+-- NOTE: no 'database = currentDatabase()' on purpose
 SELECT name FROM system.tables WHERE name = {new_tbl_name:String};
 
 -- Case 3: RENAME DICTIONARY
diff --git a/tests/queries/0_stateless/02585_query_status_deadlock.sh b/tests/queries/0_stateless/02585_query_status_deadlock.sh
index 227ecb1c1b2..e3e34109cdb 100755
--- a/tests/queries/0_stateless/02585_query_status_deadlock.sh
+++ b/tests/queries/0_stateless/02585_query_status_deadlock.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: long
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -14,7 +15,7 @@ $CLICKHOUSE_CLIENT -q "SYSTEM FLUSH LOGS"
 
 while true
 do
-    res=$($CLICKHOUSE_CLIENT -q "select query, event_time from system.query_log where query_id = '$QUERY_ID' and query like 'select%' limit 1")
+    res=$($CLICKHOUSE_CLIENT -q "select query, event_time from system.query_log where query_id = '$QUERY_ID' and current_database = '$CLICKHOUSE_DATABASE' and query like 'select%' limit 1")
     if [ -n "$res" ]; then
         break
     fi
diff --git a/tests/queries/0_stateless/02586_generate_random_structure.reference b/tests/queries/0_stateless/02586_generate_random_structure.reference
index d2929fb4564..abe168c59e8 100644
--- a/tests/queries/0_stateless/02586_generate_random_structure.reference
+++ b/tests/queries/0_stateless/02586_generate_random_structure.reference
@@ -13,7 +13,7 @@ c3.e6	Array(Int256)
 c4	FixedString(183)					
 c5	IPv4					
 c6	UInt256					
-Tb�#yV��[>�M��*ܨ��(�O�R8V1n���)���H�}C�������\'����I7�t���qn�V)䳆��qL��P�o�R�g<�{���3�i����H_m��!q���\'G���	127.48.9.45	['e1V10','e1V0','e1V10','e1V14','e1V10','e1V14']	[{-13:777622572,102:-1122882357,62:1647813163,-94:2094022166},{-32:1448633509},{},{},{34:1536340393,19:-2049677851,74:65643868,-46:-1990799930,97:-531041081,46:-2634833,14:1581632600,89:-771229823,-105:1238603584},{47:1458809010,109:1640682510,86:1945730198,85:1505847247,35:-35189402}]	[153363749503.3642648494826450951141750747382772821825909005880434540971999557,79828591186.7378041015337066268618633118713347614941338787453473118807106292,81672688565.9633830721322966111551266731935181670389237071708068971548883315,573768486971.1812413548839655834002608768736215115033958693122764224003897029,-393925092368.4893467278351090742501814120269109477445490969167853713051140487,46027399426.0865278566391382610843315130162915324295037009704113636499519839]	[755855942,1804001770,-78103159,-866181765,731736602,-79599206]	[5253556148991564114,4681434929596395351,-7302160004580855709,-3686747220178471318,6288582051009949273,646864891160092871]	[17035203905051045016266537043565487029724162173062647021612805252288722534904,-42105881403933504641593145676742477006499618886131028341247993701618141933523,45346626822580305846120377917274679004279343244238782744860626882886217433843,-3660165069803677989574889324494857545543653453780976182221584349306428201647,-23316760935816288837287058499520670431785615691220162210524162590241529297823,6184785563808848524970564618169964412151721224362412457508264894603779018817]	�ڡ|�A"�x���>����r�wz�Z�:��j�8tZ��D"Tu��2h�!���W�I��y��tP��a|�\'�y��o�����f�F�O\0��Ֆ6\fIr�E�Sac�W<~�e �l��T>P3})��w%�4@_2�N"ІXp$^Ҙ���Ͱ\04�@��n\b���\r�4�H�	16.177.117.209	7882774382721411359365561736453116698030365959050344381263687375357052837130
-Tb�#yV��[>�M��*ܨ��(�O�R8V1n���)���H�}C�������\'����I7�t���qn�V)䳆��qL��P�o�R�g<�{���3�i����H_m��!q���\'G���	127.48.9.45	['e1V10','e1V0','e1V10','e1V14','e1V10','e1V14']	[{-13:777622572,102:-1122882357,62:1647813163,-94:2094022166},{-32:1448633509},{},{},{34:1536340393,19:-2049677851,74:65643868,-46:-1990799930,97:-531041081,46:-2634833,14:1581632600,89:-771229823,-105:1238603584},{47:1458809010,109:1640682510,86:1945730198,85:1505847247,35:-35189402}]	[153363749503.3642648494826450951141750747382772821825909005880434540971999557,79828591186.7378041015337066268618633118713347614941338787453473118807106292,81672688565.9633830721322966111551266731935181670389237071708068971548883315,573768486971.1812413548839655834002608768736215115033958693122764224003897029,-393925092368.4893467278351090742501814120269109477445490969167853713051140487,46027399426.0865278566391382610843315130162915324295037009704113636499519839]	[755855942,1804001770,-78103159,-866181765,731736602,-79599206]	[5253556148991564114,4681434929596395351,-7302160004580855709,-3686747220178471318,6288582051009949273,646864891160092871]	[17035203905051045016266537043565487029724162173062647021612805252288722534904,-42105881403933504641593145676742477006499618886131028341247993701618141933523,45346626822580305846120377917274679004279343244238782744860626882886217433843,-3660165069803677989574889324494857545543653453780976182221584349306428201647,-23316760935816288837287058499520670431785615691220162210524162590241529297823,6184785563808848524970564618169964412151721224362412457508264894603779018817]	�ڡ|�A"�x���>����r�wz�Z�:��j�8tZ��D"Tu��2h�!���W�I��y��tP��a|�\'�y��o�����f�F�O\0��Ֆ6\fIr�E�Sac�W<~�e �l��T>P3})��w%�4@_2�N"ІXp$^Ҙ���Ͱ\04�@��n\b���\r�4�H�	16.177.117.209	7882774382721411359365561736453116698030365959050344381263687375357052837130
+Tb�#yV��[>�M��*ܨ��(�O�R8V1n���)���H�}C�������\'����I7�t���qn�V)䳆��qL��P�o�R�g<�{���3�i����H_m��!q���\'G���	127.48.9.45	['e1V10','e1V0','e1V10','e1V14','e1V10','e1V14']	[{-13:237920722},{102:1831835481},{},{},{62:-1960618666,-94:-1219892650},{-32:777622572}]	[-431683920736.2529974565693898437068698973660186760023819586689844248966618581,59756148020.9162673945900094878560562068677573399624031604279613893604002735,586508082308.9120376291637372686770291666437007489038136467093669000000245094,-542964250950.8072472621084212227729061994250148872708538789242780170470779236,102348230986.0528243362965635624540408239649901816289081513971979913007157412,856260707339.0308016734722383288485766011293159337170215574648625303012038641]	[700742145,583743175,-694731143,205377506,-47073316,524775483]	[-1523104801326101990,-3813742700509249040,-198797568561120929,1360848130483946585,-2034445041726915230,6445693522245970031]	[-42294009754395695750286152418877456026522055877244789929409825751148328749462,-30114637036117781224059264373564439361653611308928312514969460679379590706382,50790691897328530213645537587874962516097580703236937570724165115560305762147,-53982023979693597997184389721196431225054557132927198244547868871851761566844,-4746897427675718862552189488292169089453556841811840545196357111533622948298,-12014200750706123405006110782843469166121588186681927916239818910819762049960]	�ڡ|�A"�x���>����r�wz�Z�:��j�8tZ��D"Tu��2h�!���W�I��y��tP��a|�\'�y��o�����f�F�O\0��Ֆ6\fIr�E�Sac�W<~�e �l��T>P3})��w%�4@_2�N"ІXp$^Ҙ���Ͱ\04�@��n\b���\r�4�H�	16.177.117.209	7882774382721411359365561736453116698030365959050344381263687375357052837130
+Tb�#yV��[>�M��*ܨ��(�O�R8V1n���)���H�}C�������\'����I7�t���qn�V)䳆��qL��P�o�R�g<�{���3�i����H_m��!q���\'G���	127.48.9.45	['e1V10','e1V0','e1V10','e1V14','e1V10','e1V14']	[{-13:237920722},{102:1831835481},{},{},{62:-1960618666,-94:-1219892650},{-32:777622572}]	[-431683920736.2529974565693898437068698973660186760023819586689844248966618581,59756148020.9162673945900094878560562068677573399624031604279613893604002735,586508082308.9120376291637372686770291666437007489038136467093669000000245094,-542964250950.8072472621084212227729061994250148872708538789242780170470779236,102348230986.0528243362965635624540408239649901816289081513971979913007157412,856260707339.0308016734722383288485766011293159337170215574648625303012038641]	[700742145,583743175,-694731143,205377506,-47073316,524775483]	[-1523104801326101990,-3813742700509249040,-198797568561120929,1360848130483946585,-2034445041726915230,6445693522245970031]	[-42294009754395695750286152418877456026522055877244789929409825751148328749462,-30114637036117781224059264373564439361653611308928312514969460679379590706382,50790691897328530213645537587874962516097580703236937570724165115560305762147,-53982023979693597997184389721196431225054557132927198244547868871851761566844,-4746897427675718862552189488292169089453556841811840545196357111533622948298,-12014200750706123405006110782843469166121588186681927916239818910819762049960]	�ڡ|�A"�x���>����r�wz�Z�:��j�8tZ��D"Tu��2h�!���W�I��y��tP��a|�\'�y��o�����f�F�O\0��Ֆ6\fIr�E�Sac�W<~�e �l��T>P3})��w%�4@_2�N"ІXp$^Ҙ���Ͱ\04�@��n\b���\r�4�H�	16.177.117.209	7882774382721411359365561736453116698030365959050344381263687375357052837130
 Tb�#yV��[>�M��*ܨ��(�O�R8V1n���)���H�}C�������\'����I7�t���qn�V)䳆��qL��P�o�R�g<�{���3�i����H_m��!q���\'G���	127.48.9.45	['e1V10']	[{}]	[825002272867.1157788721157301271303736024856710948164507982705676578804195475]	[1865150610]	[7514464811443271056]	[33504961604882608369857530219353040639899064613284394558131808339620328539033]	�ڡ|�A"�x���>����r�wz�Z�:��j�8tZ��D"Tu��2h�!���W�I��y��tP��a|�\'�y��o�����f�F�O\0��Ֆ6\fIr�E�Sac�W<~�e �l��T>P3})��w%�4@_2�N"ІXp$^Ҙ���Ͱ\04�@��n\b���\r�4�H�	16.177.117.209	7882774382721411359365561736453116698030365959050344381263687375357052837130
 c1 LowCardinality(Nullable(UInt64)), c2 Date32, c3 LowCardinality(Nullable(Float64)), c4 Int256, c5 Date32
diff --git a/tests/queries/0_stateless/02675_predicate_push_down_filled_join_fix.reference b/tests/queries/0_stateless/02675_predicate_push_down_filled_join_fix.reference
index ecdb62c5cb5..986ecffcdf8 100644
--- a/tests/queries/0_stateless/02675_predicate_push_down_filled_join_fix.reference
+++ b/tests/queries/0_stateless/02675_predicate_push_down_filled_join_fix.reference
@@ -2,27 +2,27 @@ Expression ((Project names + (Projection + )))
 Header: t1.id UInt64
         t1.value String
         t2.value String
-Actions: INPUT : 0 -> t1.id_0 UInt64 : 0
-         INPUT : 1 -> t1.value_1 String : 1
-         INPUT : 2 -> t2.value_2 String : 2
-         ALIAS t1.id_0 :: 0 -> t1.id UInt64 : 3
-         ALIAS t1.value_1 :: 1 -> t1.value String : 0
-         ALIAS t2.value_2 :: 2 -> t2.value String : 1
+Actions: INPUT : 0 -> id_0 UInt64 : 0
+         INPUT : 1 -> value_1 String : 1
+         INPUT : 2 -> value_2 String : 2
+         ALIAS id_0 :: 0 -> t1.id UInt64 : 3
+         ALIAS value_1 :: 1 -> t1.value String : 0
+         ALIAS value_2 :: 2 -> t2.value String : 1
 Positions: 3 0 1
   FilledJoin (Filled JOIN)
-  Header: t1.id_0 UInt64
-          t1.value_1 String
-          t2.value_2 String
+  Header: id_0 UInt64
+          value_1 String
+          value_2 String
     Filter (( + (JOIN actions + Change column names to column identifiers)))
-    Header: t1.id_0 UInt64
-            t1.value_1 String
-    Filter column: equals(t1.id_0, 0_UInt8) (removed)
+    Header: id_0 UInt64
+            value_1 String
+    Filter column: equals(id_0, 0_UInt8) (removed)
     Actions: INPUT : 0 -> id UInt64 : 0
              INPUT : 1 -> value String : 1
              COLUMN Const(UInt8) -> 0_UInt8 UInt8 : 2
-             ALIAS id :: 0 -> t1.id_0 UInt64 : 3
-             ALIAS value :: 1 -> t1.value_1 String : 0
-             FUNCTION equals(t1.id_0 : 3, 0_UInt8 :: 2) -> equals(t1.id_0, 0_UInt8) UInt8 : 1
+             ALIAS id :: 0 -> id_0 UInt64 : 3
+             ALIAS value :: 1 -> value_1 String : 0
+             FUNCTION equals(id_0 : 3, 0_UInt8 :: 2) -> equals(id_0, 0_UInt8) UInt8 : 1
     Positions: 1 3 0
       ReadFromMergeTree (default.test_table)
       Header: id UInt64
diff --git a/tests/queries/0_stateless/02679_explain_merge_tree_prewhere_row_policy.reference b/tests/queries/0_stateless/02679_explain_merge_tree_prewhere_row_policy.reference
index 2fe98ea1682..cc16a1fce02 100644
--- a/tests/queries/0_stateless/02679_explain_merge_tree_prewhere_row_policy.reference
+++ b/tests/queries/0_stateless/02679_explain_merge_tree_prewhere_row_policy.reference
@@ -29,10 +29,10 @@ Header: id UInt64
         value String
 Actions: INPUT : 0 -> id UInt64 : 0
          INPUT : 1 -> value String : 1
-         ALIAS id :: 0 -> default.test_table.id_0 UInt64 : 2
-         ALIAS value :: 1 -> default.test_table.value_1 String : 0
-         ALIAS default.test_table.id_0 :: 2 -> id UInt64 : 1
-         ALIAS default.test_table.value_1 :: 0 -> value String : 2
+         ALIAS id :: 0 -> id_0 UInt64 : 2
+         ALIAS value :: 1 -> value_1 String : 0
+         ALIAS id_0 :: 2 -> id UInt64 : 1
+         ALIAS value_1 :: 0 -> value String : 2
 Positions: 1 2
   ReadFromMergeTree (default.test_table)
   Header: id UInt64
diff --git a/tests/queries/0_stateless/02681_undrop_query.sql b/tests/queries/0_stateless/02681_undrop_query.sql
index ead1a8bb305..39ca1548d53 100644
--- a/tests/queries/0_stateless/02681_undrop_query.sql
+++ b/tests/queries/0_stateless/02681_undrop_query.sql
@@ -21,7 +21,7 @@ detach table 02681_undrop_detach;
 undrop table 02681_undrop_detach; -- { serverError 57 }
 attach table 02681_undrop_detach;
 alter table 02681_undrop_detach update num = 2 where id = 1;
-select command from system.mutations where table='02681_undrop_detach' limit 1;
+select command from system.mutations where table='02681_undrop_detach' and database=currentDatabase() limit 1;
 drop table 02681_undrop_detach sync;
 
 select 'test MergeTree with cluster';
diff --git a/tests/queries/0_stateless/02701_invalid_having_NOT_AN_AGGREGATE.reference b/tests/queries/0_stateless/02701_invalid_having_NOT_AN_AGGREGATE.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02701_fail_on_invalid_having.sql b/tests/queries/0_stateless/02701_invalid_having_NOT_AN_AGGREGATE.sql
similarity index 100%
rename from tests/queries/0_stateless/02701_fail_on_invalid_having.sql
rename to tests/queries/0_stateless/02701_invalid_having_NOT_AN_AGGREGATE.sql
diff --git a/tests/queries/0_stateless/02703_max_local_read_bandwidth.sh b/tests/queries/0_stateless/02703_max_local_read_bandwidth.sh
index d47e2f363bd..c78cd202f1b 100755
--- a/tests/queries/0_stateless/02703_max_local_read_bandwidth.sh
+++ b/tests/queries/0_stateless/02703_max_local_read_bandwidth.sh
@@ -32,7 +32,7 @@ for read_method in "${read_methods[@]}"; do
             query_duration_ms >= 7e3,
             ProfileEvents['ReadBufferFromFileDescriptorReadBytes'] > 8e6,
             ProfileEvents['LocalReadThrottlerBytes'] > 8e6,
-            ProfileEvents['LocalReadThrottlerSleepMicroseconds'] > 7e6*0.9
+            ProfileEvents['LocalReadThrottlerSleepMicroseconds'] > 7e6*0.5
         FROM system.query_log
         WHERE current_database = '$CLICKHOUSE_DATABASE' AND query_id = '$query_id' AND type != 'QueryStart'
     "
diff --git a/tests/queries/0_stateless/02703_max_local_write_bandwidth.reference b/tests/queries/0_stateless/02703_max_local_write_bandwidth.reference
index ad05a699da0..72749c905a3 100644
--- a/tests/queries/0_stateless/02703_max_local_write_bandwidth.reference
+++ b/tests/queries/0_stateless/02703_max_local_write_bandwidth.reference
@@ -1 +1 @@
-1	1	1	1
+1	1	1
diff --git a/tests/queries/0_stateless/02703_max_local_write_bandwidth.sh b/tests/queries/0_stateless/02703_max_local_write_bandwidth.sh
index 41165d35d37..31cf6e9606e 100755
--- a/tests/queries/0_stateless/02703_max_local_write_bandwidth.sh
+++ b/tests/queries/0_stateless/02703_max_local_write_bandwidth.sh
@@ -18,8 +18,8 @@ $CLICKHOUSE_CLIENT -nm -q "
     SELECT
         query_duration_ms >= 7e3,
         ProfileEvents['WriteBufferFromFileDescriptorWriteBytes'] > 8e6,
-        ProfileEvents['LocalWriteThrottlerBytes'] > 8e6,
-        ProfileEvents['LocalWriteThrottlerSleepMicroseconds'] > 7e6*0.9
+        ProfileEvents['LocalWriteThrottlerBytes'] > 8e6
+        /* LocalWriteThrottlerSleepMicroseconds is too unreliable in debug build, but query_duration_ms is enough */
     FROM system.query_log
     WHERE current_database = '$CLICKHOUSE_DATABASE' AND query_id = '$query_id' AND type != 'QueryStart'
 "
diff --git a/tests/queries/0_stateless/02724_show_indexes.reference b/tests/queries/0_stateless/02724_show_indexes.reference
index 20af3954fa5..8365ade3231 100644
--- a/tests/queries/0_stateless/02724_show_indexes.reference
+++ b/tests/queries/0_stateless/02724_show_indexes.reference
@@ -14,6 +14,11 @@ tbl	0	mm1_idx	\N	\N	\N	\N	\N	\N	\N	minmax	\N	\N	YES	a, c, d
 tbl	0	mm2_idx	\N	\N	\N	\N	\N	\N	\N	minmax	\N	\N	YES	c, d, e
 tbl	0	PRIMARY	\N	\N	A	\N	\N	\N	\N	primary	\N	\N	YES	c, a
 tbl	0	set_idx	\N	\N	\N	\N	\N	\N	\N	set	\N	\N	YES	e
+tbl	0	blf_idx	\N	\N	\N	\N	\N	\N	\N	bloom_filter	\N	\N	YES	d, b
+tbl	0	mm1_idx	\N	\N	\N	\N	\N	\N	\N	minmax	\N	\N	YES	a, c, d
+tbl	0	mm2_idx	\N	\N	\N	\N	\N	\N	\N	minmax	\N	\N	YES	c, d, e
+tbl	0	PRIMARY	\N	\N	A	\N	\N	\N	\N	primary	\N	\N	YES	c, a
+tbl	0	set_idx	\N	\N	\N	\N	\N	\N	\N	set	\N	\N	YES	e
 --- EXTENDED
 tbl	0	blf_idx	\N	\N	\N	\N	\N	\N	\N	bloom_filter	\N	\N	YES	d, b
 tbl	0	mm1_idx	\N	\N	\N	\N	\N	\N	\N	minmax	\N	\N	YES	a, c, d
diff --git a/tests/queries/0_stateless/02724_show_indexes.sql b/tests/queries/0_stateless/02724_show_indexes.sql
index ce8ed67c524..04a481fea4e 100644
--- a/tests/queries/0_stateless/02724_show_indexes.sql
+++ b/tests/queries/0_stateless/02724_show_indexes.sql
@@ -22,6 +22,7 @@ PRIMARY KEY (c, a);
 SELECT '--- Aliases of SHOW INDEX';
 SHOW INDEX FROM tbl;
 SHOW INDEXES FROM tbl;
+SHOW INDICES FROM tbl;
 SHOW KEYS FROM tbl;
 
 SELECT '--- EXTENDED';
diff --git a/tests/queries/0_stateless/02731_parquet_s3.reference b/tests/queries/0_stateless/02731_formats_s3.reference
similarity index 61%
rename from tests/queries/0_stateless/02731_parquet_s3.reference
rename to tests/queries/0_stateless/02731_formats_s3.reference
index 5a5aaeb0068..dda2f3383fc 100644
--- a/tests/queries/0_stateless/02731_parquet_s3.reference
+++ b/tests/queries/0_stateless/02731_formats_s3.reference
@@ -1 +1,2 @@
 12639441726720293784
+499999500000
diff --git a/tests/queries/0_stateless/02731_formats_s3.sql b/tests/queries/0_stateless/02731_formats_s3.sql
new file mode 100644
index 00000000000..e54a1c10b5d
--- /dev/null
+++ b/tests/queries/0_stateless/02731_formats_s3.sql
@@ -0,0 +1,10 @@
+-- Tags: no-fasttest
+-- Tag no-fasttest: Depends on AWS
+
+-- Reading from s3 a parquet file of size between ~1 MB and ~2 MB was broken at some point
+-- (bug in CachedOnDiskReadBufferFromFile).
+select sum(*) from s3(s3_conn, filename='02731.parquet') settings remote_filesystem_read_method='threadpool', remote_filesystem_read_prefetch=1;
+
+-- Reading from s3 of arrow files of ~40 MB (max_download_buffer_size * 4) was broken at some point
+-- (bug in ParallelReadBuffer).
+select sum(*) from s3(s3_conn, filename='02731.arrow') settings remote_filesystem_read_method='read', max_download_buffer_size = 1048576;
diff --git a/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference b/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
index df606679523..9b08e69b9d3 100644
--- a/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
+++ b/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
@@ -39,6 +39,6 @@ U	c	10
 UlI+1		10
 bX?}ix [	Ny]2 G	10
 t<iT	X48q:Z]t0	10
-0	3	SELECT `key`, `value1`, `value2`, toUInt64(min(`time`)) AS `start_ts` FROM `default`.`join_inner_table` PREWHERE (`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`number` > toUInt64(\'1610517366120\')) GROUP BY `key`, `value1`, `value2`
+0	3	SELECT `key`, `value1`, `value2` FROM `default`.`join_inner_table` PREWHERE (`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`number` > toUInt64(\'1610517366120\')) GROUP BY `key`, `value1`, `value2`
 0	3	SELECT `value1`, `value2`, count() AS `count` FROM `default`.`join_outer_table` ALL INNER JOIN `_data_11888098645495698704_17868075224240210014` USING (`key`) GROUP BY `key`, `value1`, `value2`
 1	1	-- Parallel full query\nSELECT\n    value1,\n    value2,\n    avg(count) AS avg\nFROM\n    (\n        SELECT\n            key,\n            value1,\n            value2,\n            count() AS count\n        FROM join_outer_table\n        INNER JOIN\n        (\n            SELECT\n                key,\n                value1,\n                value2,\n                toUInt64(min(time)) AS start_ts\n            FROM join_inner_table\n            PREWHERE (id = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (number > toUInt64(\'1610517366120\'))\n            GROUP BY key, value1, value2\n        ) USING (key)\n        GROUP BY key, value1, value2\n        )\nGROUP BY value1, value2\nORDER BY value1, value2\nSETTINGS allow_experimental_parallel_reading_from_replicas = 1;
diff --git a/tests/queries/0_stateless/02731_parquet_s3.sql b/tests/queries/0_stateless/02731_parquet_s3.sql
deleted file mode 100644
index 3c3f11f535b..00000000000
--- a/tests/queries/0_stateless/02731_parquet_s3.sql
+++ /dev/null
@@ -1,7 +0,0 @@
--- Tags: no-fasttest
--- Tag no-fasttest: Depends on AWS
-
--- Reading from s3 a parquet file of size between ~1 MB and ~2 MB was broken at some point.
-insert into function s3(s3_conn, filename='test_02731_parquet_s3.parquet') select cityHash64(number) from numbers(170000) settings s3_truncate_on_insert=1;
-
-select sum(*) from s3(s3_conn, filename='test_02731_parquet_s3.parquet') settings remote_filesystem_read_method='threadpool', remote_filesystem_read_prefetch=1;
diff --git a/tests/queries/0_stateless/02732_rename_after_processing.reference b/tests/queries/0_stateless/02732_rename_after_processing.reference
new file mode 100644
index 00000000000..39cdb677e09
--- /dev/null
+++ b/tests/queries/0_stateless/02732_rename_after_processing.reference
@@ -0,0 +1,21 @@
+4
+processed_tmp1.csv
+!tmp1.csv
+10	10
+processed_tmp2.csv
+!tmp2.csv
+8
+processed_tmp3_1.csv
+processed_tmp3_2.csv
+!tmp3_1.csv
+!tmp3_2.csv
+4
+OK
+OK
+tmp5.csv
+OK
+tmp5.csv
+OK
+tmp5.csv
+OK
+tmp5.csv
diff --git a/tests/queries/0_stateless/02732_rename_after_processing.sh b/tests/queries/0_stateless/02732_rename_after_processing.sh
new file mode 100755
index 00000000000..c4f80d3462b
--- /dev/null
+++ b/tests/queries/0_stateless/02732_rename_after_processing.sh
@@ -0,0 +1,119 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+# see 01658_read_file_to_stringcolumn.sh
+CLICKHOUSE_USER_FILES_PATH=$(clickhouse-client --query "select _path, _file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+
+# Prepare data
+unique_name=${CLICKHOUSE_TEST_UNIQUE_NAME}
+tmp_dir=${CLICKHOUSE_USER_FILES_PATH}/${unique_name}
+mkdir -p $tmp_dir
+rm -rf ${tmp_dir:?}/*
+
+chmod 777 ${tmp_dir}
+
+echo '"id","str","int","text"' > ${tmp_dir}/tmp.csv
+echo '1,"abc",123,"abacaba"' >> ${tmp_dir}/tmp.csv
+echo '2,"def",456,"bacabaa"' >> ${tmp_dir}/tmp.csv
+echo '3,"story",78912,"acabaab"' >> ${tmp_dir}/tmp.csv
+echo '4,"history",21321321,"cabaaba"' >> ${tmp_dir}/tmp.csv
+
+chmod 777 ${tmp_dir}/tmp.csv
+
+cp ${tmp_dir}/tmp.csv ${tmp_dir}/tmp1.csv
+cp ${tmp_dir}/tmp.csv ${tmp_dir}/tmp2.csv
+cp ${tmp_dir}/tmp.csv ${tmp_dir}/tmp3_1.csv
+cp ${tmp_dir}/tmp.csv ${tmp_dir}/tmp3_2.csv
+cp ${tmp_dir}/tmp.csv ${tmp_dir}/tmp4.csv
+cp ${tmp_dir}/tmp.csv ${tmp_dir}/tmp5.csv
+
+### Checking that renaming works
+
+# simple select
+${CLICKHOUSE_CLIENT} --rename-files-after-processing="processed_%f%e" -q "SELECT COUNT(*) FROM file('${unique_name}/tmp1.csv')"
+if [ -e "${tmp_dir}/processed_tmp1.csv" ]; then
+  echo "processed_tmp1.csv"
+fi
+if [ ! -e "${tmp_dir}/tmp1.csv" ]; then
+  echo "!tmp1.csv"
+fi
+
+# select with multiple file() calls
+${CLICKHOUSE_CLIENT} --rename-files-after-processing="processed_%f%e" --multiline -q  """
+SELECT
+    sum(a.id) as aid,
+    sum(b.id) as bid
+FROM file('${unique_name}/tmp2.csv') AS a
+INNER JOIN file('${unique_name}/tmp2.csv') AS b
+ON a.text = b.text
+"""
+if [ -e "${tmp_dir}/processed_tmp2.csv" ]; then
+  echo "processed_tmp2.csv"
+fi
+if [ ! -e "${tmp_dir}/tmp2.csv" ]; then
+    echo "!tmp2.csv"
+fi
+
+# rename multiple files
+${CLICKHOUSE_CLIENT} --rename-files-after-processing="processed_%f%e" -q "SELECT COUNT(*) FROM file('${unique_name}/tmp3*.csv')"
+if [ -e "${tmp_dir}/processed_tmp3_1.csv" ]; then
+    echo "processed_tmp3_1.csv"
+fi
+if [ -e "${tmp_dir}/processed_tmp3_2.csv" ]; then
+    echo "processed_tmp3_2.csv"
+fi
+if [ ! -e "${tmp_dir}/tmp3_1.csv" ]; then
+    echo "!tmp3_1.csv"
+fi
+if [ ! -e "${tmp_dir}/tmp3_2.csv" ]; then
+    echo "!tmp3_2.csv"
+fi
+
+# check timestamp placeholder
+${CLICKHOUSE_CLIENT} --rename-files-after-processing="processed_%f_%t.csv" -q "SELECT COUNT(*) FROM file('${unique_name}/tmp4.csv')"
+# ls ${tmp_dir} | grep -E "^processed_tmp4_[0-9]+\.csv$" > /dev/null && echo "OK"
+rg="processed_tmp4_[0-9]+\.csv"
+for x in "${tmp_dir}"/processed*; do
+    if [[ $x =~ $rg ]]; then
+        echo "OK"
+        break
+    fi;
+done
+
+### Checking errors
+
+# cannot overwrite an existing file
+${CLICKHOUSE_CLIENT} --rename-files-after-processing="tmp.csv" -q "SELECT COUNT(*) FROM file('${unique_name}/tmp5.csv')" \
+    2>&1| grep "already exists" > /dev/null && echo "OK"
+if [ -e "${tmp_dir}/tmp5.csv" ]; then
+    echo "tmp5.csv"
+fi
+
+# сannot move file outside user_files
+${CLICKHOUSE_CLIENT} --rename-files-after-processing="../../%f%e" -q "SELECT COUNT(*) FROM file('${unique_name}/tmp5.csv')" \
+    2>&1| grep "is not inside" > /dev/null && echo "OK"
+if [ -e "${tmp_dir}/tmp5.csv" ]; then
+    echo "tmp5.csv"
+fi
+
+# check invalid placeholders
+
+# unknown type of placeholder (%k)
+${CLICKHOUSE_CLIENT} --rename-files-after-processing="processed_%f_%k" -q "SELECT COUNT(*) FROM file('${unique_name}/tmp5.csv')" \
+    2>&1| grep "Allowed placeholders only" > /dev/null && echo "OK"
+if [ -e "${tmp_dir}/tmp5.csv" ]; then
+    echo "tmp5.csv"
+fi
+
+# dd number of consecutive percentage signs after replace valid placeholders
+${CLICKHOUSE_CLIENT} --rename-files-after-processing="processed_%f_%%%%e" -q "SELECT COUNT(*) FROM file('${unique_name}/tmp5.csv')" \
+    2>&1| grep "Odd number of consecutive percentage signs" > /dev/null && echo "OK"
+if [ -e "${tmp_dir}/tmp5.csv" ]; then
+    echo "tmp5.csv"
+fi
+
+# Clean
+rm -rd $tmp_dir
diff --git a/tests/queries/0_stateless/02735_capnp_case_insensitive_names_matching.reference b/tests/queries/0_stateless/02735_capnp_case_insensitive_names_matching.reference
new file mode 100644
index 00000000000..f34c857e2f6
--- /dev/null
+++ b/tests/queries/0_stateless/02735_capnp_case_insensitive_names_matching.reference
@@ -0,0 +1 @@
+42	(42,42)
diff --git a/tests/queries/0_stateless/02735_capnp_case_insensitive_names_matching.sh b/tests/queries/0_stateless/02735_capnp_case_insensitive_names_matching.sh
new file mode 100755
index 00000000000..c3835948437
--- /dev/null
+++ b/tests/queries/0_stateless/02735_capnp_case_insensitive_names_matching.sh
@@ -0,0 +1,10 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest, no-parallel, no-replicated-database
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+SCHEMADIR=$CURDIR/format_schemas
+$CLICKHOUSE_LOCAL -q "select 42 as Field1, (42, 42)::Tuple(Field1 UInt32, Field2 UInt32) as Nested format CapnProto settings format_schema='$SCHEMADIR/02735_case_insensitive_names_matching:Message'" | $CLICKHOUSE_LOCAL --input-format CapnProto --structure "Field1 UInt32, Nested Tuple(Field1 UInt32, Field2 UInt32)" -q "select * from table" --format_schema="$SCHEMADIR/02735_case_insensitive_names_matching:Message"
+
diff --git a/tests/queries/0_stateless/02735_system_zookeeper_connection.reference b/tests/queries/0_stateless/02735_system_zookeeper_connection.reference
index 1deabd88b88..380da27cde6 100644
--- a/tests/queries/0_stateless/02735_system_zookeeper_connection.reference
+++ b/tests/queries/0_stateless/02735_system_zookeeper_connection.reference
@@ -1,2 +1,2 @@
-default	::1	9181	0	0	3
-zookeeper2	::1	9181	0	0	0
+default	::1	9181	0	0	0	1	1	['FILTERED_LIST','MULTI_READ','CHECK_NOT_EXISTS']
+zookeeper2	::1	9181	0	0	0	1
diff --git a/tests/queries/0_stateless/02735_system_zookeeper_connection.sql b/tests/queries/0_stateless/02735_system_zookeeper_connection.sql
index 8b37c428413..f999da51225 100644
--- a/tests/queries/0_stateless/02735_system_zookeeper_connection.sql
+++ b/tests/queries/0_stateless/02735_system_zookeeper_connection.sql
@@ -8,8 +8,14 @@ CREATE TABLE test_zk_connection_table (
 ENGINE ReplicatedMergeTree('zookeeper2:/clickhouse/{database}/02731_zk_connection/{shard}', '{replica}')
 ORDER BY tuple();
 
+select name, host, port, index, is_expired, keeper_api_version, (connected_time between yesterday() and now()),
+       (abs(session_uptime_elapsed_seconds  - zookeeperSessionUptime()) < 10), enabled_feature_flags
+from system.zookeeper_connection where name='default';
+
 -- keeper_api_version will by 0 for auxiliary_zookeeper2, because we fail to get /api_version due to chroot
 -- I'm not sure if it's a bug or a useful trick to fallback to basic api
-select name, host, port, index, is_expired, keeper_api_version from system.zookeeper_connection order by name;
+-- Also, auxiliary zookeeper is created lazily
+select name, host, port, index, is_expired, keeper_api_version, (connected_time between yesterday() and now())
+from system.zookeeper_connection where name!='default';
 
 DROP TABLE IF EXISTS test_zk_connection_table;
diff --git a/tests/queries/0_stateless/02736_reading_and_writing_structure_fields.reference b/tests/queries/0_stateless/02736_reading_and_writing_structure_fields.reference
new file mode 100644
index 00000000000..b6e6d485929
--- /dev/null
+++ b/tests/queries/0_stateless/02736_reading_and_writing_structure_fields.reference
@@ -0,0 +1,3 @@
+(42,(42,42),[(42,42),(24,24)])	[(42,(42,42),[(42,42),(24,24)]),(24,(24,24),[(24,24),(42,42)])]
+42	42	42
+[42,24]	[42,24]	[42,24]	[[42,24],[24,42]]	[[42,24],[24,42]]
diff --git a/tests/queries/0_stateless/02736_reading_and_writing_structure_fields.sh b/tests/queries/0_stateless/02736_reading_and_writing_structure_fields.sh
new file mode 100755
index 00000000000..c669be2ed33
--- /dev/null
+++ b/tests/queries/0_stateless/02736_reading_and_writing_structure_fields.sh
@@ -0,0 +1,24 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest, no-parallel, no-replicated-database
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+SCHEMADIR=$CURDIR/format_schemas
+DATA_FILE=02736_$CLICKHOUSE_TEST_UNIQUE_NAME.bin
+
+$CLICKHOUSE_LOCAL -q "select tuple(42, tuple(42, 42), [tuple(42, 42), tuple(24, 24)]) as nested, [tuple(42, tuple(42, 42), [tuple(42, 42), tuple(24, 24)]), tuple(24, tuple(24, 24), [tuple(24, 24), tuple(42, 42)])] as nestedList format CapnProto settings format_schema='$SCHEMADIR/02736_nested_structures:Message'" > $DATA_FILE
+
+$CLICKHOUSE_LOCAL -q "select * from file($DATA_FILE, CapnProto) settings format_schema='$SCHEMADIR/02736_nested_structures:Message'"
+
+$CLICKHOUSE_LOCAL -q "select 42 as nested_field1, 42 as nested_nested_field1, 42 as nested_nested_field2 format CapnProto settings format_schema='$SCHEMADIR/02736_nested_structures:Message'" > $DATA_FILE
+
+$CLICKHOUSE_LOCAL -q "select * from file($DATA_FILE, CapnProto, 'nested_field1 UInt32, nested_nested_field1 UInt32, nested_nested_field2 UInt32') settings format_schema='$SCHEMADIR/02736_nested_structures:Message'"
+
+$CLICKHOUSE_LOCAL -q "select [42, 24] as nestedList_field1, [42, 24] as nestedList_nested_field1, [42, 24] as nestedList_nested_field2, [[42, 24], [24, 42]] as nestedList_nestedList_field1, [[42, 24], [24, 42]] as nestedList_nestedList_field2 format CapnProto settings format_schema='$SCHEMADIR/02736_nested_structures:Message'" > $DATA_FILE
+
+$CLICKHOUSE_LOCAL -q "select * from file($DATA_FILE, CapnProto, 'nestedList_field1 Array(UInt32), nestedList_nested_field1 Array(UInt32), nestedList_nested_field2 Array(UInt32), nestedList_nestedList_field1 Array(Array(UInt32)), nestedList_nestedList_field2 Array(Array(UInt32))') settings format_schema='$SCHEMADIR/02736_nested_structures:Message'"
+
+rm $DATA_FILE
+
diff --git a/tests/queries/0_stateless/02737_timezone_setting.reference b/tests/queries/0_stateless/02737_timezone_setting.reference
new file mode 100644
index 00000000000..578aec4e316
--- /dev/null
+++ b/tests/queries/0_stateless/02737_timezone_setting.reference
@@ -0,0 +1,7 @@
+Pacific/Pitcairn	Pacific/Pitcairn
+Asia/Novosibirsk	Asia/Novosibirsk
+2022-12-12 17:23:23
+2022-12-13 07:23:23.123
+2002-12-12 23:23:23	2002-12-12 23:23:23
+2002-12-12 23:23:23.123	2002-12-12 23:23:23.123
+2000-01-01 01:00:00
diff --git a/tests/queries/0_stateless/02737_timezone_setting.sql b/tests/queries/0_stateless/02737_timezone_setting.sql
new file mode 100644
index 00000000000..8543e2a2c82
--- /dev/null
+++ b/tests/queries/0_stateless/02737_timezone_setting.sql
@@ -0,0 +1,26 @@
+SET session_timezone = 'Абырвалг'; -- { serverError BAD_ARGUMENTS}
+
+SELECT timezone(), timezoneOf(now()) SETTINGS session_timezone = 'Pacific/Pitcairn';
+
+SET session_timezone = 'Asia/Novosibirsk';
+SELECT timezone(), timezoneOf(now());
+
+-- test simple queries
+SELECT toDateTime(toDateTime('2022-12-12 23:23:23'), 'Europe/Zurich');
+SELECT toDateTime64(toDateTime64('2022-12-12 23:23:23.123', 3), 3, 'Europe/Zurich') SETTINGS session_timezone = 'America/Denver';
+
+-- test proper serialization
+SELECT toDateTime('2002-12-12 23:23:23') AS dt, toString(dt) SETTINGS session_timezone = 'Asia/Phnom_Penh';
+SELECT toDateTime64('2002-12-12 23:23:23.123', 3) AS dt64, toString(dt64) SETTINGS session_timezone = 'Asia/Phnom_Penh';
+
+-- Create a table and test that DateTimes are processed correctly on insert
+CREATE TABLE test_tz_setting (d DateTime('UTC')) Engine=Memory AS SELECT toDateTime('2000-01-01 00:00:00');
+INSERT INTO test_tz_setting VALUES ('2000-01-01 01:00:00'); -- this is parsed using timezone from `d` column
+INSERT INTO test_tz_setting VALUES (toDateTime('2000-01-02 02:00:00')); -- this is parsed using `session_timezone`
+
+-- Test parsing in WHERE filter, shall have the same logic as insert
+SELECT d FROM test_tz_setting WHERE d == '2000-01-01 01:00:00'; -- 1 row expected
+SELECT d FROM test_tz_setting WHERE d == toDateTime('2000-01-01 02:00:00'); -- 0 rows expected
+
+-- Cleanup table
+DROP TABLE test_tz_setting SYNC;
diff --git a/tests/queries/0_stateless/02751_ip_types_aggregate_functions_states.reference.j2 b/tests/queries/0_stateless/02751_ip_types_aggregate_functions_states.reference.j2
new file mode 100644
index 00000000000..03b0e065151
--- /dev/null
+++ b/tests/queries/0_stateless/02751_ip_types_aggregate_functions_states.reference.j2
@@ -0,0 +1,220 @@
+----- hash / State / ip4 -----
+Row 1:
+──────
+minState:            12535288824949910799
+maxState:            15790547582231549775
+first_valueState:    12535288824949910799
+last_valueState:     15790547582231549775
+topKState:           4906125994014190470
+groupArrayState:     9875990674330641453
+groupUniqArrayState: 15788623094139372318
+uniqState:           13857072740564896081
+uniqExactState:      2764760571052675772
+uniqCombinedState:   927481020821507998
+uniqCombined64State: 11588178464185397904
+uniqHLL12State:      592773541433144605
+uniqThetaState:      12573391720108828030
+----- hash / State / ip6 -----
+Row 1:
+──────
+minState:            9428555662807296659
+maxState:            18253481702148601156
+first_valueState:    9428555662807296659
+last_valueState:     18253481702148601156
+topKState:           4649040466816645853
+groupArrayState:     15334593495826890008
+groupUniqArrayState: 18179202420787216155
+uniqState:           1113473461736161202
+uniqExactState:      17291302630176581193
+uniqCombinedState:   7689865507370303115
+uniqCombined64State: 7689865507370303115
+uniqHLL12State:      12630756003012135681
+uniqThetaState:      11768246996604802350
+----- finalizeAggregation / State / ip4 -----
+Row 1:
+──────
+min:            59.154.201.255
+max:            59.154.202.47
+first_value:    59.154.201.255
+last_value:     59.154.202.47
+topK:           ['59.154.201.255','59.154.202.0','59.154.202.1','59.154.202.2','59.154.202.3','59.154.202.4','59.154.202.5','59.154.202.6','59.154.202.7','59.154.202.8']
+groupArray:     ['59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.40','59.154.202.40','59.154.202.40','59.154.202.40','59.154.202.40','59.154.202.40','59.154.202.40','59.154.202.40','59.154.202.41','59.154.202.41','59.154.202.41','59.154.202.41','59.154.202.41','59.154.202.41','59.154.202.41','59.154.202.42','59.154.202.42','59.154.202.42','59.154.202.42','59.154.202.42','59.154.202.42','59.154.202.43','59.154.202.43','59.154.202.43','59.154.202.43','59.154.202.43','59.154.202.44','59.154.202.44','59.154.202.44','59.154.202.44','59.154.202.45','59.154.202.45','59.154.202.45','59.154.202.46','59.154.202.46','59.154.202.47']
+groupUniqArray: ['59.154.202.28','59.154.202.45','59.154.202.35','59.154.202.2','59.154.202.42','59.154.202.1','59.154.202.4','59.154.202.15','59.154.202.22','59.154.202.20','59.154.202.12','59.154.202.3','59.154.202.40','59.154.202.43','59.154.202.26','59.154.202.37','59.154.202.7','59.154.202.36','59.154.202.32','59.154.202.47','59.154.202.17','59.154.202.11','59.154.201.255','59.154.202.0','59.154.202.14','59.154.202.25','59.154.202.6','59.154.202.30','59.154.202.16','59.154.202.21','59.154.202.23','59.154.202.38','59.154.202.44','59.154.202.39','59.154.202.41','59.154.202.27','59.154.202.33','59.154.202.19','59.154.202.5','59.154.202.9','59.154.202.18','59.154.202.24','59.154.202.34','59.154.202.46','59.154.202.8','59.154.202.29','59.154.202.10','59.154.202.13','59.154.202.31']
+uniq:           49
+uniqExact:      49
+uniqCombined:   49
+uniqCombined64: 49
+uniqHLL12:      48
+uniqTheta:      49
+----- finalizeAggregation / State / ip6 -----
+Row 1:
+──────
+min:            8c:333c::8c:333c:0:0
+max:            ff8b:333c::ff8b:333c:0:0
+first_value:    8c:333c::8c:333c:0:0
+last_value:     ff8b:333c::ff8b:333c:0:0
+topK:           ['dd8b:333c::dd8b:333c:0:0','de8b:333c::de8b:333c:0:0','df8b:333c::df8b:333c:0:0','e08b:333c::e08b:333c:0:0','e18b:333c::e18b:333c:0:0','e28b:333c::e28b:333c:0:0','e38b:333c::e38b:333c:0:0','e48b:333c::e48b:333c:0:0','e58b:333c::e58b:333c:0:0','e68b:333c::e68b:333c:0:0']
+groupArray:     ['8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','78c:333c::78c:333c:0:0','78c:333c::78c:333c:0:0','78c:333c::78c:333c:0:0','78c:333c::78c:333c:0:0','78c:333c::78c:333c:0:0','78c:333c::78c:333c:0:0','78c:333c::78c:333c:0:0','88c:333c::88c:333c:0:0','88c:333c::88c:333c:0:0','88c:333c::88c:333c:0:0','88c:333c::88c:333c:0:0','88c:333c::88c:333c:0:0','88c:333c::88c:333c:0:0','98c:333c::98c:333c:0:0','98c:333c::98c:333c:0:0','98c:333c::98c:333c:0:0','98c:333c::98c:333c:0:0','98c:333c::98c:333c:0:0','a8c:333c::a8c:333c:0:0','a8c:333c::a8c:333c:0:0','a8c:333c::a8c:333c:0:0','a8c:333c::a8c:333c:0:0','b8c:333c::b8c:333c:0:0','b8c:333c::b8c:333c:0:0','b8c:333c::b8c:333c:0:0','c8c:333c::c8c:333c:0:0','c8c:333c::c8c:333c:0:0','d8c:333c::d8c:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0']
+groupUniqArray: ['58c:333c::58c:333c:0:0','f78b:333c::f78b:333c:0:0','f38b:333c::f38b:333c:0:0','18c:333c::18c:333c:0:0','e78b:333c::e78b:333c:0:0','e38b:333c::e38b:333c:0:0','e48b:333c::e48b:333c:0:0','e08b:333c::e08b:333c:0:0','df8b:333c::df8b:333c:0:0','f48b:333c::f48b:333c:0:0','68c:333c::68c:333c:0:0','28c:333c::28c:333c:0:0','f08b:333c::f08b:333c:0:0','fa8b:333c::fa8b:333c:0:0','88c:333c::88c:333c:0:0','c8c:333c::c8c:333c:0:0','fe8b:333c::fe8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','e98b:333c::e98b:333c:0:0','ed8b:333c::ed8b:333c:0:0','b8c:333c::b8c:333c:0:0','f98b:333c::f98b:333c:0:0','fd8b:333c::fd8b:333c:0:0','de8b:333c::de8b:333c:0:0','f58b:333c::f58b:333c:0:0','78c:333c::78c:333c:0:0','38c:333c::38c:333c:0:0','f18b:333c::f18b:333c:0:0','e58b:333c::e58b:333c:0:0','e18b:333c::e18b:333c:0:0','e68b:333c::e68b:333c:0:0','e28b:333c::e28b:333c:0:0','48c:333c::48c:333c:0:0','dd8b:333c::dd8b:333c:0:0','f68b:333c::f68b:333c:0:0','f28b:333c::f28b:333c:0:0','8c:333c::8c:333c:0:0','a8c:333c::a8c:333c:0:0','f88b:333c::f88b:333c:0:0','fc8b:333c::fc8b:333c:0:0','e88b:333c::e88b:333c:0:0','ec8b:333c::ec8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','98c:333c::98c:333c:0:0','d8c:333c::d8c:333c:0:0','ff8b:333c::ff8b:333c:0:0']
+uniq:           49
+uniqExact:      49
+uniqCombined:   49
+uniqCombined64: 49
+uniqHLL12:      49
+uniqTheta:      49
+----- hash / IfState / ip4 -----
+Row 1:
+──────
+minIfState:            12535288824949910799
+maxIfState:            15790547582231549775
+first_valueIfState:    12535288824949910799
+last_valueIfState:     15790547582231549775
+topKIfState:           4906125994014190470
+groupArrayIfState:     9875990674330641453
+groupUniqArrayIfState: 15788623094139372318
+uniqIfState:           13857072740564896081
+uniqExactIfState:      2764760571052675772
+uniqCombinedIfState:   927481020821507998
+uniqCombined64IfState: 11588178464185397904
+uniqHLL12IfState:      592773541433144605
+uniqThetaIfState:      12573391720108828030
+----- hash / IfState / ip6 -----
+Row 1:
+──────
+minIfState:            9428555662807296659
+maxIfState:            18253481702148601156
+first_valueIfState:    9428555662807296659
+last_valueIfState:     18253481702148601156
+topKIfState:           4649040466816645853
+groupArrayIfState:     15334593495826890008
+groupUniqArrayIfState: 18179202420787216155
+uniqIfState:           1113473461736161202
+uniqExactIfState:      17291302630176581193
+uniqCombinedIfState:   7689865507370303115
+uniqCombined64IfState: 7689865507370303115
+uniqHLL12IfState:      12630756003012135681
+uniqThetaIfState:      11768246996604802350
+----- finalizeAggregation / IfState / ip4 -----
+Row 1:
+──────
+min:            59.154.201.255
+max:            59.154.202.47
+first_value:    59.154.201.255
+last_value:     59.154.202.47
+topK:           ['59.154.201.255','59.154.202.0','59.154.202.1','59.154.202.2','59.154.202.3','59.154.202.4','59.154.202.5','59.154.202.6','59.154.202.7','59.154.202.8']
+groupArray:     ['59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.201.255','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.0','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.1','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.2','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.3','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.4','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.5','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.6','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.7','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.8','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.9','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.10','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.11','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.12','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.13','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.14','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.15','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.16','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.17','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.18','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.19','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.20','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.21','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.22','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.23','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.24','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.25','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.26','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.27','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.28','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.29','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.30','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.31','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.32','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.33','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.34','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.35','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.36','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.37','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.38','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.39','59.154.202.40','59.154.202.40','59.154.202.40','59.154.202.40','59.154.202.40','59.154.202.40','59.154.202.40','59.154.202.40','59.154.202.41','59.154.202.41','59.154.202.41','59.154.202.41','59.154.202.41','59.154.202.41','59.154.202.41','59.154.202.42','59.154.202.42','59.154.202.42','59.154.202.42','59.154.202.42','59.154.202.42','59.154.202.43','59.154.202.43','59.154.202.43','59.154.202.43','59.154.202.43','59.154.202.44','59.154.202.44','59.154.202.44','59.154.202.44','59.154.202.45','59.154.202.45','59.154.202.45','59.154.202.46','59.154.202.46','59.154.202.47']
+groupUniqArray: ['59.154.202.28','59.154.202.45','59.154.202.35','59.154.202.2','59.154.202.42','59.154.202.1','59.154.202.4','59.154.202.15','59.154.202.22','59.154.202.20','59.154.202.12','59.154.202.3','59.154.202.40','59.154.202.43','59.154.202.26','59.154.202.37','59.154.202.7','59.154.202.36','59.154.202.32','59.154.202.47','59.154.202.17','59.154.202.11','59.154.201.255','59.154.202.0','59.154.202.14','59.154.202.25','59.154.202.6','59.154.202.30','59.154.202.16','59.154.202.21','59.154.202.23','59.154.202.38','59.154.202.44','59.154.202.39','59.154.202.41','59.154.202.27','59.154.202.33','59.154.202.19','59.154.202.5','59.154.202.9','59.154.202.18','59.154.202.24','59.154.202.34','59.154.202.46','59.154.202.8','59.154.202.29','59.154.202.10','59.154.202.13','59.154.202.31']
+uniq:           49
+uniqExact:      49
+uniqCombined:   49
+uniqCombined64: 49
+uniqHLL12:      48
+uniqTheta:      49
+----- finalizeAggregation / IfState / ip6 -----
+Row 1:
+──────
+min:            8c:333c::8c:333c:0:0
+max:            ff8b:333c::ff8b:333c:0:0
+first_value:    8c:333c::8c:333c:0:0
+last_value:     ff8b:333c::ff8b:333c:0:0
+topK:           ['dd8b:333c::dd8b:333c:0:0','de8b:333c::de8b:333c:0:0','df8b:333c::df8b:333c:0:0','e08b:333c::e08b:333c:0:0','e18b:333c::e18b:333c:0:0','e28b:333c::e28b:333c:0:0','e38b:333c::e38b:333c:0:0','e48b:333c::e48b:333c:0:0','e58b:333c::e58b:333c:0:0','e68b:333c::e68b:333c:0:0']
+groupArray:     ['8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','8c:333c::8c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','18c:333c::18c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','28c:333c::28c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','38c:333c::38c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','48c:333c::48c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','58c:333c::58c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','68c:333c::68c:333c:0:0','78c:333c::78c:333c:0:0','78c:333c::78c:333c:0:0','78c:333c::78c:333c:0:0','78c:333c::78c:333c:0:0','78c:333c::78c:333c:0:0','78c:333c::78c:333c:0:0','78c:333c::78c:333c:0:0','88c:333c::88c:333c:0:0','88c:333c::88c:333c:0:0','88c:333c::88c:333c:0:0','88c:333c::88c:333c:0:0','88c:333c::88c:333c:0:0','88c:333c::88c:333c:0:0','98c:333c::98c:333c:0:0','98c:333c::98c:333c:0:0','98c:333c::98c:333c:0:0','98c:333c::98c:333c:0:0','98c:333c::98c:333c:0:0','a8c:333c::a8c:333c:0:0','a8c:333c::a8c:333c:0:0','a8c:333c::a8c:333c:0:0','a8c:333c::a8c:333c:0:0','b8c:333c::b8c:333c:0:0','b8c:333c::b8c:333c:0:0','b8c:333c::b8c:333c:0:0','c8c:333c::c8c:333c:0:0','c8c:333c::c8c:333c:0:0','d8c:333c::d8c:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','dd8b:333c::dd8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','de8b:333c::de8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','df8b:333c::df8b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e08b:333c::e08b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e18b:333c::e18b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e28b:333c::e28b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e38b:333c::e38b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e48b:333c::e48b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e58b:333c::e58b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e68b:333c::e68b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e78b:333c::e78b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e88b:333c::e88b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','e98b:333c::e98b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ec8b:333c::ec8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ed8b:333c::ed8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f08b:333c::f08b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f18b:333c::f18b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f28b:333c::f28b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f38b:333c::f38b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f48b:333c::f48b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f58b:333c::f58b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f68b:333c::f68b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f78b:333c::f78b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f88b:333c::f88b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','f98b:333c::f98b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fa8b:333c::fa8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fc8b:333c::fc8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fd8b:333c::fd8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','fe8b:333c::fe8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0','ff8b:333c::ff8b:333c:0:0']
+groupUniqArray: ['58c:333c::58c:333c:0:0','f78b:333c::f78b:333c:0:0','f38b:333c::f38b:333c:0:0','18c:333c::18c:333c:0:0','e78b:333c::e78b:333c:0:0','e38b:333c::e38b:333c:0:0','e48b:333c::e48b:333c:0:0','e08b:333c::e08b:333c:0:0','df8b:333c::df8b:333c:0:0','f48b:333c::f48b:333c:0:0','68c:333c::68c:333c:0:0','28c:333c::28c:333c:0:0','f08b:333c::f08b:333c:0:0','fa8b:333c::fa8b:333c:0:0','88c:333c::88c:333c:0:0','c8c:333c::c8c:333c:0:0','fe8b:333c::fe8b:333c:0:0','ea8b:333c::ea8b:333c:0:0','ee8b:333c::ee8b:333c:0:0','e98b:333c::e98b:333c:0:0','ed8b:333c::ed8b:333c:0:0','b8c:333c::b8c:333c:0:0','f98b:333c::f98b:333c:0:0','fd8b:333c::fd8b:333c:0:0','de8b:333c::de8b:333c:0:0','f58b:333c::f58b:333c:0:0','78c:333c::78c:333c:0:0','38c:333c::38c:333c:0:0','f18b:333c::f18b:333c:0:0','e58b:333c::e58b:333c:0:0','e18b:333c::e18b:333c:0:0','e68b:333c::e68b:333c:0:0','e28b:333c::e28b:333c:0:0','48c:333c::48c:333c:0:0','dd8b:333c::dd8b:333c:0:0','f68b:333c::f68b:333c:0:0','f28b:333c::f28b:333c:0:0','8c:333c::8c:333c:0:0','a8c:333c::a8c:333c:0:0','f88b:333c::f88b:333c:0:0','fc8b:333c::fc8b:333c:0:0','e88b:333c::e88b:333c:0:0','ec8b:333c::ec8b:333c:0:0','eb8b:333c::eb8b:333c:0:0','ef8b:333c::ef8b:333c:0:0','fb8b:333c::fb8b:333c:0:0','98c:333c::98c:333c:0:0','d8c:333c::d8c:333c:0:0','ff8b:333c::ff8b:333c:0:0']
+uniq:           49
+uniqExact:      49
+uniqCombined:   49
+uniqCombined64: 49
+uniqHLL12:      49
+uniqTheta:      49
+----- Arg / hash / State / ip4 -----
+Row 1:
+──────
+argMinState: 13774589216353164344
+argMaxState: 1131101663917664667
+----- Arg / hash / State / ip6 -----
+Row 1:
+──────
+argMinState: 7320668278649617037
+argMaxState: 16598449636475438091
+----- Arg / finalizeAggregation / State / ip4 -----
+Row 1:
+──────
+argMinState: 59.154.201.255
+argMaxState: 59.154.202.47
+----- Arg / finalizeAggregation / State / ip6 -----
+Row 1:
+──────
+argMinState: 8c:333c::8c:333c:0:0
+argMaxState: ff8b:333c::ff8b:333c:0:0
+----- hash / State / ip4 -----
+Row 1:
+──────
+anyState:      12535288824949910799
+anyHeavyState: 9327034461443333306
+anyLastState:  12535288824949910799
+----- hash / State / ip6 -----
+Row 1:
+──────
+anyState:      1383994153676807399
+anyHeavyState: 15555709096566410627
+anyLastState:  1383994153676807399
+----- finalizeAggregation / State / ip4 -----
+Row 1:
+──────
+any:      59.154.201.255
+anyHeavy: 59.154.201.255
+anyLast:  59.154.201.255
+----- finalizeAggregation / State / ip6 -----
+Row 1:
+──────
+any:      dd8b:333c::dd8b:333c:0:0
+anyHeavy: dd8b:333c::dd8b:333c:0:0
+anyLast:  dd8b:333c::dd8b:333c:0:0
+----- Map/Map hash / State / ip4 -----
+Row 1:
+──────
+sumMapState: 9327034461443333306
+minMapState: 17403430892851901033
+maxMapState: 17403430892851901033
+----- Map/Map hash / State / ip6 -----
+Row 1:
+──────
+sumMapState: 5204122423200337352
+minMapState: 14534921151579960284
+maxMapState: 14534921151579960284
+----- Map/Map finalizeAggregation / State / ip4 -----
+Row 1:
+──────
+sumMap: {'59.154.201.255':1}
+minMap: {'59.154.201.255':1}
+maxMap: {'59.154.201.255':1}
+----- Map/Map finalizeAggregation / State / ip6 -----
+Row 1:
+──────
+sumMap: {'dd8b:333c::dd8b:333c:0:0':1}
+minMap: {'dd8b:333c::dd8b:333c:0:0':1}
+maxMap: {'dd8b:333c::dd8b:333c:0:0':1}
+----- Map/Array hash / State / ip4 -----
+Row 1:
+──────
+sumMapState: 9327034461443333306
+minMapState: 9327034461443333306
+maxMapState: 9327034461443333306
+----- Map/Array hash / State / ip6 -----
+Row 1:
+──────
+sumMapState: 15555709096566410627
+minMapState: 15555709096566410627
+maxMapState: 15555709096566410627
+----- Map/Array finalizeAggregation / State / ip4 -----
+Row 1:
+──────
+sumMap: (['59.154.201.255'],[1])
+minMap: (['59.154.201.255'],[1])
+maxMap: (['59.154.201.255'],[1])
+----- Map/Array finalizeAggregation / State / ip6 -----
+Row 1:
+──────
+sumMap: (['dd8b:333c::dd8b:333c:0:0'],[1])
+minMap: (['dd8b:333c::dd8b:333c:0:0'],[1])
+maxMap: (['dd8b:333c::dd8b:333c:0:0'],[1])
diff --git a/tests/queries/0_stateless/02751_ip_types_aggregate_functions_states.sql.j2 b/tests/queries/0_stateless/02751_ip_types_aggregate_functions_states.sql.j2
new file mode 100644
index 00000000000..7d030d4be2d
--- /dev/null
+++ b/tests/queries/0_stateless/02751_ip_types_aggregate_functions_states.sql.j2
@@ -0,0 +1,170 @@
+-- Tags: no-parallel, no-fasttest
+
+{# this test checks backward compatibility of aggregate functions States against IPv4, IPv6 types #}
+
+{% set ip4_generator = "select num::UInt32::IPv4 ip from (select arrayJoin(range(999999999, number)) as num from numbers(999999999,50)) order by ip" %}
+{% set ip6_generator = "SELECT toIPv6(IPv6NumToString(toFixedString(reinterpretAsFixedString(num)||reinterpretAsFixedString(num), 16))) AS ip FROM (select arrayJoin(range(1010011101, number)) as num from numbers(1010011101,50)) order by ip" %}
+{% set ip_generators = {'ip4': ip4_generator, 'ip6': ip6_generator} %}
+
+
+{% set agg_func_list = [ "min", "max", "first_value", "last_value", "topK", "groupArray", "groupUniqArray", "uniq", "uniqExact", "uniqCombined", "uniqCombined64", "uniqHLL12", "uniqTheta" ] %}
+
+{% for generator_name, ip_generator in ip_generators.items() %}
+
+select '----- hash / State / {{ generator_name }} -----';
+select
+  {% for func in agg_func_list -%}
+     cityHash64(hex( {{ func }}State(ip) )) AS {{ func }}State{{ "," if not loop.last }}
+  {% endfor -%}
+from ( {{ ip_generator }} ) format Vertical;
+
+{% endfor -%}
+
+
+{% for generator_name, ip_generator in ip_generators.items() %}
+
+select '----- finalizeAggregation / State / {{ generator_name }} -----';
+select
+  {% for func in agg_func_list -%}
+     finalizeAggregation( {{ func }}State(ip) ) AS {{ func }}{{ "," if not loop.last }}
+  {% endfor -%}
+from ( {{ ip_generator }} ) format Vertical;
+
+{% endfor -%}
+
+
+{% for generator_name, ip_generator in ip_generators.items() %}
+
+select '----- hash / IfState / {{ generator_name }} -----';
+select
+  {% for func in agg_func_list -%}
+     cityHash64(hex( {{ func }}IfState(ip, 1) )) AS {{ func }}IfState{{ "," if not loop.last }}
+  {% endfor -%}
+from ( {{ ip_generator }} ) format Vertical;
+
+{% endfor -%}
+
+
+{% for generator_name, ip_generator in ip_generators.items() %}
+
+select '----- finalizeAggregation / IfState / {{ generator_name }} -----';
+select
+  {% for func in agg_func_list -%}
+     finalizeAggregation( {{ func }}IfState(ip, 1) ) AS {{ func }}{{ "," if not loop.last }}
+  {% endfor -%}
+from ( {{ ip_generator }} ) format Vertical;
+
+{% endfor -%}
+
+
+{% set agg_func_list = [ "argMin", "argMax" ] %}
+
+{% for generator_name, ip_generator in ip_generators.items() %}
+
+select '----- Arg / hash / State / {{ generator_name }} -----';
+select
+  {% for func in agg_func_list -%}
+     cityHash64(hex( {{ func }}State(ip, ip) )) AS {{ func }}State{{ "," if not loop.last }}
+  {% endfor -%}
+from ( {{ ip_generator }} ) format Vertical;
+
+{% endfor -%}
+
+
+{% for generator_name, ip_generator in ip_generators.items() %}
+
+select '----- Arg / finalizeAggregation / State / {{ generator_name }} -----';
+select
+  {% for func in agg_func_list -%}
+     finalizeAggregation( {{ func }}State(ip, ip) ) AS {{ func }}State{{ "," if not loop.last }}
+  {% endfor -%}
+from ( {{ ip_generator }} ) format Vertical;
+
+{% endfor -%}
+
+
+
+
+{# let's test functions with not deterministic result against 1 row, to make it deterministic #}
+{% set ip4_generator = "select number::UInt32::IPv4 ip from numbers(999999999,1) order by ip" %}
+{% set ip6_generator = "SELECT toIPv6(IPv6NumToString(toFixedString(reinterpretAsFixedString(number)||reinterpretAsFixedString(number), 16))) AS ip FROM numbers(1010011101, 1) order by ip" %}
+
+{% set ip_generators = {'ip4': ip4_generator, 'ip6': ip6_generator} %}
+
+{% set agg_func_list = [ "any", "anyHeavy", "anyLast" ] %}
+
+
+{% for generator_name, ip_generator in ip_generators.items() %}
+
+select '----- hash / State / {{ generator_name }} -----';
+select
+  {% for func in  agg_func_list  -%}
+     cityHash64(hex( {{ func }}State(ip) )) AS {{ func }}State{{ "," if not loop.last }}
+  {% endfor -%}
+from ( {{ ip_generator }} ) format Vertical;
+
+{% endfor -%}
+
+
+{% for generator_name, ip_generator in ip_generators.items() %}
+
+select '----- finalizeAggregation / State / {{ generator_name }} -----';
+select
+  {% for func in  agg_func_list  -%}
+     finalizeAggregation( {{ func }}State(ip) ) AS {{ func }}{{ "," if not loop.last }}
+  {% endfor -%}
+from ( {{ ip_generator }} ) format Vertical;
+
+{% endfor -%}
+
+
+
+{% set agg_func_list = [ "sumMap", "minMap", "maxMap" ] %}
+
+{% for generator_name, ip_generator in ip_generators.items() %}
+
+select '----- Map/Map hash / State / {{ generator_name }} -----';
+select
+  {% for func in agg_func_list  -%}
+     cityHash64(hex( {{ func }}State(map(ip, 1::Int64)) )) AS {{ func }}State{{ "," if not loop.last }}
+  {% endfor -%}
+from ( {{ ip_generator }} ) format Vertical;
+
+{% endfor -%}
+
+
+
+{% for generator_name, ip_generator in ip_generators.items() %}
+
+select '----- Map/Map finalizeAggregation / State / {{ generator_name }} -----';
+select
+  {% for func in agg_func_list -%}
+     finalizeAggregation( {{ func }}State(map(ip, 1::Int64)) ) AS {{ func }}{{ "," if not loop.last }}
+  {% endfor -%}
+from ( {{ ip_generator }} ) format Vertical;
+
+{% endfor -%}
+
+
+{% for generator_name, ip_generator in ip_generators.items() %}
+
+select '----- Map/Array hash / State / {{ generator_name }} -----';
+select
+  {% for func in agg_func_list -%}
+     cityHash64(hex( {{ func }}State([ip], [1::Int64]) )) AS {{ func }}State{{ "," if not loop.last }}
+  {% endfor -%}
+from ( {{ ip_generator }} ) format Vertical;
+
+{% endfor -%}
+
+
+{% for generator_name, ip_generator in ip_generators.items() %}
+
+select '----- Map/Array finalizeAggregation / State / {{ generator_name }} -----';
+select
+  {% for func in agg_func_list -%}
+     finalizeAggregation( {{ func }}State([ip], [1::Int64]) ) AS {{ func }}{{ "," if not loop.last }}
+  {% endfor -%}
+from ( {{ ip_generator }} ) format Vertical;
+
+{% endfor -%}
diff --git a/tests/queries/0_stateless/02761_ddl_initial_query_id.sh b/tests/queries/0_stateless/02761_ddl_initial_query_id.sh
index e9a315b812b..b8b35ef01f7 100755
--- a/tests/queries/0_stateless/02761_ddl_initial_query_id.sh
+++ b/tests/queries/0_stateless/02761_ddl_initial_query_id.sh
@@ -21,4 +21,6 @@ $CLICKHOUSE_CLIENT -q "SYSTEM FLUSH LOGS"
 # - replace() is required to avoid non deterministic behaviour of
 #   normalizeQuery() that replaces the identifier with "?" only if it has more
 #   then two numbers.
+#
+# NOTE: no current_database = '$CLICKHOUSE_DATABASE' filter on purpose (since ON CLUSTER queries does not have current_database passed)
 $CLICKHOUSE_CLIENT -q "SELECT normalizeQuery(replace(query, currentDatabase(), 'default')) FROM system.query_log WHERE initial_query_id = '$query_id' AND type != 'QueryStart' ORDER BY event_time_microseconds"
diff --git a/tests/queries/0_stateless/02763_mutate_compact_part_with_skip_indices_and_projections.reference b/tests/queries/0_stateless/02763_mutate_compact_part_with_skip_indices_and_projections.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02763_mutate_compact_part_with_skip_indices_and_projections.sql b/tests/queries/0_stateless/02763_mutate_compact_part_with_skip_indices_and_projections.sql
new file mode 100644
index 00000000000..bb9825fe5a0
--- /dev/null
+++ b/tests/queries/0_stateless/02763_mutate_compact_part_with_skip_indices_and_projections.sql
@@ -0,0 +1,31 @@
+DROP TABLE IF EXISTS test;
+
+CREATE TABLE test ( col1 Int64, dt Date ) ENGINE = MergeTree PARTITION BY dt ORDER BY tuple();
+
+INSERT INTO test FORMAT Values (1, today());
+
+ALTER TABLE test ADD COLUMN col2 String;
+
+ALTER TABLE test ADD INDEX i1 (col1, col2) TYPE set(100) GRANULARITY 1;
+
+ALTER TABLE test MATERIALIZE INDEX i1;
+
+ALTER TABLE test ADD COLUMN col3 String;
+
+ALTER TABLE test DROP COLUMN col3;
+
+DROP TABLE IF EXISTS test;
+
+CREATE TABLE test ( col1 Int64, dt Date ) ENGINE = MergeTree PARTITION BY dt ORDER BY tuple();
+
+INSERT INTO test FORMAT Values (1, today());
+
+ALTER TABLE test ADD COLUMN col2 String;
+
+ALTER TABLE test ADD PROJECTION p1 ( SELECT col2, sum(col1) GROUP BY col2 );
+
+ALTER TABLE test MATERIALIZE PROJECTION p1;
+
+ALTER TABLE test ADD COLUMN col3 String;
+
+ALTER TABLE test DROP COLUMN col3;
diff --git a/tests/queries/0_stateless/02764_csv_trim_whitespaces.reference b/tests/queries/0_stateless/02764_csv_trim_whitespaces.reference
new file mode 100644
index 00000000000..a2ea31ddae7
--- /dev/null
+++ b/tests/queries/0_stateless/02764_csv_trim_whitespaces.reference
@@ -0,0 +1,122 @@
+"	trim_false_tab_left"
+"trim_false_tab_right	"
+"trim_false_	tab_middle"
+"	trim_false_	tab_everywhere	"
+"	trim_false_fixed_string_	tab_everywhere	"
+"	quoted_trim_false_	tab_everywhere	"
+"	trim_false_csv_field1	","123	","5.0	","	12.0123","	quoted_string1"
+"	trim_false_csv_field2	","	321	","	0.5","21.321	","	quoted_	string2	"
+"	trim_false_csv_field1_with_	structure	",123,5,12.0123,"	quoted_string	"
+"	trim_false_csv_field2_with_structure	",321,0.5,21.321,"	quoted_	_string2	"
+" trim_false_space_left"
+"trim_false_space_right "
+"trim_false_ space_middle"
+" trim_false_ space_everywhere "
+" trim_false_fixed_string_ space_everywhere "
+" quoted_trim_false_ space_everywhere "
+" trim_false_csv_field1 ","123 ","5.0 "," 12.0123"," quoted_string1"
+" trim_false_csv_field2 "," 321 "," 0.5","21.321 "," quoted_ string2 "
+" trim_false_csv_field1_with_ structure ",123,5,12.0123," quoted_string "
+" trim_false_csv_field2_with_structure ",321,0.5,21.321," quoted_ _string2 "
+"	 trim_false_tab_space_left"
+"trim_false_tab_space_right	 "
+"trim_false_	 tab_space_middle"
+"	 trim_false_	 tab_space_everywhere	 "
+"	 trim_false_fixed_string_	 tab_space_everywhere	 "
+"	 quoted_trim_false_	 tab_space_everywhere	 "
+"	 trim_false_csv_field1	 ","123	 ","5.0	 ","	 12.0123","	 quoted_string1"
+"	 trim_false_csv_field2	 ","	 321	 ","	 0.5","21.321	 ","	 quoted_	 string2	 "
+"	 trim_false_csv_field1_with_	 structure	 ",123,5,12.0123,"	 quoted_string	 "
+"	 trim_false_csv_field2_with_structure	 ",321,0.5,21.321,"	 quoted_	 _string2	 "
+8
+8
+16
+16
+32.32
+32.32
+64.64
+64.64
+"2023-05-22"
+"2023-05-22"
+"2023-05-22"
+"2023-05-22"
+"2023-05-22 00:00:00"
+"2023-05-22 00:00:00"
+"2023-05-22 00:00:00.000"
+"2023-05-22 00:00:00.000"
+"trim_true_tab_left"
+"trim_true_tab_right"
+"trim_true_	tab_middle"
+"trim_true_	tab_everywhere"
+"trim_true_fixed_string_	tab_everywhere"
+"	quoted_trim_true_	tab_everywhere	"
+"trim_true_csv_field1",123,5,12.0123,"	quoted_string1"
+"trim_true_csv_field2",321,0.5,21.321,"	quoted_	string2	"
+"trim_true_csv_field1_with_	structure",123,5,12.0123,"	quoted_string	"
+"trim_true_csv_field2_with_structure",321,0.5,21.321,"	quoted_	_string2	"
+"trim_true_space_left"
+"trim_true_space_right"
+"trim_true_ space_middle"
+"trim_true_ space_everywhere"
+"trim_true_fixed_string_ space_everywhere"
+" quoted_trim_true_ space_everywhere "
+"trim_true_csv_field1",123,5,12.0123," quoted_string1"
+"trim_true_csv_field2",321,0.5,21.321," quoted_ string2 "
+"trim_true_csv_field1_with_ structure",123,5,12.0123," quoted_string "
+"trim_true_csv_field2_with_structure",321,0.5,21.321," quoted_ _string2 "
+"trim_true_tab_space_left"
+"trim_true_tab_space_right"
+"trim_true_	 tab_space_middle"
+"trim_true_	 tab_space_everywhere"
+"trim_true_fixed_string_	 tab_space_everywhere"
+"	 quoted_trim_true_	 tab_space_everywhere	 "
+"trim_true_csv_field1",123,5,12.0123,"	 quoted_string1"
+"trim_true_csv_field2",321,0.5,21.321,"	 quoted_	 string2	 "
+"trim_true_csv_field1_with_	 structure",123,5,12.0123,"	 quoted_string	 "
+"trim_true_csv_field2_with_structure",321,0.5,21.321,"	 quoted_	 _string2	 "
+8
+8
+16
+16
+32.32
+32.32
+64.64
+64.64
+"2023-05-22"
+"2023-05-22"
+"2023-05-22"
+"2023-05-22"
+"2023-05-22 00:00:00"
+"2023-05-22 00:00:00"
+"2023-05-22 00:00:00.000"
+"2023-05-22 00:00:00.000"
+"	custom_csv_tab_left"
+"custom_csv_tab_right	"
+"custom_csv_	tab_middle"
+"	custom_csv_	tab_everywhere	"
+"	custom_csv_fixed_string_	tab_everywhere	"
+"	quoted_custom_csv_	tab_everywhere	"
+"	custom_csv_field_with_	structure	",123,5,12.0123,"	custom_csv_quoted_string	"
+"	custom_csv_field2_with_structure	",321,0.5,21.321,"	custom_csv_quoted_	_string2	"
+"	custom_csv_field_with_	structure	",123,5,12.0123,"	custom_csv_quoted_string	"
+"	custom_csv_field2_with_structure	",321,0.5,21.321,"	custom_csv_quoted_	_string2	"
+" custom_csv_space_left"
+"custom_csv_space_right "
+"custom_csv_ space_middle"
+" custom_csv_ space_everywhere "
+" custom_csv_fixed_string_ space_everywhere "
+" quoted_custom_csv_ space_everywhere "
+" custom_csv_field_with_ structure ",123,5,12.0123," custom_csv_quoted_string "
+" custom_csv_field2_with_structure ",321,0.5,21.321," custom_csv_quoted_ _string2 "
+" custom_csv_field_with_ structure ",123,5,12.0123," custom_csv_quoted_string "
+" custom_csv_field2_with_structure ",321,0.5,21.321," custom_csv_quoted_ _string2 "
+"	 custom_csv_tab_space_left"
+"custom_csv_tab_space_right	 "
+"custom_csv_	 tab_space_middle"
+"	 custom_csv_	 tab_space_everywhere	 "
+"	 custom_csv_fixed_string_	 tab_space_everywhere	 "
+"	 quoted_custom_csv_	 tab_space_everywhere	 "
+"	 custom_csv_field_with_	 structure	 ",123,5,12.0123,"	 custom_csv_quoted_string	 "
+"	 custom_csv_field2_with_structure	 ",321,0.5,21.321,"	 custom_csv_quoted_	 _string2	 "
+"	 custom_csv_field_with_	 structure	 ",123,5,12.0123,"	 custom_csv_quoted_string	 "
+"	 custom_csv_field2_with_structure	 ",321,0.5,21.321,"	 custom_csv_quoted_	 _string2	 "
diff --git a/tests/queries/0_stateless/02764_csv_trim_whitespaces.sh b/tests/queries/0_stateless/02764_csv_trim_whitespaces.sh
new file mode 100755
index 00000000000..9b3b7231f6e
--- /dev/null
+++ b/tests/queries/0_stateless/02764_csv_trim_whitespaces.sh
@@ -0,0 +1,55 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+BOOLS=('false' 'true')
+
+WHITESPACES=(      '\t'  ' '      '\t ')
+WHITESPACES_NAMES=('tab' 'space'  'tab_space')
+
+DATA_TYPES=(  'Int8'  'Int16' 'Float32' 'Float64'  'Date'        'Date32'        'DateTime'              'DateTime64')
+DATA_VALUES=( '8'     '16'    '32.32'   '64.64'    '2023-05-22'  '2023-05-22'    '2023-05-22 00:00:00'   '2023-05-22 00:00:00.000')
+
+for trim in "${BOOLS[@]}"
+do
+    for wsIndex in "${!WHITESPACES[@]}";
+    do
+        whitespace=${WHITESPACES[$wsIndex]}
+        whitespace_name=${WHITESPACES_NAMES[$wsIndex]}
+        echo -e "${whitespace}trim_${trim}_${whitespace_name}_left"                                              | $CLICKHOUSE_LOCAL --input_format_csv_trim_whitespaces=${trim} --input-format="CSV" -q "select * from table FORMAT CSV"
+        echo -e "trim_${trim}_${whitespace_name}_right${whitespace}"                                             | $CLICKHOUSE_LOCAL --input_format_csv_trim_whitespaces=${trim} --input-format="CSV" -q "select * from table FORMAT CSV"
+        echo -e "trim_${trim}_${whitespace}${whitespace_name}_middle"                                            | $CLICKHOUSE_LOCAL --input_format_csv_trim_whitespaces=${trim} --input-format="CSV" -q "select * from table FORMAT CSV"
+        echo -e "${whitespace}trim_${trim}_${whitespace}${whitespace_name}_everywhere${whitespace}"              | $CLICKHOUSE_LOCAL --input_format_csv_trim_whitespaces=${trim} --input-format="CSV" -q "select * from table FORMAT CSV"
+        echo -e "${whitespace}trim_${trim}_fixed_string_${whitespace}${whitespace_name}_everywhere${whitespace}" | $CLICKHOUSE_LOCAL -S "c1 FixedString(64)" --input_format_csv_trim_whitespaces=${trim} --input-format="CSV" -q "select toString(c1) from table FORMAT CSV"
+        echo -e "\"${whitespace}quoted_trim_${trim}_${whitespace}${whitespace_name}_everywhere${whitespace}\""   | $CLICKHOUSE_LOCAL --input_format_csv_trim_whitespaces=${trim} --input-format="CSV" -q "select * from table FORMAT CSV"
+        echo -e "${whitespace}trim_${trim}_csv_field1${whitespace},123${whitespace},5.0${whitespace},${whitespace}12.0123,\"${whitespace}quoted_string1\"\n${whitespace}trim_${trim}_csv_field2${whitespace},${whitespace}321${whitespace},${whitespace}0.5,21.321${whitespace},\"${whitespace}quoted_${whitespace}string2${whitespace}\"${whitespace}" | $CLICKHOUSE_LOCAL --input_format_csv_trim_whitespaces=${trim} --input-format="CSV" -q "select * from table FORMAT CSV"
+        echo -e "${whitespace}trim_${trim}_csv_field1_with_${whitespace}structure${whitespace},${whitespace}123,${whitespace}5.0${whitespace},12.0123${whitespace},\"${whitespace}quoted_string${whitespace}\"\n${whitespace}trim_${trim}_csv_field2_with_structure${whitespace},${whitespace}321${whitespace},0.5,21.321,\"${whitespace}quoted_${whitespace}_string2${whitespace}\"${whitespace}" | $CLICKHOUSE_LOCAL -S "c1 String, c2 Int32, c3 Float, c4 Double, c5 String" --input_format_csv_trim_whitespaces=${trim} --input-format="CSV" -q "select * from table FORMAT CSV"
+    done
+
+    for type_index in "${!DATA_TYPES[@]}";
+    do
+        type=${DATA_TYPES[$type_index]}
+        value=${DATA_VALUES[$type_index]}
+        echo -e "\t ${value} \t" | $CLICKHOUSE_LOCAL -S "c1 ${type}" --input-format="CSV" --input_format_csv_trim_whitespaces=${trim} -q "select * from table FORMAT CSV"
+        echo -e "\t ${value} \t" | $CLICKHOUSE_LOCAL -S "c1 Nullable(${type})" --input-format="CSV" --input_format_csv_trim_whitespaces=${trim} -q "select * from table FORMAT CSV"
+    done
+done
+
+## Custom CSV tested with input_format_csv_trim_whitespaces = false.
+## Custom CSV with input_format_csv_trim_whitespaces=true doesn't trim whitespaces from the left side at the moment
+for wsIndex in "${!WHITESPACES[@]}";
+do
+    whitespace=${WHITESPACES[$wsIndex]}
+    whitespace_name=${WHITESPACES_NAMES[$wsIndex]}
+    echo -e "${whitespace}custom_csv_${whitespace_name}_left"                                               | $CLICKHOUSE_LOCAL --input-format="CustomSeparated" --input_format_csv_trim_whitespaces=false --format_custom_escaping_rule=CSV --format_custom_field_delimiter=',' --format_csv_delimiter=',' -q "select * from table FORMAT CSV"
+    echo -e "custom_csv_${whitespace_name}_right${whitespace}"                                              | $CLICKHOUSE_LOCAL --input-format="CustomSeparated" --input_format_csv_trim_whitespaces=false --format_custom_escaping_rule=CSV --format_custom_field_delimiter=',' --format_csv_delimiter=',' -q "select * from table FORMAT CSV"
+    echo -e "custom_csv_${whitespace}${whitespace_name}_middle"                                             | $CLICKHOUSE_LOCAL --input-format="CustomSeparated" --input_format_csv_trim_whitespaces=false --format_custom_escaping_rule=CSV --format_custom_field_delimiter=',' --format_csv_delimiter=',' -q "select * from table FORMAT CSV"
+    echo -e "${whitespace}custom_csv_${whitespace}${whitespace_name}_everywhere${whitespace}"               | $CLICKHOUSE_LOCAL --input-format="CustomSeparated" --input_format_csv_trim_whitespaces=false --format_custom_escaping_rule=CSV --format_custom_field_delimiter=',' --format_csv_delimiter=',' -q "select * from table FORMAT CSV"
+    echo -e "${whitespace}custom_csv_fixed_string_${whitespace}${whitespace_name}_everywhere${whitespace}"  | $CLICKHOUSE_LOCAL -S "c1 FixedString(64)" --input-format="CustomSeparated"  --input_format_csv_trim_whitespaces=false --format_custom_escaping_rule=CSV --format_custom_field_delimiter=',' --format_csv_delimiter=',' -q "select toString(c1) from table FORMAT CSV"
+    echo -e "\"${whitespace}quoted_custom_csv_${whitespace}${whitespace_name}_everywhere${whitespace}\""    | $CLICKHOUSE_LOCAL --input-format="CustomSeparated" --input_format_csv_trim_whitespaces=false --format_custom_escaping_rule=CSV --format_custom_field_delimiter=',' --format_csv_delimiter=',' -q "select * from table FORMAT CSV"
+
+    echo -e "${whitespace}custom_csv_field_with_${whitespace}structure${whitespace},123,5.0,12.0123,\"${whitespace}custom_csv_quoted_string${whitespace}\"\n${whitespace}custom_csv_field2_with_structure${whitespace},321,0.5,21.321,\"${whitespace}custom_csv_quoted_${whitespace}_string2${whitespace}\"" | $CLICKHOUSE_LOCAL --input_format_csv_trim_whitespaces=false --input-format="CustomSeparated" --format_custom_escaping_rule=CSV --format_custom_field_delimiter=',' --format_csv_delimiter=',' -q "select * from table FORMAT CSV"
+    echo -e "${whitespace}custom_csv_field_with_${whitespace}structure${whitespace},123,5.0,12.0123,\"${whitespace}custom_csv_quoted_string${whitespace}\"\n${whitespace}custom_csv_field2_with_structure${whitespace},321,0.5,21.321,\"${whitespace}custom_csv_quoted_${whitespace}_string2${whitespace}\"" | $CLICKHOUSE_LOCAL -S "c1 String, c2 Int32, c3 Float, c4 Double, c5 String" --input_format_csv_trim_whitespaces=false --input-format="CustomSeparated" --format_custom_escaping_rule=CSV --format_custom_field_delimiter=',' --format_csv_delimiter=',' -q "select * from table FORMAT CSV"
+done
diff --git a/tests/queries/0_stateless/02764_date_filter_predicate_optimizer.reference b/tests/queries/0_stateless/02764_date_filter_predicate_optimizer.reference
deleted file mode 100644
index 54704fb3b3e..00000000000
--- a/tests/queries/0_stateless/02764_date_filter_predicate_optimizer.reference
+++ /dev/null
@@ -1,108 +0,0 @@
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-01-01\') AND (date1 <= \'1993-12-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 < \'1993-01-01\') OR (date1 > \'1993-12-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE (date1 < \'1993-01-01\') AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE (date1 > \'1993-12-31\') AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE (date1 <= \'1993-12-31\') AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE (date1 >= \'1993-01-01\') AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-01-01\') AND (date1 <= \'1997-12-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE (((date1 >= \'1993-01-01\') AND (date1 <= \'1993-12-31\')) OR ((date1 >= \'1994-01-01\') AND (date1 <= \'1994-12-31\'))) AND ((id >= 1) AND (id <= 3))
-SELECT
-    value1,
-    toYear(date1) AS year1
-FROM t
-WHERE ((date1 >= \'1993-01-01\') AND (date1 <= \'1993-12-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE (date1 < \'1993-01-01\') AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-PREWHERE (date1 >= \'1993-01-01\') AND (date1 <= \'1993-12-31\')
-WHERE ((date1 >= \'1993-01-01\') AND (date1 <= \'1993-12-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((id >= 1) AND (id <= 3)) AND ((date1 >= \'1993-01-01\') AND (date1 <= \'1993-12-31\'))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1900-02-01\') AND (date1 <= \'1900-02-28\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1992-02-01\') AND (date1 <= \'1992-02-29\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'2000-02-01\') AND (date1 <= \'2000-02-29\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE (toYYYYMM(date1) = 199300) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-01-01\') AND (date1 <= \'1993-01-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-02-01\') AND (date1 <= \'1993-02-28\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-03-01\') AND (date1 <= \'1993-03-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-04-01\') AND (date1 <= \'1993-04-30\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-05-01\') AND (date1 <= \'1993-05-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-06-01\') AND (date1 <= \'1993-06-30\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-07-01\') AND (date1 <= \'1993-07-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-08-01\') AND (date1 <= \'1993-08-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-09-01\') AND (date1 <= \'1993-09-30\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-10-01\') AND (date1 <= \'1993-10-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-11-01\') AND (date1 <= \'1993-11-30\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1993-12-01\') AND (date1 <= \'1993-12-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE (toYYYYMM(date1) = 199313) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 < \'1992-03-01\') OR (date1 > \'1992-03-31\')) AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE (date1 < \'1992-03-01\') AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE (date1 > \'1992-03-31\') AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE (date1 <= \'1992-03-31\') AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE (date1 >= \'1992-03-01\') AND ((id >= 1) AND (id <= 3))
-SELECT value1
-FROM t
-WHERE ((date1 >= \'1992-03-01\') OR ((date1 >= \'1993-01-01\') AND (date1 <= \'1993-12-31\'))) AND ((id >= 1) AND (id <= 3))
diff --git a/tests/queries/0_stateless/02764_date_filter_predicate_optimizer.sql b/tests/queries/0_stateless/02764_date_filter_predicate_optimizer.sql
deleted file mode 100644
index a04273bbb18..00000000000
--- a/tests/queries/0_stateless/02764_date_filter_predicate_optimizer.sql
+++ /dev/null
@@ -1,40 +0,0 @@
-DROP TABLE IF EXISTS t;
-CREATE TABLE t (id UInt32, value1 String, date1 Date) ENGINE ReplacingMergeTree() ORDER BY id;
-
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYear(date1) = 1993 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYear(date1) <> 1993 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYear(date1) < 1993 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYear(date1) > 1993 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYear(date1) <= 1993 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYear(date1) >= 1993 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYear(date1) BETWEEN 1993 AND 1997 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE (toYear(date1) = 1993 OR toYear(date1) = 1994) AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1, toYear(date1) as year1 FROM t WHERE year1 = 1993 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE 1993 > toYear(date1) AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t PREWHERE toYear(date1) = 1993 WHERE id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE id BETWEEN 1 AND 3 HAVING toYear(date1) = 1993;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 190002 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199202 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 200002 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199300 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199301 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199302 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199303 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199304 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199305 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199306 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199307 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199308 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199309 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199310 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199311 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199312 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) = 199313 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) <> 199203 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) < 199203 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) > 199203 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) <= 199203 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE toYYYYMM(date1) >= 199203 AND id BETWEEN 1 AND 3;
-EXPLAIN SYNTAX SELECT value1 FROM t WHERE (toYYYYMM(date1) >= 199203 OR toYear(date1) = 1993) AND id BETWEEN 1 AND 3;
-
-DROP TABLE t;
diff --git a/tests/queries/0_stateless/02764_index_analysis_fix.reference b/tests/queries/0_stateless/02764_index_analysis_fix.reference
new file mode 100644
index 00000000000..8eeacf99fa8
--- /dev/null
+++ b/tests/queries/0_stateless/02764_index_analysis_fix.reference
@@ -0,0 +1 @@
+2022-10-01 10:10:10
diff --git a/tests/queries/0_stateless/02764_index_analysis_fix.sql b/tests/queries/0_stateless/02764_index_analysis_fix.sql
new file mode 100644
index 00000000000..541a3444ef3
--- /dev/null
+++ b/tests/queries/0_stateless/02764_index_analysis_fix.sql
@@ -0,0 +1,9 @@
+drop table if exists x;
+
+create table x (dt String) engine MergeTree partition by toYYYYMM(toDate(dt)) order by tuple();
+
+insert into x values ('2022-10-01 10:10:10');
+
+select * from x where dt like '2022-10-01%';
+
+drop table x;
diff --git a/tests/queries/0_stateless/02768_cse_nested_distributed.reference b/tests/queries/0_stateless/02768_cse_nested_distributed.reference
new file mode 100644
index 00000000000..e8183f05f5d
--- /dev/null
+++ b/tests/queries/0_stateless/02768_cse_nested_distributed.reference
@@ -0,0 +1,3 @@
+1
+1
+1
diff --git a/tests/queries/0_stateless/02768_cse_nested_distributed.sql b/tests/queries/0_stateless/02768_cse_nested_distributed.sql
new file mode 100644
index 00000000000..90e526c0d01
--- /dev/null
+++ b/tests/queries/0_stateless/02768_cse_nested_distributed.sql
@@ -0,0 +1,5 @@
+with (select count() > 0 from remote('127.2', system.settings)) as s select s;
+-- nested
+with (select count() > 0 from remote('127.2', remote('127.2', system.settings))) as s select s;
+-- nested via view()
+with (select count() > 0 from remote('127.2', view(select count() from remote('127.2', system.settings)))) as s select s;
diff --git a/tests/queries/0_stateless/02771_if_constant_folding.reference b/tests/queries/0_stateless/02771_if_constant_folding.reference
new file mode 100644
index 00000000000..9dfcf39f5a7
--- /dev/null
+++ b/tests/queries/0_stateless/02771_if_constant_folding.reference
@@ -0,0 +1,5 @@
+0
+1
+2
+3
+4
diff --git a/tests/queries/0_stateless/02771_if_constant_folding.sql b/tests/queries/0_stateless/02771_if_constant_folding.sql
new file mode 100644
index 00000000000..1610465021b
--- /dev/null
+++ b/tests/queries/0_stateless/02771_if_constant_folding.sql
@@ -0,0 +1 @@
+SELECT cast(number, if(1 = 1, 'UInt64', toString(number))) FROM numbers(5);
diff --git a/tests/queries/0_stateless/02771_ignore_data_skipping_indices.reference b/tests/queries/0_stateless/02771_ignore_data_skipping_indices.reference
new file mode 100644
index 00000000000..786360783fd
--- /dev/null
+++ b/tests/queries/0_stateless/02771_ignore_data_skipping_indices.reference
@@ -0,0 +1,40 @@
+1	2	3
+1	2	3
+1	2	3
+    ReadFromMergeTree (default.data_02771)
+    Indexes:
+      PrimaryKey
+        Condition: true
+        Parts: 1/1
+        Granules: 1/1
+      Skip
+        Name: x_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/1
+        Granules: 0/1
+      Skip
+        Name: y_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/0
+        Granules: 0/0
+      Skip
+        Name: xy_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/0
+        Granules: 0/0
+    ReadFromMergeTree (default.data_02771)
+    Indexes:
+      PrimaryKey
+        Condition: true
+        Parts: 1/1
+        Granules: 1/1
+      Skip
+        Name: x_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/1
+        Granules: 0/1
+      Skip
+        Name: y_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/0
+        Granules: 0/0
diff --git a/tests/queries/0_stateless/02771_ignore_data_skipping_indices.sql b/tests/queries/0_stateless/02771_ignore_data_skipping_indices.sql
new file mode 100644
index 00000000000..a49239e9de2
--- /dev/null
+++ b/tests/queries/0_stateless/02771_ignore_data_skipping_indices.sql
@@ -0,0 +1,30 @@
+SET allow_experimental_analyzer = 0;
+
+DROP TABLE IF EXISTS data_02771;
+
+
+CREATE TABLE data_02771
+(
+    key Int,
+    x Int,
+    y Int,
+    INDEX x_idx x TYPE minmax GRANULARITY 1,
+    INDEX y_idx y TYPE minmax GRANULARITY 1,
+    INDEX xy_idx (x,y) TYPE minmax GRANULARITY 1
+)
+Engine=MergeTree()
+ORDER BY key;
+
+INSERT INTO data_02771 VALUES (1, 2, 3);
+
+SELECT * FROM data_02771;
+SELECT * FROM data_02771 SETTINGS ignore_data_skipping_indices=''; -- { serverError 6 }
+SELECT * FROM data_02771 SETTINGS ignore_data_skipping_indices='x_idx';
+SELECT * FROM data_02771 SETTINGS ignore_data_skipping_indices='na_idx';
+
+SELECT * FROM data_02771 WHERE x = 1 AND y = 1 SETTINGS ignore_data_skipping_indices='xy_idx',force_data_skipping_indices='xy_idx' ; -- { serverError 277 }
+SELECT * FROM data_02771 WHERE x = 1 AND y = 2 SETTINGS ignore_data_skipping_indices='xy_idx';
+SELECT * from ( EXPLAIN indexes = 1 SELECT * FROM data_02771 WHERE x = 1 AND y = 2 ) WHERE explain NOT LIKE '%Expression%' AND explain NOT LIKE '%Filter%';
+SELECT * from ( EXPLAIN indexes = 1 SELECT * FROM data_02771 WHERE x = 1 AND y = 2 SETTINGS ignore_data_skipping_indices='xy_idx' ) WHERE explain NOT LIKE '%Expression%' AND explain NOT LIKE '%Filter%';
+
+DROP TABLE data_02771;
diff --git a/tests/queries/0_stateless/02771_jit_functions_comparison_crash.reference b/tests/queries/0_stateless/02771_jit_functions_comparison_crash.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02771_jit_functions_comparison_crash.sql b/tests/queries/0_stateless/02771_jit_functions_comparison_crash.sql
new file mode 100644
index 00000000000..e02f1a3382d
--- /dev/null
+++ b/tests/queries/0_stateless/02771_jit_functions_comparison_crash.sql
@@ -0,0 +1,36 @@
+SET compile_expressions = 1;
+SET min_count_to_compile_expression = 0;
+
+DROP TABLE IF EXISTS test_table_1;
+CREATE TABLE test_table_1
+(
+    pkey UInt32,
+    c8 UInt32,
+    c9 String,
+    c10 Float32,
+    c11 String
+) ENGINE = MergeTree ORDER BY pkey;
+
+DROP TABLE IF EXISTS test_table_2;
+CREATE TABLE test_table_2
+(
+    vkey UInt32,
+    pkey UInt32,
+    c15 UInt32
+) ENGINE = MergeTree ORDER BY vkey;
+
+WITH test_cte AS
+(
+    SELECT
+        ref_10.c11 as c_2_c2350_1,
+        ref_9.c9 as c_2_c2351_2
+    FROM
+        test_table_1 as ref_9
+        RIGHT OUTER JOIN test_table_1 as ref_10 ON (ref_9.c11 = ref_10.c9)
+        INNER JOIN test_table_2 as ref_11 ON (ref_10.c8 = ref_11.vkey)
+    WHERE ((ref_10.pkey + ref_11.pkey) BETWEEN ref_11.vkey AND (CASE WHEN (-30.87 >= ref_9.c10) THEN ref_11.c15 ELSE ref_11.pkey END))
+)
+SELECT ref_13.c_2_c2350_1 as c_2_c2357_3 FROM test_cte as ref_13 WHERE (ref_13.c_2_c2351_2) in (select ref_14.c_2_c2351_2 as c_5_c2352_0 FROM test_cte as ref_14);
+
+DROP TABLE test_table_1;
+DROP TABLE test_table_2;
diff --git a/tests/queries/0_stateless/02771_log_faminy_truncate_count.reference b/tests/queries/0_stateless/02771_log_faminy_truncate_count.reference
new file mode 100644
index 00000000000..aa47d0d46d4
--- /dev/null
+++ b/tests/queries/0_stateless/02771_log_faminy_truncate_count.reference
@@ -0,0 +1,2 @@
+0
+0
diff --git a/tests/queries/0_stateless/02771_log_faminy_truncate_count.sql b/tests/queries/0_stateless/02771_log_faminy_truncate_count.sql
new file mode 100644
index 00000000000..3fb22837f5b
--- /dev/null
+++ b/tests/queries/0_stateless/02771_log_faminy_truncate_count.sql
@@ -0,0 +1,26 @@
+DROP TABLE IF EXISTS test_log;
+CREATE TABLE test_log
+(
+    `crypto_name` String,
+    `trade_date` Date
+)
+ENGINE = Log;
+
+INSERT INTO test_log (crypto_name, trade_date) VALUES ('abc', '2021-01-01'), ('def', '2022-02-02');
+
+TRUNCATE TABLE test_log;
+SELECT count() FROM  test_log;
+
+DROP TABLE IF EXISTS test_log;
+CREATE TABLE test_log
+(
+    `crypto_name` String,
+    `trade_date` Date
+)
+ENGINE = StripeLog;
+
+INSERT INTO test_log (crypto_name, trade_date) VALUES ('abc', '2021-01-01'), ('def', '2022-02-02');
+
+TRUNCATE TABLE test_log;
+SELECT count() FROM  test_log;
+DROP TABLE test_log;
diff --git a/tests/queries/0_stateless/02771_parallel_replicas_analyzer.reference b/tests/queries/0_stateless/02771_parallel_replicas_analyzer.reference
new file mode 100644
index 00000000000..f688db940d9
--- /dev/null
+++ b/tests/queries/0_stateless/02771_parallel_replicas_analyzer.reference
@@ -0,0 +1,12 @@
+-8888150036649430454
+-2788931093724180887
+-75175454385331084
+368066018677693974
+821735343441964030
+2804162938822577320
+4357435422797280898
+5935810273536892891
+7885388429666205427
+8124171311239967992
+1	1	-- Simple query with analyzer and pure parallel replicas\nSELECT number\nFROM join_inner_table__fuzz_146_replicated\n    SETTINGS\n    allow_experimental_analyzer = 1,\n    max_parallel_replicas = 2,\n    cluster_for_parallel_replicas = \'test_cluster_one_shard_three_replicas_localhost\',\n    allow_experimental_parallel_reading_from_replicas = 1,\n    use_hedged_requests = 0;
+0	2	SELECT `join_inner_table__fuzz_146_replicated`.`number` AS `number` FROM `default`.`join_inner_table__fuzz_146_replicated` SETTINGS allow_experimental_analyzer = 1, max_parallel_replicas = 2, cluster_for_parallel_replicas = \'test_cluster_one_shard_three_replicas_localhost\', allow_experimental_parallel_reading_from_replicas = 1, use_hedged_requests = 0
diff --git a/tests/queries/0_stateless/02771_parallel_replicas_analyzer.sql b/tests/queries/0_stateless/02771_parallel_replicas_analyzer.sql
new file mode 100644
index 00000000000..35089c0cedb
--- /dev/null
+++ b/tests/queries/0_stateless/02771_parallel_replicas_analyzer.sql
@@ -0,0 +1,52 @@
+-- Tags: zookeeper
+
+CREATE TABLE join_inner_table__fuzz_146_replicated
+(
+    `id` UUID,
+    `key` String,
+    `number` Int64,
+    `value1` String,
+    `value2` String,
+    `time` Nullable(Int64)
+)
+ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/join_inner_table__fuzz_146_replicated', '{replica}')
+ORDER BY (id, number, key)
+SETTINGS index_granularity = 8192;
+
+INSERT INTO join_inner_table__fuzz_146_replicated
+    SELECT CAST('833c9e22-c245-4eb5-8745-117a9a1f26b1', 'UUID') AS id, CAST(rowNumberInAllBlocks(), 'String') AS key, *
+    FROM generateRandom('number Int64, value1 String, value2 String, time Int64', 1, 10, 2) LIMIT 10;
+
+-- Simple query with analyzer and pure parallel replicas
+SELECT number
+FROM join_inner_table__fuzz_146_replicated
+    SETTINGS
+    allow_experimental_analyzer = 1,
+    max_parallel_replicas = 2,
+    cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost',
+    allow_experimental_parallel_reading_from_replicas = 1,
+    use_hedged_requests = 0;
+
+SYSTEM FLUSH LOGS;
+-- There should be 2 different queries
+-- The initial query
+-- The query sent to each replica (which should appear 2 times as we are setting max_parallel_replicas to 2)
+SELECT
+        is_initial_query,
+        count() as c, query,
+FROM system.query_log
+WHERE
+        event_date >= yesterday()
+  AND type = 'QueryFinish'
+  AND initial_query_id =
+      (
+          SELECT query_id
+          FROM system.query_log
+          WHERE
+                  current_database = currentDatabase()
+            AND event_date >= yesterday()
+            AND type = 'QueryFinish'
+            AND query LIKE '-- Simple query with analyzer and pure parallel replicas%'
+      )
+GROUP BY is_initial_query, query
+ORDER BY is_initial_query DESC, c, query;
diff --git a/tests/queries/0_stateless/02771_resolve_compound_identifier.reference b/tests/queries/0_stateless/02771_resolve_compound_identifier.reference
new file mode 100644
index 00000000000..8b1acc12b63
--- /dev/null
+++ b/tests/queries/0_stateless/02771_resolve_compound_identifier.reference
@@ -0,0 +1,10 @@
+0
+1
+2
+3
+4
+5
+6
+7
+8
+9
diff --git a/tests/queries/0_stateless/02771_resolve_compound_identifier.sql b/tests/queries/0_stateless/02771_resolve_compound_identifier.sql
new file mode 100644
index 00000000000..db4d443379e
--- /dev/null
+++ b/tests/queries/0_stateless/02771_resolve_compound_identifier.sql
@@ -0,0 +1,11 @@
+DROP DATABASE IF EXISTS test_02771;
+
+CREATE DATABASE test_02771;
+
+CREATE TABLE test_02771.t (x UInt8) ENGINE = MergeTree() ORDER BY x;
+
+INSERT INTO test_02771.t SELECT number FROM numbers(10);
+
+SELECT t.x FROM test_02771.t ORDER BY t.x;
+
+DROP DATABASE IF EXISTS test_02771;
diff --git a/tests/queries/0_stateless/02771_semi_join_use_nulls.reference b/tests/queries/0_stateless/02771_semi_join_use_nulls.reference
new file mode 100644
index 00000000000..8d4b1a3a75e
--- /dev/null
+++ b/tests/queries/0_stateless/02771_semi_join_use_nulls.reference
@@ -0,0 +1,112 @@
+0	0
+0	0
+0	\N
+0	0
+0	0
+0	0
+0	0
+0	0
+0	\N
+0	0
+0	0
+0	0
+0	1
+0	1
+0	0
+0	0
+0	\N
+0	0
+0	0
+0	0
+0	0
+0	0
+0	\N
+0	0
+0	0
+0	0
+0	2
+0	2
+0	\N
+0	0
+0	\N
+0	0
+0	\N
+0	\N
+0	\N
+0	0
+0	\N
+0	0
+0	\N
+0	\N
+0	1
+0	1
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+\N	2
+\N	2
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	1
+0	1
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+1	2
+1	2
+0	\N
+0	0
+0	0
+0	0
+0	\N
+0	\N
+0	\N
+0	0
+0	0
+0	0
+0	\N
+0	\N
+0	1
+0	1
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+1	2
+1	2
diff --git a/tests/queries/0_stateless/02771_semi_join_use_nulls.sql.j2 b/tests/queries/0_stateless/02771_semi_join_use_nulls.sql.j2
new file mode 100644
index 00000000000..37b2e63761b
--- /dev/null
+++ b/tests/queries/0_stateless/02771_semi_join_use_nulls.sql.j2
@@ -0,0 +1,51 @@
+
+{% for allow_experimental_analyzer in [0, 1] -%}
+{% for join_use_nulls in [0, 1] -%}
+{% for kind in ['LEFT', 'RIGHT'] -%}
+{% for strictness in ['SEMI', 'ANTI'] -%}
+{% for maybe_materialize in ['', 'materialize'] -%}
+
+SET allow_experimental_analyzer = {{ allow_experimental_analyzer }};
+
+SET join_use_nulls = {{ join_use_nulls }};
+
+SELECT id > 1, d.id FROM (SELECT {{ maybe_materialize }}(toLowCardinality(0)) AS id, 1 AS value) AS a
+{{ strictness }} {{ kind }} JOIN (SELECT {{ maybe_materialize }}(toLowCardinality(0)) AS id) AS d
+USING (id)
+;
+
+SELECT id > 1, d.id FROM (SELECT {{ maybe_materialize }}(toLowCardinality(toNullable(0))) AS id, 1 AS value) AS a
+{{ strictness }} {{ kind }} JOIN (SELECT {{ maybe_materialize }}(toLowCardinality(0)) AS id) AS d
+USING (id)
+;
+
+SELECT id > 1, d.id FROM (SELECT {{ maybe_materialize }}(toLowCardinality(0)) AS id, 1 AS value) AS a
+{{ strictness }} {{ kind }} JOIN (SELECT {{ maybe_materialize }}(toLowCardinality(toNullable(0))) AS id) AS d
+USING (id)
+;
+
+SELECT id > 1, d.id FROM (SELECT {{ maybe_materialize }}(toLowCardinality(toNullable(0))) AS id, 1 AS value) AS a
+{{ strictness }} {{ kind }} JOIN (SELECT {{ maybe_materialize }}(toLowCardinality(toNullable(0))) AS id) AS d
+USING (id)
+;
+
+SELECT id > 1, d.id FROM (SELECT {{ maybe_materialize }}(toLowCardinality(1)) AS id, 1 AS value) AS a
+{{ strictness }} {{ kind }} JOIN (SELECT {{ maybe_materialize }}(toLowCardinality(2)) AS id) AS d
+USING (id)
+;
+
+SELECT id > 1, d.id FROM (SELECT {{ maybe_materialize }}(toLowCardinality(0)) AS id, 1 AS value) AS a
+{{ strictness }} {{ kind }} JOIN (SELECT {{ maybe_materialize }}(toLowCardinality(0)) AS id) AS d
+ON a.id = d.id
+;
+
+SELECT id > 1, d.idd FROM (SELECT {{ maybe_materialize }}(toLowCardinality(0)) AS id, 1 AS value) AS a
+{{ strictness }} {{ kind }} JOIN (SELECT {{ maybe_materialize }}(toLowCardinality(0)) AS idd) AS d
+ON a.id = d.idd
+;
+
+{% endfor -%}
+{% endfor -%}
+{% endfor -%}
+{% endfor -%}
+{% endfor -%}
diff --git a/tests/queries/0_stateless/02771_skip_empty_files.reference b/tests/queries/0_stateless/02771_skip_empty_files.reference
new file mode 100644
index 00000000000..83f2e99acd0
--- /dev/null
+++ b/tests/queries/0_stateless/02771_skip_empty_files.reference
@@ -0,0 +1,7 @@
+1
+1
+1
+1
+1
+0
+0
diff --git a/tests/queries/0_stateless/02771_skip_empty_files.sh b/tests/queries/0_stateless/02771_skip_empty_files.sh
new file mode 100755
index 00000000000..2d1dc205dcd
--- /dev/null
+++ b/tests/queries/0_stateless/02771_skip_empty_files.sh
@@ -0,0 +1,20 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+FILE_PREFIX=$CLICKHOUSE_TEST_UNIQUE_NAME
+touch $FILE_PREFIX-1.parquet
+$CLICKHOUSE_LOCAL -q "select * from numbers(1) format Parquet" > $FILE_PREFIX-2.parquet
+$CLICKHOUSE_LOCAL -q "select * from file('$FILE_PREFIX-1.parquet') settings engine_file_skip_empty_files=0" 2>&1 | grep -c "CANNOT_EXTRACT_TABLE_STRUCTURE"
+$CLICKHOUSE_LOCAL -q "select * from file('$FILE_PREFIX-1.parquet', auto, 'number UInt64') settings engine_file_skip_empty_files=0" 2>&1 | grep -c "Exception"
+$CLICKHOUSE_LOCAL -q "select * from file('$FILE_PREFIX-1.parquet') settings engine_file_skip_empty_files=1" 2>&1 | grep -c "Exception"
+$CLICKHOUSE_LOCAL -q "select * from file('$FILE_PREFIX-1.parquet', auto, 'number UInt64') settings engine_file_skip_empty_files=1"
+$CLICKHOUSE_LOCAL -q "select * from file('$FILE_PREFIX-*.parquet') settings engine_file_skip_empty_files=0" 2>&1 | grep -c "Exception"
+$CLICKHOUSE_LOCAL -q "select * from file('$FILE_PREFIX-*.parquet', auto, 'number UInt64') settings engine_file_skip_empty_files=0" 2>&1 | grep -c "Exception"
+$CLICKHOUSE_LOCAL -q "select * from file('$FILE_PREFIX-*.parquet') settings engine_file_skip_empty_files=1"
+$CLICKHOUSE_LOCAL -q "select * from file('$FILE_PREFIX-*.parquet', auto, 'number UInt64') settings engine_file_skip_empty_files=1"
+
+rm $FILE_PREFIX-*
diff --git a/tests/queries/0_stateless/02771_system_user_processes.reference b/tests/queries/0_stateless/02771_system_user_processes.reference
new file mode 100644
index 00000000000..a55207ff3f4
--- /dev/null
+++ b/tests/queries/0_stateless/02771_system_user_processes.reference
@@ -0,0 +1,4 @@
+0
+0
+default	true	true
+2	2
diff --git a/tests/queries/0_stateless/02771_system_user_processes.sh b/tests/queries/0_stateless/02771_system_user_processes.sh
new file mode 100755
index 00000000000..c680283d36e
--- /dev/null
+++ b/tests/queries/0_stateless/02771_system_user_processes.sh
@@ -0,0 +1,18 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+USER_POSTFIX=`random_str 10`
+USER="test_user_02771_$USER_POSTFIX"
+
+$CLICKHOUSE_CLIENT -q "DROP USER IF EXISTS $USER"
+$CLICKHOUSE_CLIENT -q "CREATE USER $USER"
+$CLICKHOUSE_CLIENT -q "GRANT SELECT ON system.* TO $USER"
+$CLICKHOUSE_CLIENT -u "$USER" -q "SELECT * FROM system.numbers LIMIT 1"
+$CLICKHOUSE_CLIENT -u "$USER" -q "SELECT * FROM system.numbers LIMIT 1"
+$CLICKHOUSE_CLIENT -q "SELECT user, toBool(ProfileEvents['SelectQuery'] > 0), toBool(ProfileEvents['Query'] > 0) FROM system.user_processes WHERE user='default'"
+$CLICKHOUSE_CLIENT -q "SELECT ProfileEvents['SelectQuery'], ProfileEvents['Query'] FROM system.user_processes WHERE user='$USER'"
+$CLICKHOUSE_CLIENT -q "DROP USER $USER"
+
diff --git a/tests/queries/0_stateless/02771_tsv_csv_custom_skip_trailing_empty_lines.reference b/tests/queries/0_stateless/02771_tsv_csv_custom_skip_trailing_empty_lines.reference
new file mode 100644
index 00000000000..37e32ce62ee
--- /dev/null
+++ b/tests/queries/0_stateless/02771_tsv_csv_custom_skip_trailing_empty_lines.reference
@@ -0,0 +1,3 @@
+1	2
+1	2
+1	2
diff --git a/tests/queries/0_stateless/02771_tsv_csv_custom_skip_trailing_empty_lines.sql b/tests/queries/0_stateless/02771_tsv_csv_custom_skip_trailing_empty_lines.sql
new file mode 100644
index 00000000000..917a434cd58
--- /dev/null
+++ b/tests/queries/0_stateless/02771_tsv_csv_custom_skip_trailing_empty_lines.sql
@@ -0,0 +1,12 @@
+select * from format(TSV, 'x UInt32, y UInt32', '1\t2\n\n') settings input_format_tsv_skip_trailing_empty_lines=0; -- {serverError CANNOT_PARSE_INPUT_ASSERTION_FAILED}
+select * from format(TSV, 'x UInt32, y UInt32', '1\t2\n\n') settings input_format_tsv_skip_trailing_empty_lines=1;
+select * from format(TSV, 'x UInt32, y UInt32', '1\t2\n\n1\t2\n') settings input_format_tsv_skip_trailing_empty_lines=1; -- {serverError CANNOT_PARSE_INPUT_ASSERTION_FAILED}
+
+select * from format(CSV, 'x UInt32, y UInt32', '1,2\n\n') settings input_format_csv_skip_trailing_empty_lines=0; -- {serverError CANNOT_PARSE_INPUT_ASSERTION_FAILED}
+select * from format(CSV, 'x UInt32, y UInt32', '1,2\n\n') settings input_format_csv_skip_trailing_empty_lines=1;
+select * from format(CSV, 'x UInt32, y UInt32', '1,2\n\n1,2\n') settings input_format_csv_skip_trailing_empty_lines=1; -- {serverError CANNOT_PARSE_INPUT_ASSERTION_FAILED}
+
+select * from format(CustomSeparated, 'x UInt32, y UInt32', '1\t2\n\n\n') settings input_format_custom_skip_trailing_empty_lines=0; -- {serverError CANNOT_PARSE_INPUT_ASSERTION_FAILED}
+select * from format(CustomSeparated, 'x UInt32, y UInt32', '1\t2\n\n\n') settings input_format_custom_skip_trailing_empty_lines=1;
+select * from format(CustomSeparated, 'x UInt32, y UInt32', '1\t2\n\n\n1\t2\n\n\n') settings input_format_custom_skip_trailing_empty_lines=1; -- {serverError CANNOT_PARSE_INPUT_ASSERTION_FAILED}
+
diff --git a/tests/queries/0_stateless/02772_jit_date_time_add.reference b/tests/queries/0_stateless/02772_jit_date_time_add.reference
new file mode 100644
index 00000000000..dec7d2fabd2
--- /dev/null
+++ b/tests/queries/0_stateless/02772_jit_date_time_add.reference
@@ -0,0 +1 @@
+\N
diff --git a/tests/queries/0_stateless/02772_jit_date_time_add.sql b/tests/queries/0_stateless/02772_jit_date_time_add.sql
new file mode 100644
index 00000000000..61028ac4172
--- /dev/null
+++ b/tests/queries/0_stateless/02772_jit_date_time_add.sql
@@ -0,0 +1,6 @@
+SET compile_expressions = 1;
+SET min_count_to_compile_expression = 0;
+
+SELECT DISTINCT result FROM (SELECT toStartOfFifteenMinutes(toDateTime(toStartOfFifteenMinutes(toDateTime(1000.0001220703125) + (number * 65536))) + (number * 9223372036854775807)) AS result FROM system.numbers LIMIT 1048576) ORDER BY result DESC NULLS FIRST FORMAT Null; -- { serverError 407 }
+SELECT DISTINCT result FROM (SELECT toStartOfFifteenMinutes(toDateTime(toStartOfFifteenMinutes(toDateTime(1000.0001220703125) + (number * 65536))) + toInt64(number * 9223372036854775807)) AS result FROM system.numbers LIMIT 1048576) ORDER BY result DESC NULLS FIRST FORMAT Null;
+SELECT round(round(round(round(round(100)), round(round(round(round(NULL), round(65535)), toTypeName(now() + 9223372036854775807) LIKE 'DateTime%DateTime%DateTime%DateTime%', round(-2)), 255), round(NULL))));
diff --git a/tests/queries/0_stateless/02775_show_columns_mysql_compatibility.reference b/tests/queries/0_stateless/02775_show_columns_mysql_compatibility.reference
new file mode 100644
index 00000000000..68e7be9ae6f
--- /dev/null
+++ b/tests/queries/0_stateless/02775_show_columns_mysql_compatibility.reference
@@ -0,0 +1,366 @@
+Drop tables if they exist
+Create tab table 
+Create pseudo-random database name
+Create tab duplicate table
+Run MySQL test
+field	type	null	key	default	extra
+aggregate_function	AggregateFunction(sum, Int32)	0		NULL	
+array_value	Array(Int32)	0		NULL	
+boolean_value	UInt8	0		NULL	
+date32_value	Date32	0		NULL	
+date_value	Date	0		NULL	
+datetime64_value	DateTime64(3)	0		NULL	
+datetime_value	DateTime	0		NULL	
+decimal_value	Decimal(10, 2)	0		NULL	
+enum_value	Enum8('apple' = 1, 'banana' = 2, 'orange' = 3)	0		NULL	
+fixed_string_value	FixedString(10)	0		NULL	
+float32	Float32	0		NULL	
+float64	Float64	0		NULL	
+int128	Int128	0		NULL	
+int16	Int16	0		NULL	
+int256	Int256	0		NULL	
+int32	Int32	0		NULL	
+int64	Int64	0		NULL	
+int8	Int8	0		NULL	
+ipv4_value	IPv4	0		NULL	
+ipv6_value	IPv6	0		NULL	
+json_value	Object('json')	0		NULL	
+low_cardinality	LowCardinality(String)	0		NULL	
+low_cardinality_date	LowCardinality(DateTime)	0		NULL	
+map_value	Map(String, Int32)	0		NULL	
+nested.nested_int	Array(Int32)	0		NULL	
+nested.nested_string	Array(String)	0		NULL	
+nint32	Nullable(Int32)	1		NULL	
+nullable_value	Nullable(Int32)	1		NULL	
+string_value	String	0		NULL	
+tuple_value	Tuple(Int32, String)	0		NULL	
+uint128	UInt128	0		NULL	
+uint16	UInt16	0		NULL	
+uint256	UInt256	0		NULL	
+uint32	UInt32	0		NULL	
+uint64	UInt64	0	PRI SOR	NULL	
+uint8	UInt8	0		NULL	
+uuid_value	UUID	0		NULL	
+field	type	null	key	default	extra
+aggregate_function	TEXT	0		NULL	
+array_value	TEXT	0		NULL	
+boolean_value	TINYINT UNSIGNED	0		NULL	
+date32_value	DATE	0		NULL	
+date_value	DATE	0		NULL	
+datetime64_value	DATETIME	0		NULL	
+datetime_value	DATETIME	0		NULL	
+decimal_value	DECIMAL(10, 2)	0		NULL	
+enum_value	ENUM('apple', 'banana', 'orange')	0		NULL	
+fixed_string_value	TEXT	0		NULL	
+float32	FLOAT	0		NULL	
+float64	DOUBLE	0		NULL	
+int128	TEXT	0		NULL	
+int16	SMALLINT	0		NULL	
+int256	TEXT	0		NULL	
+int32	INTEGER	0		NULL	
+int64	BIGINT	0		NULL	
+int8	TINYINT	0		NULL	
+ipv4_value	TEXT	0		NULL	
+ipv6_value	TEXT	0		NULL	
+json_value	JSON	0		NULL	
+low_cardinality	BLOB	0		NULL	
+low_cardinality_date	DATETIME	0		NULL	
+map_value	JSON	0		NULL	
+nested.nested_int	TEXT	0		NULL	
+nested.nested_string	TEXT	0		NULL	
+nint32	INTEGER	0		NULL	
+nullable_value	INTEGER	0		NULL	
+string_value	BLOB	0		NULL	
+tuple_value	JSON	0		NULL	
+uint128	TEXT	0		NULL	
+uint16	SMALLINT UNSIGNED	0		NULL	
+uint256	TEXT	0		NULL	
+uint32	INTEGER UNSIGNED	0		NULL	
+uint64	BIGINT UNSIGNED	0	PRI SOR	NULL	
+uint8	TINYINT UNSIGNED	0		NULL	
+uuid_value	CHAR	0		NULL	
+field	type	null	key	default	extra
+aggregate_function	TEXT	0		NULL	
+array_value	TEXT	0		NULL	
+boolean_value	TINYINT UNSIGNED	0		NULL	
+date32_value	DATE	0		NULL	
+date_value	DATE	0		NULL	
+datetime64_value	DATETIME	0		NULL	
+datetime_value	DATETIME	0		NULL	
+decimal_value	DECIMAL(10, 2)	0		NULL	
+enum_value	ENUM('apple', 'banana', 'orange')	0		NULL	
+fixed_string_value	TEXT	0		NULL	
+float32	FLOAT	0		NULL	
+float64	DOUBLE	0		NULL	
+int128	TEXT	0		NULL	
+int16	SMALLINT	0		NULL	
+int256	TEXT	0		NULL	
+int32	INTEGER	0		NULL	
+int64	BIGINT	0		NULL	
+int8	TINYINT	0		NULL	
+ipv4_value	TEXT	0		NULL	
+ipv6_value	TEXT	0		NULL	
+json_value	JSON	0		NULL	
+low_cardinality	BLOB	0		NULL	
+low_cardinality_date	DATETIME	0		NULL	
+map_value	JSON	0		NULL	
+nested.nested_int	TEXT	0		NULL	
+nested.nested_string	TEXT	0		NULL	
+nint32	INTEGER	0		NULL	
+nullable_value	INTEGER	0		NULL	
+string_value	BLOB	0		NULL	
+tuple_value	JSON	0		NULL	
+uint128	TEXT	0		NULL	
+uint16	SMALLINT UNSIGNED	0		NULL	
+uint256	TEXT	0		NULL	
+uint32	INTEGER UNSIGNED	0		NULL	
+uint64	BIGINT UNSIGNED	0	PRI SOR	NULL	
+uint8	TINYINT UNSIGNED	0		NULL	
+uuid_value	CHAR	0		NULL	
+field	type	null	key	default	extra	collation	comment	privileges
+aggregate_function	TEXT	0		NULL		NULL		
+array_value	TEXT	0		NULL		NULL		
+boolean_value	TINYINT UNSIGNED	0		NULL		NULL		
+date32_value	DATE	0		NULL		NULL		
+date_value	DATE	0		NULL		NULL		
+datetime64_value	DATETIME	0		NULL		NULL		
+datetime_value	DATETIME	0		NULL		NULL		
+decimal_value	DECIMAL(10, 2)	0		NULL		NULL		
+enum_value	ENUM('apple', 'banana', 'orange')	0		NULL		NULL		
+fixed_string_value	TEXT	0		NULL		NULL		
+float32	FLOAT	0		NULL		NULL		
+float64	DOUBLE	0		NULL		NULL		
+int128	TEXT	0		NULL		NULL		
+int16	SMALLINT	0		NULL		NULL		
+int256	TEXT	0		NULL		NULL		
+int32	INTEGER	0		NULL		NULL		
+int64	BIGINT	0		NULL		NULL		
+int8	TINYINT	0		NULL		NULL		
+ipv4_value	TEXT	0		NULL		NULL		
+ipv6_value	TEXT	0		NULL		NULL		
+json_value	JSON	0		NULL		NULL		
+low_cardinality	BLOB	0		NULL		NULL		
+low_cardinality_date	DATETIME	0		NULL		NULL		
+map_value	JSON	0		NULL		NULL		
+nested.nested_int	TEXT	0		NULL		NULL		
+nested.nested_string	TEXT	0		NULL		NULL		
+nint32	INTEGER	0		NULL		NULL		
+nullable_value	INTEGER	0		NULL		NULL		
+string_value	BLOB	0		NULL		NULL		
+tuple_value	JSON	0		NULL		NULL		
+uint128	TEXT	0		NULL		NULL		
+uint16	SMALLINT UNSIGNED	0		NULL		NULL		
+uint256	TEXT	0		NULL		NULL		
+uint32	INTEGER UNSIGNED	0		NULL		NULL		
+uint64	BIGINT UNSIGNED	0	PRI SOR	NULL		NULL		
+uint8	TINYINT UNSIGNED	0		NULL		NULL		
+uuid_value	CHAR	0		NULL		NULL		
+field	type	null	key	default	extra
+int128	TEXT	0		NULL	
+int16	SMALLINT	0		NULL	
+int256	TEXT	0		NULL	
+int32	INTEGER	0		NULL	
+int64	BIGINT	0		NULL	
+int8	TINYINT	0		NULL	
+nested.nested_int	TEXT	0		NULL	
+nint32	INTEGER	0		NULL	
+uint128	TEXT	0		NULL	
+uint16	SMALLINT UNSIGNED	0		NULL	
+uint256	TEXT	0		NULL	
+uint32	INTEGER UNSIGNED	0		NULL	
+uint64	BIGINT UNSIGNED	0	PRI SOR	NULL	
+uint8	TINYINT UNSIGNED	0		NULL	
+field	type	null	key	default	extra
+aggregate_function	TEXT	0		NULL	
+array_value	TEXT	0		NULL	
+boolean_value	TINYINT UNSIGNED	0		NULL	
+date32_value	DATE	0		NULL	
+date_value	DATE	0		NULL	
+datetime64_value	DATETIME	0		NULL	
+datetime_value	DATETIME	0		NULL	
+decimal_value	DECIMAL(10, 2)	0		NULL	
+enum_value	ENUM('apple', 'banana', 'orange')	0		NULL	
+fixed_string_value	TEXT	0		NULL	
+float32	FLOAT	0		NULL	
+float64	DOUBLE	0		NULL	
+ipv4_value	TEXT	0		NULL	
+ipv6_value	TEXT	0		NULL	
+json_value	JSON	0		NULL	
+low_cardinality	BLOB	0		NULL	
+low_cardinality_date	DATETIME	0		NULL	
+map_value	JSON	0		NULL	
+nested.nested_string	TEXT	0		NULL	
+nullable_value	INTEGER	0		NULL	
+string_value	BLOB	0		NULL	
+tuple_value	JSON	0		NULL	
+uuid_value	CHAR	0		NULL	
+field	type	null	key	default	extra
+int128	TEXT	0		NULL	
+int16	SMALLINT	0		NULL	
+int256	TEXT	0		NULL	
+int32	INTEGER	0		NULL	
+int64	BIGINT	0		NULL	
+int8	TINYINT	0		NULL	
+nested.nested_int	TEXT	0		NULL	
+nint32	INTEGER	0		NULL	
+uint128	TEXT	0		NULL	
+uint16	SMALLINT UNSIGNED	0		NULL	
+uint256	TEXT	0		NULL	
+uint32	INTEGER UNSIGNED	0		NULL	
+uint64	BIGINT UNSIGNED	0	PRI SOR	NULL	
+uint8	TINYINT UNSIGNED	0		NULL	
+field	type	null	key	default	extra
+aggregate_function	TEXT	0		NULL	
+array_value	TEXT	0		NULL	
+boolean_value	TINYINT UNSIGNED	0		NULL	
+date32_value	DATE	0		NULL	
+date_value	DATE	0		NULL	
+datetime64_value	DATETIME	0		NULL	
+datetime_value	DATETIME	0		NULL	
+decimal_value	DECIMAL(10, 2)	0		NULL	
+enum_value	ENUM('apple', 'banana', 'orange')	0		NULL	
+fixed_string_value	TEXT	0		NULL	
+float32	FLOAT	0		NULL	
+float64	DOUBLE	0		NULL	
+ipv4_value	TEXT	0		NULL	
+ipv6_value	TEXT	0		NULL	
+json_value	JSON	0		NULL	
+low_cardinality	BLOB	0		NULL	
+low_cardinality_date	DATETIME	0		NULL	
+map_value	JSON	0		NULL	
+nested.nested_string	TEXT	0		NULL	
+nullable_value	INTEGER	0		NULL	
+string_value	BLOB	0		NULL	
+tuple_value	JSON	0		NULL	
+uuid_value	CHAR	0		NULL	
+field	type	null	key	default	extra
+int128	TEXT	0		NULL	
+int16	SMALLINT	0		NULL	
+int256	TEXT	0		NULL	
+int32	INTEGER	0		NULL	
+int64	BIGINT	0		NULL	
+int8	TINYINT	0		NULL	
+nested.nested_int	TEXT	0		NULL	
+nint32	INTEGER	0		NULL	
+uint128	TEXT	0		NULL	
+uint16	SMALLINT UNSIGNED	0		NULL	
+uint256	TEXT	0		NULL	
+uint32	INTEGER UNSIGNED	0		NULL	
+uint64	BIGINT UNSIGNED	0	PRI SOR	NULL	
+uint8	TINYINT UNSIGNED	0		NULL	
+field	type	null	key	default	extra
+aggregate_function	TEXT	0		NULL	
+field	type	null	key	default	extra
+aggregate_function	TEXT	0		NULL	
+array_value	TEXT	0		NULL	
+boolean_value	TINYINT UNSIGNED	0		NULL	
+date32_value	DATE	0		NULL	
+date_value	DATE	0		NULL	
+datetime64_value	DATETIME	0		NULL	
+datetime_value	DATETIME	0		NULL	
+decimal_value	DECIMAL(10, 2)	0		NULL	
+enum_value	ENUM('apple', 'banana', 'orange')	0		NULL	
+fixed_string_value	TEXT	0		NULL	
+float32	FLOAT	0		NULL	
+float64	DOUBLE	0		NULL	
+int128	TEXT	0		NULL	
+int16	SMALLINT	0		NULL	
+int256	TEXT	0		NULL	
+int32	INTEGER	0		NULL	
+int64	BIGINT	0		NULL	
+int8	TINYINT	0		NULL	
+ipv4_value	TEXT	0		NULL	
+ipv6_value	TEXT	0		NULL	
+json_value	JSON	0		NULL	
+low_cardinality	BLOB	0		NULL	
+low_cardinality_date	DATETIME	0		NULL	
+map_value	JSON	0		NULL	
+nested.nested_int	TEXT	0		NULL	
+nested.nested_string	TEXT	0		NULL	
+nint32	INTEGER	0		NULL	
+nullable_value	INTEGER	0		NULL	
+string_value	BLOB	0		NULL	
+tuple_value	JSON	0		NULL	
+uint128	TEXT	0		NULL	
+uint16	SMALLINT UNSIGNED	0		NULL	
+uint256	TEXT	0		NULL	
+uint32	INTEGER UNSIGNED	0		NULL	
+uint64	BIGINT UNSIGNED	0	PRI SOR	NULL	
+uint8	TINYINT UNSIGNED	0		NULL	
+uuid_value	CHAR	0		NULL	
+field	type	null	key	default	extra
+aggregate_function	TEXT	0		NULL	
+array_value	TEXT	0		NULL	
+boolean_value	TINYINT UNSIGNED	0		NULL	
+date32_value	DATE	0		NULL	
+date_value	DATE	0		NULL	
+datetime64_value	DATETIME	0		NULL	
+datetime_value	DATETIME	0		NULL	
+decimal_value	DECIMAL(10, 2)	0		NULL	
+enum_value	ENUM('apple', 'banana', 'orange')	0		NULL	
+fixed_string_value	TEXT	0		NULL	
+float32	FLOAT	0		NULL	
+float64	DOUBLE	0		NULL	
+int128	TEXT	0		NULL	
+int16	SMALLINT	0		NULL	
+int256	TEXT	0		NULL	
+int32	INTEGER	0		NULL	
+int64	BIGINT	0		NULL	
+int8	TINYINT	0		NULL	
+ipv4_value	TEXT	0		NULL	
+ipv6_value	TEXT	0		NULL	
+json_value	JSON	0		NULL	
+low_cardinality	BLOB	0		NULL	
+low_cardinality_date	DATETIME	0		NULL	
+map_value	JSON	0		NULL	
+nested.nested_int	TEXT	0		NULL	
+nested.nested_string	TEXT	0		NULL	
+nint32	INTEGER	0		NULL	
+nullable_value	INTEGER	0		NULL	
+string_value	BLOB	0		NULL	
+tuple_value	JSON	0		NULL	
+uint128	TEXT	0		NULL	
+uint16	SMALLINT UNSIGNED	0		NULL	
+uint256	TEXT	0		NULL	
+uint32	INTEGER UNSIGNED	0		NULL	
+uint64	BIGINT UNSIGNED	0	PRI SOR	NULL	
+uint8	TINYINT UNSIGNED	0		NULL	
+uuid_value	CHAR	0		NULL	
+field	type	null	key	default	extra
+aggregate_function	TEXT	0		NULL	
+array_value	TEXT	0		NULL	
+boolean_value	TINYINT UNSIGNED	0		NULL	
+date32_value	DATE	0		NULL	
+date_value	DATE	0		NULL	
+datetime64_value	DATETIME	0		NULL	
+datetime_value	DATETIME	0		NULL	
+decimal_value	DECIMAL(10, 2)	0		NULL	
+enum_value	ENUM('apple', 'banana', 'orange')	0		NULL	
+fixed_string_value	TEXT	0		NULL	
+float32	FLOAT	0		NULL	
+float64	DOUBLE	0		NULL	
+int128	TEXT	0		NULL	
+int16	SMALLINT	0		NULL	
+int256	TEXT	0		NULL	
+int32	INTEGER	0		NULL	
+int64	BIGINT	0		NULL	
+int8	TINYINT	0		NULL	
+ipv4_value	TEXT	0		NULL	
+ipv6_value	TEXT	0		NULL	
+json_value	JSON	0		NULL	
+low_cardinality	BLOB	0		NULL	
+low_cardinality_date	DATETIME	0		NULL	
+map_value	JSON	0		NULL	
+nested.nested_int	TEXT	0		NULL	
+nested.nested_string	TEXT	0		NULL	
+nint32	INTEGER	0		NULL	
+nullable_value	INTEGER	0		NULL	
+string_value	BLOB	0		NULL	
+tuple_value	JSON	0		NULL	
+uint128	TEXT	0		NULL	
+uint16	SMALLINT UNSIGNED	0		NULL	
+uint256	TEXT	0		NULL	
+uint32	INTEGER UNSIGNED	0		NULL	
+uint64	BIGINT UNSIGNED	0	PRI SOR	NULL	
+uint8	TINYINT UNSIGNED	0		NULL	
+uuid_value	CHAR	0		NULL	
diff --git a/tests/queries/0_stateless/02775_show_columns_mysql_compatibility.sh b/tests/queries/0_stateless/02775_show_columns_mysql_compatibility.sh
new file mode 100755
index 00000000000..c86519b6f5d
--- /dev/null
+++ b/tests/queries/0_stateless/02775_show_columns_mysql_compatibility.sh
@@ -0,0 +1,153 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest, no-parallel
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+# This script tests the MySQL compatibility of the SHOW COLUMNS command in ClickHouse
+USER="default"
+PASSWORD=""
+HOST="127.0.0.1"
+PORT=9004
+
+# First run the clickhouse test to create the ClickHouse Tables
+
+echo "Drop tables if they exist"
+${CLICKHOUSE_CLIENT} --query "DROP TABLE IF EXISTS tab"
+${CLICKHOUSE_CLIENT} --query "DROP DATABASE IF EXISTS database_123456789abcdef"
+${CLICKHOUSE_CLIENT} --query "DROP TABLE IF EXISTS database_123456789abcdef.tab"
+
+echo "Create tab table "
+${CLICKHOUSE_CLIENT} -n -q "
+    SET allow_suspicious_low_cardinality_types=1;
+    SET allow_experimental_object_type=1;
+    CREATE TABLE tab
+    (
+        uint8 UInt8,
+        uint16 UInt16,
+        uint32 UInt32,
+        uint64 UInt64,
+        uint128 UInt128,
+        uint256 UInt256,
+        int8 Int8,
+        int16 Int16,
+        int32 Int32,
+        int64 Int64,
+        int128 Int128,
+        int256 Int256,
+        nint32 Nullable(Int32),
+        float32 Float32,
+        float64 Float64,
+        decimal_value Decimal(10, 2),
+        boolean_value UInt8,
+        string_value String,
+        fixed_string_value FixedString(10),
+        date_value Date,
+        date32_value Date32,
+        datetime_value DateTime,
+        datetime64_value DateTime64(3),
+        json_value JSON,
+        uuid_value UUID,
+        enum_value Enum8('apple' = 1, 'banana' = 2, 'orange' = 3),
+        low_cardinality LowCardinality(String),
+        low_cardinality_date LowCardinality(DateTime),
+        aggregate_function AggregateFunction(sum, Int32),
+        array_value Array(Int32),
+        map_value Map(String, Int32),
+        tuple_value Tuple(Int32, String),
+        nullable_value Nullable(Int32),
+        ipv4_value IPv4,
+        ipv6_value IPv6,
+        nested Nested
+        (
+            nested_int Int32,
+            nested_string String
+        )
+    ) ENGINE = MergeTree
+    ORDER BY uint64;
+    "
+
+
+echo "Create pseudo-random database name"
+${CLICKHOUSE_CLIENT} --query "CREATE DATABASE database_123456789abcdef;"
+
+echo "Create tab duplicate table"
+${CLICKHOUSE_CLIENT} -n -q "
+    SET allow_suspicious_low_cardinality_types=1;
+    SET allow_experimental_object_type =1;
+    CREATE TABLE database_123456789abcdef.tab
+    (
+        uint8 UInt8,
+        uint16 UInt16,
+        uint32 UInt32,
+        uint64 UInt64,
+        uint128 UInt128,
+        uint256 UInt256,
+        int8 Int8,
+        int16 Int16,
+        int32 Int32,
+        int64 Int64,
+        int128 Int128,
+        int256 Int256,
+        nint32 Nullable(Int32),
+        float32 Float32,
+        float64 Float64,
+        decimal_value Decimal(10, 2),
+        boolean_value UInt8,
+        string_value String,
+        fixed_string_value FixedString(10),
+        date_value Date,
+        date32_value Date32,
+        datetime_value DateTime,
+        datetime64_value DateTime64(3),
+        json_value JSON, 
+        uuid_value UUID,
+        enum_value Enum8('apple' = 1, 'banana' = 2, 'orange' = 3),
+        low_cardinality LowCardinality(String),
+        low_cardinality_date LowCardinality(DateTime),
+        aggregate_function AggregateFunction(sum, Int32),
+        array_value Array(Int32),
+        map_value Map(String, Int32),
+        tuple_value Tuple(Int32, String),
+        nullable_value Nullable(Int32),
+        ipv4_value IPv4,
+        ipv6_value IPv6,
+        nested Nested
+        (
+            nested_int Int32,
+            nested_string String
+        )
+    ) ENGINE = MergeTree
+    ORDER BY uint64;
+    "
+
+# Write sql to temp file 
+TEMP_FILE=$(mktemp)
+
+cat <<EOT > $TEMP_FILE
+SHOW COLUMNS FROM tab;
+SET use_mysql_types_in_show_columns=1;
+SHOW COLUMNS FROM tab;
+SHOW EXTENDED COLUMNS FROM tab;
+SHOW FULL COLUMNS FROM tab;
+SHOW COLUMNS FROM tab LIKE '%int%';
+SHOW COLUMNS FROM tab NOT LIKE '%int%';
+SHOW COLUMNS FROM tab ILIKE '%INT%';
+SHOW COLUMNS FROM tab NOT ILIKE '%INT%';
+SHOW COLUMNS FROM tab WHERE field LIKE '%int%';
+SHOW COLUMNS FROM tab LIMIT 1;
+SHOW COLUMNS FROM tab;
+SHOW COLUMNS FROM tab FROM database_123456789abcdef;
+SHOW COLUMNS FROM database_123456789abcdef.tab;
+DROP DATABASE database_123456789abcdef;
+DROP TABLE tab;
+EOT
+
+# Now run the MySQL test script on the ClickHouse DB
+echo "Run MySQL test"
+MYSQL_PWD=$PASSWORD ${MYSQL_CLIENT} --user="$USER" --host="$HOST" --port="$PORT" < $TEMP_FILE
+
+# Clean up the temp file
+rm $TEMP_FILE
+
diff --git a/tests/queries/0_stateless/02780_final_streams_data_skipping_index.reference b/tests/queries/0_stateless/02780_final_streams_data_skipping_index.reference
new file mode 100644
index 00000000000..d7a540ae479
--- /dev/null
+++ b/tests/queries/0_stateless/02780_final_streams_data_skipping_index.reference
@@ -0,0 +1,43 @@
+-- { echoOn }
+EXPLAIN PIPELINE SELECT * FROM data FINAL WHERE v1 >= now() - INTERVAL 180 DAY
+SETTINGS max_threads=2, max_final_threads=2, force_data_skipping_indices='v1_index', use_skip_indexes_if_final=1
+FORMAT LineAsString;
+(Expression)
+ExpressionTransform × 2
+  (Filter)
+  FilterTransform × 2
+    (ReadFromMergeTree)
+    ExpressionTransform × 2
+      AggregatingSortedTransform 2 → 1
+        ExpressionTransform × 2
+          FilterSortedStreamByRange × 2
+          Description: filter values in [(999424), +inf)
+            ExpressionTransform × 2
+              MergeTreeInOrder × 2 0 → 1
+                AggregatingSortedTransform
+                  ExpressionTransform
+                    FilterSortedStreamByRange
+                    Description: filter values in [-inf, (999424))
+                      ExpressionTransform
+                        MergeTreeInOrder 0 → 1
+EXPLAIN PIPELINE SELECT * FROM data FINAL WHERE v1 >= now() - INTERVAL 180 DAY
+SETTINGS max_threads=2, max_final_threads=2, force_data_skipping_indices='v1_index', use_skip_indexes_if_final=0
+FORMAT LineAsString;
+(Expression)
+ExpressionTransform × 2
+  (Filter)
+  FilterTransform × 2
+    (ReadFromMergeTree)
+    ExpressionTransform × 2
+      AggregatingSortedTransform 2 → 1
+        ExpressionTransform × 2
+          FilterSortedStreamByRange × 2
+          Description: filter values in [(999424), +inf)
+            ExpressionTransform × 2
+              MergeTreeInOrder × 2 0 → 1
+                AggregatingSortedTransform
+                  ExpressionTransform
+                    FilterSortedStreamByRange
+                    Description: filter values in [-inf, (999424))
+                      ExpressionTransform
+                        MergeTreeInOrder 0 → 1
diff --git a/tests/queries/0_stateless/02780_final_streams_data_skipping_index.sql b/tests/queries/0_stateless/02780_final_streams_data_skipping_index.sql
new file mode 100644
index 00000000000..7de7a58e2e1
--- /dev/null
+++ b/tests/queries/0_stateless/02780_final_streams_data_skipping_index.sql
@@ -0,0 +1,28 @@
+-- Tags: no-random-merge-tree-settings, no-random-settings
+
+DROP TABLE IF EXISTS data;
+
+CREATE TABLE data
+(
+    key  Int,
+    v1   DateTime,
+    INDEX v1_index v1 TYPE minmax GRANULARITY 1
+) ENGINE=AggregatingMergeTree()
+ORDER BY key
+SETTINGS index_granularity=8192, min_bytes_for_wide_part=0, min_rows_for_wide_part=0;
+
+SYSTEM STOP MERGES data;
+
+-- generate 50% of marks that cannot be skipped with v1_index
+-- this will create a gap in marks
+INSERT INTO data SELECT number,     if(number/8192 % 2 == 0, now(), now() - INTERVAL 200 DAY) FROM numbers(1e6);
+INSERT INTO data SELECT number+1e6, if(number/8192 % 2 == 0, now(), now() - INTERVAL 200 DAY) FROM numbers(1e6);
+
+-- { echoOn }
+EXPLAIN PIPELINE SELECT * FROM data FINAL WHERE v1 >= now() - INTERVAL 180 DAY
+SETTINGS max_threads=2, max_final_threads=2, force_data_skipping_indices='v1_index', use_skip_indexes_if_final=1
+FORMAT LineAsString;
+
+EXPLAIN PIPELINE SELECT * FROM data FINAL WHERE v1 >= now() - INTERVAL 180 DAY
+SETTINGS max_threads=2, max_final_threads=2, force_data_skipping_indices='v1_index', use_skip_indexes_if_final=0
+FORMAT LineAsString;
diff --git a/tests/queries/0_stateless/02782_avro_decimals.reference b/tests/queries/0_stateless/02782_avro_decimals.reference
new file mode 100644
index 00000000000..a16e5e4ac56
--- /dev/null
+++ b/tests/queries/0_stateless/02782_avro_decimals.reference
@@ -0,0 +1,25 @@
+d	Decimal(14, 4)					
+0
+1
+1.1
+12.12
+123.123
+1234.1234
+12345.1234
+123456.1234
+1234567.1234
+12345678.1234
+123456789.1234
+1234567890.1234
+0
+-1
+-1.1
+-12.12
+-123.123
+-1234.1234
+-12345.1234
+-123456.1234
+-1234567.1234
+-12345678.1234
+-123456789.1234
+-1234567890.1234
diff --git a/tests/queries/0_stateless/02782_avro_decimals.sh b/tests/queries/0_stateless/02782_avro_decimals.sh
new file mode 100755
index 00000000000..5b754965806
--- /dev/null
+++ b/tests/queries/0_stateless/02782_avro_decimals.sh
@@ -0,0 +1,10 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+$CLICKHOUSE_LOCAL -q "desc file('$CUR_DIR/data_avro/decimals.avro')"
+$CLICKHOUSE_LOCAL -q "select * from file('$CUR_DIR/data_avro/decimals.avro')"
+
diff --git a/tests/queries/0_stateless/02782_inconsistent_formatting_and_constant_folding.reference b/tests/queries/0_stateless/02782_inconsistent_formatting_and_constant_folding.reference
new file mode 100644
index 00000000000..39d23aa2298
--- /dev/null
+++ b/tests/queries/0_stateless/02782_inconsistent_formatting_and_constant_folding.reference
@@ -0,0 +1,4 @@
+0	UInt8	-1	Int8	-0	Float64
+0
+0
+0
diff --git a/tests/queries/0_stateless/02782_inconsistent_formatting_and_constant_folding.sql b/tests/queries/0_stateless/02782_inconsistent_formatting_and_constant_folding.sql
new file mode 100644
index 00000000000..31278862ab8
--- /dev/null
+++ b/tests/queries/0_stateless/02782_inconsistent_formatting_and_constant_folding.sql
@@ -0,0 +1,41 @@
+SELECT -0, toTypeName(-0), -1, toTypeName(-1), -0., toTypeName(-0.);
+
+DROP TABLE IF EXISTS t4;
+DROP TABLE IF EXISTS t7;
+
+create table t4 (c26 String) engine = Log;
+create view t7 as select max(ref_3.c26) as c_2_c46_1 from t4 as ref_3;
+
+select
+        c_7_c4585_14 as c_4_c4593_5
+      from
+        (select
+              avg(0) as c_7_c4572_1,
+              max(-0) as c_7_c4585_14
+            from
+              t7 as ref_0
+            group by ref_0.c_2_c46_1) as subq_0
+where c_4_c4593_5 <= multiIf(true, 1, exp10(c_4_c4593_5) <= 1, 1, 1);
+
+select x as c
+      from
+        (select 1 AS k,
+              max(0) as a,
+              max(-0) as x
+            from
+              t7 GROUP BY k)
+where NOT ignore(c);
+
+SELECT x
+FROM
+(
+    SELECT
+        avg(0) AS c_7_c4572_1,
+        max(-0) AS x
+    FROM t7 AS ref_0
+    GROUP BY ref_0.c_2_c46_1
+)
+WHERE x <= multiIf(true, 1, exp10(x) <= 1, 1, 1);
+
+DROP TABLE t7;
+DROP TABLE t4;
diff --git a/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.reference b/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.sh b/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.sh
new file mode 100755
index 00000000000..d84ffd21b87
--- /dev/null
+++ b/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.sh
@@ -0,0 +1,21 @@
+#!/usr/bin/env bash
+# Tags: long, no-random-settings, no-tsan, no-asan, no-ubsan, no-msan
+
+# shellcheck disable=SC2154
+
+unset CLICKHOUSE_LOG_COMMENT
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+
+clickhouse-client -q "
+    CREATE TABLE ${CLICKHOUSE_DATABASE}.t(s String)
+    ENGINE = MergeTree
+    ORDER BY tuple();
+"
+
+clickhouse-client -q "insert into ${CLICKHOUSE_DATABASE}.t select number%10==0 ? toString(number) : '' from numbers_mt(1e7)"
+
+clickhouse-benchmark -q "select count(distinct s) from ${CLICKHOUSE_DATABASE}.t settings max_memory_usage = '50Mi'" --ignore-error -c 16 -i 1000 2>/dev/null
diff --git a/tests/queries/0_stateless/02782_values_null_to_lc_nullable.reference b/tests/queries/0_stateless/02782_values_null_to_lc_nullable.reference
new file mode 100644
index 00000000000..dec7d2fabd2
--- /dev/null
+++ b/tests/queries/0_stateless/02782_values_null_to_lc_nullable.reference
@@ -0,0 +1 @@
+\N
diff --git a/tests/queries/0_stateless/02782_values_null_to_lc_nullable.sql b/tests/queries/0_stateless/02782_values_null_to_lc_nullable.sql
new file mode 100644
index 00000000000..250fe6b7551
--- /dev/null
+++ b/tests/queries/0_stateless/02782_values_null_to_lc_nullable.sql
@@ -0,0 +1,2 @@
+select * from values('s LowCardinality(Nullable(String))', (NULL));
+
diff --git a/tests/queries/0_stateless/02783_date_predicate_optimizations.reference b/tests/queries/0_stateless/02783_date_predicate_optimizations.reference
new file mode 100644
index 00000000000..cd689b93034
--- /dev/null
+++ b/tests/queries/0_stateless/02783_date_predicate_optimizations.reference
@@ -0,0 +1,2 @@
+2021-12-31 23:00:00	0
+2021-12-31 23:00:00	0
diff --git a/tests/queries/0_stateless/02783_date_predicate_optimizations.sql b/tests/queries/0_stateless/02783_date_predicate_optimizations.sql
new file mode 100644
index 00000000000..abb13f1005e
--- /dev/null
+++ b/tests/queries/0_stateless/02783_date_predicate_optimizations.sql
@@ -0,0 +1,13 @@
+CREATE TABLE source
+(
+    `ts` DateTime('UTC'),
+    `n` Int32
+)
+ENGINE = MergeTree
+PARTITION BY toYYYYMM(ts)
+ORDER BY tuple();
+
+INSERT INTO source values ('2021-12-31 23:00:00', 0);
+
+SELECT * FROM source WHERE toYYYYMM(ts) = 202112;
+SELECT * FROM source WHERE toYear(ts) = 2021;
diff --git a/tests/queries/0_stateless/02783_max_bytes_to_read_in_schema_inference.reference b/tests/queries/0_stateless/02783_max_bytes_to_read_in_schema_inference.reference
new file mode 100644
index 00000000000..d45098ddc0f
--- /dev/null
+++ b/tests/queries/0_stateless/02783_max_bytes_to_read_in_schema_inference.reference
@@ -0,0 +1 @@
+a	Nullable(Int64)					
diff --git a/tests/queries/0_stateless/02783_max_bytes_to_read_in_schema_inference.sql b/tests/queries/0_stateless/02783_max_bytes_to_read_in_schema_inference.sql
new file mode 100644
index 00000000000..9dbf176472d
--- /dev/null
+++ b/tests/queries/0_stateless/02783_max_bytes_to_read_in_schema_inference.sql
@@ -0,0 +1,4 @@
+set input_format_max_rows_to_read_for_schema_inference=2;
+desc format('JSONEachRow', '{"a" : null}, {"a" : 42}') settings input_format_max_bytes_to_read_for_schema_inference=10; -- {serverError ONLY_NULLS_WHILE_READING_SCHEMA}
+desc format('JSONEachRow', '{"a" : null}, {"a" : 42}') settings input_format_max_bytes_to_read_for_schema_inference=20;
+
diff --git a/tests/queries/0_stateless/02783_parallel_replicas_trivial_count_optimization.reference b/tests/queries/0_stateless/02783_parallel_replicas_trivial_count_optimization.reference
new file mode 100644
index 00000000000..48795e2cd39
--- /dev/null
+++ b/tests/queries/0_stateless/02783_parallel_replicas_trivial_count_optimization.reference
@@ -0,0 +1,12 @@
+100000
+100000
+100000
+100000
+100000
+100000
+02783_count-default_0_disabled	Not parallel	1	16
+02783_count-default_0_pure	Not parallel	1	16
+02783_count-default_0_pure_analyzer	Not parallel	1	16
+02783_count-default_1_disabled	Not parallel	1	16
+02783_count-default_1_pure	Not parallel	1	16
+02783_count-default_1_pure_analyzer	Not parallel	1	16
diff --git a/tests/queries/0_stateless/02783_parallel_replicas_trivial_count_optimization.sh b/tests/queries/0_stateless/02783_parallel_replicas_trivial_count_optimization.sh
new file mode 100755
index 00000000000..6210ef2e8b6
--- /dev/null
+++ b/tests/queries/0_stateless/02783_parallel_replicas_trivial_count_optimization.sh
@@ -0,0 +1,95 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+function has_used_parallel_replicas () {
+    $CLICKHOUSE_CLIENT --query "
+        SELECT
+            initial_query_id,
+            if(count() != 2, 'Used parallel', 'Not parallel'),
+            sumIf(read_rows, is_initial_query) as read_rows,
+            sumIf(read_bytes, is_initial_query) as read_bytes
+        FROM system.query_log
+    WHERE event_date >= yesterday() and initial_query_id LIKE '$1%' AND current_database = '$CLICKHOUSE_DATABASE'
+    GROUP BY initial_query_id
+    ORDER BY min(event_time_microseconds) ASC
+    FORMAT TSV"
+}
+
+function run_query_with_pure_parallel_replicas () {
+    $CLICKHOUSE_CLIENT \
+        --query "$2" \
+        --query_id "${1}_disabled" \
+        --max_parallel_replicas 0
+
+    $CLICKHOUSE_CLIENT \
+        --query "$2" \
+        --query_id "${1}_pure" \
+        --max_parallel_replicas 3 \
+        --prefer_localhost_replica 1 \
+        --use_hedged_requests 0 \
+        --cluster_for_parallel_replicas 'test_cluster_one_shard_three_replicas_localhost' \
+        --allow_experimental_parallel_reading_from_replicas 1 \
+        --allow_experimental_analyzer 0
+
+    # Not implemented yet
+    $CLICKHOUSE_CLIENT \
+        --query "$2" \
+        --query_id "${1}_pure_analyzer" \
+        --max_parallel_replicas 3 \
+        --prefer_localhost_replica 1 \
+        --use_hedged_requests 0 \
+        --cluster_for_parallel_replicas 'test_cluster_one_shard_three_replicas_localhost' \
+        --allow_experimental_parallel_reading_from_replicas 1 \
+        --allow_experimental_analyzer 1
+}
+
+function run_query_with_custom_key_parallel_replicas () {
+    $CLICKHOUSE_CLIENT \
+        --query "$2" \
+        --query_id "${1}_disabled" \
+        --max_parallel_replicas 0
+
+    $CLICKHOUSE_CLIENT \
+        --query "$2" \
+        --query_id "${1}_custom_key" \
+        --max_parallel_replicas 3 \
+        --use_hedged_requests 0 \
+        --parallel_replicas_custom_key_filter_type 'default' \
+        --parallel_replicas_custom_key "$2" \
+        --allow_experimental_analyzer 0
+
+    $CLICKHOUSE_CLIENT \
+        --query "$2" \
+        --query_id "${1}_custom_key_analyzer" \
+        --max_parallel_replicas 3 \
+        --use_hedged_requests 0 \
+        --parallel_replicas_custom_key_filter_type 'default' \
+        --parallel_replicas_custom_key "$2" \
+        --allow_experimental_analyzer 1
+}
+
+$CLICKHOUSE_CLIENT --query "
+    CREATE TABLE replicated_numbers
+    (
+        number Int64,
+    )
+    ENGINE=ReplicatedMergeTree('/clickhouse/tables/{database}/replicated_numbers', 'r1')
+    ORDER BY (number)
+    AS SELECT number FROM numbers(100000);
+"
+
+query_id_base="02783_count-$CLICKHOUSE_DATABASE"
+
+run_query_with_pure_parallel_replicas "${query_id_base}_0" "SELECT count() FROM replicated_numbers"
+run_query_with_pure_parallel_replicas "${query_id_base}_1" "SELECT * FROM (SELECT count() FROM replicated_numbers) LIMIT 20"
+
+# Not implemented yet as the query fails to execute correctly to begin with
+#run_query_with_custom_key_parallel_replicas "${query_id_base}_2" "SELECT count() FROM cluster(test_cluster_one_shard_three_replicas_localhost, currentDatabase(), replicated_numbers)" "sipHash64(number)"
+#run_query_with_custom_key_parallel_replicas "${query_id_base}_3" "SELECT * FROM (SELECT count() FROM cluster(test_cluster_one_shard_three_replicas_localhost, currentDatabase(), replicated_numbers)) LIMIT 20" "sipHash64(number)"
+
+
+$CLICKHOUSE_CLIENT --query "SYSTEM FLUSH LOGS"
+has_used_parallel_replicas "${query_id_base}"
diff --git a/tests/queries/0_stateless/02783_parsedatetimebesteffort_syslog.reference b/tests/queries/0_stateless/02783_parsedatetimebesteffort_syslog.reference
new file mode 100644
index 00000000000..1340b3affe3
--- /dev/null
+++ b/tests/queries/0_stateless/02783_parsedatetimebesteffort_syslog.reference
@@ -0,0 +1,37 @@
+The reference time point is 2023-06-30 23:59:30
+───────────────────────────────────────────────
+The argument is before the reference time point
+───────────────────────────────────────────────
+Row 1:
+──────
+syslog_arg:    Jun 30 23:58:30
+res:           2023-06-30 23:58:30
+res_null:      2023-06-30 23:58:30
+res_zero:      2023-06-30 23:58:30
+res_us:        2023-06-30 23:58:30
+res_us_null:   2023-06-30 23:58:30
+res_us_zero:   2023-06-30 23:58:30
+res64:         2023-06-30 23:58:30.000
+res64_null:    2023-06-30 23:58:30.000
+res64_zero:    2023-06-30 23:58:30.000
+res64_us:      2023-06-30 23:58:30.000
+res64_us_null: 2023-06-30 23:58:30.000
+res64_us_zero: 2023-06-30 23:58:30.000
+──────────────────────────────────────────────
+The argument is after the reference time point
+──────────────────────────────────────────────
+Row 1:
+──────
+syslog_arg:    Jul  1 00:00:30
+res:           2022-07-01 00:00:30
+res_null:      2022-07-01 00:00:30
+res_zero:      2022-07-01 00:00:30
+res_us:        2022-07-01 00:00:30
+res_us_null:   2022-07-01 00:00:30
+res_us_zero:   2022-07-01 00:00:30
+res64:         2022-07-01 00:00:30.000
+res64_null:    2022-07-01 00:00:30.000
+res64_zero:    2022-07-01 00:00:30.000
+res64_us:      2022-07-01 00:00:30.000
+res64_us_null: 2022-07-01 00:00:30.000
+res64_us_zero: 2022-07-01 00:00:30.000
diff --git a/tests/queries/0_stateless/02783_parsedatetimebesteffort_syslog.sql b/tests/queries/0_stateless/02783_parsedatetimebesteffort_syslog.sql
new file mode 100644
index 00000000000..38e495fdd4e
--- /dev/null
+++ b/tests/queries/0_stateless/02783_parsedatetimebesteffort_syslog.sql
@@ -0,0 +1,52 @@
+SELECT 'The reference time point is 2023-06-30 23:59:30';
+SELECT '───────────────────────────────────────────────';
+SELECT 'The argument is before the reference time point';
+SELECT '───────────────────────────────────────────────';
+
+WITH
+    toDateTime('2023-06-30 23:59:30') AS dt_ref,
+    now() AS dt_now, 
+    date_sub(MINUTE, 1, dt_now) as dt_before,
+    dateDiff(SECOND, dt_ref, dt_now) AS time_shift,
+    formatDateTime(dt_before, '%b %e %T') AS syslog_before
+SELECT
+    formatDateTime(dt_before - time_shift, '%b %e %T') AS syslog_arg,
+    parseDateTimeBestEffort(syslog_before) - time_shift AS res,
+    parseDateTimeBestEffortOrNull(syslog_before) - time_shift AS res_null,
+    parseDateTimeBestEffortOrZero(syslog_before) - time_shift AS res_zero,
+    parseDateTimeBestEffortUS(syslog_before) - time_shift AS res_us,
+    parseDateTimeBestEffortUSOrNull(syslog_before) - time_shift AS res_us_null,
+    parseDateTimeBestEffortUSOrZero(syslog_before) - time_shift AS res_us_zero,
+    parseDateTime64BestEffort(syslog_before) - time_shift AS res64,
+    parseDateTime64BestEffortOrNull(syslog_before) - time_shift AS res64_null,
+    parseDateTime64BestEffortOrZero(syslog_before) - time_shift AS res64_zero,
+    parseDateTime64BestEffortUS(syslog_before) - time_shift AS res64_us,
+    parseDateTime64BestEffortUSOrNull(syslog_before) - time_shift AS res64_us_null,
+    parseDateTime64BestEffortUSOrZero(syslog_before) - time_shift AS res64_us_zero
+FORMAT Vertical;
+
+SELECT '──────────────────────────────────────────────';
+SELECT 'The argument is after the reference time point';
+SELECT '──────────────────────────────────────────────';
+
+WITH
+    toDateTime('2023-06-30 23:59:30') AS dt_ref,
+    now() AS dt_now, 
+    date_add(MINUTE, 1, dt_now) as dt_after,
+    dateDiff(SECOND, dt_ref, dt_now) AS time_shift,
+    formatDateTime(dt_after, '%b %e %T') AS syslog_after
+SELECT
+    formatDateTime(dt_after - time_shift, '%b %e %T') AS syslog_arg,
+    parseDateTimeBestEffort(syslog_after) - time_shift AS res,
+    parseDateTimeBestEffortOrNull(syslog_after) - time_shift AS res_null,
+    parseDateTimeBestEffortOrZero(syslog_after) - time_shift AS res_zero,
+    parseDateTimeBestEffortUS(syslog_after) - time_shift AS res_us,
+    parseDateTimeBestEffortUSOrNull(syslog_after) - time_shift AS res_us_null,
+    parseDateTimeBestEffortUSOrZero(syslog_after) - time_shift AS res_us_zero,
+    parseDateTime64BestEffort(syslog_after) - time_shift AS res64,
+    parseDateTime64BestEffortOrNull(syslog_after) - time_shift AS res64_null,
+    parseDateTime64BestEffortOrZero(syslog_after) - time_shift AS res64_zero,
+    parseDateTime64BestEffortUS(syslog_after) - time_shift AS res64_us,
+    parseDateTime64BestEffortUSOrNull(syslog_after) - time_shift AS res64_us_null,
+    parseDateTime64BestEffortUSOrZero(syslog_after) - time_shift AS res64_us_zero
+FORMAT Vertical;
diff --git a/tests/queries/0_stateless/02784_connection_string.reference b/tests/queries/0_stateless/02784_connection_string.reference
new file mode 100644
index 00000000000..9d58d485a14
--- /dev/null
+++ b/tests/queries/0_stateless/02784_connection_string.reference
@@ -0,0 +1,126 @@
+0
+1
+2
+3
+4
+5
+6
+7
+8
+9
+10
+11
+12
+13
+14
+15
+16
+17
+18
+19
+20
+21
+22
+23
+24
+25
+26
+27
+28
+29
+30
+31
+32
+33
+34
+35
+36
+37
+38
+39
+40
+41
+42
+43
+44
+45
+46
+47
+48
+49
+50
+51
+52
+53
+54
+55
+56
+57
+58
+59
+60
+61
+62
+63
+64
+65
+66
+67
+68
+500
+501
+502
+1000
+1001
+1002
+1003
+Bad arguments
+Bad arguments
+Bad arguments
+Bad arguments
+Bad arguments
+Bad arguments
+Bad arguments
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+BAD_ARGUMENTS
+Authentication failed
+Authentication failed
diff --git a/tests/queries/0_stateless/02784_connection_string.sh b/tests/queries/0_stateless/02784_connection_string.sh
new file mode 100755
index 00000000000..8353ac5b1e4
--- /dev/null
+++ b/tests/queries/0_stateless/02784_connection_string.sh
@@ -0,0 +1,159 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+USER_INFOS=('default' '')
+HOSTS_PORTS=("$CLICKHOUSE_HOST:$CLICKHOUSE_PORT_TCP" "$CLICKHOUSE_HOST" "$CLICKHOUSE_HOST:" ":$CLICKHOUSE_PORT_TCP"  "127.0.0.1" "127.0.0.1:$CLICKHOUSE_PORT_TCP" "$CLICKHOUSE_HOST:$CLICKHOUSE_PORT_TCP,invalid_host:9000" "[0000:0000:0000:0000:0000:0000:0000:0001]" "[::1]"  "[::1]:$CLICKHOUSE_PORT_TCP" "" )
+DATABASES=("$CLICKHOUSE_DATABASE" "")
+
+TEST_INDEX=0
+
+function runClient() 
+{
+    $CLICKHOUSE_CLIENT_BINARY "$@" -q "SELECT $TEST_INDEX" --log_comment 02766_connection_string.sh --send_logs_level=warning
+    ((++TEST_INDEX))
+}
+
+function testConnectionString() 
+{
+    if [ "$database" == "" ]; then
+        runClient "clickhouse:$1"
+        runClient "clickhouse:$1/"
+    else
+        runClient "clickhouse:$1/$database"
+    fi
+}
+
+function testConnectionWithUserName() 
+{
+if [ "$user_info" == "" ] && [ "$host_port" == "" ]; then
+        testConnectionString "//"
+        testConnectionString ""
+    else
+        testConnectionString "//$user_info@$host_port"
+    fi
+}
+
+for user_info in "${USER_INFOS[@]}"
+do
+    for host_port in "${HOSTS_PORTS[@]}"
+    do
+        for database in "${DATABASES[@]}"
+        do
+            testConnectionWithUserName
+        done
+    done
+done
+
+# Specific user and password
+TEST_INDEX=500
+TEST_USER_NAME="test_user_02771_$$"
+TEST_USER_EMAIL_NAME="test_user_02771_$$@some_mail.com"
+TEST_USER_EMAIL_NAME_ENCODED="test_user_02771_$$%40some_mail.com"
+
+TEST_USER_PASSWORD="zyx%$&abc" 
+# %, $, & percent encoded
+TEST_USER_PASSWORD_ENCODED="zyx%25%24%26abc" 
+
+$CLICKHOUSE_CLIENT -q "CREATE USER '$TEST_USER_NAME'"
+$CLICKHOUSE_CLIENT -q "CREATE USER '$TEST_USER_EMAIL_NAME' IDENTIFIED WITH plaintext_password BY '$TEST_USER_PASSWORD'"
+
+runClient "clickhouse://$TEST_USER_NAME@$CLICKHOUSE_HOST/$CLICKHOUSE_DATABASE"
+runClient "clickhouse://$TEST_USER_EMAIL_NAME_ENCODED:$TEST_USER_PASSWORD_ENCODED@$CLICKHOUSE_HOST/$CLICKHOUSE_DATABASE"
+
+$CLICKHOUSE_CLIENT -q "DROP USER '$TEST_USER_NAME'"
+$CLICKHOUSE_CLIENT -q "DROP USER '$TEST_USER_EMAIL_NAME'"
+
+# Percent-encoded database in non-ascii symbols 
+UTF8_DATABASE="БазаДанных_$$"
+UTF8_DATABASE_PERCENT_ENCODED="%D0%91%D0%B0%D0%B7%D0%B0%D0%94%D0%B0%D0%BD%D0%BD%D1%8B%D1%85_$$"
+$CLICKHOUSE_CLIENT -q "CREATE DATABASE IF NOT EXISTS \`$UTF8_DATABASE\`"
+runClient "clickhouse://default@$CLICKHOUSE_HOST/$UTF8_DATABASE_PERCENT_ENCODED"
+$CLICKHOUSE_CLIENT -q "DROP DATABASE IF EXISTS \`$UTF8_DATABASE\`"
+
+# clickhouse-client extra options cases 
+TEST_INDEX=1000
+
+runClient "clickhouse://$CLICKHOUSE_HOST/" --user 'default'
+runClient "clickhouse://$CLICKHOUSE_HOST/default" --user 'default'
+runClient "clickhouse:" --database "$CLICKHOUSE_DATABASE"
+
+# User 'default' and default host
+runClient "clickhouse://default@"
+
+# Invalid URI cases
+TEST_INDEX=10000
+runClient "clickhouse://default:@$CLICKHOUSE_HOST/" --user 'default' 2>&1 | grep -o 'Bad arguments'
+runClient "clickhouse://default:pswrd@$CLICKHOUSE_HOST/" --user 'default' 2>&1 | grep -o 'Bad arguments'
+runClient "clickhouse://default:pswrd@$CLICKHOUSE_HOST/" --password 'pswrd' 2>&1 | grep -o 'Bad arguments'
+runClient "clickhouse:///$CLICKHOUSE_DATABASE" --database "$CLICKHOUSE_DATABASE" 2>&1 | grep -o 'Bad arguments'
+runClient "clickhouse://$CLICKHOUSE_HOST/$CLICKHOUSE_DATABASE" --database "$CLICKHOUSE_DATABASE" 2>&1 | grep -o 'Bad arguments'
+runClient "clickhouse://$CLICKHOUSE_HOST/$CLICKHOUSE_DATABASE?s" --database "$CLICKHOUSE_DATABASE" 2>&1 | grep -o 'Bad arguments'
+runClient "clickhouse:/$CLICKHOUSE_DATABASE?s" --database "$CLICKHOUSE_DATABASE" 2>&1 | grep -o 'Bad arguments'
+
+runClient "http://" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "click_house:" 2>&1 | grep -o 'BAD_ARGUMENTS'
+
+TEST_INDEX=1000087
+# Using connection string prohibits to use --host and --port options
+runClient "clickhouse://default:@$CLICKHOUSE_HOST/" --host "$CLICKHOUSE_HOST" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://default:@$CLICKHOUSE_HOST:$CLICKHOUSE_PORT_TCP/" --host "$CLICKHOUSE_HOST" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://default:@$CLICKHOUSE_HOST:$CLICKHOUSE_PORT_TCP/" --port "$CLICKHOUSE_PORT_TCP" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://default:@$CLICKHOUSE_HOST:$CLICKHOUSE_PORT_TCP/" --host "$CLICKHOUSE_HOST" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://default:@$CLICKHOUSE_HOST:$CLICKHOUSE_PORT_TCP/" --host "$CLICKHOUSE_HOST" --host "$CLICKHOUSE_HOST" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://default:@$CLICKHOUSE_HOST:$CLICKHOUSE_PORT_TCP/" --port "$CLICKHOUSE_PORT_TCP" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://default:@$CLICKHOUSE_HOST/" --port "$CLICKHOUSE_PORT_TCP" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://$CLICKHOUSE_HOST/" --port "$CLICKHOUSE_PORT_TCP" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://:@$CLICKHOUSE_HOST/" --port "$CLICKHOUSE_PORT_TCP" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://$CLICKHOUSE_HOST/" --port "$CLICKHOUSE_PORT_TCP" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://" --host "$CLICKHOUSE_HOST" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse:" --port "$CLICKHOUSE_PORT_TCP" --host "$CLICKHOUSE_HOST" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://" --port "$CLICKHOUSE_PORT_TCP" --host "$CLICKHOUSE_HOST" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse:///" --port "$CLICKHOUSE_PORT_TCP" --host "$CLICKHOUSE_HOST" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse:///?" --port "$CLICKHOUSE_PORT_TCP" --host "$CLICKHOUSE_HOST" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://:/?" --port "$CLICKHOUSE_PORT_TCP" --host "$CLICKHOUSE_HOST" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse:" --database "$CLICKHOUSE_DATABASE" --port "$CLICKHOUSE_PORT_TCP" --host "$CLICKHOUSE_HOST" 2>&1 | grep -o 'BAD_ARGUMENTS' 
+
+# Using clickhouse-client and connection is prohibited
+runClient "clickhouse:" --connection "connection" 2>&1 | grep -o 'BAD_ARGUMENTS'
+
+# Space is used in connection string (This is prohibited).
+runClient " clickhouse:" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse: " 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://host1 /" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://host1, host2/" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://host1 ,host2/" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://host1 host2/" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://host1/ database:" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://user :password@host1" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://user: password@host1" 2>&1 | grep -o 'BAD_ARGUMENTS'
+
+# Connection string is not first argument
+runClient --multiline "clickhouse://default:@$CLICKHOUSE_HOST/" 2>&1 | grep -o 'BAD_ARGUMENTS'
+# Connection string used as the first and the second argument of client
+runClient "clickhouse://default:@$CLICKHOUSE_HOST/" "clickhouse://default:@$CLICKHOUSE_HOST/" 2>&1 | grep -o 'BAD_ARGUMENTS'
+
+# Invalid hosts
+runClient "clickhouse://host1,,," 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse://," 2>&1 | grep -o 'BAD_ARGUMENTS'
+
+# Invalid parameters
+runClient "clickhouse:?invalid_parameter" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse:?invalid_parameter&secure" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse:?s&invalid_parameter" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse:?s&invalid_parameter=val" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse:?invalid_parameter=arg" 2>&1 | grep -o 'BAD_ARGUMENTS'
+runClient "clickhouse:?invalid_parameter=arg&s" 2>&1 | grep -o 'BAD_ARGUMENTS'
+# Several users prohibited
+runClient "clickhouse://user1@localhost,default@localhost/" 2>&1 | grep -o 'BAD_ARGUMENTS'
+# Using '@' in user name is prohibited. User name should be percent-encoded.
+runClient "clickhouse://my_mail@email.com@host/" 2>&1 | grep -o 'BAD_ARGUMENTS'
+
+# Wrong input cases 
+TEST_INDEX=100000
+# Invalid user name
+runClient "clickhouse://non_exist_user@$CLICKHOUSE_HOST:$CLICKHOUSE_PORT_TCP/" 2>&1 | grep -o 'Authentication failed'
+# Invalid password
+runClient "clickhouse://default:invalid_password@$CLICKHOUSE_HOST:$CLICKHOUSE_PORT_TCP/" 2>&1 | grep -o 'Authentication failed'
diff --git a/tests/queries/0_stateless/02784_disable_async_with_dedup_correctly.reference b/tests/queries/0_stateless/02784_disable_async_with_dedup_correctly.reference
new file mode 100644
index 00000000000..014be4ce1a9
--- /dev/null
+++ b/tests/queries/0_stateless/02784_disable_async_with_dedup_correctly.reference
@@ -0,0 +1,17 @@
+0
+1
+1
+1
+2
+3
+4
+5
+6
+7
+8
+9
+10
+11
+12
+13
+14
diff --git a/tests/queries/0_stateless/02784_disable_async_with_dedup_correctly.sh b/tests/queries/0_stateless/02784_disable_async_with_dedup_correctly.sh
new file mode 100755
index 00000000000..40e7c9feabf
--- /dev/null
+++ b/tests/queries/0_stateless/02784_disable_async_with_dedup_correctly.sh
@@ -0,0 +1,29 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT -q "DROP TABLE IF EXISTS 02784_async_table_with_dedup"
+
+$CLICKHOUSE_CLIENT -q "CREATE TABLE 02784_async_table_with_dedup (a Int64) ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/02784_async_table_with_dedup', 'r1') ORDER BY a"
+
+CLICKHOUSE_CLIENT_WITH_LOG=$(echo ${CLICKHOUSE_CLIENT} | sed 's/'"--send_logs_level=${CLICKHOUSE_CLIENT_SERVER_LOGS_LEVEL}"'/--send_logs_level=trace/g')
+
+function insert_with_log_check() {
+    $CLICKHOUSE_CLIENT_WITH_LOG --async-insert=1 --async_insert_deduplicate=1 --wait_for_async_insert=1 -q "$1" 2>&1 | grep -Fc "Setting async_insert=1, but INSERT query will be executed synchronously"
+}
+
+insert_with_log_check "INSERT INTO 02784_async_table_with_dedup VALUES (1), (2)"
+insert_with_log_check "INSERT INTO 02784_async_table_with_dedup SELECT number as a FROM system.numbers LIMIT 10 OFFSET 3"
+
+DATA_FILE=test_02784_async_$CLICKHOUSE_TEST_UNIQUE_NAME.csv
+echo -e '13\n14' > $DATA_FILE
+
+insert_with_log_check "INSERT INTO 02784_async_table_with_dedup FROM INFILE '$DATA_FILE' FORMAT CSV"
+
+$CLICKHOUSE_CLIENT -q "SELECT a FROM 02784_async_table_with_dedup ORDER BY a"
+
+$CLICKHOUSE_CLIENT -q "DROP TABLE 02784_async_table_with_dedup"
+
+rm $DATA_FILE
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02784_move_all_conditions_to_prewhere_analyzer_asan.reference b/tests/queries/0_stateless/02784_move_all_conditions_to_prewhere_analyzer_asan.reference
new file mode 100644
index 00000000000..a08e8a1d440
--- /dev/null
+++ b/tests/queries/0_stateless/02784_move_all_conditions_to_prewhere_analyzer_asan.reference
@@ -0,0 +1,4 @@
+0	0
+0	0
+0	0
+0	0
diff --git a/tests/queries/0_stateless/02784_move_all_conditions_to_prewhere_analyzer_asan.sql b/tests/queries/0_stateless/02784_move_all_conditions_to_prewhere_analyzer_asan.sql
new file mode 100644
index 00000000000..44b9ce4fdc1
--- /dev/null
+++ b/tests/queries/0_stateless/02784_move_all_conditions_to_prewhere_analyzer_asan.sql
@@ -0,0 +1,15 @@
+DROP TABLE IF EXISTS t_02784;
+
+CREATE TABLE t_02784 (c1 UInt64, c2 UInt64) ENGINE=MergeTree() ORDER BY c1 SETTINGS min_bytes_for_wide_part=1;
+
+INSERT INTO t_02784 SELECT number, number FROM numbers(1);
+
+SET allow_experimental_analyzer=1;
+SET move_all_conditions_to_prewhere=1;
+
+SELECT c1, c2 FROM t_02784 WHERE c1 = 0 AND c2 = 0;
+SELECT c1, c2 FROM t_02784 WHERE c2 = 0 AND c1 = 0;
+SELECT c2, c1 FROM t_02784 WHERE c1 = 0 AND c2 = 0;
+SELECT c2, c1 FROM t_02784 WHERE c2 = 0 AND c1 = 0;
+
+DROP TABLE t_02784;
diff --git a/tests/queries/0_stateless/02784_parallel_replicas_automatic_disabling.reference b/tests/queries/0_stateless/02784_parallel_replicas_automatic_disabling.reference
new file mode 100644
index 00000000000..af81158ecae
--- /dev/null
+++ b/tests/queries/0_stateless/02784_parallel_replicas_automatic_disabling.reference
@@ -0,0 +1,2 @@
+10
+1
diff --git a/tests/queries/0_stateless/02784_parallel_replicas_automatic_disabling.sql b/tests/queries/0_stateless/02784_parallel_replicas_automatic_disabling.sql
new file mode 100644
index 00000000000..b2f674ddb64
--- /dev/null
+++ b/tests/queries/0_stateless/02784_parallel_replicas_automatic_disabling.sql
@@ -0,0 +1,15 @@
+DROP TABLE IF EXISTS test_parallel_replicas_automatic_disabling;
+CREATE TABLE test_parallel_replicas_automatic_disabling (n UInt64) ENGINE=MergeTree() ORDER BY tuple();
+INSERT INTO test_parallel_replicas_automatic_disabling SELECT * FROM numbers(10);
+
+SYSTEM FLUSH LOGS;
+
+SET skip_unavailable_shards=1, allow_experimental_parallel_reading_from_replicas=1, max_parallel_replicas=3, use_hedged_requests=0, cluster_for_parallel_replicas='parallel_replicas', parallel_replicas_for_non_replicated_merge_tree=1, parallel_replicas_min_number_of_granules_to_enable=10000;
+SET send_logs_level='error';
+SELECT count() FROM test_parallel_replicas_automatic_disabling WHERE NOT ignore(*);
+
+SYSTEM FLUSH LOGS;
+
+SELECT count() > 0 FROM system.text_log WHERE event_time >= now() - INTERVAL 2 MINUTE AND message LIKE '%Parallel replicas will be disabled, because the estimated number of granules to read%';
+
+DROP TABLE test_parallel_replicas_automatic_disabling;
diff --git a/tests/queries/0_stateless/02784_projections_read_in_order_bug.reference b/tests/queries/0_stateless/02784_projections_read_in_order_bug.reference
new file mode 100644
index 00000000000..6110bc68aae
--- /dev/null
+++ b/tests/queries/0_stateless/02784_projections_read_in_order_bug.reference
@@ -0,0 +1,4 @@
+00000000-0000-0000-0000-000000000000	1643760000	0
+00000000-0000-0000-0000-000000000000	1643760000	0
+00000000-0000-0000-0000-000000000000	1643760000	0
+00000000-0000-0000-0000-000000000000	1643760000	0
diff --git a/tests/queries/0_stateless/02784_projections_read_in_order_bug.sql b/tests/queries/0_stateless/02784_projections_read_in_order_bug.sql
new file mode 100644
index 00000000000..6bf287a3d77
--- /dev/null
+++ b/tests/queries/0_stateless/02784_projections_read_in_order_bug.sql
@@ -0,0 +1,44 @@
+create table events (
+    `organisation_id` UUID,
+    `session_id` UUID,
+    `id` UUID DEFAULT generateUUIDv4(),
+    `timestamp` UInt64,
+    `payload` String,
+    `customer_id` UUID,
+    `call_id` String,
+    PROJECTION events_by_session_and_org
+    (
+        SELECT *
+        ORDER BY
+            organisation_id,
+            session_id,
+            timestamp
+    ),
+    PROJECTION events_by_session
+    (
+        SELECT *
+        ORDER BY
+            session_id,
+            timestamp
+    ),
+    PROJECTION events_by_session_and_customer
+    (
+        SELECT *
+        ORDER BY
+            customer_id,
+            session_id,
+            timestamp
+    ),
+    PROJECTION events_by_call_id
+    (
+        SELECT *
+        ORDER BY
+            call_id,
+            timestamp
+    )) engine = MergeTree order by (organisation_id, session_id, timestamp) settings index_granularity = 3;
+
+insert into events values (reinterpretAsUUID(0), reinterpretAsUUID(1), reinterpretAsUUID(0), toDateTime('2022-02-02', 'UTC'), toString(0), reinterpretAsUUID(0), toString(0)), (reinterpretAsUUID(0), reinterpretAsUUID(1), reinterpretAsUUID(0), toDateTime('2022-02-02', 'UTC'), toString(0), reinterpretAsUUID(0), toString(0)), (reinterpretAsUUID(1), reinterpretAsUUID(0), reinterpretAsUUID(0), toDateTime('2022-02-02', 'UTC'), toString(0), reinterpretAsUUID(0), toString(0)), (reinterpretAsUUID(1), reinterpretAsUUID(0), reinterpretAsUUID(0), toDateTime('2022-02-02', 'UTC'), toString(0), reinterpretAsUUID(0), toString(0)), (reinterpretAsUUID(3), reinterpretAsUUID(2), reinterpretAsUUID(0), toDateTime('2022-02-02', 'UTC'), toString(0), reinterpretAsUUID(0), toString(0)), (reinterpretAsUUID(3), reinterpretAsUUID(2), reinterpretAsUUID(0), toDateTime('2022-02-02', 'UTC'), toString(0), reinterpretAsUUID(0), toString(0));
+insert into events values (reinterpretAsUUID(0), reinterpretAsUUID(1), reinterpretAsUUID(0), toDateTime('2022-02-02', 'UTC'), toString(0), reinterpretAsUUID(0), toString(0)), (reinterpretAsUUID(0), reinterpretAsUUID(1), reinterpretAsUUID(0), toDateTime('2022-02-02', 'UTC'), toString(0), reinterpretAsUUID(0), toString(0)), (reinterpretAsUUID(1), reinterpretAsUUID(0), reinterpretAsUUID(0), toDateTime('2022-02-02', 'UTC'), toString(0), reinterpretAsUUID(0), toString(0)), (reinterpretAsUUID(1), reinterpretAsUUID(0), reinterpretAsUUID(0), toDateTime('2022-02-02', 'UTC'), toString(0), reinterpretAsUUID(0), toString(0)), (reinterpretAsUUID(3), reinterpretAsUUID(2), reinterpretAsUUID(0), toDateTime('2022-02-02', 'UTC'), toString(0), reinterpretAsUUID(0), toString(0)), (reinterpretAsUUID(3), reinterpretAsUUID(2), reinterpretAsUUID(0), toDateTime('2022-02-02', 'UTC'), toString(0), reinterpretAsUUID(0), toString(0));
+
+set read_in_order_two_level_merge_threshold=1;
+SELECT id, timestamp, payload FROM events WHERE (organisation_id = reinterpretAsUUID(1)) AND (session_id = reinterpretAsUUID(0)) ORDER BY timestamp, payload, id ASC;
diff --git a/tests/queries/0_stateless/02784_schema_inference_null_as_default.reference b/tests/queries/0_stateless/02784_schema_inference_null_as_default.reference
new file mode 100644
index 00000000000..c83819ab2e2
--- /dev/null
+++ b/tests/queries/0_stateless/02784_schema_inference_null_as_default.reference
@@ -0,0 +1,9 @@
+x	Nullable(Int64)					
+\N
+42
+x	Nullable(Int64)					
+\N
+42
+x	Int64					
+0
+42
diff --git a/tests/queries/0_stateless/02784_schema_inference_null_as_default.sql b/tests/queries/0_stateless/02784_schema_inference_null_as_default.sql
new file mode 100644
index 00000000000..9c9f99d8283
--- /dev/null
+++ b/tests/queries/0_stateless/02784_schema_inference_null_as_default.sql
@@ -0,0 +1,7 @@
+desc format(JSONEachRow, '{"x" : null}, {"x" : 42}') settings schema_inference_make_columns_nullable=1;
+select * from format(JSONEachRow, '{"x" : null}, {"x" : 42}') settings schema_inference_make_columns_nullable=1;
+desc format(JSONEachRow, '{"x" : null}, {"x" : 42}') settings schema_inference_make_columns_nullable=0, input_format_null_as_default=0;
+select * from format(JSONEachRow, '{"x" : null}, {"x" : 42}') settings schema_inference_make_columns_nullable=0, input_format_null_as_default=0;
+desc format(JSONEachRow, '{"x" : null}, {"x" : 42}') settings schema_inference_make_columns_nullable=0, input_format_null_as_default=1;
+select * from format(JSONEachRow, '{"x" : null}, {"x" : 42}') settings schema_inference_make_columns_nullable=0, input_format_null_as_default=1;
+
diff --git a/tests/queries/0_stateless/02785_global_join_too_many_columns.reference b/tests/queries/0_stateless/02785_global_join_too_many_columns.reference
new file mode 100644
index 00000000000..425151f3a41
--- /dev/null
+++ b/tests/queries/0_stateless/02785_global_join_too_many_columns.reference
@@ -0,0 +1 @@
+40
diff --git a/tests/queries/0_stateless/02785_global_join_too_many_columns.sql b/tests/queries/0_stateless/02785_global_join_too_many_columns.sql
new file mode 100644
index 00000000000..a49aae25f1c
--- /dev/null
+++ b/tests/queries/0_stateless/02785_global_join_too_many_columns.sql
@@ -0,0 +1,14 @@
+drop table if exists local;
+drop table if exists distr;
+
+create table local (a UInt64, b UInt64, c UInt64, d UInt64, e UInt64, f UInt64, g UInt64, h UInt64) engine = Log;
+create table distr as local engine = Distributed('test_cluster_two_shards', currentDatabase(), local);
+
+insert into local (a) select number from numbers(10);
+
+set max_columns_to_read=1;
+select count() from distr as l global all left join distr as r on l.a = r.a;
+
+drop table if exists local;
+drop table if exists distr;
+
diff --git a/tests/queries/0_stateless/02785_summing_merge_tree_datetime64.reference b/tests/queries/0_stateless/02785_summing_merge_tree_datetime64.reference
new file mode 100644
index 00000000000..d395c4d6a0f
--- /dev/null
+++ b/tests/queries/0_stateless/02785_summing_merge_tree_datetime64.reference
@@ -0,0 +1 @@
+1	2023-05-01 23:55:55.100	15
diff --git a/tests/queries/0_stateless/02785_summing_merge_tree_datetime64.sql b/tests/queries/0_stateless/02785_summing_merge_tree_datetime64.sql
new file mode 100644
index 00000000000..db00f189330
--- /dev/null
+++ b/tests/queries/0_stateless/02785_summing_merge_tree_datetime64.sql
@@ -0,0 +1,13 @@
+DROP TABLE IF EXISTS summing_merge_tree_datetime64;
+
+CREATE TABLE summing_merge_tree_datetime64 ( `pk` UInt64, `timestamp` DateTime64(3), `value` UInt64 )
+ENGINE = SummingMergeTree() ORDER BY pk;
+
+INSERT INTO summing_merge_tree_datetime64 SELECT 1 pk, '2023-05-01 23:55:55.100' timestamp, 1 value;
+INSERT INTO summing_merge_tree_datetime64 SELECT 1 pk, '2023-05-01 23:55:55.100' timestamp, 2 value;
+INSERT INTO summing_merge_tree_datetime64 SELECT 1 pk, '2023-05-01 23:55:55.100' timestamp, 3 value;
+INSERT INTO summing_merge_tree_datetime64 SELECT 1 pk, '2023-05-01 23:55:55.100' timestamp, 4 value;
+INSERT INTO summing_merge_tree_datetime64 SELECT 1 pk, '2023-05-01 23:55:55.100' timestamp, 5 value;
+
+SELECT * FROM summing_merge_tree_datetime64 FINAL;
+DROP TABLE summing_merge_tree_datetime64;
diff --git a/tests/queries/0_stateless/02785_text_with_whitespace_tab_field_delimiter.reference b/tests/queries/0_stateless/02785_text_with_whitespace_tab_field_delimiter.reference
new file mode 100644
index 00000000000..228436130dc
--- /dev/null
+++ b/tests/queries/0_stateless/02785_text_with_whitespace_tab_field_delimiter.reference
@@ -0,0 +1,2 @@
+1	a	b
+2	c	d
diff --git a/tests/queries/0_stateless/02785_text_with_whitespace_tab_field_delimiter.sh b/tests/queries/0_stateless/02785_text_with_whitespace_tab_field_delimiter.sh
new file mode 100755
index 00000000000..6fca95cb839
--- /dev/null
+++ b/tests/queries/0_stateless/02785_text_with_whitespace_tab_field_delimiter.sh
@@ -0,0 +1,18 @@
+#!/usr/bin/env bash
+
+# NOTE: this sh wrapper is required because of shell_config
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT -q "drop table if exists test_whitespace"
+$CLICKHOUSE_CLIENT -q "drop table if exists test_tab"
+$CLICKHOUSE_CLIENT -q "create table test_whitespace (x UInt32, y String, z String) engine=MergeTree order by x"
+$CLICKHOUSE_CLIENT -q "create table test_tab (x UInt32, y String, z String) engine=MergeTree order by x"
+cat $CURDIR/data_csv/csv_with_space_delimiter.csv | ${CLICKHOUSE_CLIENT} -q "INSERT INTO test_whitespace SETTINGS format_csv_delimiter=' ', input_format_csv_allow_whitespace_or_tab_as_delimiter=true FORMAT CSV"
+cat $CURDIR/data_csv/csv_with_tab_delimiter.csv | ${CLICKHOUSE_CLIENT} -q "INSERT INTO test_tab SETTINGS format_csv_delimiter='\t', input_format_csv_allow_whitespace_or_tab_as_delimiter=true FORMAT CSV"
+$CLICKHOUSE_CLIENT -q "select * from test_whitespace"
+$CLICKHOUSE_CLIENT -q "select * from test_tab"
+$CLICKHOUSE_CLIENT -q "drop table test_whitespace"
+$CLICKHOUSE_CLIENT -q "drop table test_tab"; 
diff --git a/tests/queries/0_stateless/02786_parquet_big_integer_compatibility.reference b/tests/queries/0_stateless/02786_parquet_big_integer_compatibility.reference
new file mode 100644
index 00000000000..7764974255b
--- /dev/null
+++ b/tests/queries/0_stateless/02786_parquet_big_integer_compatibility.reference
@@ -0,0 +1 @@
+424242424242424242424242424242424242424242424242424242
diff --git a/tests/queries/0_stateless/02786_parquet_big_integer_compatibility.sh b/tests/queries/0_stateless/02786_parquet_big_integer_compatibility.sh
new file mode 100755
index 00000000000..8865b2e7aab
--- /dev/null
+++ b/tests/queries/0_stateless/02786_parquet_big_integer_compatibility.sh
@@ -0,0 +1,9 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+$CLICKHOUSE_LOCAL -q "select toString(424242424242424242424242424242424242424242424242424242::UInt256) as x format Parquet" | $CLICKHOUSE_LOCAL --input-format=Parquet --structure='x UInt256' -q "select * from table"
+
diff --git a/tests/queries/0_stateless/02786_transform_float.reference b/tests/queries/0_stateless/02786_transform_float.reference
new file mode 100644
index 00000000000..3fbb2492f2e
--- /dev/null
+++ b/tests/queries/0_stateless/02786_transform_float.reference
@@ -0,0 +1,10 @@
+1
+1
+1
+---
+1
+1
+1
+1
+1
+1
diff --git a/tests/queries/0_stateless/02786_transform_float.sql b/tests/queries/0_stateless/02786_transform_float.sql
new file mode 100644
index 00000000000..4229425b084
--- /dev/null
+++ b/tests/queries/0_stateless/02786_transform_float.sql
@@ -0,0 +1,3 @@
+select transform(number, [1], [toFloat32(1)], toFloat32(1)) from numbers(3);
+SELECT '---';
+select transform(number, [3], [toFloat32(1)], toFloat32(1)) from numbers(6);
diff --git a/tests/queries/0_stateless/02787_transform_null.reference b/tests/queries/0_stateless/02787_transform_null.reference
new file mode 100644
index 00000000000..a650dbbd173
--- /dev/null
+++ b/tests/queries/0_stateless/02787_transform_null.reference
@@ -0,0 +1,9 @@
+ZERO
+ZERO
+ONE
+ONE
+a
+a
+	\N	0	\N	0	\N
+1	1	1	\N	1	1
+a	\N	3	3	3	3
diff --git a/tests/queries/0_stateless/02787_transform_null.sql b/tests/queries/0_stateless/02787_transform_null.sql
new file mode 100644
index 00000000000..64a771f0f4b
--- /dev/null
+++ b/tests/queries/0_stateless/02787_transform_null.sql
@@ -0,0 +1,40 @@
+SELECT transform(0, [0, 1], ['ZERO', 'ONE'], 'DEFAULT') AS result;
+SELECT transform(0, [0, 1], ['ZERO', 'ONE'], NULL) AS result;
+
+SELECT CASE 1
+  WHEN 0 THEN 'ZERO'
+  WHEN 1 THEN 'ONE'
+  ELSE 'NONE'
+END AS result;
+
+SELECT CASE 1
+  WHEN 0 THEN NULL
+  WHEN 1 THEN 'ONE'
+  ELSE 'NONE'
+END AS result;
+
+select 
+    case 1 
+        when 1 then 'a' 
+        else 'b'
+    end value;
+
+select 
+    case 1 
+        when 1 then 'a' 
+    end value;
+
+SELECT
+    d,
+    toInt16OrNull(d),
+    caseWithExpression(d, 'a', 3, toInt16OrZero(d)) AS case_zero,
+    caseWithExpression(d, 'a', 3, toInt16OrNull(d)) AS case_null,
+    if(d = 'a', 3, toInt16OrZero(d)) AS if_zero,
+    if(d = 'a', 3, toInt16OrNull(d)) AS if_null
+FROM
+(
+    SELECT arrayJoin(['', '1', 'a']) AS d
+)
+ORDER BY
+    case_zero ASC,
+    d ASC;
diff --git a/tests/queries/0_stateless/02788_fix_logical_error_in_sorting.reference b/tests/queries/0_stateless/02788_fix_logical_error_in_sorting.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02788_fix_logical_error_in_sorting.sql b/tests/queries/0_stateless/02788_fix_logical_error_in_sorting.sql
new file mode 100644
index 00000000000..1ff68191800
--- /dev/null
+++ b/tests/queries/0_stateless/02788_fix_logical_error_in_sorting.sql
@@ -0,0 +1,77 @@
+CREATE TABLE session_events
+(
+    clientId UInt64,
+    sessionId String,
+    pageId UInt64,
+    eventNumber UInt64,
+    timestamp UInt64,
+    type LowCardinality(String),
+    data String
+)
+ENGINE = MergeTree
+PARTITION BY toYYYYMM(toDate(pageId / 1000))
+ORDER BY (clientId, sessionId, pageId, timestamp);
+
+CREATE TABLE event_types
+(
+    type String,
+    active Int16
+)
+ENGINE = MergeTree
+PARTITION BY substring(type, 1, 1)
+ORDER BY (type, active);
+
+SYSTEM STOP MERGES session_events;
+SYSTEM STOP MERGES event_types;
+
+INSERT INTO session_events SELECT
+    141,
+    '693de636-6d9b-47b7-b52a-33bd303b6255',
+    1686053240314,
+    number,
+    number,
+    toString(number % 10),
+    ''
+FROM numbers_mt(100000);
+
+INSERT INTO session_events SELECT
+    141,
+    '693de636-6d9b-47b7-b52a-33bd303b6255',
+    1686053240314,
+    number,
+    number,
+    toString(number % 10),
+    ''
+FROM numbers_mt(100000);
+
+INSERT INTO event_types SELECT
+    toString(number % 10),
+    number % 2
+FROM numbers(20);
+
+SET optimize_sorting_by_input_stream_properties = 1;
+
+-- We check only that no exception was thrown
+EXPLAIN PIPELINE
+SELECT
+    pageId,
+    [prev_active_ts, timestamp] AS inactivity_timestamps,
+    timestamp - prev_active_ts AS inactive_duration,
+    timestamp
+FROM
+(
+    SELECT
+        pageId,
+        timestamp,
+        neighbor(timestamp, -1) AS prev_active_ts
+    FROM session_events
+    WHERE (type IN (
+        SELECT type
+        FROM event_types
+        WHERE active = 1
+    )) AND (sessionId = '693de636-6d9b-47b7-b52a-33bd303b6255') AND (session_events.clientId = 141) AND (pageId = 1686053240314)
+    ORDER BY timestamp ASC
+)
+WHERE runningDifference(timestamp) >= 500
+ORDER BY timestamp ASC
+FORMAT Null;
diff --git a/tests/queries/0_stateless/02789_filesystem_cache_alignment.reference b/tests/queries/0_stateless/02789_filesystem_cache_alignment.reference
new file mode 100644
index 00000000000..70e1fca6a65
--- /dev/null
+++ b/tests/queries/0_stateless/02789_filesystem_cache_alignment.reference
@@ -0,0 +1,7 @@
+0
+OK
+OK
+0
+0
+OK
+OK
diff --git a/tests/queries/0_stateless/02789_filesystem_cache_alignment.sh b/tests/queries/0_stateless/02789_filesystem_cache_alignment.sh
new file mode 100755
index 00000000000..912cdd3d1e8
--- /dev/null
+++ b/tests/queries/0_stateless/02789_filesystem_cache_alignment.sh
@@ -0,0 +1,125 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest, no-parallel, no-random-settings, no-random-merge-tree-settings
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT -nm -q "
+DROP TABLE IF EXISTS test;
+CREATE TABLE test (a Int32, b String)
+ENGINE = MergeTree()
+ORDER BY a
+SETTINGS disk = disk(type = cache,
+                     max_size = '1Gi',
+                     max_file_segment_size = '40Mi',
+                     boundary_alignment = '20Mi',
+                     path = '$CLICKHOUSE_TEST_UNIQUE_NAME',
+                     disk = 's3_disk');
+
+INSERT INTO test SELECT number, randomString(100) FROM numbers(1000000);
+"
+
+QUERY_ID=$RANDOM
+$CLICKHOUSE_CLIENT --query_id "$QUERY_ID" -nm -q "
+SET enable_filesystem_cache_log = 1;
+SYSTEM DROP FILESYSTEM CACHE;
+SELECT * FROM test WHERE NOT ignore() LIMIT 1 FORMAT Null;
+SYSTEM FLUSH LOGS;
+"
+
+query="
+SELECT cache_path, file_size,
+    tupleElement(file_segment_range, 2) - tupleElement(file_segment_range, 1) + 1 as file_segment_size,
+    formatReadableSize(file_size) as formatted_file_size,
+    formatReadableSize(file_segment_size) as formatted_file_segment_size,
+    tupleElement(file_segment_range, 2) as end_offset
+FROM (
+    SELECT arrayJoin(cache_paths) AS cache_path,
+           local_path,
+           remote_path,
+           size as file_size
+    FROM system.remote_data_paths
+    WHERE endsWith(local_path, '.bin')
+) AS data_paths
+INNER JOIN system.filesystem_cache_log AS cache_log
+ON data_paths.remote_path = cache_log.source_file_path
+WHERE query_id = '$QUERY_ID' "
+
+# File segments cannot be less that 20Mi,
+# except for last file segment in a file or if file size is less.
+$CLICKHOUSE_CLIENT -nm -q "
+SELECT count() FROM ($query)
+WHERE file_segment_size < file_size
+AND end_offset + 1 != file_size
+AND file_segment_size < 20 * 1024 * 1024;
+"
+
+all=$($CLICKHOUSE_CLIENT -nm -q "
+SELECT count() FROM ($query)
+WHERE file_segment_size < file_size AND end_offset + 1 != file_size;
+")
+#echo $all
+
+if [ "$all" -gt "1" ]; then
+  echo "OK"
+else
+  echo "FAIL"
+fi
+
+count=$($CLICKHOUSE_CLIENT -nm -q "
+SELECT count() FROM ($query)
+WHERE file_segment_size < file_size
+AND end_offset + 1 != file_size
+AND formatted_file_segment_size in ('20.00 MiB', '40.00 MiB')
+")
+
+if [ "$count" = "$all" ]; then
+  echo "OK"
+else
+  echo "FAIL"
+fi
+
+query2="
+SELECT *
+FROM (SELECT * FROM ($query)) AS cache_log
+INNER JOIN system.filesystem_cache AS cache
+ON cache_log.cache_path = cache.cache_path "
+
+$CLICKHOUSE_CLIENT -nm -q "
+SELECT count() FROM ($query2)
+WHERE file_segment_range_begin - file_segment_range_end + 1 < file_size
+AND file_segment_range_end + 1 != file_size
+AND downloaded_size < 20 * 1024 * 1024;
+"
+
+$CLICKHOUSE_CLIENT -nm -q "
+SELECT count() FROM ($query2)
+WHERE file_segment_range_begin - file_segment_range_end + 1 < file_size
+AND file_segment_range_end + 1 != file_size
+AND formatReadableSize(downloaded_size) not in ('20.00 MiB', '40.00 MiB');
+"
+
+all=$($CLICKHOUSE_CLIENT -nm -q "
+SELECT count() FROM ($query2)
+WHERE file_segment_size < file_size AND file_segment_range_end + 1 != file_size;
+")
+
+if [ "$all" -gt "1" ]; then
+  echo "OK"
+else
+  echo "FAIL"
+fi
+
+count2=$($CLICKHOUSE_CLIENT -nm -q "
+SELECT count() FROM ($query2)
+WHERE file_segment_range_begin - file_segment_range_end + 1 < file_size
+AND file_segment_range_end + 1 != file_size
+AND formatReadableSize(downloaded_size) in ('20.00 MiB', '40.00 MiB');
+")
+
+if [ "$count2" = "$all" ]; then
+  echo "OK"
+else
+  echo "FAIL"
+fi
diff --git a/tests/queries/0_stateless/02789_set_index_nullable_condition_bug.reference b/tests/queries/0_stateless/02789_set_index_nullable_condition_bug.reference
new file mode 100644
index 00000000000..e6ce356cd45
--- /dev/null
+++ b/tests/queries/0_stateless/02789_set_index_nullable_condition_bug.reference
@@ -0,0 +1 @@
+v1	v2
diff --git a/tests/queries/0_stateless/02789_set_index_nullable_condition_bug.sql b/tests/queries/0_stateless/02789_set_index_nullable_condition_bug.sql
new file mode 100644
index 00000000000..fed030f170d
--- /dev/null
+++ b/tests/queries/0_stateless/02789_set_index_nullable_condition_bug.sql
@@ -0,0 +1,15 @@
+drop table if exists test_table;
+CREATE TABLE test_table
+(
+    col1 String,
+    col2 String,
+    INDEX test_table_col2_idx col2 TYPE set(0) GRANULARITY 1
+) ENGINE = MergeTree()
+      ORDER BY col1
+AS SELECT 'v1', 'v2';
+
+SELECT * FROM test_table
+WHERE 1 == 1 AND col1 == col1 OR
+       0 AND col2 == NULL;
+
+drop table if exists test_table;
diff --git a/tests/queries/0_stateless/02789_table_functions_errors.reference b/tests/queries/0_stateless/02789_table_functions_errors.reference
new file mode 100644
index 00000000000..af81158ecae
--- /dev/null
+++ b/tests/queries/0_stateless/02789_table_functions_errors.reference
@@ -0,0 +1,2 @@
+10
+1
diff --git a/tests/queries/0_stateless/02789_table_functions_errors.sh b/tests/queries/0_stateless/02789_table_functions_errors.sh
new file mode 100755
index 00000000000..081f7776ba0
--- /dev/null
+++ b/tests/queries/0_stateless/02789_table_functions_errors.sh
@@ -0,0 +1,12 @@
+#!/usr/bin/env bash
+# Tags: no-parallel
+# Tag no-parallel: It uses system.errors values which are global
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+# Simply calling a table function correctly should not increase system.errors
+OLD_ERROR_QUANTITY=$(${CLICKHOUSE_CLIENT} --query "SELECT sum(value) FROM system.errors WHERE name = 'UNKNOWN_TABLE'")
+${CLICKHOUSE_CLIENT} --query "SELECT count() FROM numbers(10)"
+${CLICKHOUSE_CLIENT} --query "SELECT sum(value) = ${OLD_ERROR_QUANTITY}  FROM system.errors WHERE name = 'UNKNOWN_TABLE'"
diff --git a/tests/queries/0_stateless/02790_fix_coredump_when_compile_expression.reference b/tests/queries/0_stateless/02790_fix_coredump_when_compile_expression.reference
new file mode 100644
index 00000000000..b8626c4cff2
--- /dev/null
+++ b/tests/queries/0_stateless/02790_fix_coredump_when_compile_expression.reference
@@ -0,0 +1 @@
+4
diff --git a/tests/queries/0_stateless/02790_fix_coredump_when_compile_expression.sql b/tests/queries/0_stateless/02790_fix_coredump_when_compile_expression.sql
new file mode 100644
index 00000000000..90995da0cca
--- /dev/null
+++ b/tests/queries/0_stateless/02790_fix_coredump_when_compile_expression.sql
@@ -0,0 +1,4 @@
+CREATE TABLE test (col1 Nullable(DOUBLE), col2 Nullable(DOUBLE), col3 DOUBLE) ENGINE=Memory;
+
+insert into test values(1.0 , 2.0, 3.0);
+select multiIf(col1 > 2, col2/col3, 4.0) from test SETTINGS min_count_to_compile_expression=0;
diff --git a/tests/queries/0_stateless/02790_url_multiple_tsv_files.reference b/tests/queries/0_stateless/02790_url_multiple_tsv_files.reference
new file mode 100644
index 00000000000..927a33afecf
--- /dev/null
+++ b/tests/queries/0_stateless/02790_url_multiple_tsv_files.reference
@@ -0,0 +1,5 @@
+136
+136
+136
+136
+136
diff --git a/tests/queries/0_stateless/02790_url_multiple_tsv_files.sql b/tests/queries/0_stateless/02790_url_multiple_tsv_files.sql
new file mode 100644
index 00000000000..b71bd7c737a
--- /dev/null
+++ b/tests/queries/0_stateless/02790_url_multiple_tsv_files.sql
@@ -0,0 +1,5 @@
+select sum(*) from (select * from url('http://127.0.0.1:8123?query=select+{1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16}+as+x+format+TSV', 'TSV') settings max_threads=1, max_download_threads=1);
+select sum(*) from (select * from url('http://127.0.0.1:8123?query=select+{1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16}+as+x+format+CSV', 'CSV') settings max_threads=1, max_download_threads=1);
+select sum(*) from (select * from url('http://127.0.0.1:8123?query=select+{1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16}+as+x+format+JSONEachRow', 'JSONEachRow') settings max_threads=1, max_download_threads=1);
+select sum(*) from (select * from url('http://127.0.0.1:8123?query=select+{1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16}+as+x+format+TSKV', 'TSKV') settings max_threads=1, max_download_threads=1);
+select sum(*) from (select * from url('http://127.0.0.1:8123?query=select+{1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16}+as+x+format+Native', 'Native') settings max_threads=1, max_download_threads=1);
diff --git a/tests/queries/0_stateless/02791_predicate_pushdown_different_types.reference b/tests/queries/0_stateless/02791_predicate_pushdown_different_types.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02791_predicate_pushdown_different_types.sql b/tests/queries/0_stateless/02791_predicate_pushdown_different_types.sql
new file mode 100644
index 00000000000..121ffb27e9b
--- /dev/null
+++ b/tests/queries/0_stateless/02791_predicate_pushdown_different_types.sql
@@ -0,0 +1,7 @@
+# These queries triggered a crash in old ClickHouse versions:
+
+CREATE TEMPORARY TABLE a (key UInt32, ID LowCardinality(String));
+CREATE TEMPORARY TABLE b (key UInt32);
+SELECT * FROM b JOIN a USING (key) WHERE ID = '1' HAVING ID = '1';
+
+# PS. Predicate pushdown does not work for LowCardinality(String), but it's another problem.
diff --git a/tests/queries/0_stateless/02794_pushdown_invalid_get.reference b/tests/queries/0_stateless/02794_pushdown_invalid_get.reference
new file mode 100644
index 00000000000..3fbedf693b5
--- /dev/null
+++ b/tests/queries/0_stateless/02794_pushdown_invalid_get.reference
@@ -0,0 +1 @@
+-2
diff --git a/tests/queries/0_stateless/02794_pushdown_invalid_get.sql b/tests/queries/0_stateless/02794_pushdown_invalid_get.sql
new file mode 100644
index 00000000000..949f868259e
--- /dev/null
+++ b/tests/queries/0_stateless/02794_pushdown_invalid_get.sql
@@ -0,0 +1,2 @@
+SELECT * FROM (SELECT toInt128(NULL) AS x UNION ALL SELECT materialize(toInt128(-2))) WHERE x; -- { serverError ILLEGAL_TYPE_OF_COLUMN_FOR_FILTER }
+SELECT * FROM (SELECT toInt128(NULL) AS x UNION ALL SELECT materialize(toInt128(-2))) WHERE x != 0;
diff --git a/tests/queries/0_stateless/02795_full_join_assert_cast.reference b/tests/queries/0_stateless/02795_full_join_assert_cast.reference
new file mode 100644
index 00000000000..102e3209c64
--- /dev/null
+++ b/tests/queries/0_stateless/02795_full_join_assert_cast.reference
@@ -0,0 +1 @@
+String
diff --git a/tests/queries/0_stateless/02795_full_join_assert_cast.sql b/tests/queries/0_stateless/02795_full_join_assert_cast.sql
new file mode 100644
index 00000000000..d3f0060ac79
--- /dev/null
+++ b/tests/queries/0_stateless/02795_full_join_assert_cast.sql
@@ -0,0 +1 @@
+SELECT any(toTypeName(s)) FROM (SELECT ('a' :: String) as s) t1 FULL JOIN (SELECT ('b' :: LowCardinality(String)) as s) t2 USING (s);
diff --git a/tests/queries/0_stateless/02796_projection_date_filter_on_view.reference b/tests/queries/0_stateless/02796_projection_date_filter_on_view.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02796_projection_date_filter_on_view.sql b/tests/queries/0_stateless/02796_projection_date_filter_on_view.sql
new file mode 100644
index 00000000000..9d9d7a3abd5
--- /dev/null
+++ b/tests/queries/0_stateless/02796_projection_date_filter_on_view.sql
@@ -0,0 +1,70 @@
+DROP TABLE IF EXISTS fx_1m;
+DROP TABLE IF EXISTS fx_5m;
+
+-- create source table
+CREATE TABLE fx_1m (
+    `symbol` LowCardinality(String) CODEC(ZSTD),
+    `dt_close` DateTime64(3, 'UTC') CODEC(DoubleDelta, ZSTD),
+    `open` Float32 CODEC(Delta, ZSTD),
+    `high` Float32 CODEC(Delta, ZSTD),
+    `low` Float32 CODEC(Delta, ZSTD),
+    `close` Float32 CODEC(Delta, ZSTD),
+    `volume` Float32 CODEC(Delta, ZSTD)
+)
+ENGINE = MergeTree()
+PARTITION BY toYear(dt_close)
+ORDER BY (symbol, dt_close);
+
+-- add projection
+ALTER TABLE fx_1m
+ADD PROJECTION fx_5m (
+    SELECT
+        symbol,
+        toStartOfInterval(dt_close, INTERVAL 300 SECOND) AS dt_close,
+        argMin(open, dt_close),
+        max(high),
+        min(low),
+        argMax(close, dt_close),
+        sum(volume) volume
+    GROUP BY symbol, dt_close
+);
+
+-- materialize projection
+ALTER TABLE fx_1m MATERIALIZE PROJECTION fx_5m SETTINGS mutations_sync = 2;
+
+-- create view using projection
+CREATE VIEW fx_5m AS
+SELECT
+    symbol,
+    toStartOfInterval(dt_close, INTERVAL 300 SECOND) AS dt_close,
+    argMin(open, dt_close) open,
+    max(high) high,
+    min(low) low,
+    argMax(close, dt_close) close,
+    sum(volume) volume
+FROM fx_1m
+GROUP BY symbol, dt_close;
+
+-- insert sample data
+INSERT INTO fx_1m
+SELECT
+    'EURUSD',
+    toDateTime64('2022-12-12 12:00:00', 3, 'UTC') + number,
+    number + randCanonical(),
+    number + randCanonical(),
+    number + randCanonical(),
+    number + randCanonical(),
+    number + randCanonical()
+FROM numbers(1000000);
+
+-- segmentation fault (filter on dt_close column)
+SELECT
+    dt_close,
+    close
+FROM fx_5m
+where symbol = 'EURUSD' and dt_close between '2022-12-11' and '2022-12-13'
+order by dt_close
+format Null;
+
+DROP TABLE fx_5m;
+DROP TABLE fx_1m;
diff --git a/tests/queries/0_stateless/02797_transform_narrow_types.reference b/tests/queries/0_stateless/02797_transform_narrow_types.reference
new file mode 100644
index 00000000000..5a2bd60ca83
--- /dev/null
+++ b/tests/queries/0_stateless/02797_transform_narrow_types.reference
@@ -0,0 +1,6 @@
+f
+s
+11
+11
+33
+3
diff --git a/tests/queries/0_stateless/02797_transform_narrow_types.sql b/tests/queries/0_stateless/02797_transform_narrow_types.sql
new file mode 100644
index 00000000000..56a02fb8af7
--- /dev/null
+++ b/tests/queries/0_stateless/02797_transform_narrow_types.sql
@@ -0,0 +1,6 @@
+SELECT transform(-1, [-1, 2], ['f', 's'], 'g');
+SELECT transform(2, [-1, 2], ['f', 's'], 'g');
+SELECT transform(-1, [-1, 2], [11, 22], 33);
+SELECT transform(-1, [-1, 2], [11, 22]);
+SELECT transform(3, [-1, 2], [11, 22], 33);
+SELECT transform(3, [-1, 2], [11, 22]);
diff --git a/tests/queries/0_stateless/02798_generic_transform.reference b/tests/queries/0_stateless/02798_generic_transform.reference
new file mode 100644
index 00000000000..2140c3218b3
--- /dev/null
+++ b/tests/queries/0_stateless/02798_generic_transform.reference
@@ -0,0 +1,38 @@
+def
+def
+def
+hello
+def
+world
+def
+abc!
+def
+def
+
+
+
+hello
+
+world
+
+abc
+
+
+
+
+
+hello
+
+world
+
+abc
+
+
+123
+2023-03-03 00:00:00.000
+2023-02-02 00:00:00.000
+2023-01-01 00:00:00.000
+1	1
+42	42
+42
+42
diff --git a/tests/queries/0_stateless/02798_generic_transform.sql b/tests/queries/0_stateless/02798_generic_transform.sql
new file mode 100644
index 00000000000..6317d83fb29
--- /dev/null
+++ b/tests/queries/0_stateless/02798_generic_transform.sql
@@ -0,0 +1,12 @@
+SELECT transform((number, toString(number)), [(3, '3'), (5, '5'), (7, '7')], ['hello', 'world', 'abc!'], 'def') FROM system.numbers LIMIT 10;
+SELECT transform(toNullable(toInt256(number)), [3, 5, 7], ['hello', 'world', 'abc'], '') FROM system.numbers LIMIT 10;
+SELECT transform(toUInt256(number), [3, 5, 7], ['hello', 'world', 'abc'], '') FROM system.numbers LIMIT 10;
+
+select case 1::Nullable(Int32) when 1 then 123 else 0 end;
+
+SELECT transform(arrayJoin(['c', 'b', 'a']), ['a', 'b'], [toDateTime64('2023-01-01', 3), toDateTime64('2023-02-02', 3)], toDateTime64('2023-03-03', 3));
+
+SELECT transform(1, [1], [toDecimal32(1, 2)]), toDecimal32(1, 2);
+select transform(1, [1], [toDecimal32(42, 2)]), toDecimal32(42, 2);
+SELECT transform(1, [1], [toDecimal32(42, 2)], 0);
+SELECT transform(1, [1], [toDecimal32(42, 2)], toDecimal32(0, 2));
diff --git a/tests/queries/0_stateless/02799_transform_empty_arrays.reference b/tests/queries/0_stateless/02799_transform_empty_arrays.reference
new file mode 100644
index 00000000000..fd44083947e
--- /dev/null
+++ b/tests/queries/0_stateless/02799_transform_empty_arrays.reference
@@ -0,0 +1,30 @@
+0
+1
+2
+3
+4
+5
+6
+7
+8
+9
+Hello
+Hello
+Hello
+Hello
+Hello
+Hello
+Hello
+Hello
+Hello
+Hello
+Hello 0
+Hello 1
+Hello 2
+Hello 3
+Hello 4
+Hello 5
+Hello 6
+Hello 7
+Hello 8
+Hello 9
diff --git a/tests/queries/0_stateless/02799_transform_empty_arrays.sql b/tests/queries/0_stateless/02799_transform_empty_arrays.sql
new file mode 100644
index 00000000000..84e3e9d2930
--- /dev/null
+++ b/tests/queries/0_stateless/02799_transform_empty_arrays.sql
@@ -0,0 +1,3 @@
+SELECT transform(number, [], [1]) FROM numbers(10);
+SELECT transform(number, [], [], 'Hello') FROM numbers(10);
+SELECT transform(number, [], [], 'Hello ' || number::String) FROM numbers(10);
diff --git a/tests/queries/0_stateless/02800_transform_alter.reference b/tests/queries/0_stateless/02800_transform_alter.reference
new file mode 100644
index 00000000000..cae8aeba20f
--- /dev/null
+++ b/tests/queries/0_stateless/02800_transform_alter.reference
@@ -0,0 +1,6 @@
+1	a1	a1
+2	a2	b2
+3	a3	b3
+1	a1
+2	b2
+3	b3
diff --git a/tests/queries/0_stateless/02800_transform_alter.sql b/tests/queries/0_stateless/02800_transform_alter.sql
new file mode 100644
index 00000000000..7458f51c5a4
--- /dev/null
+++ b/tests/queries/0_stateless/02800_transform_alter.sql
@@ -0,0 +1,43 @@
+DROP TABLE IF EXISTS test_xy;
+DROP TABLE IF EXISTS updates;
+
+CREATE TABLE test_xy
+(
+    `x` Int32,
+    `y` String
+)
+ENGINE = MergeTree
+ORDER BY x;
+
+CREATE TABLE updates
+(
+    `x` Int32,
+    `y` String
+)
+ENGINE = MergeTree
+ORDER BY x;
+
+INSERT INTO test_xy(x, y) VALUES (1, 'a1'), (2, 'a2'), (3, 'a3');
+INSERT INTO updates(x, y) VALUES  (2, 'b2'), (3, 'b3');
+
+SELECT x, y,
+    transform(x,
+        (select groupArray(x) from (select x, y from updates order by x) t1),
+        (select groupArray(y) from (select x, y from updates order by x) t2),
+        y)
+FROM test_xy
+WHERE 1 ORDER BY x, y;
+
+SET mutations_sync = 1;
+ALTER table test_xy
+    UPDATE
+    y =  transform(x,
+        (select groupArray(x) from (select x, y from updates order by x) t1),
+        (select groupArray(y) from (select x, y from updates order by x) t2),
+        y)
+    WHERE 1;
+
+SELECT * FROM test_xy ORDER BY x, y;
+
+DROP TABLE test_xy;
+DROP TABLE updates;
diff --git a/tests/queries/0_stateless/02801_transform_nullable.reference b/tests/queries/0_stateless/02801_transform_nullable.reference
new file mode 100644
index 00000000000..48d529e7d90
--- /dev/null
+++ b/tests/queries/0_stateless/02801_transform_nullable.reference
@@ -0,0 +1,75 @@
+1970-01-01 00:00:01.000
+1970-01-01 00:00:02.000
+1970-01-01 00:00:00.000
+\N
+\N
+\N
+hello
+\N
+world
+\N
+abc
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+-1
+-1
+-1
+111
+-1
+222
+-1
+\N
+-1
+-1
+-1.1
+-1.1
+-1.1
+\N
+-1.1
+222
+-1.1
+333
+-1.1
+-1.1
+1
+1
+1
+\N
+1
+\N
+1
+\N
+1
+1
+Остальные
+\N
+-
+xyz
+Hello
+-
+xyz
+World
+-
+xyz
+-
+-
diff --git a/tests/queries/0_stateless/02801_transform_nullable.sql b/tests/queries/0_stateless/02801_transform_nullable.sql
new file mode 100644
index 00000000000..95f3c16600a
--- /dev/null
+++ b/tests/queries/0_stateless/02801_transform_nullable.sql
@@ -0,0 +1,14 @@
+select transform('a', ['a', 'b'], [toDateTime64(1, 3, 'UTC'), toDateTime64(2, 3, 'UTC')], toDateTime64(0, 3, 'UTC'));
+select transform(2, [1, 2], [toDateTime64(1, 3, 'UTC'), toDateTime64(2, 3, 'UTC')], toDateTime64(0, 3, 'UTC'));
+select transform(null, [1, 2], [toDateTime64(1, 3, 'UTC'), toDateTime64(2, 3, 'UTC')], toDateTime64(0, 3, 'UTC'));
+
+SELECT transform(number, [3, 5, 7], ['hello', 'world', 'abc'], null) FROM system.numbers LIMIT 10;
+SELECT transform(null, ['3', '5', '7'], ['hello', 'world', 'abc'], null) FROM system.numbers LIMIT 10;
+SELECT transform(null, [null, null, null], [null, null, null], null) FROM system.numbers LIMIT 10;
+SELECT transform(toString(number), ['3', '5', '7'], [111, 222, null], -1) FROM system.numbers LIMIT 10;
+SELECT transform(toString(number), ['3', '5', '7'], [null, 222, 333], materialize(-1.1)) FROM system.numbers LIMIT 10;
+SELECT transform(toString(number), ['3', '5', '7'], [null, null, null], materialize(1)) FROM system.numbers LIMIT 10;
+SELECT transform(1, [2, 3], ['Meta.ua', null], materialize('Остальные')) AS title;
+SELECT transform(2, [2, 3], [null, 'Google'], materialize('Остальные')) AS title;
+
+SELECT transform(number % 3 = 1 ? NULL : number, [2, 5, NULL], ['Hello', 'World', 'xyz'], '-') FROM numbers(10);
diff --git a/tests/queries/0_stateless/02803_remote_cannot_clone_block.reference b/tests/queries/0_stateless/02803_remote_cannot_clone_block.reference
new file mode 100644
index 00000000000..d00491fd7e5
--- /dev/null
+++ b/tests/queries/0_stateless/02803_remote_cannot_clone_block.reference
@@ -0,0 +1 @@
+1
diff --git a/tests/queries/0_stateless/02803_remote_cannot_clone_block.sql b/tests/queries/0_stateless/02803_remote_cannot_clone_block.sql
new file mode 100644
index 00000000000..6d79aa76d18
--- /dev/null
+++ b/tests/queries/0_stateless/02803_remote_cannot_clone_block.sql
@@ -0,0 +1,21 @@
+DROP TABLE IF EXISTS numbers_10_00223;
+
+CREATE TABLE numbers_10_00223
+ENGINE = Log AS
+SELECT *
+FROM system.numbers
+LIMIT 10000;
+
+SET allow_experimental_analyzer = 0;
+
+SELECT *
+FROM
+(
+    SELECT 1
+    FROM remote('127.0.0.{2,3}', currentDatabase(), numbers_10_00223)
+        WITH TOTALS
+)
+WHERE 1
+GROUP BY 1;
+
+DROP TABLE numbers_10_00223;
diff --git a/tests/queries/0_stateless/02806_system_parts_columns_modification_time.reference b/tests/queries/0_stateless/02806_system_parts_columns_modification_time.reference
new file mode 100644
index 00000000000..f1be11980bb
--- /dev/null
+++ b/tests/queries/0_stateless/02806_system_parts_columns_modification_time.reference
@@ -0,0 +1,6 @@
+Wide	key	1	1
+Wide	key	1	1
+Wide	value	1	0
+Compact	key	1	1
+Compact	key	1	1
+Compact	value	1	1
diff --git a/tests/queries/0_stateless/02806_system_parts_columns_modification_time.sql.j2 b/tests/queries/0_stateless/02806_system_parts_columns_modification_time.sql.j2
new file mode 100644
index 00000000000..eee236ff681
--- /dev/null
+++ b/tests/queries/0_stateless/02806_system_parts_columns_modification_time.sql.j2
@@ -0,0 +1,30 @@
+-- Tags: no-s3-storage
+-- Tag: no-s3-storage because S3 updates metadata for the virtual link file on metadata disk (see CreateHardlinkOperation::execute() for details)
+
+set mutations_sync=1;
+
+{# modification time of the part folder and column files not always equal, this is how much seconds of difference is allowed #}
+{% set mtime_diff_in_seconds = 5 %}
+
+{% for id, settings, file_per_column in [
+    ("wide",    "min_bytes_for_wide_part=0, min_rows_for_wide_part=0",      true),
+    ("compact", "min_bytes_for_wide_part=1000, min_rows_for_wide_part=100", false)
+]
+%}
+
+drop table if exists data_{{ id }};
+create table data_{{ id }} (key Int) engine=MergeTree() order by tuple() settings {{ settings }};
+insert into data_{{ id }} values (1);
+select sleep(3) format Null;
+select part_type, column, now()-modification_time < 10, modification_time - column_modification_time < {{ mtime_diff_in_seconds }} from system.parts_columns where database = currentDatabase() and table = 'data_{{ id }}';
+alter table data_{{ id }} add column value Int default 0;
+alter table data_{{ id }} materialize column value;
+select part_type, column, now()-modification_time < 10,
+{% if file_per_column %}
+modification_time - column_modification_time >= 3
+{% else %}
+modification_time - column_modification_time < {{ mtime_diff_in_seconds }}
+{% endif %}
+from system.parts_columns where active and database = currentDatabase() and table = 'data_{{ id }}' order by column;
+
+{% endfor %}
diff --git a/tests/queries/0_stateless/02807_lower_utf8_msan.reference b/tests/queries/0_stateless/02807_lower_utf8_msan.reference
new file mode 100644
index 00000000000..7d7df6af777
--- /dev/null
+++ b/tests/queries/0_stateless/02807_lower_utf8_msan.reference
@@ -0,0 +1,4 @@
+©--------------------
+©--------------------------------------
+AAAAАБВГAAAAAAAAAAAAАБВГAAAAAAAA
+AAAAАБВГAAAAAAAAAAAAАБВГAAAAAAAA
diff --git a/tests/queries/0_stateless/02807_lower_utf8_msan.sql b/tests/queries/0_stateless/02807_lower_utf8_msan.sql
new file mode 100644
index 00000000000..e9eb18bf615
--- /dev/null
+++ b/tests/queries/0_stateless/02807_lower_utf8_msan.sql
@@ -0,0 +1,2 @@
+SELECT lowerUTF8(arrayJoin(['©--------------------------------------', '©--------------------'])) ORDER BY 1;
+SELECT upperUTF8(materialize('aaaaАБВГaaaaaaaaaaaaАБВГAAAAaaAA')) FROM numbers(2);
diff --git a/tests/queries/0_stateless/02807_math_unary_crash.reference b/tests/queries/0_stateless/02807_math_unary_crash.reference
new file mode 100644
index 00000000000..6ed281c757a
--- /dev/null
+++ b/tests/queries/0_stateless/02807_math_unary_crash.reference
@@ -0,0 +1,2 @@
+1
+1
diff --git a/tests/queries/0_stateless/02807_math_unary_crash.sql b/tests/queries/0_stateless/02807_math_unary_crash.sql
new file mode 100644
index 00000000000..fb693ac70f7
--- /dev/null
+++ b/tests/queries/0_stateless/02807_math_unary_crash.sql
@@ -0,0 +1,6 @@
+DROP TABLE IF EXISTS t10;
+CREATE TABLE t10 (`c0` Int32) ENGINE = MergeTree ORDER BY tuple();
+INSERT INTO t10 (c0) FORMAT Values (-1);
+SELECT 1 FROM t10 GROUP BY erf(-sign(t10.c0));
+SELECT 1 FROM t10 GROUP BY -sign(t10.c0);
+DROP TABLE t10;
diff --git a/tests/queries/0_stateless/02808_custom_disk_with_user_defined_name.reference b/tests/queries/0_stateless/02808_custom_disk_with_user_defined_name.reference
new file mode 100644
index 00000000000..713dde3527d
--- /dev/null
+++ b/tests/queries/0_stateless/02808_custom_disk_with_user_defined_name.reference
@@ -0,0 +1,3 @@
+OK
+0
+1
diff --git a/tests/queries/0_stateless/02808_custom_disk_with_user_defined_name.sh b/tests/queries/0_stateless/02808_custom_disk_with_user_defined_name.sh
new file mode 100755
index 00000000000..a43cd6deb9e
--- /dev/null
+++ b/tests/queries/0_stateless/02808_custom_disk_with_user_defined_name.sh
@@ -0,0 +1,33 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+# set -x
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+
+$CLICKHOUSE_CLIENT -nm --query """
+DROP TABLE IF EXISTS test;
+CREATE TABLE test (a Int32, b String)
+ENGINE = MergeTree() ORDER BY tuple()
+SETTINGS disk = disk_s3_disk(type = cache, max_size = '100Ki', path = ${CLICKHOUSE_TEST_UNIQUE_NAME}, disk = s3_disk);
+""" 2>&1 | grep -q "Disk with name \`s3_disk\` already exist" && echo 'OK' || echo 'FAIL'
+
+disk_name="${CLICKHOUSE_TEST_UNIQUE_NAME}"
+
+$CLICKHOUSE_CLIENT -nm --query """
+SELECT count() FROM system.disks WHERE name = '$disk_name'
+"""
+
+$CLICKHOUSE_CLIENT -nm --query """
+DROP TABLE IF EXISTS test;
+CREATE TABLE test (a Int32, b String)
+ENGINE = MergeTree() ORDER BY tuple()
+SETTINGS disk = disk_$disk_name(type = cache, max_size = '100Ki', path = ${CLICKHOUSE_TEST_UNIQUE_NAME}, disk = s3_disk);
+"""
+
+$CLICKHOUSE_CLIENT -nm --query """
+SELECT count() FROM system.disks WHERE name = '$disk_name'
+"""
diff --git a/tests/queries/0_stateless/02809_prewhere_and_in.reference b/tests/queries/0_stateless/02809_prewhere_and_in.reference
new file mode 100644
index 00000000000..3080ae862bb
--- /dev/null
+++ b/tests/queries/0_stateless/02809_prewhere_and_in.reference
@@ -0,0 +1,8 @@
+PREWHERE a IN
+PREWHERE a IN
+PREWHERE a IN
+PREWHERE a IN
+PREWHERE b NOT IN
+PREWHERE b NOT IN
+PREWHERE b NOT IN
+PREWHERE b NOT IN
diff --git a/tests/queries/0_stateless/02809_prewhere_and_in.sql b/tests/queries/0_stateless/02809_prewhere_and_in.sql
new file mode 100644
index 00000000000..345577d6c7c
--- /dev/null
+++ b/tests/queries/0_stateless/02809_prewhere_and_in.sql
@@ -0,0 +1,56 @@
+DROP TABLE IF EXISTS t_02809;
+
+CREATE TABLE t_02809(a Int64, b Int64, s String)
+ENGINE=MergeTree order by tuple()
+AS SELECT number, number%10, toString(arrayMap(i-> cityHash64(i*number), range(50))) FROM numbers(10000);
+
+CREATE TABLE t_02809_set(c Int64)
+ENGINE=Set()
+AS SELECT * FROM numbers(10);
+
+CREATE TABLE t_02809_aux(c Int64)
+ENGINE=Memory()
+AS SELECT * FROM numbers(10);
+
+
+SET optimize_move_to_prewhere=1;
+
+-- Queries with 'IN'
+SELECT substring(explain, 1, 13) FROM (EXPLAIN SYNTAX
+     SELECT * FROM t_02809 WHERE a IN (SELECT * FROM system.one)
+) WHERE explain LIKE '%WHERE%';
+
+SELECT substring(explain, 1, 13) FROM (EXPLAIN SYNTAX
+     SELECT * FROM t_02809 WHERE a IN (1,2,3)
+) WHERE explain LIKE '%WHERE%';
+
+SELECT substring(explain, 1, 13) FROM (EXPLAIN SYNTAX
+     SELECT * FROM t_02809 WHERE a IN t_02809_set
+) WHERE explain LIKE '%WHERE%';
+
+SELECT substring(explain, 1, 13) FROM (EXPLAIN SYNTAX
+     SELECT * FROM t_02809 WHERE a IN t_02809_aux
+) WHERE explain LIKE '%WHERE%';
+
+
+-- Queries with 'NOT IN'
+SELECT substring(explain, 1, 17) FROM (EXPLAIN SYNTAX
+     SELECT * FROM t_02809 WHERE b NOT IN (SELECT * FROM system.one)
+) WHERE explain LIKE '%WHERE%';
+
+SELECT substring(explain, 1, 17) FROM (EXPLAIN SYNTAX
+     SELECT * FROM t_02809 WHERE b NOT IN (1,2,3)
+) WHERE explain LIKE '%WHERE%';
+
+SELECT substring(explain, 1, 17) FROM (EXPLAIN SYNTAX
+     SELECT * FROM t_02809 WHERE b NOT IN t_02809_set
+) WHERE explain LIKE '%WHERE%';
+
+SELECT substring(explain, 1, 17) FROM (EXPLAIN SYNTAX
+     SELECT * FROM t_02809 WHERE b NOT IN t_02809_aux
+) WHERE explain LIKE '%WHERE%';
+
+
+DROP TABLE t_02809;
+DROP TABLE t_02809_set;
+DROP TABLE t_02809_aux;
diff --git a/tests/queries/0_stateless/02809_storage_set_analysis_bug.reference b/tests/queries/0_stateless/02809_storage_set_analysis_bug.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02809_storage_set_analysis_bug.sql b/tests/queries/0_stateless/02809_storage_set_analysis_bug.sql
new file mode 100644
index 00000000000..531946acda0
--- /dev/null
+++ b/tests/queries/0_stateless/02809_storage_set_analysis_bug.sql
@@ -0,0 +1,17 @@
+DROP TABLE IF EXISTS test_set;
+DROP TABLE IF EXISTS null_in__fuzz_6;
+
+set allow_suspicious_low_cardinality_types = 1;
+
+CREATE TABLE null_in__fuzz_6 (`dt` LowCardinality(UInt16), `idx` Int32, `i` Nullable(Int256), `s` Int32) ENGINE = MergeTree PARTITION BY dt ORDER BY idx;
+insert into null_in__fuzz_6 select * from generateRandom() limit 1;
+
+SET transform_null_in = 0;
+
+CREATE TABLE test_set (i Nullable(int)) ENGINE = Set();
+INSERT INTO test_set VALUES (1), (NULL);
+
+SELECT count() = 1 FROM null_in__fuzz_6 PREWHERE 71 WHERE i IN (test_set); -- { serverError CANNOT_CONVERT_TYPE }
+
+DROP TABLE test_set;
+DROP TABLE null_in__fuzz_6;
diff --git a/tests/queries/0_stateless/02810_async_insert_dedup_replicated_collapsing.reference b/tests/queries/0_stateless/02810_async_insert_dedup_replicated_collapsing.reference
new file mode 100644
index 00000000000..74624d246de
--- /dev/null
+++ b/tests/queries/0_stateless/02810_async_insert_dedup_replicated_collapsing.reference
@@ -0,0 +1,8 @@
+string1
+------------
+string1
+------------
+string1
+string1
+string2
+------------
diff --git a/tests/queries/0_stateless/02810_async_insert_dedup_replicated_collapsing.sh b/tests/queries/0_stateless/02810_async_insert_dedup_replicated_collapsing.sh
new file mode 100755
index 00000000000..804cd894ebc
--- /dev/null
+++ b/tests/queries/0_stateless/02810_async_insert_dedup_replicated_collapsing.sh
@@ -0,0 +1,39 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+${CLICKHOUSE_CLIENT} -q "DROP TABLE IF EXISTS 02810_async_insert_dedup_collapsing"
+${CLICKHOUSE_CLIENT} -q "CREATE TABLE 02810_async_insert_dedup_collapsing (stringvalue String, sign Int8) ENGINE = ReplicatedCollapsingMergeTree('/clickhouse/{database}/02810_async_insert_dedup', 'r1', sign) ORDER BY stringvalue"
+
+url="${CLICKHOUSE_URL}&async_insert=1&wait_for_async_insert=1&async_insert_busy_timeout_ms=3000&async_insert_deduplicate=1"
+
+# insert value with same key and sign so it's collapsed on insert
+${CLICKHOUSE_CURL} -sS "$url" -d "INSERT INTO 02810_async_insert_dedup_collapsing VALUES ('string1', 1)" &
+${CLICKHOUSE_CURL} -sS "$url" -d "INSERT INTO 02810_async_insert_dedup_collapsing VALUES ('string1', 1)" &
+
+wait
+
+${CLICKHOUSE_CLIENT} -q "SELECT stringvalue FROM 02810_async_insert_dedup_collapsing ORDER BY stringvalue"
+${CLICKHOUSE_CLIENT} -q "SELECT '------------'"
+
+# trigger same collaps algorithm but also deduplication
+${CLICKHOUSE_CURL} -sS "$url" -d "INSERT INTO 02810_async_insert_dedup_collapsing VALUES ('string1', 1)" & 
+${CLICKHOUSE_CURL} -sS "$url" -d "INSERT INTO 02810_async_insert_dedup_collapsing VALUES ('string1', 1)" &
+
+wait
+
+${CLICKHOUSE_CLIENT} -q "SELECT stringvalue FROM 02810_async_insert_dedup_collapsing ORDER BY stringvalue"
+${CLICKHOUSE_CLIENT} -q "SELECT '------------'"
+
+${CLICKHOUSE_CURL} -sS "$url" -d "INSERT INTO 02810_async_insert_dedup_collapsing VALUES ('string2', 1)" &
+${CLICKHOUSE_CURL} -sS "$url" -d "INSERT INTO 02810_async_insert_dedup_collapsing VALUES ('string2', 1), ('string1', 1)" &
+${CLICKHOUSE_CURL} -sS "$url" -d "INSERT INTO 02810_async_insert_dedup_collapsing VALUES ('string2', 1)" &
+
+wait
+
+${CLICKHOUSE_CLIENT} -q "SELECT stringvalue FROM 02810_async_insert_dedup_collapsing ORDER BY stringvalue"
+${CLICKHOUSE_CLIENT} -q "SELECT '------------'"
+
+${CLICKHOUSE_CLIENT} -q "DROP TABLE 02810_async_insert_dedup_collapsing"
\ No newline at end of file
diff --git a/tests/queries/0_stateless/data_avro/decimals.avro b/tests/queries/0_stateless/data_avro/decimals.avro
new file mode 100644
index 00000000000..630d6864047
Binary files /dev/null and b/tests/queries/0_stateless/data_avro/decimals.avro differ
diff --git a/tests/queries/0_stateless/data_csv/csv_with_space_delimiter.csv b/tests/queries/0_stateless/data_csv/csv_with_space_delimiter.csv
new file mode 100644
index 00000000000..967f8ae450e
--- /dev/null
+++ b/tests/queries/0_stateless/data_csv/csv_with_space_delimiter.csv
@@ -0,0 +1 @@
+1 a b
diff --git a/tests/queries/0_stateless/data_csv/csv_with_tab_delimiter.csv b/tests/queries/0_stateless/data_csv/csv_with_tab_delimiter.csv
new file mode 100644
index 00000000000..f3b63950ea8
--- /dev/null
+++ b/tests/queries/0_stateless/data_csv/csv_with_tab_delimiter.csv
@@ -0,0 +1 @@
+2	c	d
diff --git a/tests/queries/0_stateless/data_minio/02731.arrow b/tests/queries/0_stateless/data_minio/02731.arrow
new file mode 100644
index 00000000000..ee104640365
Binary files /dev/null and b/tests/queries/0_stateless/data_minio/02731.arrow differ
diff --git a/tests/queries/0_stateless/data_minio/02731.parquet b/tests/queries/0_stateless/data_minio/02731.parquet
new file mode 100644
index 00000000000..8300a18642a
Binary files /dev/null and b/tests/queries/0_stateless/data_minio/02731.parquet differ
diff --git a/tests/queries/0_stateless/format_schemas/02735_case_insensitive_names_matching.capnp b/tests/queries/0_stateless/format_schemas/02735_case_insensitive_names_matching.capnp
new file mode 100644
index 00000000000..6b12aab081a
--- /dev/null
+++ b/tests/queries/0_stateless/format_schemas/02735_case_insensitive_names_matching.capnp
@@ -0,0 +1,13 @@
+@0x9ef128e10a8010b8;
+
+struct Nested
+{
+    field1 @0 : UInt32;
+    field2 @1 : UInt32;
+}
+
+struct Message
+{
+    field1 @0 : UInt32;
+    nested @1 : Nested;
+}
diff --git a/tests/queries/0_stateless/format_schemas/02736_nested_structures.capnp b/tests/queries/0_stateless/format_schemas/02736_nested_structures.capnp
new file mode 100644
index 00000000000..a03eb27f383
--- /dev/null
+++ b/tests/queries/0_stateless/format_schemas/02736_nested_structures.capnp
@@ -0,0 +1,21 @@
+@0x9ef128e10a8010b8;
+
+struct Nested2
+{
+    field1 @0 : UInt32;
+    field2 @1 : UInt32;
+}
+
+struct Nested
+{
+    field1 @0 : UInt32;
+    nested @1 : Nested2;
+    nestedList @2 : List(Nested2);
+}
+
+struct Message
+{
+    nested @0 : Nested;
+    nestedList @1 : List(Nested);
+}
+
diff --git a/tests/queries/1_stateful/00013_sorting_of_nested.sql b/tests/queries/1_stateful/00013_sorting_of_nested.sql
index f97120e2b98..7f4a5002a7b 100644
--- a/tests/queries/1_stateful/00013_sorting_of_nested.sql
+++ b/tests/queries/1_stateful/00013_sorting_of_nested.sql
@@ -1,4 +1 @@
--- Tags: no-parallel-replicas
-
 SELECT ParsedParams.Key1 FROM test.visits FINAL WHERE VisitID != 0 AND notEmpty(ParsedParams.Key1) ORDER BY VisitID LIMIT 10
-
diff --git a/tests/queries/1_stateful/00022_merge_prewhere.sql b/tests/queries/1_stateful/00022_merge_prewhere.sql
index 400a896d5a8..74a3677b68e 100644
--- a/tests/queries/1_stateful/00022_merge_prewhere.sql
+++ b/tests/queries/1_stateful/00022_merge_prewhere.sql
@@ -1,5 +1,3 @@
--- Tags: no-parallel-replicas
-
 DROP TABLE IF EXISTS test.merge_hits;
 CREATE TABLE IF NOT EXISTS test.merge_hits AS test.hits ENGINE = Merge(test, '^hits$');
 SELECT count() FROM test.merge_hits WHERE AdvEngineID = 2;
diff --git a/tests/queries/1_stateful/00042_any_left_join.sql b/tests/queries/1_stateful/00042_any_left_join.sql
index c7c0f0f987a..b87cf88f007 100644
--- a/tests/queries/1_stateful/00042_any_left_join.sql
+++ b/tests/queries/1_stateful/00042_any_left_join.sql
@@ -1,5 +1,3 @@
--- Tags: no-parallel-replicas
-
 SELECT
     EventDate,
     hits,
diff --git a/tests/queries/1_stateful/00043_any_left_join.sql b/tests/queries/1_stateful/00043_any_left_join.sql
index 6b8cce54051..704d38f727a 100644
--- a/tests/queries/1_stateful/00043_any_left_join.sql
+++ b/tests/queries/1_stateful/00043_any_left_join.sql
@@ -1,5 +1,3 @@
--- Tags: no-parallel-replicas
-
 SELECT
     EventDate,
     count() AS hits,
diff --git a/tests/queries/1_stateful/00044_any_left_join_string.sql b/tests/queries/1_stateful/00044_any_left_join_string.sql
index ceb7a1c1783..a4f2e9e1b96 100644
--- a/tests/queries/1_stateful/00044_any_left_join_string.sql
+++ b/tests/queries/1_stateful/00044_any_left_join_string.sql
@@ -1,5 +1,3 @@
--- Tags: no-parallel-replicas
-
 SELECT
     domain,
     hits,
diff --git a/tests/queries/1_stateful/00063_loyalty_joins.sql b/tests/queries/1_stateful/00063_loyalty_joins.sql
index 44f0767a87a..44b575cab85 100644
--- a/tests/queries/1_stateful/00063_loyalty_joins.sql
+++ b/tests/queries/1_stateful/00063_loyalty_joins.sql
@@ -1,5 +1,3 @@
--- Tags: no-parallel-replicas
-
 SET any_join_distinct_right_table_keys = 1;
 SET joined_subquery_requires_alias = 0;
 
diff --git a/tests/queries/1_stateful/00065_loyalty_with_storage_join.sql b/tests/queries/1_stateful/00065_loyalty_with_storage_join.sql
index 35f0c7b60b9..a0f41f8aa8d 100644
--- a/tests/queries/1_stateful/00065_loyalty_with_storage_join.sql
+++ b/tests/queries/1_stateful/00065_loyalty_with_storage_join.sql
@@ -1,5 +1,3 @@
--- Tags: no-parallel-replicas
-
 USE test;
 
 DROP TABLE IF EXISTS join;
diff --git a/tests/queries/1_stateful/00074_full_join.sql b/tests/queries/1_stateful/00074_full_join.sql
index c1d9e4be1a4..f049be2a74d 100644
--- a/tests/queries/1_stateful/00074_full_join.sql
+++ b/tests/queries/1_stateful/00074_full_join.sql
@@ -1,5 +1,3 @@
--- Tags: no-parallel-replicas
-
 set any_join_distinct_right_table_keys = 1;
 set joined_subquery_requires_alias = 0;
 
diff --git a/tests/queries/1_stateful/00075_left_array_join.sql b/tests/queries/1_stateful/00075_left_array_join.sql
index 3540d791157..1fd045a26bf 100644
--- a/tests/queries/1_stateful/00075_left_array_join.sql
+++ b/tests/queries/1_stateful/00075_left_array_join.sql
@@ -1,4 +1,2 @@
--- Tags: no-parallel-replicas
-
 SELECT UserID, EventTime::DateTime('Asia/Dubai'), pp.Key1, pp.Key2, ParsedParams.Key1 FROM test.hits ARRAY JOIN ParsedParams AS pp WHERE CounterID = 1704509 ORDER BY UserID, EventTime, pp.Key1, pp.Key2 LIMIT 100;
 SELECT UserID, EventTime::DateTime('Asia/Dubai'), pp.Key1, pp.Key2, ParsedParams.Key1 FROM test.hits LEFT ARRAY JOIN ParsedParams AS pp WHERE CounterID = 1704509 ORDER BY UserID, EventTime, pp.Key1, pp.Key2 LIMIT 100;
diff --git a/tests/queries/1_stateful/00079_array_join_not_used_joined_column.sql b/tests/queries/1_stateful/00079_array_join_not_used_joined_column.sql
index 9431e1cf596..8e6742bb1e1 100644
--- a/tests/queries/1_stateful/00079_array_join_not_used_joined_column.sql
+++ b/tests/queries/1_stateful/00079_array_join_not_used_joined_column.sql
@@ -1,5 +1,3 @@
--- Tags: no-parallel-replicas
-
 SELECT PP.Key1 AS `ym:s:paramsLevel1`, sum(arrayAll(`x_1` -> `x_1`= '', ParsedParams.Key2)) AS `ym:s:visits` FROM test.hits ARRAY JOIN ParsedParams AS `PP`  WHERE CounterID = 1704509 GROUP BY `ym:s:paramsLevel1` ORDER BY PP.Key1, `ym:s:visits` LIMIT 0, 100;
 SELECT PP.Key1 AS x1, ParsedParams.Key2 AS x2 FROM test.hits ARRAY JOIN ParsedParams AS PP WHERE CounterID = 1704509 ORDER BY x1, x2 LIMIT 10;
 SELECT ParsedParams.Key2 AS x FROM test.hits ARRAY JOIN ParsedParams AS PP ORDER BY x DESC LIMIT 10;
diff --git a/tests/queries/1_stateful/00080_array_join_and_union.sql b/tests/queries/1_stateful/00080_array_join_and_union.sql
index 2f2e5e9324f..d9aa1cc17cc 100644
--- a/tests/queries/1_stateful/00080_array_join_and_union.sql
+++ b/tests/queries/1_stateful/00080_array_join_and_union.sql
@@ -1,3 +1 @@
--- Tags: no-parallel-replicas
-
 SELECT count() FROM (SELECT Goals.ID FROM test.visits ARRAY JOIN Goals WHERE CounterID = 842440 LIMIT 10 UNION ALL SELECT Goals.ID FROM test.visits ARRAY JOIN Goals WHERE CounterID = 842440 LIMIT 10);
diff --git a/tests/queries/1_stateful/00084_external_aggregation.sql b/tests/queries/1_stateful/00084_external_aggregation.sql
index 330aa158cf7..b3922eae049 100644
--- a/tests/queries/1_stateful/00084_external_aggregation.sql
+++ b/tests/queries/1_stateful/00084_external_aggregation.sql
@@ -1,5 +1,3 @@
--- Tags: no-random-settings, no-parallel-replicas
-
 SET max_bytes_before_external_group_by = 200000000;
 
 SET max_memory_usage = 1500000000;
diff --git a/tests/queries/1_stateful/00092_obfuscator.sh b/tests/queries/1_stateful/00092_obfuscator.sh
index f19473f01ac..f9e0098a46c 100755
--- a/tests/queries/1_stateful/00092_obfuscator.sh
+++ b/tests/queries/1_stateful/00092_obfuscator.sh
@@ -1,6 +1,5 @@
 #!/usr/bin/env bash
-# Tags: no-parallel-replicas
-# clickhouse-local may not work with parallel replicas
+
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
diff --git a/tests/queries/1_stateful/00096_obfuscator_save_load.sh b/tests/queries/1_stateful/00096_obfuscator_save_load.sh
index 1bb212e1bba..a88dfcdb9b9 100755
--- a/tests/queries/1_stateful/00096_obfuscator_save_load.sh
+++ b/tests/queries/1_stateful/00096_obfuscator_save_load.sh
@@ -1,6 +1,4 @@
 #!/usr/bin/env bash
-# Tags: no-parallel-replicas
-# clickhouse-local may not work with parallel replicas
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
diff --git a/tests/queries/1_stateful/00146_aggregate_function_uniq.sql b/tests/queries/1_stateful/00146_aggregate_function_uniq.sql
index 2cab6e70d22..fd3fde7636d 100644
--- a/tests/queries/1_stateful/00146_aggregate_function_uniq.sql
+++ b/tests/queries/1_stateful/00146_aggregate_function_uniq.sql
@@ -1,5 +1,3 @@
--- Tags: no-parallel-replicas
-
 SELECT RegionID, uniqHLL12(WatchID) AS X FROM remote('127.0.0.{1,2}', test, hits) GROUP BY RegionID HAVING X > 100000 ORDER BY RegionID ASC;
 SELECT RegionID, uniqCombined(WatchID) AS X FROM remote('127.0.0.{1,2}', test, hits) GROUP BY RegionID HAVING X > 100000 ORDER BY RegionID ASC;
 SELECT abs(uniq(WatchID) - uniqExact(WatchID)) FROM test.hits;
diff --git a/tests/queries/1_stateful/00149_quantiles_timing_distributed.sql b/tests/queries/1_stateful/00149_quantiles_timing_distributed.sql
index 5d2476226ba..6f910646fb7 100644
--- a/tests/queries/1_stateful/00149_quantiles_timing_distributed.sql
+++ b/tests/queries/1_stateful/00149_quantiles_timing_distributed.sql
@@ -1,4 +1,4 @@
--- Tags: distributed, no-parallel-replicas
+-- Tags: distributed
 
 SELECT sum(cityHash64(*)) FROM (SELECT CounterID, quantileTiming(0.5)(SendTiming), count() FROM remote('127.0.0.{1,2,3,4,5,6,7,8,9,10}', test.hits) WHERE SendTiming != -1 GROUP BY CounterID);
 SELECT sum(cityHash64(*)) FROM (SELECT CounterID, quantileTiming(0.5)(SendTiming), count() FROM remote('127.0.0.{1,2,3,4,5,6,7,8,9,10}', test.hits) WHERE SendTiming != -1 GROUP BY CounterID) SETTINGS optimize_aggregation_in_order = 1;
diff --git a/tests/queries/1_stateful/00152_insert_different_granularity.sql b/tests/queries/1_stateful/00152_insert_different_granularity.sql
index 35483149498..294d71b384b 100644
--- a/tests/queries/1_stateful/00152_insert_different_granularity.sql
+++ b/tests/queries/1_stateful/00152_insert_different_granularity.sql
@@ -1,4 +1,4 @@
--- Tags: no-tsan, no-replicated-database, no-parallel, no-parallel-replicas
+-- Tags: no-tsan, no-replicated-database, no-parallel
 -- Tag no-replicated-database: Fails due to additional replicas or shards
 
 DROP TABLE IF EXISTS fixed_granularity_table;
diff --git a/tests/queries/1_stateful/00156_max_execution_speed_sample_merge.sql b/tests/queries/1_stateful/00156_max_execution_speed_sample_merge.sql
index 32079111f6c..e325c18200b 100644
--- a/tests/queries/1_stateful/00156_max_execution_speed_sample_merge.sql
+++ b/tests/queries/1_stateful/00156_max_execution_speed_sample_merge.sql
@@ -1,6 +1,3 @@
--- Tags: no-parallel-replicas
--- Merge tables doesn't work with parallel replicas currently
-
 SET max_execution_speed = 4000000, timeout_before_checking_execution_speed = 0;
 
 CREATE TEMPORARY TABLE times (t DateTime);
diff --git a/tests/queries/1_stateful/00166_explain_estimate.sql b/tests/queries/1_stateful/00166_explain_estimate.sql
index abac92ecb2e..c4071271736 100644
--- a/tests/queries/1_stateful/00166_explain_estimate.sql
+++ b/tests/queries/1_stateful/00166_explain_estimate.sql
@@ -1,4 +1,4 @@
--- Tags: no-replicated-database, no-parallel-replicas
+-- Tags: no-replicated-database
 -- Tag no-replicated-database: Requires investigation
 
 EXPLAIN ESTIMATE SELECT count() FROM test.hits WHERE CounterID = 29103473;
diff --git a/tests/queries/1_stateful/00170_s3_cache.sql b/tests/queries/1_stateful/00170_s3_cache.sql
index 43e85af0bc3..23663a1844d 100644
--- a/tests/queries/1_stateful/00170_s3_cache.sql
+++ b/tests/queries/1_stateful/00170_s3_cache.sql
@@ -1,4 +1,4 @@
--- Tags: no-parallel, no-random-settings, no-parallel-replicas
+-- Tags: no-parallel, no-random-settings
 
 -- { echo }
 
diff --git a/tests/queries/1_stateful/00171_grouping_aggregated_transform_bug.sql b/tests/queries/1_stateful/00171_grouping_aggregated_transform_bug.sql
index 07788af927e..7068780a1b1 100644
--- a/tests/queries/1_stateful/00171_grouping_aggregated_transform_bug.sql
+++ b/tests/queries/1_stateful/00171_grouping_aggregated_transform_bug.sql
@@ -1,4 +1,4 @@
--- Tags: distributed, no-parallel-replicas
+-- Tags: distributed
 
 SELECT sum(cityHash64(*)) FROM (SELECT CounterID, quantileTiming(0.5)(SendTiming), count() FROM remote('127.0.0.{1,2,3,4,5,6,7,8,9,10}', test.hits) WHERE SendTiming != -1 GROUP BY CounterID) SETTINGS max_block_size = 63169;
 SELECT sum(cityHash64(*)) FROM (SELECT CounterID, quantileTiming(0.5)(SendTiming), count() FROM remote('127.0.0.{1,2,3,4,5,6,7,8,9,10}', test.hits) WHERE SendTiming != -1 GROUP BY CounterID) SETTINGS optimize_aggregation_in_order = 1, max_block_size = 63169;
diff --git a/tests/queries/1_stateful/00177_memory_bound_merging.sh b/tests/queries/1_stateful/00177_memory_bound_merging.sh
index 008422be108..774f005b8eb 100755
--- a/tests/queries/1_stateful/00177_memory_bound_merging.sh
+++ b/tests/queries/1_stateful/00177_memory_bound_merging.sh
@@ -12,6 +12,8 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 check_replicas_read_in_order() {
     # to check this we actually look for at least one log message from MergeTreeInOrderSelectProcessor.
     # hopefully logger's names are a bit more stable than log messages itself
+    #
+    # NOTE: lack of "current_database = '$CLICKHOUSE_DATABASE'" filter is made on purpose
     $CLICKHOUSE_CLIENT -nq "
         SYSTEM FLUSH LOGS;
 
diff --git a/tests/queries/1_stateful/00178_query_datetime64_index.reference b/tests/queries/1_stateful/00178_query_datetime64_index.reference
new file mode 100644
index 00000000000..f24667b36da
--- /dev/null
+++ b/tests/queries/1_stateful/00178_query_datetime64_index.reference
@@ -0,0 +1,2 @@
+2023-05-27 00:00:00.000
+2023-05-27 00:00:00.000
diff --git a/tests/queries/1_stateful/00178_query_datetime64_index.sql b/tests/queries/1_stateful/00178_query_datetime64_index.sql
new file mode 100644
index 00000000000..a3fb594db73
--- /dev/null
+++ b/tests/queries/1_stateful/00178_query_datetime64_index.sql
@@ -0,0 +1,9 @@
+DROP TABLE IF EXISTS datetime64_index_tbl;
+
+CREATE TABLE datetime64_index_tbl(ts DateTime64(3, 'UTC')) ENGINE=MergeTree ORDER BY ts;
+INSERT INTO datetime64_index_tbl(ts) VALUES(toDateTime64('2023-05-27 00:00:00', 3, 'UTC'));
+
+SELECT ts FROM datetime64_index_tbl WHERE ts < toDate('2023-05-28');
+SELECT ts FROM datetime64_index_tbl WHERE ts < toDate32('2023-05-28');
+
+DROP TABLE datetime64_index_tbl;
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 0455556ae96..2802e52c288 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -26,6 +26,7 @@ AlertManager
 Alexey
 AnyEvent
 AppleClang
+Approximative
 ArrayJoin
 ArrowStream
 AsyncInsertCacheSize
@@ -468,6 +469,7 @@ MSan
 MVCC
 MacBook
 MacOS
+MapState
 MarkCacheBytes
 MarkCacheFiles
 MarksLoaderThreads
@@ -771,6 +773,7 @@ SMALLINT
 SPNEGO
 SQEs
 SQLAlchemy
+SquaredDistance
 SQLConsoleDetail
 SQLInsert
 SQLSTATE
@@ -1005,6 +1008,7 @@ anyLast
 anyheavy
 anylast
 appendTrailingCharIfAbsent
+approximative
 argMax
 argMin
 argmax
@@ -1081,6 +1085,7 @@ avgweighted
 avro
 avx
 aws
+azureBlobStorage
 backend
 backoff
 backticks
@@ -1342,6 +1347,7 @@ detectLanguageUnknown
 determinator
 deterministically
 dictGet
+dictGetAll
 dictGetChildren
 dictGetDescendant
 dictGetHierarchy
@@ -1758,6 +1764,7 @@ misconfiguration
 mispredictions
 mmap
 mmapped
+modularization
 moduloOrZero
 mongodb
 monthName
@@ -1931,6 +1938,7 @@ prefertch
 prefetch
 prefetchsize
 preloaded
+prem
 prepend
 prepended
 prepends
@@ -2042,6 +2050,7 @@ reconnection
 recurse
 redash
 reddit
+redis
 redisstreams
 refcounter
 regexpExtract
@@ -2128,6 +2137,8 @@ seektable
 sequenceCount
 sequenceMatch
 sequenceNextNode
+serverTimeZone
+serverTimezone
 serverUUID
 sessionCacheSize
 sessionIdContext
@@ -2159,6 +2170,7 @@ snowflakeToDateTime
 socketcache
 soundex
 sparkbar
+sparkBar
 sparsehash
 speedscope
 splitByChar
@@ -2252,6 +2264,7 @@ summap
 summingmergetree
 sumwithoverflow
 superaggregates
+supertype
 supremum
 symlink
 symlinks
@@ -2418,6 +2431,7 @@ unescaping
 unhex
 unicode
 unidimensional
+unintuitive
 uniq
 uniqCombined
 uniqExact
@@ -2445,6 +2459,7 @@ unrounded
 untracked
 untrusted
 untuple
+uploader
 uploaders
 upperUTF
 uptime
diff --git a/utils/check-style/check-style b/utils/check-style/check-style
index afaf2ee6d48..e7c06fefee2 100755
--- a/utils/check-style/check-style
+++ b/utils/check-style/check-style
@@ -13,7 +13,7 @@
 #  and then to run formatter only for the specified files.
 
 ROOT_PATH=$(git rev-parse --show-toplevel)
-EXCLUDE_DIRS='build/|integration/|widechar_width/|glibc-compatibility/|poco/|memcpy/|consistent-hashing|benchmark|tests/|utils/keeper-bench/example.yaml'
+EXCLUDE_DIRS='build/|integration/|widechar_width/|glibc-compatibility/|poco/|memcpy/|consistent-hashing|benchmark|tests/.*.cpp|utils/keeper-bench/example.yaml'
 
 # From [1]:
 #     But since array_to_string_internal() in array.c still loops over array
@@ -163,14 +163,12 @@ find $ROOT_PATH -not -path $ROOT_PATH'/contrib*' \( -name '*.yaml' -or -name '*.
 
 # Tests should not be named with "fail" in their names. It makes looking at the results less convenient.
 find $ROOT_PATH/tests/queries -iname '*fail*' |
-    grep -vP $EXCLUDE_DIRS |
     grep . && echo 'Tests should not be named with "fail" in their names. It makes looking at the results less convenient when you search for "fail" substring in browser.'
 
 # Queries to system.query_log/system.query_thread_log should have current_database = currentDatabase() condition
 # NOTE: it is not that accurate, but at least something.
 tests_with_query_log=( $(
     find $ROOT_PATH/tests/queries -iname '*.sql' -or -iname '*.sh' -or -iname '*.py' -or -iname '*.j2' |
-        grep -vP $EXCLUDE_DIRS |
         xargs grep --with-filename -e system.query_log -e system.query_thread_log | cut -d: -f1 | sort -u
 ) )
 for test_case in "${tests_with_query_log[@]}"; do
@@ -205,7 +203,6 @@ tables_with_database_column=(
 # NOTE: it is not that accuate, but at least something.
 tests_with_database_column=( $(
     find $ROOT_PATH/tests/queries -iname '*.sql' -or -iname '*.sh' -or -iname '*.py' -or -iname '*.j2' |
-        grep -vP $EXCLUDE_DIRS |
         xargs grep --with-filename $(printf -- "-e %s " "${tables_with_database_column[@]}") |
         grep -v -e ':--' -e ':#' |
         cut -d: -f1 | sort -u
@@ -225,7 +222,6 @@ done
 # NOTE: it is not that accuate, but at least something.
 tests_with_replicated_merge_tree=( $(
     find $ROOT_PATH/tests/queries -iname '*.sql' -or -iname '*.sh' -or -iname '*.py' -or -iname '*.j2' |
-        grep -vP $EXCLUDE_DIRS |
         xargs grep --with-filename -e "Replicated.*MergeTree[ ]*(.*" | cut -d: -f1 | sort -u
 ) )
 for test_case in "${tests_with_replicated_merge_tree[@]}"; do
@@ -233,7 +229,7 @@ for test_case in "${tests_with_replicated_merge_tree[@]}"; do
         *.gen.*)
             ;;
         *.sh)
-            test_case_zk_prefix="\$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX"
+            test_case_zk_prefix="\(\$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX\|{database}\)"
             grep -q -e "Replicated.*MergeTree[ ]*(.*$test_case_zk_prefix" "$test_case" || echo "Replicated.*MergeTree should contain '$test_case_zk_prefix' in zookeeper path to avoid overlaps ($test_case)"
             ;;
         *.sql|*.sql.j2)
diff --git a/utils/checksum-for-compressed-block/main.cpp b/utils/checksum-for-compressed-block/main.cpp
index 4f9923e7638..4ae06a78ab4 100644
--- a/utils/checksum-for-compressed-block/main.cpp
+++ b/utils/checksum-for-compressed-block/main.cpp
@@ -45,7 +45,7 @@ int main(int, char **)
     {
         auto flipped = flipBit(str, pos);
         auto checksum = CityHash_v1_0_2::CityHash128(flipped.data(), flipped.size());
-        std::cout << getHexUIntLowercase(checksum.first) << getHexUIntLowercase(checksum.second) << "\t" << pos / 8 << ", " << pos % 8 << "\n";
+        std::cout << getHexUIntLowercase(checksum) << "\t" << pos / 8 << ", " << pos % 8 << "\n";
     }
 
     return 0;
diff --git a/utils/keeper-data-dumper/main.cpp b/utils/keeper-data-dumper/main.cpp
index e82b21079fe..5a6fd15d72c 100644
--- a/utils/keeper-data-dumper/main.cpp
+++ b/utils/keeper-data-dumper/main.cpp
@@ -8,6 +8,7 @@
 #include <Coordination/KeeperLogStore.h>
 #include <Coordination/Changelog.h>
 #include <Common/logger_useful.h>
+#include <Disks/DiskLocal.h>
 
 using namespace Coordination;
 using namespace DB;
@@ -62,15 +63,18 @@ int main(int argc, char *argv[])
     ResponsesQueue queue(std::numeric_limits<size_t>::max());
     SnapshotsQueue snapshots_queue{1};
     CoordinationSettingsPtr settings = std::make_shared<CoordinationSettings>();
-    KeeperContextPtr keeper_context = std::make_shared<DB::KeeperContext>();
-    auto state_machine = std::make_shared<KeeperStateMachine>(queue, snapshots_queue, argv[1], settings, keeper_context, nullptr);
+    KeeperContextPtr keeper_context = std::make_shared<DB::KeeperContext>(true);
+    keeper_context->setLogDisk(std::make_shared<DB::DiskLocal>("LogDisk", argv[2], 0));
+    keeper_context->setSnapshotDisk(std::make_shared<DB::DiskLocal>("LogDisk", argv[1], 0));
+
+    auto state_machine = std::make_shared<KeeperStateMachine>(queue, snapshots_queue, settings, keeper_context, nullptr);
     state_machine->init();
     size_t last_commited_index = state_machine->last_commit_index();
 
     LOG_INFO(logger, "Last committed index: {}", last_commited_index);
 
     DB::KeeperLogStore changelog(
-        argv[2], LogFileSettings{.force_sync = true, .compress_logs = settings->compress_logs, .rotate_interval = 10000000});
+        LogFileSettings{.force_sync = true, .compress_logs = settings->compress_logs, .rotate_interval = 10000000}, keeper_context);
     changelog.init(last_commited_index, 10000000000UL); /// collect all logs
     if (changelog.size() == 0)
         LOG_INFO(logger, "Changelog empty");
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index 653a0cd5388..2a098d8c1da 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,7 +1,21 @@
+v23.6.1.1524-stable	2023-06-30
+v23.5.4.25-stable	2023-06-29
+v23.5.3.24-stable	2023-06-17
+v23.5.2.7-stable	2023-06-10
+v23.5.1.3174-stable	2023-06-09
+v23.4.5.22-stable	2023-06-29
+v23.4.4.16-stable	2023-06-17
+v23.4.3.48-stable	2023-06-12
 v23.4.2.11-stable	2023-05-02
 v23.4.1.1943-stable	2023-04-27
+v23.3.7.5-lts	2023-06-29
+v23.3.6.7-lts	2023-06-28
+v23.3.5.9-lts	2023-06-22
+v23.3.4.17-lts	2023-06-17
+v23.3.3.52-lts	2023-06-12
 v23.3.2.37-lts	2023-04-22
 v23.3.1.2823-lts	2023-03-31
+v23.2.7.32-stable	2023-06-09
 v23.2.6.34-stable	2023-04-23
 v23.2.5.46-stable	2023-04-03
 v23.2.4.12-stable	2023-03-10
@@ -41,6 +55,8 @@ v22.9.4.32-stable	2022-10-26
 v22.9.3.18-stable	2022-09-30
 v22.9.2.7-stable	2022-09-23
 v22.9.1.2603-stable	2022-09-22
+v22.8.19.10-lts	2023-06-17
+v22.8.18.31-lts	2023-06-12
 v22.8.17.17-lts	2023-04-22
 v22.8.16.32-lts	2023-04-04
 v22.8.15.23-lts	2023-03-10