From eb7aad00160b1418ed96ecc83770b62ce3bfaaf0 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 14 Nov 2023 11:35:54 +0100
Subject: [PATCH 001/245] Do not consider parts broken if only projections are
 broken

---
 src/Interpreters/MutationsInterpreter.cpp     |  14 +
 src/Interpreters/MutationsInterpreter.h       |   1 +
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  61 +++-
 src/Storages/MergeTree/IMergeTreeDataPart.h   |  19 +-
 src/Storages/MergeTree/MergeTreeData.cpp      |  26 +-
 src/Storages/MergeTree/MergeTreeData.h        |  11 +-
 .../MergeTree/MergeTreeDataPartChecksum.h     |   2 +
 src/Storages/MergeTree/MutateTask.cpp         |   8 +-
 .../ReplicatedMergeTreePartCheckThread.cpp    |  31 +-
 .../ReplicatedMergeTreePartCheckThread.h      |   4 +-
 src/Storages/MergeTree/checkDataPart.cpp      |  80 ++++-
 src/Storages/MergeTree/checkDataPart.h        |   4 +-
 src/Storages/StorageMergeTree.cpp             |   5 +-
 src/Storages/StorageReplicatedMergeTree.cpp   |   3 +-
 src/Storages/System/StorageSystemDisks.cpp    |   2 +-
 .../System/StorageSystemPartsBase.cpp         |   8 +-
 src/Storages/System/StorageSystemPartsBase.h  |   2 +-
 .../System/StorageSystemProjectionParts.cpp   |  48 ++-
 .../StorageSystemProjectionPartsColumns.cpp   |  21 +-
 .../02916_broken_projection.reference         | 224 ++++++++++++++
 .../0_stateless/02916_broken_projection.sh    | 283 ++++++++++++++++++
 21 files changed, 795 insertions(+), 62 deletions(-)
 create mode 100644 tests/queries/0_stateless/02916_broken_projection.reference
 create mode 100755 tests/queries/0_stateless/02916_broken_projection.sh

diff --git a/src/Interpreters/MutationsInterpreter.cpp b/src/Interpreters/MutationsInterpreter.cpp
index 0ace0a8b79c..a9a5d4f33d0 100644
--- a/src/Interpreters/MutationsInterpreter.cpp
+++ b/src/Interpreters/MutationsInterpreter.cpp
@@ -305,6 +305,11 @@ bool MutationsInterpreter::Source::hasProjection(const String & name) const
     return part && part->hasProjection(name);
 }
 
+bool MutationsInterpreter::Source::hasBrokenProjection(const String & name) const
+{
+    return part && part->hasBrokenProjection(name);
+}
+
 bool MutationsInterpreter::Source::isCompactPart() const
 {
     return part && part->getType() == MergeTreeDataPartType::Compact;
@@ -922,6 +927,15 @@ void MutationsInterpreter::prepare(bool dry_run)
             materialized_indices.insert(index.name);
     }
 
+    /// Always rebuild broken projections.
+    for (const auto & projection : metadata_snapshot->getProjections())
+    {
+        if (!source.hasBrokenProjection(projection.name))
+            continue;
+
+        materialized_projections.insert(projection.name);
+    }
+
     for (const auto & projection : metadata_snapshot->getProjections())
     {
         if (!source.hasProjection(projection.name))
diff --git a/src/Interpreters/MutationsInterpreter.h b/src/Interpreters/MutationsInterpreter.h
index c53b86ddb5e..33b8021a653 100644
--- a/src/Interpreters/MutationsInterpreter.h
+++ b/src/Interpreters/MutationsInterpreter.h
@@ -122,6 +122,7 @@ public:
         bool materializeTTLRecalculateOnly() const;
         bool hasSecondaryIndex(const String & name) const;
         bool hasProjection(const String & name) const;
+        bool hasBrokenProjection(const String & name) const;
         bool isCompactPart() const;
 
         void read(
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 9bc72577b25..bc81758675e 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -732,7 +732,23 @@ void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool ch
             else
             {
                 auto part = getProjectionPartBuilder(projection.name).withPartFormatFromDisk().build();
-                part->loadColumnsChecksumsIndexes(require_columns_checksums, check_consistency);
+
+                try
+                {
+                    part->loadColumnsChecksumsIndexes(require_columns_checksums, check_consistency);
+                }
+                catch (...)
+                {
+                    if (isRetryableException(std::current_exception()))
+                        throw;
+
+                    LOG_ERROR(&Poco::Logger::get("IMergeTreeDataPart"),
+                              "Cannot load projection {}, will consider it broken", projection.name);
+
+                    addBrokenProjectionPart(projection.name, std::move(part), getCurrentExceptionMessage(false), getCurrentExceptionCode());
+                    continue;
+                }
+
                 addProjectionPart(projection.name, std::move(part));
             }
         }
@@ -1129,7 +1145,8 @@ void IMergeTreeDataPart::loadChecksums(bool require)
         /// Check the data while we are at it.
         LOG_WARNING(storage.log, "Checksums for part {} not found. Will calculate them from data on disk.", name);
 
-        checksums = checkDataPart(shared_from_this(), false);
+        bool noop;
+        checksums = checkDataPart(shared_from_this(), false, noop, /* is_cancelled */{}, /* throw_on_broken_projection */false);
         writeChecksums(checksums, {});
 
         bytes_on_disk = checksums.getTotalSizeOnDisk();
@@ -2130,6 +2147,46 @@ std::optional<String> IMergeTreeDataPart::getStreamNameForColumn(
     return getStreamNameOrHash(stream_name, extension, storage_);
 }
 
+void IMergeTreeDataPart::addBrokenProjectionPart(
+    const String & projection_name,
+    std::shared_ptr<IMergeTreeDataPart> projection_part,
+    const String & message,
+    int code)
+{
+    projection_part->setBrokenReason(message, code);
+    bool inserted = broken_projection_parts.emplace(projection_name, projection_part).second;
+    if (!inserted)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Projection part {} in part {} is already added to a broken projection parts list", projection_name, name);
+}
+
+void IMergeTreeDataPart::markProjectionPartAsBroken(const String & projection_name, const String & message, int code) const
+{
+    std::lock_guard lock(broken_projections_mutex);
+
+    auto it = projection_parts.find(projection_name);
+    if (it == projection_parts.end())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "There is no projection part '{}'", projection_name);
+
+    it->second->setBrokenReason(message, code);
+
+    broken_projection_parts.emplace(projection_name, it->second);
+    projection_parts.erase(it);
+}
+
+void IMergeTreeDataPart::setBrokenReason(const String & message, int code)
+{
+    std::lock_guard lock(broken_projections_mutex);
+    is_broken = true;
+    exception = message;
+    exception_code = code;
+}
+
+bool IMergeTreeDataPart::hasBrokenProjection(const String & projection_name) const
+{
+    std::lock_guard lock(broken_projections_mutex);
+    return broken_projection_parts.contains(projection_name);
+}
+
 bool isCompactPart(const MergeTreeDataPartPtr & data_part)
 {
     return (data_part && data_part->getType() == MergeTreeDataPartType::Compact);
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index a9659d2f5f4..52a1541e15f 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -255,6 +255,12 @@ public:
     /// Frozen by ALTER TABLE ... FREEZE ... It is used for information purposes in system.parts table.
     mutable std::atomic<bool> is_frozen {false};
 
+    /// If it is a projection part, it can be broken sometimes.
+    mutable std::atomic<bool> is_broken {false};
+    mutable std::string exception;
+    mutable int exception_code = 0;
+    mutable std::mutex broken_projections_mutex;
+
     /// Indicates that the part was marked Outdated by PartCheckThread because the part was not committed to ZooKeeper
     mutable bool is_unexpected_local_part = false;
 
@@ -405,12 +411,20 @@ public:
 
     const std::map<String, std::shared_ptr<IMergeTreeDataPart>> & getProjectionParts() const { return projection_parts; }
 
+    const std::map<String, std::shared_ptr<IMergeTreeDataPart>> & getBrokenProjectionParts() const { return broken_projection_parts; }
+
     MergeTreeDataPartBuilder getProjectionPartBuilder(const String & projection_name, bool is_temp_projection = false);
 
     void addProjectionPart(const String & projection_name, std::shared_ptr<IMergeTreeDataPart> && projection_part);
 
+    void addBrokenProjectionPart(const String & projection_name, std::shared_ptr<IMergeTreeDataPart> projection_part, const String & message, int code);
+
+    void markProjectionPartAsBroken(const String & projection_name, const String & message, int code) const;
+
     bool hasProjection(const String & projection_name) const { return projection_parts.contains(projection_name); }
 
+    bool hasBrokenProjection(const String & projection_name) const;
+
     void loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded = false);
 
     /// Return set of metadata file names without checksums. For example,
@@ -564,7 +578,8 @@ protected:
     const IMergeTreeDataPart * parent_part;
     String parent_part_name;
 
-    std::map<String, std::shared_ptr<IMergeTreeDataPart>> projection_parts;
+    mutable std::map<String, std::shared_ptr<IMergeTreeDataPart>> projection_parts;
+    mutable std::map<String, std::shared_ptr<IMergeTreeDataPart>> broken_projection_parts;
 
     mutable PartMetadataManagerPtr metadata_manager;
 
@@ -678,6 +693,8 @@ private:
     void incrementStateMetric(MergeTreeDataPartState state) const;
     void decrementStateMetric(MergeTreeDataPartState state) const;
 
+    void setBrokenReason(const String & message, int code);
+
     /// This ugly flag is needed for debug assertions only
     mutable bool part_is_probably_removed_from_disk = false;
 };
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 1c0f9208fef..152c386e188 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -5737,7 +5737,7 @@ MergeTreeData::getDataPartsVectorForInternalUsage(const DataPartStates & afforda
 }
 
 MergeTreeData::ProjectionPartsVector
-MergeTreeData::getProjectionPartsVectorForInternalUsage(const DataPartStates & affordable_states, DataPartStateVector * out_states) const
+MergeTreeData::getProjectionPartsVectorForInternalUsage(const DataPartStates & affordable_states, bool fill_states) const
 {
     auto lock = lockParts();
     ProjectionPartsVector res;
@@ -5749,14 +5749,20 @@ MergeTreeData::getProjectionPartsVectorForInternalUsage(const DataPartStates & a
             res.data_parts.push_back(part);
             for (const auto & [_, projection_part] : part->getProjectionParts())
                 res.projection_parts.push_back(projection_part);
+            for (const auto & [_, projection_part] : part->getBrokenProjectionParts())
+                res.broken_projection_parts.push_back(projection_part);
         }
     }
 
-    if (out_states != nullptr)
+    if (fill_states)
     {
-        out_states->resize(res.projection_parts.size());
+        res.projection_parts_states.resize(res.projection_parts.size());
         for (size_t i = 0; i < res.projection_parts.size(); ++i)
-            (*out_states)[i] = res.projection_parts[i]->getParentPart()->getState();
+            (res.projection_parts_states)[i] = res.projection_parts[i]->getParentPart()->getState();
+
+        res.broken_projection_parts_states.resize(res.broken_projection_parts.size());
+        for (size_t i = 0; i < res.broken_projection_parts.size(); ++i)
+            (res.broken_projection_parts_states)[i] = res.broken_projection_parts[i]->getParentPart()->getState();
     }
 
     return res;
@@ -5809,7 +5815,7 @@ bool MergeTreeData::supportsLightweightDelete() const
     return true;
 }
 
-MergeTreeData::ProjectionPartsVector MergeTreeData::getAllProjectionPartsVector(MergeTreeData::DataPartStateVector * out_states) const
+MergeTreeData::ProjectionPartsVector MergeTreeData::getAllProjectionPartsVector(bool fill_states) const
 {
     ProjectionPartsVector res;
     auto lock = lockParts();
@@ -5820,11 +5826,15 @@ MergeTreeData::ProjectionPartsVector MergeTreeData::getAllProjectionPartsVector(
             res.projection_parts.push_back(projection_part);
     }
 
-    if (out_states != nullptr)
+    if (fill_states)
     {
-        out_states->resize(res.projection_parts.size());
+        res.projection_parts_states.resize(res.projection_parts.size());
         for (size_t i = 0; i < res.projection_parts.size(); ++i)
-            (*out_states)[i] = res.projection_parts[i]->getParentPart()->getState();
+            (res.projection_parts_states)[i] = res.projection_parts[i]->getParentPart()->getState();
+
+        res.broken_projection_parts_states.resize(res.broken_projection_parts.size());
+        for (size_t i = 0; i < res.broken_projection_parts.size(); ++i)
+            (res.broken_projection_parts_states)[i] = res.broken_projection_parts[i]->getParentPart()->getState();
     }
     return res;
 }
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index 54104849fe4..4ef3b75988b 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -468,8 +468,13 @@ public:
 
     struct ProjectionPartsVector
     {
-        DataPartsVector projection_parts;
         DataPartsVector data_parts;
+
+        DataPartsVector projection_parts;
+        DataPartStateVector projection_parts_states;
+
+        DataPartsVector broken_projection_parts;
+        DataPartStateVector broken_projection_parts_states;
     };
 
     /// Returns a copy of the list so that the caller shouldn't worry about locks.
@@ -484,7 +489,7 @@ public:
         const DataPartStates & affordable_states, DataPartStateVector * out_states = nullptr) const;
     /// Same as above but only returns projection parts
     ProjectionPartsVector getProjectionPartsVectorForInternalUsage(
-        const DataPartStates & affordable_states, DataPartStateVector * out_states = nullptr) const;
+        const DataPartStates & affordable_states, bool fill_states = false) const;
 
 
     /// Returns absolutely all parts (and snapshot of their states)
@@ -496,7 +501,7 @@ public:
     size_t getTotalMarksCount() const;
 
     /// Same as above but only returns projection parts
-    ProjectionPartsVector getAllProjectionPartsVector(MergeTreeData::DataPartStateVector * out_states = nullptr) const;
+    ProjectionPartsVector getAllProjectionPartsVector(bool fill_states = false) const;
 
     /// Returns parts in Active state
     DataParts getDataPartsForInternalUsage() const;
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
index 8e5e8c8c448..3595ce38db5 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
@@ -54,6 +54,8 @@ struct MergeTreeDataPartChecksums
 
     bool has(const String & file_name) const { return files.find(file_name) != files.end(); }
 
+    bool remove(const String & file_name) { return files.erase(file_name); }
+
     bool empty() const { return files.empty(); }
 
     /// Checks that the set of columns and their checksums are the same. If not, throws an exception.
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 911b25de2ad..8ef1621b647 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -513,7 +513,9 @@ static std::set<ProjectionDescriptionRawPtr> getProjectionsToRecalculate(
     {
         bool need_recalculate =
             materialized_projections.contains(projection.name)
-            || (!is_full_part_storage && source_part->hasProjection(projection.name));
+            || (!is_full_part_storage
+                && (source_part->hasProjection(projection.name)
+                    || source_part->hasBrokenProjection(projection.name)));
 
         if (need_recalculate)
             projections_to_recalc.insert(&projection);
@@ -1367,7 +1369,9 @@ private:
 
             bool need_recalculate =
                 ctx->materialized_projections.contains(projection.name)
-                || (!is_full_part_storage && ctx->source_part->hasProjection(projection.name));
+                || (!is_full_part_storage
+                    && (ctx->source_part->hasProjection(projection.name)
+                        || ctx->source_part->hasBrokenProjection(projection.name)));
 
             if (need_recalculate)
             {
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
index b1875464725..4468cf8e3bf 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
@@ -274,7 +274,7 @@ std::pair<bool, MergeTreeDataPartPtr> ReplicatedMergeTreePartCheckThread::findLo
     return std::make_pair(exists_in_zookeeper, part);
 }
 
-ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const String & part_name)
+ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const String & part_name, bool throw_on_broken_projection)
 {
     ReplicatedCheckResult result;
     auto [exists_in_zookeeper, part] = findLocalPart(part_name);
@@ -341,6 +341,7 @@ ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const St
         /// before the ReplicatedMergeTreePartHeader was introduced.
         String part_path = storage.replica_path + "/parts/" + part_name;
         String part_znode = zookeeper->get(part_path);
+        bool is_broken_projection = false;
 
         try
         {
@@ -362,8 +363,10 @@ ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const St
 
             checkDataPart(
                 part,
-                true,
-                [this] { return need_stop.load(); });
+                /* require_checksums */true,
+                is_broken_projection,
+                [this] { return need_stop.load(); },
+                throw_on_broken_projection);
 
             if (need_stop)
             {
@@ -384,12 +387,22 @@ ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const St
 
             tryLogCurrentException(log, __PRETTY_FUNCTION__);
 
-            auto message = PreformattedMessage::create("Part {} looks broken. Removing it and will try to fetch.", part_name);
-            LOG_ERROR(log, message);
+            PreformattedMessage message;
+            if (is_broken_projection)
+            {
+                message = PreformattedMessage::create("Part {} has a broken projection. It will be ignored.", part_name);
+                LOG_DEBUG(log, message);
+                result.action = ReplicatedCheckResult::DoNothing;
+            }
+            else
+            {
+                message = PreformattedMessage::create("Part {} looks broken. Removing it and will try to fetch.", part_name);
+                LOG_ERROR(log, message);
+                result.action = ReplicatedCheckResult::TryFetchMissing;
+            }
 
             /// Part is broken, let's try to find it and fetch.
             result.status = {part_name, false, message};
-            result.action = ReplicatedCheckResult::TryFetchMissing;
             return result;
 
         }
@@ -419,12 +432,12 @@ ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const St
 }
 
 
-CheckResult ReplicatedMergeTreePartCheckThread::checkPartAndFix(const String & part_name, std::optional<time_t> * recheck_after)
+CheckResult ReplicatedMergeTreePartCheckThread::checkPartAndFix(const String & part_name, std::optional<time_t> * recheck_after, bool throw_on_broken_projection)
 {
     LOG_INFO(log, "Checking part {}", part_name);
     ProfileEvents::increment(ProfileEvents::ReplicatedPartChecks);
 
-    ReplicatedCheckResult result = checkPartImpl(part_name);
+    ReplicatedCheckResult result = checkPartImpl(part_name, throw_on_broken_projection);
     switch (result.action)
     {
         case ReplicatedCheckResult::None: UNREACHABLE();
@@ -577,7 +590,7 @@ void ReplicatedMergeTreePartCheckThread::run()
         }
 
         std::optional<time_t> recheck_after;
-        checkPartAndFix(selected->name, &recheck_after);
+        checkPartAndFix(selected->name, &recheck_after, /* throw_on_broken_projection */false);
 
         if (need_stop)
             return;
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.h b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.h
index 68dc6ca3d1d..26c4bfe9384 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.h
@@ -65,9 +65,9 @@ public:
     size_t size() const;
 
     /// Check part by name
-    CheckResult checkPartAndFix(const String & part_name, std::optional<time_t> * recheck_after = nullptr);
+    CheckResult checkPartAndFix(const String & part_name, std::optional<time_t> * recheck_after = nullptr, bool throw_on_broken_projection = true);
 
-    ReplicatedCheckResult checkPartImpl(const String & part_name);
+    ReplicatedCheckResult checkPartImpl(const String & part_name, bool throw_on_broken_projection);
 
     std::unique_lock<std::mutex> pausePartsCheck();
 
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index a75df00e8a7..74af7cbb77c 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -111,7 +111,9 @@ static IMergeTreeDataPart::Checksums checkDataPart(
     const NameSet & files_without_checksums,
     const ReadSettings & read_settings,
     bool require_checksums,
-    std::function<bool()> is_cancelled)
+    std::function<bool()> is_cancelled,
+    bool & is_broken_projection,
+    bool throw_on_broken_projection)
 {
     /** Responsibility:
       * - read list of columns from columns.txt;
@@ -120,6 +122,7 @@ static IMergeTreeDataPart::Checksums checkDataPart(
       */
 
     CurrentMetrics::Increment metric_increment{CurrentMetrics::ReplicatedChecks};
+    Poco::Logger * log = &Poco::Logger::get("checkDataPart");
 
     NamesAndTypesList columns_txt;
 
@@ -269,23 +272,68 @@ static IMergeTreeDataPart::Checksums checkDataPart(
         }
     }
 
-    for (const auto & [name, projection] : data_part->getProjectionParts())
+    auto check_projection = [&](const String & name, std::shared_ptr<IMergeTreeDataPart> projection)
     {
-        if (is_cancelled())
-            return {};
-
         auto projection_file = name + ".proj";
-        auto projection_checksums = checkDataPart(
-            projection, *data_part_storage.getProjection(projection_file),
-            projection->getColumns(), projection->getType(),
-            projection->getFileNamesWithoutChecksums(),
-            read_settings, require_checksums, is_cancelled);
+        if (!throw_on_broken_projection && projection->is_broken)
+        {
+            projections_on_disk.erase(projection_file);
+            checksums_txt.remove(projection_file);
+            return;
+        }
+
+        IMergeTreeDataPart::Checksums projection_checksums;
+        try
+        {
+            bool noop;
+            projection_checksums = checkDataPart(
+                projection, *data_part_storage.getProjection(projection_file),
+                projection->getColumns(), projection->getType(),
+                projection->getFileNamesWithoutChecksums(),
+                read_settings, require_checksums, is_cancelled, noop, /* throw_on_broken_projection */false);
+        }
+        catch (...)
+        {
+            if (isRetryableException(std::current_exception()))
+                throw;
+
+            LOG_TEST(log, "Marking projection {} as broken ({})", name, projection_file);
+
+            if (!data_part->hasBrokenProjection(name))
+                data_part->markProjectionPartAsBroken(name, getCurrentExceptionMessage(false), getCurrentExceptionCode());
+
+            is_broken_projection = true;
+            if (throw_on_broken_projection)
+                throw;
+
+            projections_on_disk.erase(projection_file);
+            checksums_txt.remove(projection_file);
+            return;
+        }
 
         checksums_data.files[projection_file] = IMergeTreeDataPart::Checksums::Checksum(
             projection_checksums.getTotalSizeOnDisk(),
             projection_checksums.getTotalChecksumUInt128());
 
         projections_on_disk.erase(projection_file);
+    };
+
+    auto broken_projection_parts = data_part->getBrokenProjectionParts(); /// Iterate over copy
+    for (const auto & [name, projection] : broken_projection_parts)
+    {
+        if (is_cancelled())
+            return {};
+        else
+            check_projection(name, projection);
+    }
+
+    auto projection_parts = data_part->getProjectionParts(); /// Iterate over copy
+    for (const auto & [name, projection] : projection_parts)
+    {
+        if (is_cancelled())
+            return {};
+        else
+            check_projection(name, projection);
     }
 
     if (require_checksums && !projections_on_disk.empty())
@@ -315,7 +363,9 @@ IMergeTreeDataPart::Checksums checkDataPartInMemory(const DataPartInMemoryPtr &
 IMergeTreeDataPart::Checksums checkDataPart(
     MergeTreeData::DataPartPtr data_part,
     bool require_checksums,
-    std::function<bool()> is_cancelled)
+    bool & is_broken_projection,
+    std::function<bool()> is_cancelled,
+    bool throw_on_broken_projection)
 {
     if (auto part_in_memory = asInMemoryPart(data_part))
         return checkDataPartInMemory(part_in_memory);
@@ -357,7 +407,9 @@ IMergeTreeDataPart::Checksums checkDataPart(
             data_part->getFileNamesWithoutChecksums(),
             read_settings,
             require_checksums,
-            is_cancelled);
+            is_cancelled,
+            is_broken_projection,
+            throw_on_broken_projection);
     };
 
     try
@@ -371,7 +423,9 @@ IMergeTreeDataPart::Checksums checkDataPart(
             data_part->getFileNamesWithoutChecksums(),
             read_settings,
             require_checksums,
-            is_cancelled);
+            is_cancelled,
+            is_broken_projection,
+            throw_on_broken_projection);
     }
     catch (...)
     {
diff --git a/src/Storages/MergeTree/checkDataPart.h b/src/Storages/MergeTree/checkDataPart.h
index d0e48b6f80a..a01978f4efe 100644
--- a/src/Storages/MergeTree/checkDataPart.h
+++ b/src/Storages/MergeTree/checkDataPart.h
@@ -10,7 +10,9 @@ namespace DB
 IMergeTreeDataPart::Checksums checkDataPart(
     MergeTreeData::DataPartPtr data_part,
     bool require_checksums,
-    std::function<bool()> is_cancelled = []{ return false; });
+    bool & is_broken_projection,
+    std::function<bool()> is_cancelled = []{ return false; },
+    bool throw_on_broken_projection = false);
 
 bool isNotEnoughMemoryErrorCode(int code);
 bool isRetryableException(const std::exception_ptr exception_ptr);
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index e9a0dd5fbf3..74277616e95 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -2242,11 +2242,12 @@ std::optional<CheckResult> StorageMergeTree::checkDataNext(DataValidationTasksPt
     {
         /// If the checksums file is not present, calculate the checksums and write them to disk.
         static constexpr auto checksums_path = "checksums.txt";
+        bool noop;
         if (part->isStoredOnDisk() && !part->getDataPartStorage().exists(checksums_path))
         {
             try
             {
-                auto calculated_checksums = checkDataPart(part, false);
+                auto calculated_checksums = checkDataPart(part, false, noop, /* is_cancelled */{}, /* throw_on_broken_projection */true);
                 calculated_checksums.checkEqual(part->checksums, true);
 
                 auto & part_mutable = const_cast<IMergeTreeDataPart &>(*part);
@@ -2267,7 +2268,7 @@ std::optional<CheckResult> StorageMergeTree::checkDataNext(DataValidationTasksPt
         {
             try
             {
-                checkDataPart(part, true);
+                checkDataPart(part, true, noop, /* is_cancelled */{}, /* throw_on_broken_projection */true);
                 return CheckResult(part->name, true, "");
             }
             catch (...)
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 74821a9186c..1859fa03094 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -8690,12 +8690,11 @@ IStorage::DataValidationTasksPtr StorageReplicatedMergeTree::getCheckTaskList(
 
 std::optional<CheckResult> StorageReplicatedMergeTree::checkDataNext(DataValidationTasksPtr & check_task_list)
 {
-
     if (auto part = assert_cast<DataValidationTasks *>(check_task_list.get())->next())
     {
         try
         {
-            return CheckResult(part_check_thread.checkPartAndFix(part->name));
+            return part_check_thread.checkPartAndFix(part->name, /* recheck_after */nullptr, /* throw_on_broken_projection */true);
         }
         catch (const Exception & ex)
         {
diff --git a/src/Storages/System/StorageSystemDisks.cpp b/src/Storages/System/StorageSystemDisks.cpp
index 23a00cc7ae5..250fcdba641 100644
--- a/src/Storages/System/StorageSystemDisks.cpp
+++ b/src/Storages/System/StorageSystemDisks.cpp
@@ -63,7 +63,7 @@ Pipe StorageSystemDisks::read(
     for (const auto & [disk_name, disk_ptr] : context->getDisksMap())
     {
         col_name->insert(disk_name);
-        col_path->insert(disk_ptr->getPath());
+        col_path->insert(fs::absolute(disk_ptr->getPath()).string());
         col_free->insert(disk_ptr->getAvailableSpace().value_or(std::numeric_limits<UInt64>::max()));
         col_total->insert(disk_ptr->getTotalSpace().value_or(std::numeric_limits<UInt64>::max()));
         col_unreserved->insert(disk_ptr->getUnreservedSpace().value_or(std::numeric_limits<UInt64>::max()));
diff --git a/src/Storages/System/StorageSystemPartsBase.cpp b/src/Storages/System/StorageSystemPartsBase.cpp
index 513af6cfc46..e97c13b1fed 100644
--- a/src/Storages/System/StorageSystemPartsBase.cpp
+++ b/src/Storages/System/StorageSystemPartsBase.cpp
@@ -64,7 +64,7 @@ StoragesInfo::getParts(MergeTreeData::DataPartStateVector & state, bool has_stat
 }
 
 MergeTreeData::ProjectionPartsVector
-StoragesInfo::getProjectionParts(MergeTreeData::DataPartStateVector & state, bool has_state_column) const
+StoragesInfo::getProjectionParts(bool fill_states, bool has_state_column) const
 {
     if (data->getInMemoryMetadataPtr()->projections.empty())
         return {};
@@ -74,12 +74,12 @@ StoragesInfo::getProjectionParts(MergeTreeData::DataPartStateVector & state, boo
     {
         /// If has_state_column is requested, return all states.
         if (!has_state_column)
-            return data->getProjectionPartsVectorForInternalUsage({State::Active, State::Outdated}, &state);
+            return data->getProjectionPartsVectorForInternalUsage({State::Active, State::Outdated}, fill_states);
 
-        return data->getAllProjectionPartsVector(&state);
+        return data->getAllProjectionPartsVector(fill_states);
     }
 
-    return data->getProjectionPartsVectorForInternalUsage({State::Active}, &state);
+    return data->getProjectionPartsVectorForInternalUsage({State::Active}, fill_states);
 }
 
 StoragesInfoStream::StoragesInfoStream(const SelectQueryInfo & query_info, ContextPtr context)
diff --git a/src/Storages/System/StorageSystemPartsBase.h b/src/Storages/System/StorageSystemPartsBase.h
index c3d2e64b303..e0e81f0d24d 100644
--- a/src/Storages/System/StorageSystemPartsBase.h
+++ b/src/Storages/System/StorageSystemPartsBase.h
@@ -25,7 +25,7 @@ struct StoragesInfo
     explicit operator bool() const { return storage != nullptr; }
 
     MergeTreeData::DataPartsVector getParts(MergeTreeData::DataPartStateVector & state, bool has_state_column) const;
-    MergeTreeData::ProjectionPartsVector getProjectionParts(MergeTreeData::DataPartStateVector & state, bool has_state_column) const;
+    MergeTreeData::ProjectionPartsVector getProjectionParts(bool fill_states, bool has_state_column) const;
 };
 
 /** A helper class that enumerates the storages that match given query. */
diff --git a/src/Storages/System/StorageSystemProjectionParts.cpp b/src/Storages/System/StorageSystemProjectionParts.cpp
index 213865a8d61..44bdb294a2d 100644
--- a/src/Storages/System/StorageSystemProjectionParts.cpp
+++ b/src/Storages/System/StorageSystemProjectionParts.cpp
@@ -83,7 +83,11 @@ StorageSystemProjectionParts::StorageSystemProjectionParts(const StorageID & tab
 
         {"rows_where_ttl_info.expression",              std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>())},
         {"rows_where_ttl_info.min",                     std::make_shared<DataTypeArray>(std::make_shared<DataTypeDateTime>())},
-        {"rows_where_ttl_info.max",                     std::make_shared<DataTypeArray>(std::make_shared<DataTypeDateTime>())}
+        {"rows_where_ttl_info.max",                     std::make_shared<DataTypeArray>(std::make_shared<DataTypeDateTime>())},
+
+        {"is_broken",                                   std::make_shared<DataTypeUInt8>()},
+        {"exception_code",                              std::make_shared<DataTypeInt32>()},
+        {"exception",                                   std::make_shared<DataTypeString>()},
     }
     )
 {
@@ -93,15 +97,14 @@ void StorageSystemProjectionParts::processNextStorage(
     ContextPtr, MutableColumns & columns, std::vector<UInt8> & columns_mask, const StoragesInfo & info, bool has_state_column)
 {
     using State = MergeTreeDataPartState;
-    MergeTreeData::DataPartStateVector all_parts_state;
-    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(all_parts_state, has_state_column);
-    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
+    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(true, has_state_column);
+    auto fill_part_info = [&](size_t part_number, const MergeTreeData::DataPartsVector & parts, const MergeTreeData::DataPartStateVector & states)
     {
-        const auto & part = all_parts.projection_parts[part_number];
+        const auto & part = parts[part_number];
         const auto * parent_part = part->getParentPart();
         chassert(parent_part);
 
-        auto part_state = all_parts_state[part_number];
+        auto part_state = states[part_number];
 
         ColumnSize columns_size = part->getTotalColumnsSize();
         ColumnSize parent_columns_size = parent_part->getTotalColumnsSize();
@@ -278,10 +281,43 @@ void StorageSystemProjectionParts::processNextStorage(
         add_ttl_info_map(part->ttl_infos.group_by_ttl);
         add_ttl_info_map(part->ttl_infos.rows_where_ttl);
 
+        {
+            if (columns_mask[src_index++])
+                columns[res_index++]->insert(part->is_broken.load(std::memory_order_relaxed));
+
+            if (part->is_broken)
+            {
+                std::lock_guard lock(part->broken_projections_mutex);
+                if (columns_mask[src_index++])
+                    columns[res_index++]->insert(part->exception_code);
+                if (columns_mask[src_index++])
+                    columns[res_index++]->insert(part->exception);
+            }
+            else
+            {
+                if (columns_mask[src_index++])
+                    columns[res_index++]->insertDefault();
+                if (columns_mask[src_index++])
+                    columns[res_index++]->insertDefault();
+            }
+        }
+
         /// _state column should be the latest.
         /// Do not use part->getState*, it can be changed from different thread
         if (has_state_column)
             columns[res_index++]->insert(IMergeTreeDataPart::stateString(part_state));
+    };
+
+    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
+    {
+        auto part = all_parts.projection_parts[part_number];
+        fill_part_info(part_number, all_parts.projection_parts, all_parts.projection_parts_states);
+    }
+
+    for (size_t part_number = 0; part_number < all_parts.broken_projection_parts.size(); ++part_number)
+    {
+        auto part = all_parts.broken_projection_parts[part_number];
+        fill_part_info(part_number, all_parts.broken_projection_parts, all_parts.broken_projection_parts_states);
     }
 }
 
diff --git a/src/Storages/System/StorageSystemProjectionPartsColumns.cpp b/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
index 06becc6d91c..3f4224e46bb 100644
--- a/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
+++ b/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
@@ -103,15 +103,14 @@ void StorageSystemProjectionPartsColumns::processNextStorage(
     }
 
     /// Go through the list of projection parts.
-    MergeTreeData::DataPartStateVector all_parts_state;
-    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(all_parts_state, has_state_column);
-    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
+    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(true, has_state_column);
+    auto fill_part_info = [&](size_t part_number, const MergeTreeData::DataPartsVector & parts, const MergeTreeData::DataPartStateVector & states)
     {
-        const auto & part = all_parts.projection_parts[part_number];
+        const auto & part = parts[part_number];
         const auto * parent_part = part->getParentPart();
         chassert(parent_part);
 
-        auto part_state = all_parts_state[part_number];
+        auto part_state = states[part_number];
         auto columns_size = part->getTotalColumnsSize();
         auto parent_columns_size = parent_part->getTotalColumnsSize();
 
@@ -260,6 +259,18 @@ void StorageSystemProjectionPartsColumns::processNextStorage(
             if (has_state_column)
                 columns[res_index++]->insert(part->stateString());
         }
+    };
+
+    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
+    {
+        auto part = all_parts.projection_parts[part_number];
+        fill_part_info(part_number, all_parts.projection_parts, all_parts.projection_parts_states);
+    }
+
+    for (size_t part_number = 0; part_number < all_parts.broken_projection_parts.size(); ++part_number)
+    {
+        auto part = all_parts.broken_projection_parts[part_number];
+        fill_part_info(part_number, all_parts.broken_projection_parts, all_parts.broken_projection_parts_states);
     }
 }
 
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
new file mode 100644
index 00000000000..d0b07e081db
--- /dev/null
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -0,0 +1,224 @@
+insert new part
+insert new part
+insert new part
+insert new part
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+1
+0
+broke metadata of part 'proj' (parent part: all_2_2_0)
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+16
+12
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+0
+broken projections info
+all_2_2_0	proj	FILE_DOESNT_EXIST
+check table full
+all_0_0_0	1	
+all_1_1_0	1	
+all_3_3_0	1	
+all_2_2_0	0	Part all_2_2_0 has a broken projection. It will be ignored.
+0
+broke data of part 'proj_2' (parent part: all_2_2_0)
+broken projections info
+all_2_2_0	proj	FILE_DOESNT_EXIST
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+FILE_DOESNT_EXIST
+check table
+0
+broken projections info
+all_2_2_0	proj	FILE_DOESNT_EXIST
+all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	[]
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+16
+12
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+0
+0
+broke data of part 'proj_2' (parent part: all_3_3_0)
+broken projections info
+all_2_2_0	proj	FILE_DOESNT_EXIST
+all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
+insert new part
+insert new part
+optimize
+0
+broken projections info
+all_2_2_0	proj	FILE_DOESNT_EXIST
+all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
+all_3_3_0	proj_2	NO_FILE_IN_DATA_PART
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	[]
+all_3_3_0	0	['proj']
+all_3_5_1	1	['proj']
+all_4_4_0	0	['proj','proj_2']
+all_5_5_0	0	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+16
+12
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+0
+0
+broke metadata of part 'proj' (parent part: all_1_1_0)
+Detach - Attach
+broken projections info
+all_1_1_0	proj	NO_FILE_IN_DATA_PART
+all_2_2_0	proj	NO_FILE_IN_DATA_PART
+all_2_2_0	proj_2	FILE_DOESNT_EXIST
+all_3_3_0	proj_2	FILE_DOESNT_EXIST
+0
+broke data of part 'proj_2' (parent part: all_1_1_0)
+Detach - Attach
+broken projections info
+all_1_1_0	proj	NO_FILE_IN_DATA_PART
+all_1_1_0	proj_2	FILE_DOESNT_EXIST
+all_2_2_0	proj	NO_FILE_IN_DATA_PART
+all_2_2_0	proj_2	FILE_DOESNT_EXIST
+all_3_3_0	proj_2	FILE_DOESNT_EXIST
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	[]
+all_2_2_0	1	[]
+all_3_3_0	0	['proj']
+all_3_5_1	1	['proj']
+all_4_4_0	0	['proj','proj_2']
+all_5_5_0	0	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+16
+12
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+0
+check table full
+all_3_5_1	1	
+all_0_0_0	1	
+all_1_1_0	0	Part all_1_1_0 has a broken projection. It will be ignored.
+all_2_2_0	0	Part all_2_2_0 has a broken projection. It will be ignored.
+materialize projection proj
+check table full
+all_3_5_1_6	1	
+all_0_0_0_6	1	
+all_2_2_0_6	1	
+all_1_1_0_6	1	
+system.parts
+all_0_0_0	0	['proj','proj_2']
+all_0_0_0_6	1	['proj','proj_2']
+all_1_1_0	0	[]
+all_1_1_0_6	1	['proj','proj_2']
+all_2_2_0	0	[]
+all_2_2_0_6	1	['proj','proj_2']
+all_3_3_0	0	['proj']
+all_3_5_1	0	['proj']
+all_3_5_1_6	1	['proj']
+all_4_4_0	0	['proj','proj_2']
+all_5_5_0	0	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+1
+materialize projection proj_2
+check table full
+all_3_5_1_7	1	
+all_0_0_0_7	1	
+all_2_2_0_7	1	
+all_1_1_0_7	1	
+system.parts
+all_0_0_0	0	['proj','proj_2']
+all_0_0_0_6	0	['proj','proj_2']
+all_0_0_0_7	1	['proj','proj_2']
+all_1_1_0	0	[]
+all_1_1_0_6	0	['proj','proj_2']
+all_1_1_0_7	1	['proj','proj_2']
+all_2_2_0	0	[]
+all_2_2_0_6	0	['proj','proj_2']
+all_2_2_0_7	1	['proj','proj_2']
+all_3_3_0	0	['proj']
+all_3_5_1	0	['proj']
+all_3_5_1_6	0	['proj']
+all_3_5_1_7	1	['proj','proj_2']
+all_4_4_0	0	['proj','proj_2']
+all_5_5_0	0	['proj','proj_2']
+select from projection 'proj'
+12
+16
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+16
+12
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+1
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
new file mode 100755
index 00000000000..81adfe6e49d
--- /dev/null
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -0,0 +1,283 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT -nm -q "
+DROP TABLE IF EXISTS test SYNC;
+CREATE TABLE test
+(
+    a String,
+    b String,
+    c Int32,
+    d Int32,
+    e Int32,
+
+    PROJECTION proj
+    (
+        SELECT c ORDER BY d
+    ),
+    PROJECTION proj_2
+    (
+        SELECT d ORDER BY c
+    )
+)
+ENGINE = ReplicatedMergeTree('/test2/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '1') PRIMARY KEY (a)
+SETTINGS min_bytes_for_wide_part = 0,
+    max_parts_to_merge_at_once=3,
+    enable_vertical_merge_algorithm=1,
+    vertical_merge_algorithm_min_rows_to_activate = 1,
+    vertical_merge_algorithm_min_columns_to_activate = 1,
+    vertical_merge_algorithm_min_columns_to_activate = 1;
+"
+
+table_uuid=$($CLICKHOUSE_CLIENT -q "SELECT uuid FROM system.tables WHERE table='test' and database=currentDatabase()")
+
+function random()
+{
+    cat /dev/urandom | LC_ALL=C tr -dc 'a-zA-Z' | fold -w ${1:-8} | head -n 1
+}
+
+function insert()
+{
+    offset=$1
+    size=$2
+    echo 'insert new part'
+    $CLICKHOUSE_CLIENT -q "INSERT INTO test SELECT number, number, number, number, number%2 FROM numbers($offset, $size);"
+}
+
+function break_projection()
+{
+    part_name=$1
+    parent_name=$2
+    break_type=$3
+
+    read -r disk_name part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
+    SELECT disk_name, path
+    FROM system.projection_parts
+    WHERE table='test'
+    AND database=currentDatabase()
+    AND active=1
+    AND part_name='$part_name'
+    AND parent_name='$parent_name'
+    LIMIT 1;
+    ")
+
+    path=$($CLICKHOUSE_CLIENT -q "SELECT path FROM system.disks WHERE name='$disk_name'")
+
+    # make sure path is absolute
+    $CLICKHOUSE_CLIENT -q "select throwIf(substring('$path', 1, 1) != '/', 'Path is relative: $path')" || exit
+
+    if [ "$break_type" = "data" ]
+        then
+           rm "$path/$part_path/d.bin"
+           rm "$path/$part_path/c.bin"
+           echo "broke data of part '$part_name' (parent part: $parent_name)"
+        else
+           rm "$path/$part_path/columns.txt"
+           echo "broke metadata of part '$part_name' (parent part: $parent_name)"
+    fi
+}
+
+function broken_projections_info()
+{
+    echo 'broken projections info'
+    $CLICKHOUSE_CLIENT -q "
+    SELECT parent_name, name, errors.name FROM
+    (
+        SELECT parent_name, name, exception_code
+        FROM system.projection_parts
+        WHERE table='test'
+        AND database=currentDatabase()
+        AND is_broken = 1
+    ) AS parts_info
+    INNER JOIN system.errors AS errors
+    ON parts_info.exception_code = errors.code
+    ORDER BY parent_name, name
+"
+}
+
+function check()
+{
+    expect_broken_part=""
+    expected_error=""
+    if [ $# -ne 0 ]; then
+        expect_broken_part=$1
+        expected_error=$2
+    fi
+
+    echo 'system.parts'
+    $CLICKHOUSE_CLIENT -q "
+    SELECT name, active, projections
+    FROM system.parts
+    WHERE table='test' AND database=currentDatabase()
+    ORDER BY name;"
+
+    echo "select from projection 'proj'"
+    query_id=$(random 8)
+
+    if [ "$expect_broken_part" = "proj" ]
+        then
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12;" 2>&1 | grep -o $expected_error
+        else
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 OR d == 16;"
+            echo 'used projections'
+            $CLICKHOUSE_CLIENT -nm -q "
+            SYSTEM FLUSH LOGS;
+            SELECT query, projections FROM system.query_log WHERE query_id='$query_id' and type='QueryFinish'
+            "
+    fi
+
+    echo "select from projection 'proj_2'"
+    query_id=$(random 8)
+
+    if [ "$expect_broken_part" = "proj_2" ]
+        then
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12;" 2>&1 | grep -o $expected_error
+        else
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 OR c == 16;"
+            echo 'used projections'
+            $CLICKHOUSE_CLIENT -nm -q "
+            SYSTEM FLUSH LOGS;
+            SELECT query, projections FROM system.query_log WHERE query_id='$query_id' and type='QueryFinish'
+            "
+    fi
+
+    echo 'check table'
+    $CLICKHOUSE_CLIENT -q "CHECK TABLE test"
+}
+
+function optimize_no_wait()
+{
+    echo 'optimize'
+    $CLICKHOUSE_CLIENT -nm -q "OPTIMIZE TABLE test SETTINGS alter_sync=0;"
+}
+
+function reattach()
+{
+    echo 'Detach - Attach'
+    $CLICKHOUSE_CLIENT -nm -q "
+    DETACH TABLE test;
+    ATTACH TABLE test;
+    "
+}
+
+function materialize_projection
+{
+    projection=$1
+    echo "materialize projection $projection"
+    $CLICKHOUSE_CLIENT -q "ALTER TABLE test MATERIALIZE PROJECTION $projection SETTINGS mutations_sync=2"
+}
+
+function check_table_full()
+{
+    echo 'check table full'
+    $CLICKHOUSE_CLIENT -q "CHECK TABLE test SETTINGS check_query_single_value_result = 0"
+}
+
+
+insert 0 5
+
+insert 5 5
+
+insert 10 5
+
+insert 15 5
+
+check
+
+# Break metadata file of projection 'proj'
+break_projection proj all_2_2_0 metadata
+
+# Do select and after "check table" query.
+# Select works because it does not read columns.txt.
+check
+
+# Projection 'proj' from part all_2_2_0 will now appear in broken parts info
+# because it was marked broken during "check table" query.
+# TODO: try to mark it during select as well
+broken_projections_info
+
+# Check table query will also show a list of parts which have broken projections.
+check_table_full
+
+# Break data file of projection 'proj_2' for part all_2_2_0
+break_projection proj_2 all_2_2_0 data
+
+# It will not yet appear in broken projections info.
+broken_projections_info
+
+# Select now fails with error "File doesn't exist"
+check "proj_2" "FILE_DOESNT_EXIST"
+
+# Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
+broken_projections_info
+
+# Second select works, because projection is now marked as broken.
+check
+
+# Break data file of projection 'proj_2' for part all_3_3_0
+break_projection proj_2 all_3_3_0 data
+
+# It will not yet appear in broken projections info.
+broken_projections_info
+
+insert 20 5
+
+insert 25 5
+
+# Part all_3_3_0 has 'proj' and 'proj_2' projections, but 'proj_2' is broken and server does NOT know it yet.
+# Parts all_4_4_0 and all_5_5_0 have both non-broken projections.
+# So a merge will be create for future part all_3_5_1.
+# During merge it will fail to read from 'proj_2' of part all_3_3_0 and proj_2 will be marked broken.
+# Merge will be retried and on second attempt it will succeed.
+# The result part all_3_5_1 will have only 1 projection - 'proj', because
+# it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
+optimize_no_wait
+sleep 2
+
+$CLICKHOUSE_CLIENT -nm -q "
+SYSTEM FLUSH LOGS;
+SELECT count() FROM system.text_log
+WHERE level='Error'
+AND logger_name='MergeTreeBackgroundExecutor'
+AND message like 'Exception while executing background task {$table_uuid:all_3_5_1}%Cannot open file%proj_2.proj/c.bin%'
+"
+
+# Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
+broken_projections_info
+
+check
+
+break_projection proj all_1_1_0 metadata
+
+reattach
+
+broken_projections_info
+
+break_projection proj_2 all_1_1_0 data
+
+reattach
+
+broken_projections_info
+
+check
+
+check_table_full
+
+materialize_projection proj
+
+check_table_full
+
+check
+
+materialize_projection proj_2
+
+check_table_full
+
+check
+
+$CLICKHOUSE_CLIENT -nm -q "
+DROP TABLE test;
+"

From 6c42a3fad6b58efdf91115c3b80f267f1f604c62 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 16 Nov 2023 16:43:34 +0100
Subject: [PATCH 002/245] Better

---
 src/Interpreters/MutationsInterpreter.cpp     | 18 ++--
 .../Optimizations/projectionsCommon.cpp       |  2 +-
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 45 +++------
 src/Storages/MergeTree/IMergeTreeDataPart.h   | 11 +--
 src/Storages/MergeTree/MergeTask.cpp          |  5 +-
 src/Storages/MergeTree/MergeTreeData.cpp      | 57 ++++++-----
 src/Storages/MergeTree/MergeTreeData.h        |  4 +-
 src/Storages/MergeTree/MutateTask.cpp         |  8 +-
 src/Storages/MergeTree/checkDataPart.cpp      | 34 ++-----
 .../System/StorageSystemPartsBase.cpp         |  8 +-
 src/Storages/System/StorageSystemPartsBase.h  |  2 +-
 .../System/StorageSystemProjectionParts.cpp   | 30 +++---
 .../StorageSystemProjectionPartsColumns.cpp   | 21 +---
 .../02916_broken_projection.reference         | 95 ++++++++-----------
 .../0_stateless/02916_broken_projection.sh    | 12 +--
 15 files changed, 146 insertions(+), 206 deletions(-)

diff --git a/src/Interpreters/MutationsInterpreter.cpp b/src/Interpreters/MutationsInterpreter.cpp
index a9a5d4f33d0..237bffe4a67 100644
--- a/src/Interpreters/MutationsInterpreter.cpp
+++ b/src/Interpreters/MutationsInterpreter.cpp
@@ -753,7 +753,7 @@ void MutationsInterpreter::prepare(bool dry_run)
         {
             mutation_kind.set(MutationKind::MUTATE_INDEX_PROJECTION);
             const auto & projection = projections_desc.get(command.projection_name);
-            if (!source.hasProjection(projection.name))
+            if (!source.hasProjection(projection.name) || source.hasBrokenProjection(projection.name))
             {
                 for (const auto & column : projection.required_columns)
                     dependencies.emplace(column, ColumnDependency::PROJECTION);
@@ -927,20 +927,18 @@ void MutationsInterpreter::prepare(bool dry_run)
             materialized_indices.insert(index.name);
     }
 
-    /// Always rebuild broken projections.
-    for (const auto & projection : metadata_snapshot->getProjections())
-    {
-        if (!source.hasBrokenProjection(projection.name))
-            continue;
-
-        materialized_projections.insert(projection.name);
-    }
-
     for (const auto & projection : metadata_snapshot->getProjections())
     {
         if (!source.hasProjection(projection.name))
             continue;
 
+        /// Always rebuild broken projections.
+        if (source.hasBrokenProjection(projection.name))
+        {
+            materialized_projections.insert(projection.name);
+            continue;
+        }
+
         if (need_rebuild_projections)
         {
             materialized_projections.insert(projection.name);
diff --git a/src/Processors/QueryPlan/Optimizations/projectionsCommon.cpp b/src/Processors/QueryPlan/Optimizations/projectionsCommon.cpp
index c3b3449857b..9ebd5aaa32f 100644
--- a/src/Processors/QueryPlan/Optimizations/projectionsCommon.cpp
+++ b/src/Processors/QueryPlan/Optimizations/projectionsCommon.cpp
@@ -224,7 +224,7 @@ bool analyzeProjectionCandidate(
     {
         const auto & created_projections = part_with_ranges.data_part->getProjectionParts();
         auto it = created_projections.find(candidate.projection->name);
-        if (it != created_projections.end())
+        if (it != created_projections.end() && !it->second->is_broken)
         {
             projection_parts.push_back(it->second);
         }
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index bc81758675e..85ce112d9a1 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -745,8 +745,7 @@ void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool ch
                     LOG_ERROR(&Poco::Logger::get("IMergeTreeDataPart"),
                               "Cannot load projection {}, will consider it broken", projection.name);
 
-                    addBrokenProjectionPart(projection.name, std::move(part), getCurrentExceptionMessage(false), getCurrentExceptionCode());
-                    continue;
+                    part->setBrokenReason(getCurrentExceptionMessage(false), getCurrentExceptionCode());
                 }
 
                 addProjectionPart(projection.name, std::move(part));
@@ -2147,44 +2146,30 @@ std::optional<String> IMergeTreeDataPart::getStreamNameForColumn(
     return getStreamNameOrHash(stream_name, extension, storage_);
 }
 
-void IMergeTreeDataPart::addBrokenProjectionPart(
-    const String & projection_name,
-    std::shared_ptr<IMergeTreeDataPart> projection_part,
-    const String & message,
-    int code)
-{
-    projection_part->setBrokenReason(message, code);
-    bool inserted = broken_projection_parts.emplace(projection_name, projection_part).second;
-    if (!inserted)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Projection part {} in part {} is already added to a broken projection parts list", projection_name, name);
-}
-
 void IMergeTreeDataPart::markProjectionPartAsBroken(const String & projection_name, const String & message, int code) const
 {
-    std::lock_guard lock(broken_projections_mutex);
-
     auto it = projection_parts.find(projection_name);
     if (it == projection_parts.end())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "There is no projection part '{}'", projection_name);
-
     it->second->setBrokenReason(message, code);
-
-    broken_projection_parts.emplace(projection_name, it->second);
-    projection_parts.erase(it);
-}
-
-void IMergeTreeDataPart::setBrokenReason(const String & message, int code)
-{
-    std::lock_guard lock(broken_projections_mutex);
-    is_broken = true;
-    exception = message;
-    exception_code = code;
 }
 
 bool IMergeTreeDataPart::hasBrokenProjection(const String & projection_name) const
 {
-    std::lock_guard lock(broken_projections_mutex);
-    return broken_projection_parts.contains(projection_name);
+    auto it = projection_parts.find(projection_name);
+    if (it == projection_parts.end())
+        return false;
+    return it->second->is_broken;
+}
+
+void IMergeTreeDataPart::setBrokenReason(const String & message, int code) const
+{
+    std::lock_guard lock(broken_reason_mutex);
+    if (is_broken)
+        return;
+    is_broken = true;
+    exception = message;
+    exception_code = code;
 }
 
 bool isCompactPart(const MergeTreeDataPartPtr & data_part)
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 52a1541e15f..9af2c16f1e8 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -259,7 +259,7 @@ public:
     mutable std::atomic<bool> is_broken {false};
     mutable std::string exception;
     mutable int exception_code = 0;
-    mutable std::mutex broken_projections_mutex;
+    mutable std::mutex broken_reason_mutex;
 
     /// Indicates that the part was marked Outdated by PartCheckThread because the part was not committed to ZooKeeper
     mutable bool is_unexpected_local_part = false;
@@ -411,14 +411,10 @@ public:
 
     const std::map<String, std::shared_ptr<IMergeTreeDataPart>> & getProjectionParts() const { return projection_parts; }
 
-    const std::map<String, std::shared_ptr<IMergeTreeDataPart>> & getBrokenProjectionParts() const { return broken_projection_parts; }
-
     MergeTreeDataPartBuilder getProjectionPartBuilder(const String & projection_name, bool is_temp_projection = false);
 
     void addProjectionPart(const String & projection_name, std::shared_ptr<IMergeTreeDataPart> && projection_part);
 
-    void addBrokenProjectionPart(const String & projection_name, std::shared_ptr<IMergeTreeDataPart> projection_part, const String & message, int code);
-
     void markProjectionPartAsBroken(const String & projection_name, const String & message, int code) const;
 
     bool hasProjection(const String & projection_name) const { return projection_parts.contains(projection_name); }
@@ -427,6 +423,8 @@ public:
 
     void loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded = false);
 
+    void setBrokenReason(const String & message, int code) const;
+
     /// Return set of metadata file names without checksums. For example,
     /// columns.txt or checksums.txt itself.
     NameSet getFileNamesWithoutChecksums() const;
@@ -579,7 +577,6 @@ protected:
     String parent_part_name;
 
     mutable std::map<String, std::shared_ptr<IMergeTreeDataPart>> projection_parts;
-    mutable std::map<String, std::shared_ptr<IMergeTreeDataPart>> broken_projection_parts;
 
     mutable PartMetadataManagerPtr metadata_manager;
 
@@ -693,8 +690,6 @@ private:
     void incrementStateMetric(MergeTreeDataPartState state) const;
     void decrementStateMetric(MergeTreeDataPartState state) const;
 
-    void setBrokenReason(const String & message, int code);
-
     /// This ugly flag is needed for debug assertions only
     mutable bool part_is_probably_removed_from_disk = false;
 };
diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index adb1ca72e46..53ba1a57b27 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -696,8 +696,9 @@ bool MergeTask::MergeProjectionsStage::mergeMinMaxIndexAndPrepareProjections() c
         MergeTreeData::DataPartsVector projection_parts;
         for (const auto & part : global_ctx->future_part->parts)
         {
-            auto it = part->getProjectionParts().find(projection.name);
-            if (it != part->getProjectionParts().end())
+            auto actual_projection_parts = part->getProjectionParts();
+            auto it = actual_projection_parts.find(projection.name);
+            if (it != actual_projection_parts.end() && !it->second->is_broken)
                 projection_parts.push_back(it->second);
         }
         if (projection_parts.size() < global_ctx->future_part->parts.size())
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 152c386e188..0725c3cbf32 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -5737,7 +5737,7 @@ MergeTreeData::getDataPartsVectorForInternalUsage(const DataPartStates & afforda
 }
 
 MergeTreeData::ProjectionPartsVector
-MergeTreeData::getProjectionPartsVectorForInternalUsage(const DataPartStates & affordable_states, bool fill_states) const
+MergeTreeData::getProjectionPartsVectorForInternalUsage(const DataPartStates & affordable_states, DataPartStateVector * out_states) const
 {
     auto lock = lockParts();
     ProjectionPartsVector res;
@@ -5749,20 +5749,14 @@ MergeTreeData::getProjectionPartsVectorForInternalUsage(const DataPartStates & a
             res.data_parts.push_back(part);
             for (const auto & [_, projection_part] : part->getProjectionParts())
                 res.projection_parts.push_back(projection_part);
-            for (const auto & [_, projection_part] : part->getBrokenProjectionParts())
-                res.broken_projection_parts.push_back(projection_part);
         }
     }
 
-    if (fill_states)
+    if (out_states != nullptr)
     {
-        res.projection_parts_states.resize(res.projection_parts.size());
+        out_states->resize(res.projection_parts.size());
         for (size_t i = 0; i < res.projection_parts.size(); ++i)
-            (res.projection_parts_states)[i] = res.projection_parts[i]->getParentPart()->getState();
-
-        res.broken_projection_parts_states.resize(res.broken_projection_parts.size());
-        for (size_t i = 0; i < res.broken_projection_parts.size(); ++i)
-            (res.broken_projection_parts_states)[i] = res.broken_projection_parts[i]->getParentPart()->getState();
+            (*out_states)[i] = res.projection_parts[i]->getParentPart()->getState();
     }
 
     return res;
@@ -5815,7 +5809,7 @@ bool MergeTreeData::supportsLightweightDelete() const
     return true;
 }
 
-MergeTreeData::ProjectionPartsVector MergeTreeData::getAllProjectionPartsVector(bool fill_states) const
+MergeTreeData::ProjectionPartsVector MergeTreeData::getAllProjectionPartsVector(MergeTreeData::DataPartStateVector * out_states) const
 {
     ProjectionPartsVector res;
     auto lock = lockParts();
@@ -5826,15 +5820,11 @@ MergeTreeData::ProjectionPartsVector MergeTreeData::getAllProjectionPartsVector(
             res.projection_parts.push_back(projection_part);
     }
 
-    if (fill_states)
+    if (out_states != nullptr)
     {
-        res.projection_parts_states.resize(res.projection_parts.size());
+        out_states->resize(res.projection_parts.size());
         for (size_t i = 0; i < res.projection_parts.size(); ++i)
-            (res.projection_parts_states)[i] = res.projection_parts[i]->getParentPart()->getState();
-
-        res.broken_projection_parts_states.resize(res.broken_projection_parts.size());
-        for (size_t i = 0; i < res.broken_projection_parts.size(); ++i)
-            (res.broken_projection_parts_states)[i] = res.broken_projection_parts[i]->getParentPart()->getState();
+            (*out_states)[i] = res.projection_parts[i]->getParentPart()->getState();
     }
     return res;
 }
@@ -7050,8 +7040,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
             }
         }
 
-        auto projections = src_part->getProjectionParts();
-        for (const auto & [name, projection_part] : projections)
+        for (const auto & [name, projection_part] : src_part->getProjectionParts())
         {
             const auto & projection_storage = projection_part->getDataPartStorage();
             for (auto it = projection_storage.iterate(); it->isValid(); it->next())
@@ -7654,21 +7643,39 @@ MovePartsOutcome MergeTreeData::moveParts(const CurrentlyMovingPartsTaggerPtr &
 
 bool MergeTreeData::partsContainSameProjections(const DataPartPtr & left, const DataPartPtr & right, String & out_reason)
 {
-    if (left->getProjectionParts().size() != right->getProjectionParts().size())
+    auto remove_broken_parts = [](auto & parts)
+    {
+        std::set<String> broken_projection_parts;
+        for (const auto & [name, part] : parts)
+        {
+            if (part->is_broken)
+                broken_projection_parts.emplace(name);
+        }
+        for (const auto & name : broken_projection_parts)
+            parts.erase(name);
+    };
+
+    auto left_projection_parts = left->getProjectionParts();
+    auto right_projection_parts = right->getProjectionParts();
+
+    remove_broken_parts(left_projection_parts);
+    remove_broken_parts(right_projection_parts);
+
+    if (left_projection_parts.size() != right_projection_parts.size())
     {
         out_reason = fmt::format(
             "Parts have different number of projections: {} in part '{}' and {} in part '{}'",
-            left->getProjectionParts().size(),
+            left_projection_parts.size(),
             left->name,
-            right->getProjectionParts().size(),
+            right_projection_parts.size(),
             right->name
         );
         return false;
     }
 
-    for (const auto & [name, _] : left->getProjectionParts())
+    for (const auto & [name, _] : left_projection_parts)
     {
-        if (!right->hasProjection(name))
+        if (!right_projection_parts.contains(name))
         {
             out_reason = fmt::format(
                 "The part '{}' doesn't have projection '{}' while part '{}' does", right->name, name, left->name
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index 4ef3b75988b..18087c6b059 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -489,7 +489,7 @@ public:
         const DataPartStates & affordable_states, DataPartStateVector * out_states = nullptr) const;
     /// Same as above but only returns projection parts
     ProjectionPartsVector getProjectionPartsVectorForInternalUsage(
-        const DataPartStates & affordable_states, bool fill_states = false) const;
+        const DataPartStates & affordable_states, MergeTreeData::DataPartStateVector * out_states) const;
 
 
     /// Returns absolutely all parts (and snapshot of their states)
@@ -501,7 +501,7 @@ public:
     size_t getTotalMarksCount() const;
 
     /// Same as above but only returns projection parts
-    ProjectionPartsVector getAllProjectionPartsVector(bool fill_states = false) const;
+    ProjectionPartsVector getAllProjectionPartsVector(MergeTreeData::DataPartStateVector * out_states = nullptr) const;
 
     /// Returns parts in Active state
     DataParts getDataPartsForInternalUsage() const;
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 8ef1621b647..6a1ceec1cd3 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -514,8 +514,8 @@ static std::set<ProjectionDescriptionRawPtr> getProjectionsToRecalculate(
         bool need_recalculate =
             materialized_projections.contains(projection.name)
             || (!is_full_part_storage
-                && (source_part->hasProjection(projection.name)
-                    || source_part->hasBrokenProjection(projection.name)));
+                && source_part->hasProjection(projection.name)
+                && !source_part->hasBrokenProjection(projection.name));
 
         if (need_recalculate)
             projections_to_recalc.insert(&projection);
@@ -1370,8 +1370,8 @@ private:
             bool need_recalculate =
                 ctx->materialized_projections.contains(projection.name)
                 || (!is_full_part_storage
-                    && (ctx->source_part->hasProjection(projection.name)
-                        || ctx->source_part->hasBrokenProjection(projection.name)));
+                    && ctx->source_part->hasProjection(projection.name)
+                    && !ctx->source_part->hasBrokenProjection(projection.name));
 
             if (need_recalculate)
             {
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index 74af7cbb77c..8feabf344b5 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -272,14 +272,16 @@ static IMergeTreeDataPart::Checksums checkDataPart(
         }
     }
 
-    auto check_projection = [&](const String & name, std::shared_ptr<IMergeTreeDataPart> projection)
+    for (const auto & [name, projection] : data_part->getProjectionParts())
     {
+        if (is_cancelled())
+            return {};
+
         auto projection_file = name + ".proj";
         if (!throw_on_broken_projection && projection->is_broken)
         {
             projections_on_disk.erase(projection_file);
             checksums_txt.remove(projection_file);
-            return;
         }
 
         IMergeTreeDataPart::Checksums projection_checksums;
@@ -297,10 +299,11 @@ static IMergeTreeDataPart::Checksums checkDataPart(
             if (isRetryableException(std::current_exception()))
                 throw;
 
-            LOG_TEST(log, "Marking projection {} as broken ({})", name, projection_file);
-
-            if (!data_part->hasBrokenProjection(name))
-                data_part->markProjectionPartAsBroken(name, getCurrentExceptionMessage(false), getCurrentExceptionCode());
+            if (!projection->is_broken)
+            {
+                LOG_TEST(log, "Marking projection {} as broken ({})", name, projection_file);
+                projection->setBrokenReason(getCurrentExceptionMessage(false), getCurrentExceptionCode());
+            }
 
             is_broken_projection = true;
             if (throw_on_broken_projection)
@@ -308,7 +311,6 @@ static IMergeTreeDataPart::Checksums checkDataPart(
 
             projections_on_disk.erase(projection_file);
             checksums_txt.remove(projection_file);
-            return;
         }
 
         checksums_data.files[projection_file] = IMergeTreeDataPart::Checksums::Checksum(
@@ -316,24 +318,6 @@ static IMergeTreeDataPart::Checksums checkDataPart(
             projection_checksums.getTotalChecksumUInt128());
 
         projections_on_disk.erase(projection_file);
-    };
-
-    auto broken_projection_parts = data_part->getBrokenProjectionParts(); /// Iterate over copy
-    for (const auto & [name, projection] : broken_projection_parts)
-    {
-        if (is_cancelled())
-            return {};
-        else
-            check_projection(name, projection);
-    }
-
-    auto projection_parts = data_part->getProjectionParts(); /// Iterate over copy
-    for (const auto & [name, projection] : projection_parts)
-    {
-        if (is_cancelled())
-            return {};
-        else
-            check_projection(name, projection);
     }
 
     if (require_checksums && !projections_on_disk.empty())
diff --git a/src/Storages/System/StorageSystemPartsBase.cpp b/src/Storages/System/StorageSystemPartsBase.cpp
index e97c13b1fed..513af6cfc46 100644
--- a/src/Storages/System/StorageSystemPartsBase.cpp
+++ b/src/Storages/System/StorageSystemPartsBase.cpp
@@ -64,7 +64,7 @@ StoragesInfo::getParts(MergeTreeData::DataPartStateVector & state, bool has_stat
 }
 
 MergeTreeData::ProjectionPartsVector
-StoragesInfo::getProjectionParts(bool fill_states, bool has_state_column) const
+StoragesInfo::getProjectionParts(MergeTreeData::DataPartStateVector & state, bool has_state_column) const
 {
     if (data->getInMemoryMetadataPtr()->projections.empty())
         return {};
@@ -74,12 +74,12 @@ StoragesInfo::getProjectionParts(bool fill_states, bool has_state_column) const
     {
         /// If has_state_column is requested, return all states.
         if (!has_state_column)
-            return data->getProjectionPartsVectorForInternalUsage({State::Active, State::Outdated}, fill_states);
+            return data->getProjectionPartsVectorForInternalUsage({State::Active, State::Outdated}, &state);
 
-        return data->getAllProjectionPartsVector(fill_states);
+        return data->getAllProjectionPartsVector(&state);
     }
 
-    return data->getProjectionPartsVectorForInternalUsage({State::Active}, fill_states);
+    return data->getProjectionPartsVectorForInternalUsage({State::Active}, &state);
 }
 
 StoragesInfoStream::StoragesInfoStream(const SelectQueryInfo & query_info, ContextPtr context)
diff --git a/src/Storages/System/StorageSystemPartsBase.h b/src/Storages/System/StorageSystemPartsBase.h
index e0e81f0d24d..c3d2e64b303 100644
--- a/src/Storages/System/StorageSystemPartsBase.h
+++ b/src/Storages/System/StorageSystemPartsBase.h
@@ -25,7 +25,7 @@ struct StoragesInfo
     explicit operator bool() const { return storage != nullptr; }
 
     MergeTreeData::DataPartsVector getParts(MergeTreeData::DataPartStateVector & state, bool has_state_column) const;
-    MergeTreeData::ProjectionPartsVector getProjectionParts(bool fill_states, bool has_state_column) const;
+    MergeTreeData::ProjectionPartsVector getProjectionParts(MergeTreeData::DataPartStateVector & state, bool has_state_column) const;
 };
 
 /** A helper class that enumerates the storages that match given query. */
diff --git a/src/Storages/System/StorageSystemProjectionParts.cpp b/src/Storages/System/StorageSystemProjectionParts.cpp
index 44bdb294a2d..3dbe6823dac 100644
--- a/src/Storages/System/StorageSystemProjectionParts.cpp
+++ b/src/Storages/System/StorageSystemProjectionParts.cpp
@@ -97,14 +97,15 @@ void StorageSystemProjectionParts::processNextStorage(
     ContextPtr, MutableColumns & columns, std::vector<UInt8> & columns_mask, const StoragesInfo & info, bool has_state_column)
 {
     using State = MergeTreeDataPartState;
-    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(true, has_state_column);
-    auto fill_part_info = [&](size_t part_number, const MergeTreeData::DataPartsVector & parts, const MergeTreeData::DataPartStateVector & states)
+    MergeTreeData::DataPartStateVector all_parts_state;
+    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(all_parts_state, has_state_column);
+    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
     {
-        const auto & part = parts[part_number];
+        const auto & part = all_parts.projection_parts[part_number];
         const auto * parent_part = part->getParentPart();
         chassert(parent_part);
 
-        auto part_state = states[part_number];
+        auto part_state = all_parts_state[part_number];
 
         ColumnSize columns_size = part->getTotalColumnsSize();
         ColumnSize parent_columns_size = parent_part->getTotalColumnsSize();
@@ -275,7 +276,12 @@ void StorageSystemProjectionParts::processNextStorage(
         add_ttl_info_map(part->ttl_infos.moves_ttl);
 
         if (columns_mask[src_index++])
-            columns[res_index++]->insert(queryToString(part->default_codec->getCodecDesc()));
+        {
+            if (part->default_codec)
+                columns[res_index++]->insert(queryToString(part->default_codec->getCodecDesc()));
+            else
+                columns[res_index++]->insertDefault();
+        }
 
         add_ttl_info_map(part->ttl_infos.recompression_ttl);
         add_ttl_info_map(part->ttl_infos.group_by_ttl);
@@ -287,7 +293,7 @@ void StorageSystemProjectionParts::processNextStorage(
 
             if (part->is_broken)
             {
-                std::lock_guard lock(part->broken_projections_mutex);
+                std::lock_guard lock(part->broken_reason_mutex);
                 if (columns_mask[src_index++])
                     columns[res_index++]->insert(part->exception_code);
                 if (columns_mask[src_index++])
@@ -306,18 +312,6 @@ void StorageSystemProjectionParts::processNextStorage(
         /// Do not use part->getState*, it can be changed from different thread
         if (has_state_column)
             columns[res_index++]->insert(IMergeTreeDataPart::stateString(part_state));
-    };
-
-    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
-    {
-        auto part = all_parts.projection_parts[part_number];
-        fill_part_info(part_number, all_parts.projection_parts, all_parts.projection_parts_states);
-    }
-
-    for (size_t part_number = 0; part_number < all_parts.broken_projection_parts.size(); ++part_number)
-    {
-        auto part = all_parts.broken_projection_parts[part_number];
-        fill_part_info(part_number, all_parts.broken_projection_parts, all_parts.broken_projection_parts_states);
     }
 }
 
diff --git a/src/Storages/System/StorageSystemProjectionPartsColumns.cpp b/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
index 3f4224e46bb..06becc6d91c 100644
--- a/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
+++ b/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
@@ -103,14 +103,15 @@ void StorageSystemProjectionPartsColumns::processNextStorage(
     }
 
     /// Go through the list of projection parts.
-    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(true, has_state_column);
-    auto fill_part_info = [&](size_t part_number, const MergeTreeData::DataPartsVector & parts, const MergeTreeData::DataPartStateVector & states)
+    MergeTreeData::DataPartStateVector all_parts_state;
+    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(all_parts_state, has_state_column);
+    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
     {
-        const auto & part = parts[part_number];
+        const auto & part = all_parts.projection_parts[part_number];
         const auto * parent_part = part->getParentPart();
         chassert(parent_part);
 
-        auto part_state = states[part_number];
+        auto part_state = all_parts_state[part_number];
         auto columns_size = part->getTotalColumnsSize();
         auto parent_columns_size = parent_part->getTotalColumnsSize();
 
@@ -259,18 +260,6 @@ void StorageSystemProjectionPartsColumns::processNextStorage(
             if (has_state_column)
                 columns[res_index++]->insert(part->stateString());
         }
-    };
-
-    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
-    {
-        auto part = all_parts.projection_parts[part_number];
-        fill_part_info(part_number, all_parts.projection_parts, all_parts.projection_parts_states);
-    }
-
-    for (size_t part_number = 0; part_number < all_parts.broken_projection_parts.size(); ++part_number)
-    {
-        auto part = all_parts.broken_projection_parts[part_number];
-        fill_part_info(part_number, all_parts.broken_projection_parts, all_parts.broken_projection_parts_states);
     }
 }
 
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index d0b07e081db..62966036eed 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -8,15 +8,15 @@ all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 1
 0
@@ -27,23 +27,20 @@ all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
-16
 12
+16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 0
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
 check table full
-all_0_0_0	1	
-all_1_1_0	1	
-all_3_3_0	1	
 all_2_2_0	0	Part all_2_2_0 has a broken projection. It will be ignored.
 0
 broke data of part 'proj_2' (parent part: all_2_2_0)
@@ -52,13 +49,13 @@ all_2_2_0	proj	FILE_DOESNT_EXIST
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj_2']
+all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
 FILE_DOESNT_EXIST
 check table
@@ -69,18 +66,18 @@ all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	[]
+all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
-16
 12
+16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 0
 0
@@ -99,21 +96,21 @@ all_3_3_0	proj_2	NO_FILE_IN_DATA_PART
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	[]
-all_3_3_0	0	['proj']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	0	['proj','proj_2']
 all_3_5_1	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
-16
 12
+16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 0
 0
@@ -135,76 +132,66 @@ all_2_2_0	proj_2	FILE_DOESNT_EXIST
 all_3_3_0	proj_2	FILE_DOESNT_EXIST
 system.parts
 all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	[]
-all_2_2_0	1	[]
-all_3_3_0	0	['proj']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	0	['proj','proj_2']
 all_3_5_1	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
-16
 12
+16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 0
 check table full
-all_3_5_1	1	
-all_0_0_0	1	
-all_1_1_0	0	Part all_1_1_0 has a broken projection. It will be ignored.
 all_2_2_0	0	Part all_2_2_0 has a broken projection. It will be ignored.
+all_1_1_0	0	Part all_1_1_0 has a broken projection. It will be ignored.
 materialize projection proj
 check table full
-all_3_5_1_6	1	
-all_0_0_0_6	1	
-all_2_2_0_6	1	
-all_1_1_0_6	1	
 system.parts
 all_0_0_0	0	['proj','proj_2']
 all_0_0_0_6	1	['proj','proj_2']
-all_1_1_0	0	[]
+all_1_1_0	0	['proj','proj_2']
 all_1_1_0_6	1	['proj','proj_2']
-all_2_2_0	0	[]
+all_2_2_0	0	['proj','proj_2']
 all_2_2_0_6	1	['proj','proj_2']
-all_3_3_0	0	['proj']
+all_3_3_0	0	['proj','proj_2']
 all_3_5_1	0	['proj']
 all_3_5_1_6	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 1
 materialize projection proj_2
 check table full
-all_3_5_1_7	1	
-all_0_0_0_7	1	
-all_2_2_0_7	1	
-all_1_1_0_7	1	
 system.parts
 all_0_0_0	0	['proj','proj_2']
 all_0_0_0_6	0	['proj','proj_2']
 all_0_0_0_7	1	['proj','proj_2']
-all_1_1_0	0	[]
+all_1_1_0	0	['proj','proj_2']
 all_1_1_0_6	0	['proj','proj_2']
 all_1_1_0_7	1	['proj','proj_2']
-all_2_2_0	0	[]
+all_2_2_0	0	['proj','proj_2']
 all_2_2_0_6	0	['proj','proj_2']
 all_2_2_0_7	1	['proj','proj_2']
-all_3_3_0	0	['proj']
+all_3_3_0	0	['proj','proj_2']
 all_3_5_1	0	['proj']
 all_3_5_1_6	0	['proj']
 all_3_5_1_7	1	['proj','proj_2']
@@ -214,11 +201,11 @@ select from projection 'proj'
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
-16
 12
+16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 1
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 81adfe6e49d..4748506d9cf 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -23,7 +23,7 @@ CREATE TABLE test
         SELECT d ORDER BY c
     )
 )
-ENGINE = ReplicatedMergeTree('/test2/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '1') PRIMARY KEY (a)
+ENGINE = ReplicatedMergeTree('/test3/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '1') PRIMARY KEY (a)
 SETTINGS min_bytes_for_wide_part = 0,
     max_parts_to_merge_at_once=3,
     enable_vertical_merge_algorithm=1,
@@ -119,9 +119,9 @@ function check()
 
     if [ "$expect_broken_part" = "proj" ]
         then
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12;" 2>&1 | grep -o $expected_error
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 ORDER BY c;" 2>&1 | grep -o $expected_error
         else
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 OR d == 16;"
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;"
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
@@ -134,9 +134,9 @@ function check()
 
     if [ "$expect_broken_part" = "proj_2" ]
         then
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12;" 2>&1 | grep -o $expected_error
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 ORDER BY d;" 2>&1 | grep -o $expected_error
         else
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 OR c == 16;"
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;"
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
@@ -173,7 +173,7 @@ function materialize_projection
 function check_table_full()
 {
     echo 'check table full'
-    $CLICKHOUSE_CLIENT -q "CHECK TABLE test SETTINGS check_query_single_value_result = 0"
+    $CLICKHOUSE_CLIENT -q "CHECK TABLE test SETTINGS check_query_single_value_result = 0" | grep "broken"
 }
 
 

From 8ea4e302a50db872a798c6cd39c6f5edb255ec49 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 16 Nov 2023 19:43:32 +0100
Subject: [PATCH 003/245] Fix style check

---
 .../0_stateless/02916_broken_projection.sh    | 31 ++++++++++++++++---
 1 file changed, 26 insertions(+), 5 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 4748506d9cf..bf0ec61fd76 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# shellcheck disable=SC2046
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -125,7 +126,7 @@ function check()
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
-            SELECT query, projections FROM system.query_log WHERE query_id='$query_id' and type='QueryFinish'
+            SELECT query, projections FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
             "
     fi
 
@@ -140,7 +141,7 @@ function check()
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
-            SELECT query, projections FROM system.query_log WHERE query_id='$query_id' and type='QueryFinish'
+            SELECT query, projections FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
             "
     fi
 
@@ -148,10 +149,20 @@ function check()
     $CLICKHOUSE_CLIENT -q "CHECK TABLE test"
 }
 
-function optimize_no_wait()
+function optimize()
 {
+    final=$1
+    no_wait=$2
+
     echo 'optimize'
-    $CLICKHOUSE_CLIENT -nm -q "OPTIMIZE TABLE test SETTINGS alter_sync=0;"
+    query="OPTIMIZE TABLE test"
+
+    if [ $final -eq 1 ]; then
+        query="$query FINAL"
+    if [ $no_wait -eq 1 ]; then
+        query="$query SETTINGS alter_sync=0"
+
+    $CLICKHOUSE_CLIENT -nm -q $query
 }
 
 function reattach()
@@ -234,7 +245,7 @@ insert 25 5
 # Merge will be retried and on second attempt it will succeed.
 # The result part all_3_5_1 will have only 1 projection - 'proj', because
 # it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
-optimize_no_wait
+optimize 0 1
 sleep 2
 
 $CLICKHOUSE_CLIENT -nm -q "
@@ -276,6 +287,16 @@ materialize_projection proj_2
 
 check_table_full
 
+break_projection proj all_3_5_1_7 data
+
+insert 30 5
+
+optimize 1 0
+
+insert 35 5
+
+optimize 1 0
+
 check
 
 $CLICKHOUSE_CLIENT -nm -q "

From 42b2fe9adcf4596e8e36231068911c5dbdc4948f Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 21 Nov 2023 13:21:35 +0100
Subject: [PATCH 004/245] Fxi

---
 src/Common/ErrorCodes.cpp                     |  1 +
 .../ReplicatedMergeTreePartCheckThread.cpp    | 10 +-
 src/Storages/MergeTree/checkDataPart.cpp      | 17 +++-
 .../02916_broken_projection.reference         | 93 ++++++++++---------
 .../0_stateless/02916_broken_projection.sh    | 39 ++++----
 5 files changed, 94 insertions(+), 66 deletions(-)

diff --git a/src/Common/ErrorCodes.cpp b/src/Common/ErrorCodes.cpp
index 28f8e6c6021..9c3aab5ad01 100644
--- a/src/Common/ErrorCodes.cpp
+++ b/src/Common/ErrorCodes.cpp
@@ -586,6 +586,7 @@
     M(704, CANNOT_USE_QUERY_CACHE_WITH_NONDETERMINISTIC_FUNCTIONS) \
     M(705, TABLE_NOT_EMPTY) \
     M(706, LIBSSH_ERROR) \
+    M(707, BROKEN_PROJECTION) \
     M(999, KEEPER_EXCEPTION) \
     M(1000, POCO_EXCEPTION) \
     M(1001, STD_EXCEPTION) \
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
index 4468cf8e3bf..ba4d4869025 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
@@ -63,7 +63,7 @@ void ReplicatedMergeTreePartCheckThread::enqueuePart(const String & name, time_t
     if (parts_set.contains(name))
         return;
 
-    LOG_TRACE(log, "Enqueueing {} for check after after {}s", name, delay_to_check_seconds);
+    LOG_TRACE(log, "Enqueueing {} for check after {}s", name, delay_to_check_seconds);
     parts_queue.emplace_back(name, std::chrono::steady_clock::now() + std::chrono::seconds(delay_to_check_seconds));
     parts_set.insert(name);
     task->schedule();
@@ -385,17 +385,19 @@ ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const St
             if (isRetryableException(std::current_exception()))
                 throw;
 
-            tryLogCurrentException(log, __PRETTY_FUNCTION__);
-
             PreformattedMessage message;
             if (is_broken_projection)
             {
-                message = PreformattedMessage::create("Part {} has a broken projection. It will be ignored.", part_name);
+                message = PreformattedMessage::create(
+                    "Part {} has a broken projections. It will be ignored. Broken projections info: \n{}",
+                    part_name, getCurrentExceptionMessage(false));
                 LOG_DEBUG(log, message);
                 result.action = ReplicatedCheckResult::DoNothing;
             }
             else
             {
+                tryLogCurrentException(log, __PRETTY_FUNCTION__);
+
                 message = PreformattedMessage::create("Part {} looks broken. Removing it and will try to fetch.", part_name);
                 LOG_ERROR(log, message);
                 result.action = ReplicatedCheckResult::TryFetchMissing;
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index 8feabf344b5..3bb6f763c8b 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -42,6 +42,7 @@ namespace ErrorCodes
     extern const int NO_FILE_IN_DATA_PART;
     extern const int NETWORK_ERROR;
     extern const int SOCKET_TIMEOUT;
+    extern const int BROKEN_PROJECTION;
 }
 
 
@@ -272,6 +273,7 @@ static IMergeTreeDataPart::Checksums checkDataPart(
         }
     }
 
+    std::string broken_projections_message;
     for (const auto & [name, projection] : data_part->getProjectionParts())
     {
         if (is_cancelled())
@@ -307,7 +309,15 @@ static IMergeTreeDataPart::Checksums checkDataPart(
 
             is_broken_projection = true;
             if (throw_on_broken_projection)
-                throw;
+            {
+                if (!broken_projections_message.empty())
+                    broken_projections_message += "\n";
+
+                broken_projections_message += fmt::format(
+                    "Part {} has a broken projection {} (error: {})",
+                    data_part->name, name, getCurrentExceptionMessage(false));
+                continue;
+            }
 
             projections_on_disk.erase(projection_file);
             checksums_txt.remove(projection_file);
@@ -320,6 +330,11 @@ static IMergeTreeDataPart::Checksums checkDataPart(
         projections_on_disk.erase(projection_file);
     }
 
+    if (throw_on_broken_projection && !broken_projections_message.empty())
+    {
+        throw Exception(ErrorCodes::BROKEN_PROJECTION, broken_projections_message.data());
+    }
+
     if (require_checksums && !projections_on_disk.empty())
     {
         throw Exception(ErrorCodes::UNEXPECTED_FILE_IN_DATA_PART,
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index 62966036eed..aee18a21fb8 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -7,42 +7,40 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 1
-0
 broke metadata of part 'proj' (parent part: all_2_2_0)
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 0
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
 check table full
-all_2_2_0	0	Part all_2_2_0 has a broken projection. It will be ignored.
-0
+all_2_2_0	0	Part all_2_2_0 has a broken projections. It will be ignored. Broken projections info: \nCode: 707. DB::Exception: Part all_2_2_0 has a broken projection proj (error: Code: 107. DB::ErrnoException: Cannot open file /var/lib/clickhouse/store/521/521986ec-2fef-42c8-a402-83f937689286/all_2_2_0/proj.proj/columns.txt, errno: 2, strerror: No such file or directory. (FILE_DOESNT_EXIST) (version 23.11.1.1)). (BROKEN_PROJECTION) (version 23.11.1.1)
 broke data of part 'proj_2' (parent part: all_2_2_0)
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
@@ -51,13 +49,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: proj_2
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
-FILE_DOESNT_EXIST
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: proj_2
 check table
 0
 broken projections info
@@ -68,19 +65,18 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 0
-0
 broke data of part 'proj_2' (parent part: all_3_3_0)
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
@@ -88,6 +84,7 @@ all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
 insert new part
 insert new part
 optimize
+OPTIMIZE TABLE test SETTINGS alter_sync=0
 0
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
@@ -101,19 +98,18 @@ all_3_3_0	0	['proj','proj_2']
 all_3_5_1	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 0
-0
 broke metadata of part 'proj' (parent part: all_1_1_0)
 Detach - Attach
 broken projections info
@@ -121,7 +117,6 @@ all_1_1_0	proj	NO_FILE_IN_DATA_PART
 all_2_2_0	proj	NO_FILE_IN_DATA_PART
 all_2_2_0	proj_2	FILE_DOESNT_EXIST
 all_3_3_0	proj_2	FILE_DOESNT_EXIST
-0
 broke data of part 'proj_2' (parent part: all_1_1_0)
 Detach - Attach
 broken projections info
@@ -138,21 +133,21 @@ all_3_3_0	0	['proj','proj_2']
 all_3_5_1	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 0
 check table full
-all_2_2_0	0	Part all_2_2_0 has a broken projection. It will be ignored.
-all_1_1_0	0	Part all_1_1_0 has a broken projection. It will be ignored.
+all_2_2_0	0	Part all_2_2_0 has a broken projections. It will be ignored. Broken projections info: \nCode: 707. DB::Exception: Part all_2_2_0 has a broken projection proj (error: Code: 107. DB::ErrnoException: Cannot open file /var/lib/clickhouse/store/521/521986ec-2fef-42c8-a402-83f937689286/all_2_2_0/proj.proj/columns.txt, errno: 2, strerror: No such file or directory. (FILE_DOESNT_EXIST) (version 23.11.1.1))\nPart all_2_2_0 has a broken projection proj_2 (error: Code: 226. DB::Exception: There is no file for column \'c\' in data part \'proj_2\'. (NO_FILE_IN_DATA_PART) (version 23.11.1.1)). (BROKEN_PROJECTION) (version 23.11.1.1)
+all_1_1_0	0	Part all_1_1_0 has a broken projections. It will be ignored. Broken projections info: \nCode: 707. DB::Exception: Part all_1_1_0 has a broken projection proj (error: Code: 107. DB::ErrnoException: Cannot open file /var/lib/clickhouse/store/521/521986ec-2fef-42c8-a402-83f937689286/all_1_1_0/proj.proj/columns.txt, errno: 2, strerror: No such file or directory. (FILE_DOESNT_EXIST) (version 23.11.1.1))\nPart all_1_1_0 has a broken projection proj_2 (error: Code: 226. DB::Exception: There is no file for column \'c\' in data part \'proj_2\'. (NO_FILE_IN_DATA_PART) (version 23.11.1.1)). (BROKEN_PROJECTION) (version 23.11.1.1)
 materialize projection proj
 check table full
 system.parts
@@ -167,45 +162,55 @@ all_3_5_1	0	['proj']
 all_3_5_1_6	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 1
 materialize projection proj_2
 check table full
+broke data of part 'proj' (parent part: all_3_5_1_7)
+insert new part
+optimize
+OPTIMIZE TABLE test FINAL
+insert new part
+optimize
+OPTIMIZE TABLE test FINAL
 system.parts
 all_0_0_0	0	['proj','proj_2']
 all_0_0_0_6	0	['proj','proj_2']
-all_0_0_0_7	1	['proj','proj_2']
+all_0_0_0_7	0	['proj','proj_2']
+all_0_8_2_7	1	['proj_2']
 all_1_1_0	0	['proj','proj_2']
 all_1_1_0_6	0	['proj','proj_2']
-all_1_1_0_7	1	['proj','proj_2']
+all_1_1_0_7	0	['proj','proj_2']
 all_2_2_0	0	['proj','proj_2']
 all_2_2_0_6	0	['proj','proj_2']
-all_2_2_0_7	1	['proj','proj_2']
+all_2_2_0_7	0	['proj','proj_2']
 all_3_3_0	0	['proj','proj_2']
 all_3_5_1	0	['proj']
 all_3_5_1_6	0	['proj']
-all_3_5_1_7	1	['proj','proj_2']
+all_3_5_1_7	0	['proj','proj_2']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj'
+all_8_8_0	0	['proj','proj_2']
+all_9_9_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj_2']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 1
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index bf0ec61fd76..bf382624787 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -24,7 +24,7 @@ CREATE TABLE test
         SELECT d ORDER BY c
     )
 )
-ENGINE = ReplicatedMergeTree('/test3/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '1') PRIMARY KEY (a)
+ENGINE = ReplicatedMergeTree('/test4/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '1') PRIMARY KEY (a)
 SETTINGS min_bytes_for_wide_part = 0,
     max_parts_to_merge_at_once=3,
     enable_vertical_merge_algorithm=1,
@@ -65,18 +65,13 @@ function break_projection()
     LIMIT 1;
     ")
 
-    path=$($CLICKHOUSE_CLIENT -q "SELECT path FROM system.disks WHERE name='$disk_name'")
-
-    # make sure path is absolute
-    $CLICKHOUSE_CLIENT -q "select throwIf(substring('$path', 1, 1) != '/', 'Path is relative: $path')" || exit
-
     if [ "$break_type" = "data" ]
         then
-           rm "$path/$part_path/d.bin"
-           rm "$path/$part_path/c.bin"
+           rm "$part_path/d.bin"
+           rm "$part_path/c.bin"
            echo "broke data of part '$part_name' (parent part: $parent_name)"
         else
-           rm "$path/$part_path/columns.txt"
+           rm "$part_path/columns.txt"
            echo "broke metadata of part '$part_name' (parent part: $parent_name)"
     fi
 }
@@ -115,12 +110,12 @@ function check()
     WHERE table='test' AND database=currentDatabase()
     ORDER BY name;"
 
-    echo "select from projection 'proj'"
+    echo "select from projection 'proj', expect error: $expect_broken_part"
     query_id=$(random 8)
 
     if [ "$expect_broken_part" = "proj" ]
         then
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 ORDER BY c;" 2>&1 | grep -o $expected_error
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --send_logs_level 'fatal' --query_id $query_id -q "SELECT c FROM test WHERE d == 12 ORDER BY c;" 2>&1 | grep -o $expected_error
         else
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;"
             echo 'used projections'
@@ -130,12 +125,12 @@ function check()
             "
     fi
 
-    echo "select from projection 'proj_2'"
+    echo "select from projection 'proj_2', expect error: $expect_broken_part"
     query_id=$(random 8)
 
     if [ "$expect_broken_part" = "proj_2" ]
         then
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 ORDER BY d;" 2>&1 | grep -o $expected_error
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --send_logs_level 'fatal' --query_id $query_id -q "SELECT d FROM test WHERE c == 12 ORDER BY d;" 2>&1 | grep -o $expected_error
         else
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;"
             echo 'used projections'
@@ -146,7 +141,9 @@ function check()
     fi
 
     echo 'check table'
-    $CLICKHOUSE_CLIENT -q "CHECK TABLE test"
+    $CLICKHOUSE_CLIENT -nm -q "
+    SET send_logs_level='fatal';
+    CHECK TABLE test;"
 }
 
 function optimize()
@@ -159,16 +156,21 @@ function optimize()
 
     if [ $final -eq 1 ]; then
         query="$query FINAL"
+    fi
     if [ $no_wait -eq 1 ]; then
         query="$query SETTINGS alter_sync=0"
+    fi
 
-    $CLICKHOUSE_CLIENT -nm -q $query
+    echo $query
+
+    $CLICKHOUSE_CLIENT -q "$query"
 }
 
 function reattach()
 {
     echo 'Detach - Attach'
     $CLICKHOUSE_CLIENT -nm -q "
+    SET send_logs_level='fatal';
     DETACH TABLE test;
     ATTACH TABLE test;
     "
@@ -184,7 +186,10 @@ function materialize_projection
 function check_table_full()
 {
     echo 'check table full'
-    $CLICKHOUSE_CLIENT -q "CHECK TABLE test SETTINGS check_query_single_value_result = 0" | grep "broken"
+    $CLICKHOUSE_CLIENT -nm -q "
+    SET send_logs_level='fatal';
+    CHECK TABLE test SETTINGS check_query_single_value_result = 0;
+" | grep "broken"
 }
 
 
@@ -300,5 +305,5 @@ optimize 1 0
 check
 
 $CLICKHOUSE_CLIENT -nm -q "
-DROP TABLE test;
+DROP TABLE test SYNC;
 "

From bcc87c01771414806fca705b5c9b5e0e925dea5f Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 21 Nov 2023 17:17:36 +0100
Subject: [PATCH 005/245] Better test

---
 .../ReplicatedMergeTreePartCheckThread.cpp    |  3 +-
 src/Storages/System/StorageSystemDisks.cpp    |  2 +-
 .../02916_broken_projection.reference         | 43 +++++++++----------
 .../0_stateless/02916_broken_projection.sh    | 27 ++++++++----
 4 files changed, 42 insertions(+), 33 deletions(-)

diff --git a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
index ba4d4869025..d058113e134 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
@@ -388,8 +388,9 @@ ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const St
             PreformattedMessage message;
             if (is_broken_projection)
             {
+                WriteBufferFromOwnString wb;
                 message = PreformattedMessage::create(
-                    "Part {} has a broken projections. It will be ignored. Broken projections info: \n{}",
+                    "Part {} has a broken projections. It will be ignored. Broken projections info: {}",
                     part_name, getCurrentExceptionMessage(false));
                 LOG_DEBUG(log, message);
                 result.action = ReplicatedCheckResult::DoNothing;
diff --git a/src/Storages/System/StorageSystemDisks.cpp b/src/Storages/System/StorageSystemDisks.cpp
index 250fcdba641..23a00cc7ae5 100644
--- a/src/Storages/System/StorageSystemDisks.cpp
+++ b/src/Storages/System/StorageSystemDisks.cpp
@@ -63,7 +63,7 @@ Pipe StorageSystemDisks::read(
     for (const auto & [disk_name, disk_ptr] : context->getDisksMap())
     {
         col_name->insert(disk_name);
-        col_path->insert(fs::absolute(disk_ptr->getPath()).string());
+        col_path->insert(disk_ptr->getPath());
         col_free->insert(disk_ptr->getAvailableSpace().value_or(std::numeric_limits<UInt64>::max()));
         col_total->insert(disk_ptr->getTotalSpace().value_or(std::numeric_limits<UInt64>::max()));
         col_unreserved->insert(disk_ptr->getUnreservedSpace().value_or(std::numeric_limits<UInt64>::max()));
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index aee18a21fb8..1b84ca96840 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -11,12 +11,12 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
 broke metadata of part 'proj' (parent part: all_2_2_0)
@@ -29,18 +29,18 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
-check table full
-all_2_2_0	0	Part all_2_2_0 has a broken projections. It will be ignored. Broken projections info: \nCode: 707. DB::Exception: Part all_2_2_0 has a broken projection proj (error: Code: 107. DB::ErrnoException: Cannot open file /var/lib/clickhouse/store/521/521986ec-2fef-42c8-a402-83f937689286/all_2_2_0/proj.proj/columns.txt, errno: 2, strerror: No such file or directory. (FILE_DOESNT_EXIST) (version 23.11.1.1)). (BROKEN_PROJECTION) (version 23.11.1.1)
+check table full (all_2_2_0)
+all_2_2_0
 broke data of part 'proj_2' (parent part: all_2_2_0)
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
@@ -53,7 +53,7 @@ select from projection 'proj', expect error: proj_2
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: proj_2
 check table
 0
@@ -69,12 +69,12 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
 broke data of part 'proj_2' (parent part: all_3_3_0)
@@ -102,12 +102,12 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
 broke metadata of part 'proj' (parent part: all_1_1_0)
@@ -137,19 +137,18 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
-check table full
-all_2_2_0	0	Part all_2_2_0 has a broken projections. It will be ignored. Broken projections info: \nCode: 707. DB::Exception: Part all_2_2_0 has a broken projection proj (error: Code: 107. DB::ErrnoException: Cannot open file /var/lib/clickhouse/store/521/521986ec-2fef-42c8-a402-83f937689286/all_2_2_0/proj.proj/columns.txt, errno: 2, strerror: No such file or directory. (FILE_DOESNT_EXIST) (version 23.11.1.1))\nPart all_2_2_0 has a broken projection proj_2 (error: Code: 226. DB::Exception: There is no file for column \'c\' in data part \'proj_2\'. (NO_FILE_IN_DATA_PART) (version 23.11.1.1)). (BROKEN_PROJECTION) (version 23.11.1.1)
-all_1_1_0	0	Part all_1_1_0 has a broken projections. It will be ignored. Broken projections info: \nCode: 707. DB::Exception: Part all_1_1_0 has a broken projection proj (error: Code: 107. DB::ErrnoException: Cannot open file /var/lib/clickhouse/store/521/521986ec-2fef-42c8-a402-83f937689286/all_1_1_0/proj.proj/columns.txt, errno: 2, strerror: No such file or directory. (FILE_DOESNT_EXIST) (version 23.11.1.1))\nPart all_1_1_0 has a broken projection proj_2 (error: Code: 226. DB::Exception: There is no file for column \'c\' in data part \'proj_2\'. (NO_FILE_IN_DATA_PART) (version 23.11.1.1)). (BROKEN_PROJECTION) (version 23.11.1.1)
+check table full (all_1_1_0)
+all_1_1_0
 materialize projection proj
-check table full
+check table full ()
 system.parts
 all_0_0_0	0	['proj','proj_2']
 all_0_0_0_6	1	['proj','proj_2']
@@ -166,16 +165,16 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
 materialize projection proj_2
-check table full
+check table full ()
 broke data of part 'proj' (parent part: all_3_5_1_7)
 insert new part
 optimize
@@ -206,11 +205,11 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj_2']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj_2
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index bf382624787..a522de42c89 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -121,7 +121,7 @@ function check()
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
-            SELECT query, projections FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
+            SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
             "
     fi
 
@@ -136,7 +136,7 @@ function check()
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
-            SELECT query, projections FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
+            SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
             "
     fi
 
@@ -185,11 +185,20 @@ function materialize_projection
 
 function check_table_full()
 {
-    echo 'check table full'
-    $CLICKHOUSE_CLIENT -nm -q "
-    SET send_logs_level='fatal';
-    CHECK TABLE test SETTINGS check_query_single_value_result = 0;
-" | grep "broken"
+    echo "check table full ($1)"
+    expect_broken_part=$1
+    if [ "$expect_broken_part" = "" ]
+       then
+           $CLICKHOUSE_CLIENT -nm -q "
+           SET send_logs_level='fatal';
+           CHECK TABLE test SETTINGS check_query_single_value_result = 0;
+           " | grep "broken"
+       else
+           $CLICKHOUSE_CLIENT -nm -q "
+           SET send_logs_level='fatal';
+           CHECK TABLE test SETTINGS check_query_single_value_result = 0;
+           " | grep "broken" | grep -o $expect_broken_part | head -n 1
+    fi
 }
 
 
@@ -216,7 +225,7 @@ check
 broken_projections_info
 
 # Check table query will also show a list of parts which have broken projections.
-check_table_full
+check_table_full "all_2_2_0"
 
 # Break data file of projection 'proj_2' for part all_2_2_0
 break_projection proj_2 all_2_2_0 data
@@ -280,7 +289,7 @@ broken_projections_info
 
 check
 
-check_table_full
+check_table_full all_1_1_0
 
 materialize_projection proj
 

From e8d99cb29654645c5a89d6cb15856b48a55d7bdf Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Wed, 22 Nov 2023 12:34:31 +0100
Subject: [PATCH 006/245] Fix style check

---
 tests/queries/0_stateless/02916_broken_projection.sh | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index a522de42c89..6ed92e2e06e 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -54,8 +54,8 @@ function break_projection()
     parent_name=$2
     break_type=$3
 
-    read -r disk_name part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
-    SELECT disk_name, path
+    read -r part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
+    SELECT path
     FROM system.projection_parts
     WHERE table='test'
     AND database=currentDatabase()

From a57e612cf2ef657801cdeefb8410caf5cab804a2 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 24 Nov 2023 16:08:49 +0100
Subject: [PATCH 007/245] Fxi tests

---
 src/Storages/StorageMergeTree.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 74277616e95..84b48bb650b 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -2247,7 +2247,7 @@ std::optional<CheckResult> StorageMergeTree::checkDataNext(DataValidationTasksPt
         {
             try
             {
-                auto calculated_checksums = checkDataPart(part, false, noop, /* is_cancelled */{}, /* throw_on_broken_projection */true);
+                auto calculated_checksums = checkDataPart(part, false, noop, /* is_cancelled */[]{ return false; }, /* throw_on_broken_projection */true);
                 calculated_checksums.checkEqual(part->checksums, true);
 
                 auto & part_mutable = const_cast<IMergeTreeDataPart &>(*part);
@@ -2268,7 +2268,7 @@ std::optional<CheckResult> StorageMergeTree::checkDataNext(DataValidationTasksPt
         {
             try
             {
-                checkDataPart(part, true, noop, /* is_cancelled */{}, /* throw_on_broken_projection */true);
+                checkDataPart(part, true, noop, /* is_cancelled */[]{ return false; }, /* throw_on_broken_projection */true);
                 return CheckResult(part->name, true, "");
             }
             catch (...)

From 8ebbc8d85dc3f1e37d109ddb1ad1a05a55283a79 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 24 Nov 2023 18:37:40 +0100
Subject: [PATCH 008/245] Update 02117_show_create_table_system.reference

---
 .../0_stateless/02117_show_create_table_system.reference       | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/tests/queries/0_stateless/02117_show_create_table_system.reference b/tests/queries/0_stateless/02117_show_create_table_system.reference
index 9ed905a0df8..e122de8ef6c 100644
--- a/tests/queries/0_stateless/02117_show_create_table_system.reference
+++ b/tests/queries/0_stateless/02117_show_create_table_system.reference
@@ -685,6 +685,9 @@ CREATE TABLE system.projection_parts
     `rows_where_ttl_info.expression` Array(String),
     `rows_where_ttl_info.min` Array(DateTime),
     `rows_where_ttl_info.max` Array(DateTime),
+    `is_broken` UInt8,
+    `exception_code` Int32,
+    `exception` String,
     `bytes` UInt64 ALIAS bytes_on_disk,
     `marks_size` UInt64 ALIAS marks_bytes,
     `part_name` String ALIAS name

From b4dab194954845b76d1ce9a6bf8b18dded059d74 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 27 Nov 2023 12:42:09 +0100
Subject: [PATCH 009/245] Fix test

---
 .../0_stateless/02916_broken_projection.reference    |  1 +
 tests/queries/0_stateless/02916_broken_projection.sh | 12 +++++++++---
 2 files changed, 10 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index 1b84ca96840..1f072e207a7 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -55,6 +55,7 @@ select from projection 'proj', expect error: proj_2
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: proj_2
+FILE_DOESNT_EXIST
 check table
 0
 broken projections info
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 6ed92e2e06e..80805330577 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -115,7 +115,10 @@ function check()
 
     if [ "$expect_broken_part" = "proj" ]
         then
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --send_logs_level 'fatal' --query_id $query_id -q "SELECT c FROM test WHERE d == 12 ORDER BY c;" 2>&1 | grep -o $expected_error
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
+SET send_logs_level='fatal';
+SELECT c FROM test WHERE d == 12 ORDER BY c;
+" 2>&1 | grep -oF "$expected_error"
         else
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;"
             echo 'used projections'
@@ -130,7 +133,10 @@ function check()
 
     if [ "$expect_broken_part" = "proj_2" ]
         then
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --send_logs_level 'fatal' --query_id $query_id -q "SELECT d FROM test WHERE c == 12 ORDER BY d;" 2>&1 | grep -o $expected_error
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
+SET send_logs_level='fatal';
+SELECT d FROM test WHERE c == 12 ORDER BY d;
+" 2>&1 | grep -oF "$expected_error"
         else
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;"
             echo 'used projections'
@@ -234,7 +240,7 @@ break_projection proj_2 all_2_2_0 data
 broken_projections_info
 
 # Select now fails with error "File doesn't exist"
-check "proj_2" "FILE_DOESNT_EXIST"
+check "proj_2" FILE_DOESNT_EXIST
 
 # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
 broken_projections_info

From a6972e7c90fd8ff775855cac13f47f9cd46b2da1 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 28 Nov 2023 10:22:10 +0100
Subject: [PATCH 010/245] Fxi

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 85ce112d9a1..be665a64f1c 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -1145,7 +1145,7 @@ void IMergeTreeDataPart::loadChecksums(bool require)
         LOG_WARNING(storage.log, "Checksums for part {} not found. Will calculate them from data on disk.", name);
 
         bool noop;
-        checksums = checkDataPart(shared_from_this(), false, noop, /* is_cancelled */{}, /* throw_on_broken_projection */false);
+        checksums = checkDataPart(shared_from_this(), false, noop, /* is_cancelled */[]{ return false; }, /* throw_on_broken_projection */false);
         writeChecksums(checksums, {});
 
         bytes_on_disk = checksums.getTotalSizeOnDisk();

From 0e11eeaea546dd41231a4f180b877ada1291a23d Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 30 Nov 2023 13:52:08 +0100
Subject: [PATCH 011/245] Allow to backup and restore parts with broken
 projections

---
 src/Backups/BackupSettings.cpp                |   2 +
 src/Backups/BackupSettings.h                  |   6 +
 .../MergeTree/DataPartStorageOnDiskBase.cpp   |  35 +-
 .../MergeTree/DataPartStorageOnDiskBase.h     |   4 +-
 src/Storages/MergeTree/IDataPartStorage.h     |   4 +-
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  15 +-
 src/Storages/MergeTree/IMergeTreeDataPart.h   |   3 +-
 src/Storages/MergeTree/MergeTreeData.cpp      |   9 +-
 .../02916_broken_projection.reference         | 226 +++++++++-
 .../0_stateless/02916_broken_projection.sh    | 426 +++++++++++++-----
 10 files changed, 588 insertions(+), 142 deletions(-)

diff --git a/src/Backups/BackupSettings.cpp b/src/Backups/BackupSettings.cpp
index 68d825e9468..51d713f03e1 100644
--- a/src/Backups/BackupSettings.cpp
+++ b/src/Backups/BackupSettings.cpp
@@ -32,6 +32,8 @@ namespace ErrorCodes
     M(UInt64, shard_num) \
     M(UInt64, replica_num) \
     M(Bool, check_parts) \
+    M(Bool, check_projection_parts) \
+    M(Bool, allow_backup_broken_projections) \
     M(Bool, internal) \
     M(String, host_id) \
     M(OptionalUUID, backup_uuid)
diff --git a/src/Backups/BackupSettings.h b/src/Backups/BackupSettings.h
index f26b992b348..ec430905f51 100644
--- a/src/Backups/BackupSettings.h
+++ b/src/Backups/BackupSettings.h
@@ -62,6 +62,12 @@ struct BackupSettings
     /// Check checksums of the data parts before writing them to a backup.
     bool check_parts = true;
 
+    /// Check checksums of the projection data parts before writing them to a backup.
+    bool check_projection_parts = true;
+
+    /// Allow to create backup with broken projections.
+    bool allow_backup_broken_projections = false;
+
     /// Internal, should not be specified by user.
     /// Whether this backup is a part of a distributed backup created by BACKUP ON CLUSTER.
     bool internal = false;
diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp b/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp
index 7fc8187aee5..6e5cbdde355 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp
@@ -334,7 +334,9 @@ void DataPartStorageOnDiskBase::backup(
     const ReadSettings & read_settings,
     bool make_temporary_hard_links,
     BackupEntries & backup_entries,
-    TemporaryFilesOnDisks * temp_dirs) const
+    TemporaryFilesOnDisks * temp_dirs,
+    bool is_projection_part,
+    bool allow_backup_broken_projection) const
 {
     fs::path part_path_on_disk = fs::path{root_path} / part_dir;
     fs::path part_path_in_backup = fs::path{path_in_backup} / part_dir;
@@ -376,7 +378,7 @@ void DataPartStorageOnDiskBase::backup(
 
     bool copy_encrypted = !backup_settings.decrypt_files_from_encrypted_disks;
 
-    for (const auto & filepath : files_to_backup)
+    auto backup_file = [&](const String & filepath)
     {
         auto filepath_on_disk = part_path_on_disk / filepath;
         auto filepath_in_backup = part_path_in_backup / filepath;
@@ -384,8 +386,10 @@ void DataPartStorageOnDiskBase::backup(
         if (files_without_checksums.contains(filepath))
         {
             backup_entries.emplace_back(filepath_in_backup, std::make_unique<BackupEntryFromSmallFile>(disk, filepath_on_disk, read_settings, copy_encrypted));
-            continue;
+            return;
         }
+        else if (is_projection_part && allow_backup_broken_projection && !disk->exists(filepath_on_disk))
+            return;
 
         if (make_temporary_hard_links)
         {
@@ -410,6 +414,31 @@ void DataPartStorageOnDiskBase::backup(
             backup_entry = wrapBackupEntryWith(std::move(backup_entry), temp_dir_owner);
 
         backup_entries.emplace_back(filepath_in_backup, std::move(backup_entry));
+    };
+
+    auto * log = &Poco::Logger::get("DataPartStorageOnDiskBase::backup");
+
+    for (const auto & filepath : files_to_backup)
+    {
+        if (is_projection_part && allow_backup_broken_projection)
+        {
+            try
+            {
+                backup_file(filepath);
+            }
+            catch (Exception & e)
+            {
+                if (e.code() != ErrorCodes::FILE_DOESNT_EXIST)
+                    throw;
+
+                LOG_ERROR(log, "Cannot backup file {} of projection part {}. Will try to ignore it", filepath, part_dir);
+                continue;
+            }
+        }
+        else
+        {
+            backup_file(filepath);
+        }
     }
 }
 
diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskBase.h b/src/Storages/MergeTree/DataPartStorageOnDiskBase.h
index 1826e84c28d..6176a13c27b 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskBase.h
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskBase.h
@@ -58,7 +58,9 @@ public:
         const ReadSettings & read_settings,
         bool make_temporary_hard_links,
         BackupEntries & backup_entries,
-        TemporaryFilesOnDisks * temp_dirs) const override;
+        TemporaryFilesOnDisks * temp_dirs,
+        bool is_projection_part,
+        bool allow_backup_broken_projection) const override;
 
     MutableDataPartStoragePtr freeze(
         const std::string & to,
diff --git a/src/Storages/MergeTree/IDataPartStorage.h b/src/Storages/MergeTree/IDataPartStorage.h
index 072cb29626e..b3a6ab203d5 100644
--- a/src/Storages/MergeTree/IDataPartStorage.h
+++ b/src/Storages/MergeTree/IDataPartStorage.h
@@ -222,7 +222,9 @@ public:
         const ReadSettings & read_settings,
         bool make_temporary_hard_links,
         BackupEntries & backup_entries,
-        TemporaryFilesOnDisks * temp_dirs) const = 0;
+        TemporaryFilesOnDisks * temp_dirs,
+        bool is_projection_part,
+        bool allow_backup_broken_projection) const = 0;
 
     /// Creates hardlinks into 'to/dir_path' for every file in data part.
     /// Callback is called after hardlinks are created, but before 'delete-on-destroy.txt' marker is removed.
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index be665a64f1c..940b3991067 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -647,13 +647,14 @@ void IMergeTreeDataPart::loadColumnsChecksumsIndexes(bool require_columns_checks
         loadIndex(); /// Must be called after loadIndexGranularity as it uses the value of `index_granularity`
         loadRowsCount(); /// Must be called after loadIndexGranularity() as it uses the value of `index_granularity`.
         loadPartitionAndMinMaxIndex();
+        bool has_broken_projections = false;
         if (!parent_part)
         {
             loadTTLInfos();
-            loadProjections(require_columns_checksums, check_consistency, false /* if_not_loaded */);
+            has_broken_projections = !loadProjections(require_columns_checksums, check_consistency, false /* if_not_loaded */);
         }
 
-        if (check_consistency)
+        if (check_consistency && !has_broken_projections)
             checkConsistency(require_columns_checksums);
 
         loadDefaultCompressionCodec();
@@ -715,9 +716,10 @@ void IMergeTreeDataPart::addProjectionPart(
     projection_parts[projection_name] = std::move(projection_part);
 }
 
-void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded)
+bool IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded)
 {
     auto metadata_snapshot = storage.getInMemoryMetadataPtr();
+    bool has_broken_projection = false;
     for (const auto & projection : metadata_snapshot->projections)
     {
         auto path = projection.name + ".proj";
@@ -742,16 +744,19 @@ void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool ch
                     if (isRetryableException(std::current_exception()))
                         throw;
 
+                    auto message = getCurrentExceptionMessage(true);
                     LOG_ERROR(&Poco::Logger::get("IMergeTreeDataPart"),
-                              "Cannot load projection {}, will consider it broken", projection.name);
+                              "Cannot load projection {}, will consider it broken. Reason: {}", projection.name, message);
 
-                    part->setBrokenReason(getCurrentExceptionMessage(false), getCurrentExceptionCode());
+                    has_broken_projection = true;
+                    part->setBrokenReason(message, getCurrentExceptionCode());
                 }
 
                 addProjectionPart(projection.name, std::move(part));
             }
         }
     }
+    return has_broken_projection;
 }
 
 void IMergeTreeDataPart::loadIndexGranularity()
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 9af2c16f1e8..6e276284f4c 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -421,7 +421,8 @@ public:
 
     bool hasBrokenProjection(const String & projection_name) const;
 
-    void loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded = false);
+    /// Return true, if all projections were loaded successfully and none was marked as broken.
+    bool loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded = false);
 
     void setBrokenReason(const String & message, int code) const;
 
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 8683e4293e9..c95aee88aee 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -5113,7 +5113,7 @@ MergeTreeData::PartsBackupEntries MergeTreeData::backupParts(
         if (hold_table_lock && !table_lock)
             table_lock = lockForShare(local_context->getCurrentQueryId(), local_context->getSettingsRef().lock_acquire_timeout);
 
-        if (backup_settings.check_parts)
+        if (backup_settings.check_projection_parts)
             part->checkConsistencyWithProjections(/* require_part_metadata= */ true);
 
         BackupEntries backup_entries_from_part;
@@ -5125,7 +5125,8 @@ MergeTreeData::PartsBackupEntries MergeTreeData::backupParts(
             read_settings,
             make_temporary_hard_links,
             backup_entries_from_part,
-            &temp_dirs);
+            &temp_dirs,
+            false, false);
 
         auto projection_parts = part->getProjectionParts();
         for (const auto & [projection_name, projection_part] : projection_parts)
@@ -5138,7 +5139,9 @@ MergeTreeData::PartsBackupEntries MergeTreeData::backupParts(
                 read_settings,
                 make_temporary_hard_links,
                 backup_entries_from_part,
-                &temp_dirs);
+                &temp_dirs,
+                projection_part->is_broken,
+                backup_settings.allow_backup_broken_projections);
         }
 
         if (hold_storage_and_part_ptrs)
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index 1f072e207a7..4c4901ae99f 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -19,6 +19,7 @@ used projections
 SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
+0
 broke metadata of part 'proj' (parent part: all_2_2_0)
 system.parts
 all_0_0_0	1	['proj','proj_2']
@@ -39,8 +40,9 @@ check table
 0
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
-check table full (all_2_2_0)
+check table full (test - all_2_2_0)
 all_2_2_0
+0
 broke data of part 'proj_2' (parent part: all_2_2_0)
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
@@ -78,6 +80,7 @@ used projections
 SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
+0
 broke data of part 'proj_2' (parent part: all_3_3_0)
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
@@ -111,6 +114,7 @@ used projections
 SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
+0
 broke metadata of part 'proj' (parent part: all_1_1_0)
 Detach - Attach
 broken projections info
@@ -118,6 +122,7 @@ all_1_1_0	proj	NO_FILE_IN_DATA_PART
 all_2_2_0	proj	NO_FILE_IN_DATA_PART
 all_2_2_0	proj_2	FILE_DOESNT_EXIST
 all_3_3_0	proj_2	FILE_DOESNT_EXIST
+0
 broke data of part 'proj_2' (parent part: all_1_1_0)
 Detach - Attach
 broken projections info
@@ -146,10 +151,10 @@ used projections
 SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
-check table full (all_1_1_0)
+check table full (test - all_1_1_0)
 all_1_1_0
 materialize projection proj
-check table full ()
+check table full (test - )
 system.parts
 all_0_0_0	0	['proj','proj_2']
 all_0_0_0_6	1	['proj','proj_2']
@@ -175,7 +180,8 @@ SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
 materialize projection proj_2
-check table full ()
+check table full (test - )
+0
 broke data of part 'proj' (parent part: all_3_5_1_7)
 insert new part
 optimize
@@ -214,3 +220,215 @@ used projections
 SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
+insert new part
+insert new part
+insert new part
+insert new part
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+used projections
+SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+used projections
+SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+system.parts
+all_1_1_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+used projections
+SELECT c FROM test2_replica WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+used projections
+SELECT d FROM test2_replica WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+0
+broke data of part 'proj' (parent part: all_0_0_0)
+check table full (test2 - all_0_0_0)
+all_0_0_0
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+used projections
+SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+used projections
+SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+0
+broke data of part 'all_0_0_0'
+check table full (test2 - all_0_0_0)
+all_0_0_0
+system.parts
+all_0_0_0	0	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+used projections
+SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+used projections
+SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+used projections
+SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+used projections
+SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+insert new part
+insert new part
+insert new part
+insert new part
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+12
+16
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+0
+broke data of part 'proj' (parent part: all_2_2_0)
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: proj
+FILE_DOESNT_EXIST
+select from projection 'proj_2', expect error: proj
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+0
+broken projections info
+all_2_2_0	proj	NO_FILE_IN_DATA_PART
+BACKUP_CREATED
+RESTORED
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: proj
+FILE_DOESNT_EXIST
+select from projection 'proj_2', expect error: proj
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+0
+broken projections info
+all_2_2_0	proj	NO_FILE_IN_DATA_PART
+0
+broke all data of part 'proj' (parent part: all_2_2_0)
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: proj
+select from projection 'proj_2', expect error: proj
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+0
+broken projections info
+all_2_2_0	proj	NO_FILE_IN_DATA_PART
+FILE_DOESNT_EXIST
+materialize projection proj
+system.parts
+all_0_0_0	0	['proj','proj_2']
+all_0_0_0_4	1	['proj','proj_2']
+all_1_1_0	0	['proj','proj_2']
+all_1_1_0_4	1	['proj','proj_2']
+all_2_2_0	0	['proj','proj_2']
+all_2_2_0_4	1	['proj','proj_2']
+all_3_3_0	0	['proj','proj_2']
+all_3_3_0_4	1	['proj','proj_2']
+select from projection 'proj', expect error: proj
+select from projection 'proj_2', expect error: proj
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+broken projections info
+all_2_2_0	proj	NO_FILE_IN_DATA_PART
+BACKUP_CREATED
+RESTORED
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: proj
+select from projection 'proj_2', expect error: proj
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+0
+broke all data of part 'proj' (parent part: all_2_2_0)
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: proj
+select from projection 'proj_2', expect error: proj
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+0
+broken projections info
+all_2_2_0	proj	FILE_DOESNT_EXIST
+BACKUP_CREATED
+RESTORED
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+12
+16
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+0
+broken projections info
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 80805330577..1555139e16f 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -5,35 +5,40 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_CLIENT -nm -q "
-DROP TABLE IF EXISTS test SYNC;
-CREATE TABLE test
-(
-    a String,
-    b String,
-    c Int32,
-    d Int32,
-    e Int32,
+function create_table()
+{
+    test_id=$1
+    name=$2
+    replica=$3
+    $CLICKHOUSE_CLIENT -nm -q "
+    DROP TABLE IF EXISTS $name SYNC;
+    CREATE TABLE $name
+    (
+        a String,
+        b String,
+        c Int64,
+        d Int64,
+        e Int64,
 
-    PROJECTION proj
-    (
-        SELECT c ORDER BY d
-    ),
-    PROJECTION proj_2
-    (
-        SELECT d ORDER BY c
+        PROJECTION proj
+        (
+            SELECT c ORDER BY d
+        ),
+        PROJECTION proj_2
+        (
+            SELECT d ORDER BY c
+        )
     )
-)
-ENGINE = ReplicatedMergeTree('/test4/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '1') PRIMARY KEY (a)
-SETTINGS min_bytes_for_wide_part = 0,
-    max_parts_to_merge_at_once=3,
-    enable_vertical_merge_algorithm=1,
-    vertical_merge_algorithm_min_rows_to_activate = 1,
-    vertical_merge_algorithm_min_columns_to_activate = 1,
-    vertical_merge_algorithm_min_columns_to_activate = 1;
-"
-
-table_uuid=$($CLICKHOUSE_CLIENT -q "SELECT uuid FROM system.tables WHERE table='test' and database=currentDatabase()")
+    ENGINE = ReplicatedMergeTree('/test_broken_projection_24_$test_id/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '$replica') ORDER BY a
+    SETTINGS min_bytes_for_wide_part = 0,
+        max_parts_to_merge_at_once=3,
+        enable_vertical_merge_algorithm=1,
+        vertical_merge_algorithm_min_rows_to_activate = 1,
+        vertical_merge_algorithm_min_columns_to_activate = 1,
+        vertical_merge_algorithm_min_columns_to_activate = 1,
+        compress_primary_key=0;
+    "
+}
 
 function random()
 {
@@ -42,49 +47,88 @@ function random()
 
 function insert()
 {
-    offset=$1
-    size=$2
+    table=$1
+    offset=$2
+    size=$3
     echo 'insert new part'
-    $CLICKHOUSE_CLIENT -q "INSERT INTO test SELECT number, number, number, number, number%2 FROM numbers($offset, $size);"
+    $CLICKHOUSE_CLIENT -q "INSERT INTO $table SELECT number, number, number, number, number%2 FROM numbers($offset, $size);"
 }
 
 function break_projection()
 {
-    part_name=$1
-    parent_name=$2
-    break_type=$3
+    table=$1
+    part_name=$2
+    parent_name=$3
+    break_type=$4
 
     read -r part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
     SELECT path
     FROM system.projection_parts
-    WHERE table='test'
+    WHERE table='$table'
     AND database=currentDatabase()
     AND active=1
     AND part_name='$part_name'
     AND parent_name='$parent_name'
+    ORDER BY modification_time DESC
     LIMIT 1;
     ")
 
+    $CLICKHOUSE_CLIENT -q "select throwIf(substring('$part_path', 1, 1) != '/', 'Path is relative: $part_path')" || exit
+
     if [ "$break_type" = "data" ]
         then
            rm "$part_path/d.bin"
            rm "$part_path/c.bin"
            echo "broke data of part '$part_name' (parent part: $parent_name)"
-        else
+    fi
+    if [ "$break_type" = "metadata" ]
+        then
            rm "$part_path/columns.txt"
            echo "broke metadata of part '$part_name' (parent part: $parent_name)"
     fi
+    if [ "$break_type" = "part" ]
+        then
+           rm -r "$part_path"
+           echo "broke all data of part '$part_name' (parent part: $parent_name)"
+    fi
+}
+
+function break_part()
+{
+    table=$1
+    part_name=$2
+
+    read -r part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
+    SELECT path
+    FROM system.parts
+    WHERE table='$table'
+    AND database=currentDatabase()
+    AND active=1
+    AND part_name='$part_name'
+    ORDER BY modification_time DESC
+    LIMIT 1;
+    ")
+
+    if [ "$part_path" = "" ]
+       then
+           echo "Part path is empty"
+           exit
+    fi
+
+    rm $part_path/columns.txt
+    echo "broke data of part '$part_name'"
 }
 
 function broken_projections_info()
 {
+    table=$1
     echo 'broken projections info'
     $CLICKHOUSE_CLIENT -q "
     SELECT parent_name, name, errors.name FROM
     (
         SELECT parent_name, name, exception_code
         FROM system.projection_parts
-        WHERE table='test'
+        WHERE table='$table'
         AND database=currentDatabase()
         AND is_broken = 1
     ) AS parts_info
@@ -96,18 +140,19 @@ function broken_projections_info()
 
 function check()
 {
+    table=$1
     expect_broken_part=""
     expected_error=""
-    if [ $# -ne 0 ]; then
-        expect_broken_part=$1
-        expected_error=$2
+    if [ $# -gt 1 ]; then
+        expect_broken_part=$2
+        expected_error=$3
     fi
 
     echo 'system.parts'
     $CLICKHOUSE_CLIENT -q "
     SELECT name, active, projections
     FROM system.parts
-    WHERE table='test' AND database=currentDatabase()
+    WHERE table='$table' AND database=currentDatabase()
     ORDER BY name;"
 
     echo "select from projection 'proj', expect error: $expect_broken_part"
@@ -117,10 +162,10 @@ function check()
         then
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
 SET send_logs_level='fatal';
-SELECT c FROM test WHERE d == 12 ORDER BY c;
+SELECT c FROM $table WHERE d == 12 ORDER BY c;
 " 2>&1 | grep -oF "$expected_error"
         else
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;"
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM $table WHERE d == 12 OR d == 16 ORDER BY c;"
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
@@ -135,10 +180,10 @@ SELECT c FROM test WHERE d == 12 ORDER BY c;
         then
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
 SET send_logs_level='fatal';
-SELECT d FROM test WHERE c == 12 ORDER BY d;
+SELECT d FROM $table WHERE c == 12 ORDER BY d;
 " 2>&1 | grep -oF "$expected_error"
         else
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;"
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM $table WHERE c == 12 OR c == 16 ORDER BY d;"
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
@@ -149,7 +194,7 @@ SELECT d FROM test WHERE c == 12 ORDER BY d;
     echo 'check table'
     $CLICKHOUSE_CLIENT -nm -q "
     SET send_logs_level='fatal';
-    CHECK TABLE test;"
+    CHECK TABLE $table;"
 }
 
 function optimize()
@@ -184,141 +229,274 @@ function reattach()
 
 function materialize_projection
 {
-    projection=$1
+    table=$1
+    projection=$2
     echo "materialize projection $projection"
-    $CLICKHOUSE_CLIENT -q "ALTER TABLE test MATERIALIZE PROJECTION $projection SETTINGS mutations_sync=2"
+    $CLICKHOUSE_CLIENT -q "ALTER TABLE $table MATERIALIZE PROJECTION $projection SETTINGS mutations_sync=2"
 }
 
 function check_table_full()
 {
-    echo "check table full ($1)"
-    expect_broken_part=$1
+    table=$1
+    expect_broken_part=$2
+    echo "check table full ($1 - $2)"
     if [ "$expect_broken_part" = "" ]
        then
            $CLICKHOUSE_CLIENT -nm -q "
            SET send_logs_level='fatal';
-           CHECK TABLE test SETTINGS check_query_single_value_result = 0;
+           CHECK TABLE $table SETTINGS check_query_single_value_result = 0;
            " | grep "broken"
        else
            $CLICKHOUSE_CLIENT -nm -q "
            SET send_logs_level='fatal';
-           CHECK TABLE test SETTINGS check_query_single_value_result = 0;
+           CHECK TABLE $table SETTINGS check_query_single_value_result = 0;
            " | grep "broken" | grep -o $expect_broken_part | head -n 1
     fi
 }
 
+function test1()
+{
+    create_table test1 test 1
 
-insert 0 5
+    table_uuid=$($CLICKHOUSE_CLIENT -q "SELECT uuid FROM system.tables WHERE table='test' and database=currentDatabase()")
 
-insert 5 5
+    insert test 0 5
 
-insert 10 5
+    insert test 5 5
 
-insert 15 5
+    insert test 10 5
 
-check
+    insert test 15 5
 
-# Break metadata file of projection 'proj'
-break_projection proj all_2_2_0 metadata
+    check test
 
-# Do select and after "check table" query.
-# Select works because it does not read columns.txt.
-check
+    # Break metadata file of projection 'proj'
+    break_projection test proj all_2_2_0 metadata
 
-# Projection 'proj' from part all_2_2_0 will now appear in broken parts info
-# because it was marked broken during "check table" query.
-# TODO: try to mark it during select as well
-broken_projections_info
+    # Do select and after "check table" query.
+    # Select works because it does not read columns.txt.
+    check test
 
-# Check table query will also show a list of parts which have broken projections.
-check_table_full "all_2_2_0"
+    # Projection 'proj' from part all_2_2_0 will now appear in broken parts info
+    # because it was marked broken during "check table" query.
+    # TODO: try to mark it during select as well
+    broken_projections_info test
 
-# Break data file of projection 'proj_2' for part all_2_2_0
-break_projection proj_2 all_2_2_0 data
+    # Check table query will also show a list of parts which have broken projections.
+    check_table_full test "all_2_2_0"
 
-# It will not yet appear in broken projections info.
-broken_projections_info
+    # Break data file of projection 'proj_2' for part all_2_2_0
+    break_projection test proj_2 all_2_2_0 data
 
-# Select now fails with error "File doesn't exist"
-check "proj_2" FILE_DOESNT_EXIST
+    # It will not yet appear in broken projections info.
+    broken_projections_info test
 
-# Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
-broken_projections_info
+    # Select now fails with error "File doesn't exist"
+    check test "proj_2" FILE_DOESNT_EXIST
 
-# Second select works, because projection is now marked as broken.
-check
+    # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
+    broken_projections_info test
 
-# Break data file of projection 'proj_2' for part all_3_3_0
-break_projection proj_2 all_3_3_0 data
+    # Second select works, because projection is now marked as broken.
+    check test
 
-# It will not yet appear in broken projections info.
-broken_projections_info
+    # Break data file of projection 'proj_2' for part all_3_3_0
+    break_projection test proj_2 all_3_3_0 data
 
-insert 20 5
+    # It will not yet appear in broken projections info.
+    broken_projections_info test
 
-insert 25 5
+    insert test 20 5
 
-# Part all_3_3_0 has 'proj' and 'proj_2' projections, but 'proj_2' is broken and server does NOT know it yet.
-# Parts all_4_4_0 and all_5_5_0 have both non-broken projections.
-# So a merge will be create for future part all_3_5_1.
-# During merge it will fail to read from 'proj_2' of part all_3_3_0 and proj_2 will be marked broken.
-# Merge will be retried and on second attempt it will succeed.
-# The result part all_3_5_1 will have only 1 projection - 'proj', because
-# it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
-optimize 0 1
-sleep 2
+    insert test 25 5
 
-$CLICKHOUSE_CLIENT -nm -q "
-SYSTEM FLUSH LOGS;
-SELECT count() FROM system.text_log
-WHERE level='Error'
-AND logger_name='MergeTreeBackgroundExecutor'
-AND message like 'Exception while executing background task {$table_uuid:all_3_5_1}%Cannot open file%proj_2.proj/c.bin%'
-"
+    # Part all_3_3_0 has 'proj' and 'proj_2' projections, but 'proj_2' is broken and server does NOT know it yet.
+    # Parts all_4_4_0 and all_5_5_0 have both non-broken projections.
+    # So a merge will be create for future part all_3_5_1.
+    # During merge it will fail to read from 'proj_2' of part all_3_3_0 and proj_2 will be marked broken.
+    # Merge will be retried and on second attempt it will succeed.
+    # The result part all_3_5_1 will have only 1 projection - 'proj', because
+    # it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
+    optimize 0 1
+    sleep 2
 
-# Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
-broken_projections_info
+    $CLICKHOUSE_CLIENT -nm -q "
+    SYSTEM FLUSH LOGS;
+    SELECT count() FROM system.text_log
+    WHERE level='Error'
+    AND logger_name='MergeTreeBackgroundExecutor'
+    AND message like 'Exception while executing background task {$table_uuid:all_3_5_1}%Cannot open file%proj_2.proj/c.bin%'
+    "
 
-check
+    # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
+    broken_projections_info test
 
-break_projection proj all_1_1_0 metadata
+    check test
 
-reattach
+    break_projection test proj all_1_1_0 metadata
 
-broken_projections_info
+    reattach
 
-break_projection proj_2 all_1_1_0 data
+    broken_projections_info test
 
-reattach
+    break_projection test proj_2 all_1_1_0 data
 
-broken_projections_info
+    reattach
 
-check
+    broken_projections_info test
 
-check_table_full all_1_1_0
+    check test
 
-materialize_projection proj
+    check_table_full test all_1_1_0
 
-check_table_full
+    materialize_projection test proj
 
-check
+    check_table_full test
 
-materialize_projection proj_2
+    check test
 
-check_table_full
+    materialize_projection test proj_2
 
-break_projection proj all_3_5_1_7 data
+    check_table_full test
 
-insert 30 5
+    break_projection test proj all_3_5_1_7 data
 
-optimize 1 0
+    insert test 30 5
 
-insert 35 5
+    optimize 1 0
 
-optimize 1 0
+    insert test 35 5
 
-check
+    optimize 1 0
 
-$CLICKHOUSE_CLIENT -nm -q "
-DROP TABLE test SYNC;
-"
+    check test
+}
+
+function test2()
+{
+    create_table test2 test2 1
+
+    insert test2 0 5
+
+    insert test2 5 5
+
+    insert test 10 5
+
+    insert test 15 5
+
+    check test2
+
+    create_table test2 test2_replica 2
+
+    check test2_replica
+
+    break_projection test2 proj all_0_0_0 data
+
+    check_table_full test2 all_0_0_0
+
+    check test2
+
+    break_part test2 all_0_0_0
+
+    check_table_full test2 all_0_0_0
+
+    check test2
+
+    $CLICKHOUSE_CLIENT -q "SYSTEM SYNC REPLICA test2;"
+
+    check test2
+}
+
+CLICKHOUSE_TEST_UNIQUE_NAME="gghhhhhhhhhhhhhhhhhhh"
+function test3()
+{
+    create_table test3 test 1
+
+    insert test 0 5
+
+    insert test 5 5
+
+    insert test 10 5
+
+    insert test 15 5
+
+    check test
+
+    break_projection test proj all_2_2_0 data
+
+    check test proj FILE_DOESNT_EXIST
+
+    broken_projections_info test
+
+    ${CLICKHOUSE_CLIENT} -nm --query "
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}') settings check_projection_parts=false;
+    " | grep -o "BACKUP_CREATED"
+
+    ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
+    drop table test sync;
+    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}');
+    " | grep -o "RESTORED"
+
+    check test proj FILE_DOESNT_EXIST
+
+    broken_projections_info test
+
+    break_projection test proj all_2_2_0 part
+
+    check test proj
+
+    broken_projections_info test
+
+    ${CLICKHOUSE_CLIENT} -nm --query "
+    set send_logs_level='fatal';
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2')
+    " 2>&1 | grep -o "FILE_DOESNT_EXIST"
+
+    materialize_projection test proj
+
+    check test proj
+
+    broken_projections_info test
+
+    ${CLICKHOUSE_CLIENT} -nm --query "
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3')
+    " | grep -o "BACKUP_CREATED"
+
+    ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
+    drop table test sync;
+    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3');
+    " | grep -o "RESTORED"
+
+    check test proj
+
+    break_projection test proj all_2_2_0 part
+
+    check test proj FILE_DOESNT_EXIST
+
+    broken_projections_info test
+
+    ${CLICKHOUSE_CLIENT} -nm --query "
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2')
+    settings check_projection_parts=false, allow_backup_broken_projections=true;
+    " | grep -o "BACKUP_CREATED"
+
+    ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
+    drop table test sync;
+    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2');
+    " | grep -o "RESTORED"
+
+    check test
+
+    broken_projections_info test
+}
+
+test1
+test2
+test3
+
+
+#$CLICKHOUSE_CLIENT -nm -q "
+#DROP TABLE test SYNC;
+#DROP TABLE test2 SYNC;
+#DROP TABLE test2_replica SYNC;
+#"

From 6632589d72ed270626e012c86a78a8f0c8411fb3 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 30 Nov 2023 13:54:22 +0100
Subject: [PATCH 012/245] Review fix

---
 src/Storages/MergeTree/MergeTreeData.cpp             |  6 +++---
 tests/queries/0_stateless/02916_broken_projection.sh | 10 +++++-----
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index c95aee88aee..1ba4153bc3e 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -7669,7 +7669,7 @@ MovePartsOutcome MergeTreeData::moveParts(const CurrentlyMovingPartsTaggerPtr &
 
 bool MergeTreeData::partsContainSameProjections(const DataPartPtr & left, const DataPartPtr & right, String & out_reason)
 {
-    auto remove_broken_parts = [](auto & parts)
+    auto remove_broken_parts_from_consideration = [](auto & parts)
     {
         std::set<String> broken_projection_parts;
         for (const auto & [name, part] : parts)
@@ -7684,8 +7684,8 @@ bool MergeTreeData::partsContainSameProjections(const DataPartPtr & left, const
     auto left_projection_parts = left->getProjectionParts();
     auto right_projection_parts = right->getProjectionParts();
 
-    remove_broken_parts(left_projection_parts);
-    remove_broken_parts(right_projection_parts);
+    remove_broken_parts_from_consideration(left_projection_parts);
+    remove_broken_parts_from_consideration(right_projection_parts);
 
     if (left_projection_parts.size() != right_projection_parts.size())
     {
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 1555139e16f..60b21216d1a 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -495,8 +495,8 @@ test2
 test3
 
 
-#$CLICKHOUSE_CLIENT -nm -q "
-#DROP TABLE test SYNC;
-#DROP TABLE test2 SYNC;
-#DROP TABLE test2_replica SYNC;
-#"
+$CLICKHOUSE_CLIENT -nm -q "
+DROP TABLE IF EXISTS test SYNC;
+DROP TABLE IF EXISTS test2 SYNC;
+DROP TABLE IF EXISTS test2_replica SYNC;
+"

From caf4dc7e14e594da3c254822b345b79c57e76d19 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Fri, 1 Dec 2023 12:21:47 +0100
Subject: [PATCH 013/245] Fix style check

---
 src/Common/ErrorCodes.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/ErrorCodes.cpp b/src/Common/ErrorCodes.cpp
index b0ed754536d..57aa82f3639 100644
--- a/src/Common/ErrorCodes.cpp
+++ b/src/Common/ErrorCodes.cpp
@@ -587,7 +587,7 @@
     M(705, TABLE_NOT_EMPTY) \
     M(706, LIBSSH_ERROR) \
     M(707, GCP_ERROR) \
-    M(708, ILLEGAL_STATISTIC) \ 
+    M(708, ILLEGAL_STATISTIC) \
     M(709, BROKEN_PROJECTION) \
     \
     M(999, KEEPER_EXCEPTION) \

From f609c44eb83fc769ba9e8fc5875bbc10e3e17b9b Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Fri, 1 Dec 2023 13:38:28 +0100
Subject: [PATCH 014/245] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 60b21216d1a..bd141d1a122 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -459,11 +459,13 @@ function test3()
     broken_projections_info test
 
     ${CLICKHOUSE_CLIENT} -nm --query "
+    set send_logs_level='fatal';
     backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3')
     " | grep -o "BACKUP_CREATED"
 
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
     drop table test sync;
+    set send_logs_level='fatal';
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3');
     " | grep -o "RESTORED"
 
@@ -476,12 +478,14 @@ function test3()
     broken_projections_info test
 
     ${CLICKHOUSE_CLIENT} -nm --query "
+    set send_logs_level='fatal';
     backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2')
     settings check_projection_parts=false, allow_backup_broken_projections=true;
     " | grep -o "BACKUP_CREATED"
 
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
     drop table test sync;
+    set send_logs_level='fatal';
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2');
     " | grep -o "RESTORED"
 

From 2b903003b4795eb3768fec3f84ec8321fa5485f6 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 4 Dec 2023 13:21:18 +0100
Subject: [PATCH 015/245] Update reference

---
 .../0_stateless/02916_broken_projection.reference        | 8 +++-----
 tests/queries/0_stateless/02916_broken_projection.sh     | 9 ++++-----
 2 files changed, 7 insertions(+), 10 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index 4c4901ae99f..acd1b87eb30 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -332,16 +332,14 @@ all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
-FILE_DOESNT_EXIST
 select from projection 'proj_2', expect error: proj
 12
 16
 used projections
 SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
-0
+1
 broken projections info
-all_2_2_0	proj	NO_FILE_IN_DATA_PART
 0
 broke all data of part 'proj' (parent part: all_2_2_0)
 system.parts
@@ -358,7 +356,7 @@ SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
 broken projections info
-all_2_2_0	proj	NO_FILE_IN_DATA_PART
+all_2_2_0	proj	FILE_DOESNT_EXIST
 FILE_DOESNT_EXIST
 materialize projection proj
 system.parts
@@ -379,7 +377,7 @@ SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
 broken projections info
-all_2_2_0	proj	NO_FILE_IN_DATA_PART
+all_2_2_0	proj	FILE_DOESNT_EXIST
 BACKUP_CREATED
 RESTORED
 system.parts
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index bd141d1a122..7315cf5ce61 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -29,7 +29,7 @@ function create_table()
             SELECT d ORDER BY c
         )
     )
-    ENGINE = ReplicatedMergeTree('/test_broken_projection_24_$test_id/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '$replica') ORDER BY a
+    ENGINE = ReplicatedMergeTree('/test_broken_projection_$test_id/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '$replica') ORDER BY a
     SETTINGS min_bytes_for_wide_part = 0,
         max_parts_to_merge_at_once=3,
         enable_vertical_merge_algorithm=1,
@@ -407,7 +407,6 @@ function test2()
     check test2
 }
 
-CLICKHOUSE_TEST_UNIQUE_NAME="gghhhhhhhhhhhhhhhhhhh"
 function test3()
 {
     create_table test3 test 1
@@ -437,7 +436,7 @@ function test3()
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}');
     " | grep -o "RESTORED"
 
-    check test proj FILE_DOESNT_EXIST
+    check test proj
 
     broken_projections_info test
 
@@ -479,14 +478,14 @@ function test3()
 
     ${CLICKHOUSE_CLIENT} -nm --query "
     set send_logs_level='fatal';
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2')
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_4')
     settings check_projection_parts=false, allow_backup_broken_projections=true;
     " | grep -o "BACKUP_CREATED"
 
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
     drop table test sync;
     set send_logs_level='fatal';
-    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2');
+    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_4');
     " | grep -o "RESTORED"
 
     check test

From b77a6073aea98c7c5f5fcc28492a34e801d11b6b Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 4 Dec 2023 16:57:09 +0100
Subject: [PATCH 016/245] Fix test

---
 .../02916_broken_projection.reference         | 90 +++++++++++--------
 .../0_stateless/02916_broken_projection.sh    | 36 ++++----
 2 files changed, 70 insertions(+), 56 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index acd1b87eb30..b7764a6434e 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -7,12 +7,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -26,12 +26,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -51,7 +51,7 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: proj_2
+select from projection 'proj'
 12
 16
 used projections
@@ -68,12 +68,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -102,12 +102,12 @@ all_3_3_0	0	['proj','proj_2']
 all_3_5_1	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -139,12 +139,12 @@ all_3_3_0	0	['proj','proj_2']
 all_3_5_1	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -167,12 +167,12 @@ all_3_5_1	0	['proj']
 all_3_5_1_6	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -208,12 +208,12 @@ all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
 all_8_8_0	0	['proj','proj_2']
 all_9_9_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj_2
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -227,20 +227,19 @@ insert new part
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 used projections
 SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
 system.parts
-all_1_1_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 used projections
 SELECT c FROM test2_replica WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 used projections
 SELECT d FROM test2_replica WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
@@ -252,10 +251,10 @@ all_0_0_0
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 used projections
 SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
@@ -266,10 +265,10 @@ all_0_0_0
 system.parts
 all_0_0_0	0	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 used projections
 SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
@@ -277,10 +276,10 @@ check table
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 used projections
 SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
@@ -294,12 +293,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -315,7 +314,7 @@ all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
 FILE_DOESNT_EXIST
-select from projection 'proj_2', expect error: proj
+select from projection 'proj_2'
 12
 16
 used projections
@@ -331,8 +330,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: proj
-select from projection 'proj_2', expect error: proj
+select from projection 'proj'
+12
+16
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2'
 12
 16
 used projections
@@ -348,7 +351,8 @@ all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
-select from projection 'proj_2', expect error: proj
+STD_EXCEPTION
+select from projection 'proj_2'
 12
 16
 used projections
@@ -368,8 +372,12 @@ all_2_2_0	0	['proj','proj_2']
 all_2_2_0_4	1	['proj','proj_2']
 all_3_3_0	0	['proj','proj_2']
 all_3_3_0_4	1	['proj','proj_2']
-select from projection 'proj', expect error: proj
-select from projection 'proj_2', expect error: proj
+select from projection 'proj'
+12
+16
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2'
 12
 16
 used projections
@@ -385,8 +393,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: proj
-select from projection 'proj_2', expect error: proj
+select from projection 'proj'
+12
+16
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2'
 12
 16
 used projections
@@ -401,7 +413,7 @@ all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
-select from projection 'proj_2', expect error: proj
+select from projection 'proj_2'
 12
 16
 used projections
@@ -417,12 +429,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 7315cf5ce61..eeea512f14a 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -29,7 +29,7 @@ function create_table()
             SELECT d ORDER BY c
         )
     )
-    ENGINE = ReplicatedMergeTree('/test_broken_projection_$test_id/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '$replica') ORDER BY a
+    ENGINE = ReplicatedMergeTree('/test_broken_projection_32_$test_id/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '$replica') ORDER BY a
     SETTINGS min_bytes_for_wide_part = 0,
         max_parts_to_merge_at_once=3,
         enable_vertical_merge_algorithm=1,
@@ -155,39 +155,41 @@ function check()
     WHERE table='$table' AND database=currentDatabase()
     ORDER BY name;"
 
-    echo "select from projection 'proj', expect error: $expect_broken_part"
     query_id=$(random 8)
 
     if [ "$expect_broken_part" = "proj" ]
         then
+            echo "select from projection 'proj', expect error: $expect_broken_part"
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
-SET send_logs_level='fatal';
-SELECT c FROM $table WHERE d == 12 ORDER BY c;
-" 2>&1 | grep -oF "$expected_error"
+                SET send_logs_level='fatal';
+                SELECT c FROM $table WHERE d == 12 ORDER BY c;
+            " 2>&1 | grep -oF "$expected_error"
         else
+            echo "select from projection 'proj'"
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM $table WHERE d == 12 OR d == 16 ORDER BY c;"
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
-            SYSTEM FLUSH LOGS;
-            SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
+                SYSTEM FLUSH LOGS;
+                SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
             "
     fi
 
-    echo "select from projection 'proj_2', expect error: $expect_broken_part"
     query_id=$(random 8)
 
     if [ "$expect_broken_part" = "proj_2" ]
         then
+            echo "select from projection 'proj_2', expect error: $expect_broken_part"
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
-SET send_logs_level='fatal';
-SELECT d FROM $table WHERE c == 12 ORDER BY d;
-" 2>&1 | grep -oF "$expected_error"
+                SET send_logs_level='fatal';
+                SELECT d FROM $table WHERE c == 12 ORDER BY d;
+            " 2>&1 | grep -oF "$expected_error"
         else
+            echo "select from projection 'proj_2'"
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM $table WHERE c == 12 OR c == 16 ORDER BY d;"
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
-            SYSTEM FLUSH LOGS;
-            SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
+                SYSTEM FLUSH LOGS;
+                SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
             "
     fi
 
@@ -436,13 +438,13 @@ function test3()
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}');
     " | grep -o "RESTORED"
 
-    check test proj
+    check test
 
     broken_projections_info test
 
     break_projection test proj all_2_2_0 part
 
-    check test proj
+    check test proj STD_EXCEPTION
 
     broken_projections_info test
 
@@ -453,7 +455,7 @@ function test3()
 
     materialize_projection test proj
 
-    check test proj
+    check test
 
     broken_projections_info test
 
@@ -468,7 +470,7 @@ function test3()
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3');
     " | grep -o "RESTORED"
 
-    check test proj
+    check test
 
     break_projection test proj all_2_2_0 part
 

From 4de048904a3cbb6ff30e20b5a8defd1564f2e722 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 4 Dec 2023 19:14:06 +0100
Subject: [PATCH 017/245] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index eeea512f14a..261342da103 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: no-random-merge-tree-settings
 # shellcheck disable=SC2046
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

From d3b80ac60cdb1fa17fb8907a7a6f11afde759bab Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 4 Dec 2023 19:14:55 +0100
Subject: [PATCH 018/245] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 261342da103..0910ba177fb 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: no-random-merge-tree-settings
+# Tags: long, no-random-merge-tree-settings
 # shellcheck disable=SC2046
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

From 23bde28ac4fc18e296daf6b04283ab50ee58d025 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 8 Dec 2023 19:11:47 +0100
Subject: [PATCH 019/245] Fxi

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 6 ++----
 src/Storages/MergeTree/IMergeTreeDataPart.h   | 2 +-
 src/Storages/MergeTree/MutateTask.cpp         | 6 ++++--
 3 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 52310802c9d..5418bcd83f3 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -677,7 +677,7 @@ void IMergeTreeDataPart::loadColumnsChecksumsIndexes(bool require_columns_checks
         if (!parent_part)
         {
             loadTTLInfos();
-            has_broken_projections = !loadProjections(require_columns_checksums, check_consistency, false /* if_not_loaded */);
+            loadProjections(require_columns_checksums, check_consistency, has_broken_projections, false /* if_not_loaded */);
         }
 
         if (check_consistency && !has_broken_projections)
@@ -742,10 +742,9 @@ void IMergeTreeDataPart::addProjectionPart(
     projection_parts[projection_name] = std::move(projection_part);
 }
 
-bool IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded)
+void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool check_consistency, bool & has_broken_projection, bool if_not_loaded)
 {
     auto metadata_snapshot = storage.getInMemoryMetadataPtr();
-    bool has_broken_projection = false;
     for (const auto & projection : metadata_snapshot->projections)
     {
         auto path = projection.name + ".proj";
@@ -782,7 +781,6 @@ bool IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool ch
             }
         }
     }
-    return has_broken_projection;
 }
 
 void IMergeTreeDataPart::loadIndexGranularity()
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 050bd76121c..9812529086b 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -434,7 +434,7 @@ public:
     bool hasBrokenProjection(const String & projection_name) const;
 
     /// Return true, if all projections were loaded successfully and none was marked as broken.
-    bool loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded = false);
+    void loadProjections(bool require_columns_checksums, bool check_consistency, bool & has_broken_projection, bool if_not_loaded = false);
 
     void setBrokenReason(const String & message, int code) const;
 
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 93b241deae7..2b0cf60a7f1 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -870,7 +870,8 @@ void finalizeMutatedPart(
     new_data_part->modification_time = time(nullptr);
 
     /// Load rest projections which are hardlinked
-    new_data_part->loadProjections(false, false, true /* if_not_loaded */);
+    bool noop;
+    new_data_part->loadProjections(false, false, noop, true /* if_not_loaded */);
 
     /// All information about sizes is stored in checksums.
     /// It doesn't make sense to touch filesystem for sizes.
@@ -1570,8 +1571,9 @@ private:
 
     void finalize()
     {
+        bool noop;
         ctx->new_data_part->minmax_idx = std::move(ctx->minmax_idx);
-        ctx->new_data_part->loadProjections(false, false, true /* if_not_loaded */);
+        ctx->new_data_part->loadProjections(false, false, noop, true /* if_not_loaded */);
         ctx->mutating_executor.reset();
         ctx->mutating_pipeline.reset();
 

From c8c4db5984bf9101478e0d1f33c3432c257ea7a0 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 11 Dec 2023 13:24:31 +0100
Subject: [PATCH 020/245] Fxi test

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp              | 7 +++++++
 .../queries/0_stateless/02916_broken_projection.reference  | 7 ++++---
 tests/queries/0_stateless/02916_broken_projection.sh       | 4 +++-
 3 files changed, 14 insertions(+), 4 deletions(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 5418bcd83f3..7af49edf788 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -780,6 +780,13 @@ void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool ch
                 addProjectionPart(projection.name, std::move(part));
             }
         }
+        else if (checksums.has(path))
+        {
+            auto part = getProjectionPartBuilder(projection.name).withPartFormatFromDisk().build();
+            part->setBrokenReason("Projection directory " + path + " does not exist while loading projections", ErrorCodes::NO_FILE_IN_DATA_PART);
+            addProjectionPart(projection.name, std::move(part));
+            has_broken_projection = true;
+        }
     }
 }
 
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index b7764a6434e..358304de74a 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -406,7 +406,7 @@ SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
 0
-broke all data of part 'proj' (parent part: all_2_2_0)
+broke all data of part 'proj' (parent part: all_1_1_0)
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
@@ -421,13 +421,13 @@ SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
 broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
+all_1_1_0	proj	FILE_DOESNT_EXIST
 BACKUP_CREATED
 RESTORED
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj_2']
+all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
@@ -442,3 +442,4 @@ SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
 broken projections info
+all_1_1_0	proj	NO_FILE_IN_DATA_PART
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 0910ba177fb..eb68f8621a2 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -410,6 +410,8 @@ function test2()
     check test2
 }
 
+CLICKHOUSE_DATABASE="default"
+CLICKHOUSE_TEST_UNIQUE_NAME="test123456"
 function test3()
 {
     create_table test3 test 1
@@ -473,7 +475,7 @@ function test3()
 
     check test
 
-    break_projection test proj all_2_2_0 part
+    break_projection test proj all_1_1_0 part
 
     check test proj FILE_DOESNT_EXIST
 

From cd41802d7e5b056e0114c8ad7523f00828ad5940 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 11 Dec 2023 17:37:44 +0100
Subject: [PATCH 021/245] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 2 --
 1 file changed, 2 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index eb68f8621a2..a52570f3d52 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -410,8 +410,6 @@ function test2()
     check test2
 }
 
-CLICKHOUSE_DATABASE="default"
-CLICKHOUSE_TEST_UNIQUE_NAME="test123456"
 function test3()
 {
     create_table test3 test 1

From 457032d2998a085fb9c10c0b9d536e79dbcc5dab Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 11 Dec 2023 20:40:25 +0100
Subject: [PATCH 022/245] Disable fault injection because it breaks .reference

---
 tests/queries/0_stateless/02916_broken_projection.sh | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index a52570f3d52..2049610e45b 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -52,7 +52,7 @@ function insert()
     offset=$2
     size=$3
     echo 'insert new part'
-    $CLICKHOUSE_CLIENT -q "INSERT INTO $table SELECT number, number, number, number, number%2 FROM numbers($offset, $size);"
+    $CLICKHOUSE_CLIENT -q "INSERT INTO $table SELECT number, number, number, number, number%2 FROM numbers($offset, $size) SETTINGS insert_keeper_fault_injection_probability;"
 }
 
 function break_projection()
@@ -431,11 +431,12 @@ function test3()
     broken_projections_info test
 
     ${CLICKHOUSE_CLIENT} -nm --query "
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}') settings check_projection_parts=false;
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}') settings check_projection_parts=false, backup_restore_keeper_fault_injection_probability=0.0;
     " | grep -o "BACKUP_CREATED"
 
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
     drop table test sync;
+    set backup_restore_keeper_fault_injection_probability=0.0;
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}');
     " | grep -o "RESTORED"
 
@@ -451,6 +452,7 @@ function test3()
 
     ${CLICKHOUSE_CLIENT} -nm --query "
     set send_logs_level='fatal';
+    set backup_restore_keeper_fault_injection_probability=0.0;
     backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2')
     " 2>&1 | grep -o "FILE_DOESNT_EXIST"
 
@@ -462,12 +464,14 @@ function test3()
 
     ${CLICKHOUSE_CLIENT} -nm --query "
     set send_logs_level='fatal';
+    set backup_restore_keeper_fault_injection_probability=0.0;
     backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3')
     " | grep -o "BACKUP_CREATED"
 
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
     drop table test sync;
     set send_logs_level='fatal';
+    set backup_restore_keeper_fault_injection_probability=0.0;
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3');
     " | grep -o "RESTORED"
 
@@ -481,6 +485,7 @@ function test3()
 
     ${CLICKHOUSE_CLIENT} -nm --query "
     set send_logs_level='fatal';
+    set backup_restore_keeper_fault_injection_probability=0.0;
     backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_4')
     settings check_projection_parts=false, allow_backup_broken_projections=true;
     " | grep -o "BACKUP_CREATED"
@@ -488,6 +493,7 @@ function test3()
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
     drop table test sync;
     set send_logs_level='fatal';
+    set backup_restore_keeper_fault_injection_probability=0.0;
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_4');
     " | grep -o "RESTORED"
 

From 8ef2638cfce90031213bbbd595a50d584406a916 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 12 Dec 2023 14:22:14 +0100
Subject: [PATCH 023/245] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 2049610e45b..0418759eb26 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -52,7 +52,7 @@ function insert()
     offset=$2
     size=$3
     echo 'insert new part'
-    $CLICKHOUSE_CLIENT -q "INSERT INTO $table SELECT number, number, number, number, number%2 FROM numbers($offset, $size) SETTINGS insert_keeper_fault_injection_probability;"
+    $CLICKHOUSE_CLIENT -q "INSERT INTO $table SELECT number, number, number, number, number%2 FROM numbers($offset, $size) SETTINGS insert_keeper_fault_injection_probability=0.0;"
 }
 
 function break_projection()

From d81edb4adf65c8c3724ec27fc83b65d5d1b3ebad Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Wed, 13 Dec 2023 12:29:28 +0100
Subject: [PATCH 024/245] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 0418759eb26..07495c45214 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -431,7 +431,8 @@ function test3()
     broken_projections_info test
 
     ${CLICKHOUSE_CLIENT} -nm --query "
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}') settings check_projection_parts=false, backup_restore_keeper_fault_injection_probability=0.0;
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}') settings check_projection_parts=false;
     " | grep -o "BACKUP_CREATED"
 
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "

From 79432255df02f696962858347c2207dbdbf2b69f Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 18 Dec 2023 12:45:24 +0100
Subject: [PATCH 025/245] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 07495c45214..55e613b8f3a 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-random-merge-tree-settings
+# Tags: long, no-random-merge-tree-settings, no-random-settings
 # shellcheck disable=SC2046
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

From 319ae440b6ba09b1dc21b355fab22a99d073592c Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 19 Dec 2023 16:43:30 +0000
Subject: [PATCH 026/245] Implement Variant data type

---
 docs/en/operations/settings/settings.md       |   52 +
 docs/en/sql-reference/data-types/variant.md   |  217 ++
 .../functions/other-functions.md              |   36 +
 src/Columns/ColumnNullable.cpp                |   22 +-
 src/Columns/ColumnNullable.h                  |    1 +
 src/Columns/ColumnVariant.cpp                 | 1360 +++++++++
 src/Columns/ColumnVariant.h                   |  306 ++
 src/Columns/IColumn.cpp                       |    6 +
 src/Columns/IColumn.h                         |   14 +
 src/Columns/MaskOperations.cpp                |    6 +-
 src/Columns/MaskOperations.h                  |    2 +-
 src/Columns/tests/gtest_column_variant.cpp    |  688 +++++
 src/Core/Settings.h                           |    2 +
 src/Core/TypeId.h                             |    1 +
 src/DataTypes/DataTypeFactory.cpp             |    1 +
 src/DataTypes/DataTypeFactory.h               |    1 +
 src/DataTypes/DataTypeNullable.cpp            |   28 +
 src/DataTypes/DataTypeNullable.h              |    3 +
 src/DataTypes/DataTypeTuple.cpp               |    9 +-
 src/DataTypes/DataTypeVariant.cpp             |  197 ++
 src/DataTypes/DataTypeVariant.h               |   64 +
 src/DataTypes/EnumValues.cpp                  |   21 +
 src/DataTypes/EnumValues.h                    |    8 +-
 src/DataTypes/IDataType.cpp                   |   23 +-
 src/DataTypes/IDataType.h                     |    3 +
 .../Serializations/ISerialization.cpp         |   61 +-
 src/DataTypes/Serializations/ISerialization.h |   13 +
 .../Serializations/SerializationArray.cpp     |  138 +-
 .../Serializations/SerializationArray.h       |    3 +
 .../Serializations/SerializationBool.cpp      |  179 +-
 .../Serializations/SerializationBool.h        |    8 +-
 .../SerializationCustomSimpleText.cpp         |   56 +
 .../SerializationCustomSimpleText.h           |    6 +
 .../Serializations/SerializationDate.cpp      |   46 +
 .../Serializations/SerializationDate.h        |    5 +
 .../Serializations/SerializationDate32.cpp    |   45 +
 .../Serializations/SerializationDate32.h      |    5 +
 .../Serializations/SerializationDateTime.cpp  |  157 +-
 .../Serializations/SerializationDateTime.h    |    5 +
 .../SerializationDateTime64.cpp               |  112 +
 .../Serializations/SerializationDateTime64.h  |    6 +
 .../Serializations/SerializationDecimal.cpp   |   46 +-
 .../Serializations/SerializationDecimal.h     |    6 +-
 .../Serializations/SerializationEnum.cpp      |   97 +
 .../Serializations/SerializationEnum.h        |   13 +
 .../SerializationFixedString.cpp              |   56 +
 .../Serializations/SerializationFixedString.h |    6 +
 .../SerializationIPv4andIPv6.cpp              |  188 ++
 .../Serializations/SerializationIPv4andIPv6.h |  129 +-
 .../SerializationLowCardinality.cpp           |   47 +-
 .../SerializationLowCardinality.h             |   12 +
 .../Serializations/SerializationMap.cpp       |  108 +-
 .../Serializations/SerializationMap.h         |    7 +-
 .../Serializations/SerializationNamed.cpp     |    1 +
 .../Serializations/SerializationNothing.h     |    1 +
 .../Serializations/SerializationNullable.cpp  |  532 +++-
 .../Serializations/SerializationNullable.h    |   53 +-
 .../Serializations/SerializationNumber.cpp    |   80 +-
 .../Serializations/SerializationNumber.h      |    3 +
 .../Serializations/SerializationString.cpp    |  101 +-
 .../Serializations/SerializationString.h      |    5 +
 .../Serializations/SerializationTuple.cpp     |  318 ++-
 .../Serializations/SerializationTuple.h       |   12 +
 .../Serializations/SerializationUUID.cpp      |   41 +-
 .../Serializations/SerializationUUID.h        |    6 +-
 .../Serializations/SerializationVariant.cpp   |  828 ++++++
 .../Serializations/SerializationVariant.h     |  116 +
 .../SerializationVariantElement.cpp           |  241 ++
 .../SerializationVariantElement.h             |   87 +
 .../Serializations/SerializationWrapper.cpp   |   25 +
 .../Serializations/SerializationWrapper.h     |    5 +
 .../Serializations/SimpleTextSerialization.h  |   38 +
 src/DataTypes/Utils.cpp                       |    1 +
 src/Databases/DatabaseReplicated.cpp          |    1 +
 src/Formats/EscapingRuleUtils.cpp             |   10 +-
 src/Formats/JSONUtils.cpp                     |    4 +-
 src/Formats/SchemaInferenceUtils.cpp          |    2 +-
 src/Functions/FunctionsConversion.h           |  262 +-
 src/Functions/if.cpp                          |   50 +-
 src/Functions/isNotNull.cpp                   |   13 +
 src/Functions/isNull.cpp                      |   13 +
 src/Functions/multiIf.cpp                     |   10 +
 src/Functions/variantElement.cpp              |  238 ++
 src/IO/ReadHelpers.cpp                        |  298 +-
 src/IO/ReadHelpers.h                          |  198 +-
 src/IO/readDecimalText.h                      |   20 +
 src/Interpreters/InterpreterCreateQuery.cpp   |   14 +
 src/Interpreters/InterpreterInsertQuery.cpp   |    2 +-
 src/Interpreters/inplaceBlockConversions.cpp  |   35 +-
 .../parseColumnsListForTableFunction.cpp      |   11 +
 .../parseColumnsListForTableFunction.h        |    2 +
 src/Parsers/ExpressionElementParsers.cpp      |    2 +-
 .../Formats/Impl/CSVRowInputFormat.cpp        |    2 +-
 .../Formats/Impl/MySQLDumpRowInputFormat.cpp  |    2 +-
 .../Formats/Impl/TSKVRowInputFormat.cpp       |    2 +-
 .../Impl/TabSeparatedRowInputFormat.cpp       |    4 +-
 .../Formats/Impl/ValuesBlockInputFormat.cpp   |    2 +-
 ...940_variant_text_deserialization.reference |  516 ++++
 .../02940_variant_text_deserialization.sql    |  266 ++
 .../02941_variant_type_1.reference            | 2472 +++++++++++++++++
 .../0_stateless/02941_variant_type_1.sh       |  124 +
 .../02941_variant_type_2.reference            |   51 +
 .../0_stateless/02941_variant_type_2.sh       |   71 +
 .../02941_variant_type_3.reference            |   51 +
 .../0_stateless/02941_variant_type_3.sh       |   71 +
 .../02941_variant_type_4.reference            |   56 +
 .../0_stateless/02941_variant_type_4.sh       |   66 +
 .../0_stateless/02942_variant_cast.reference  |   25 +
 .../0_stateless/02942_variant_cast.sql        |   23 +
 .../02943_variant_element.reference           |   44 +
 .../0_stateless/02943_variant_element.sql     |   16 +
 ...44_variant_as_if_multi_if_result.reference |   96 +
 .../02944_variant_as_if_multi_if_result.sql   |   64 +
 113 files changed, 11750 insertions(+), 584 deletions(-)
 create mode 100644 docs/en/sql-reference/data-types/variant.md
 create mode 100644 src/Columns/ColumnVariant.cpp
 create mode 100644 src/Columns/ColumnVariant.h
 create mode 100644 src/Columns/tests/gtest_column_variant.cpp
 create mode 100644 src/DataTypes/DataTypeVariant.cpp
 create mode 100644 src/DataTypes/DataTypeVariant.h
 create mode 100644 src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp
 create mode 100644 src/DataTypes/Serializations/SerializationVariant.cpp
 create mode 100644 src/DataTypes/Serializations/SerializationVariant.h
 create mode 100644 src/DataTypes/Serializations/SerializationVariantElement.cpp
 create mode 100644 src/DataTypes/Serializations/SerializationVariantElement.h
 create mode 100644 src/Functions/variantElement.cpp
 create mode 100644 tests/queries/0_stateless/02940_variant_text_deserialization.reference
 create mode 100644 tests/queries/0_stateless/02940_variant_text_deserialization.sql
 create mode 100644 tests/queries/0_stateless/02941_variant_type_1.reference
 create mode 100755 tests/queries/0_stateless/02941_variant_type_1.sh
 create mode 100644 tests/queries/0_stateless/02941_variant_type_2.reference
 create mode 100755 tests/queries/0_stateless/02941_variant_type_2.sh
 create mode 100644 tests/queries/0_stateless/02941_variant_type_3.reference
 create mode 100755 tests/queries/0_stateless/02941_variant_type_3.sh
 create mode 100644 tests/queries/0_stateless/02941_variant_type_4.reference
 create mode 100755 tests/queries/0_stateless/02941_variant_type_4.sh
 create mode 100644 tests/queries/0_stateless/02942_variant_cast.reference
 create mode 100644 tests/queries/0_stateless/02942_variant_cast.sql
 create mode 100644 tests/queries/0_stateless/02943_variant_element.reference
 create mode 100644 tests/queries/0_stateless/02943_variant_element.sql
 create mode 100644 tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference
 create mode 100644 tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index dc46a3f0dcd..dbf5bc341cc 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -5134,3 +5134,55 @@ When set to `true` than for all s3 requests first two attempts are made with low
 When set to `false` than all attempts are made with identical timeouts.
 
 Default value: `true`.
+
+## allow_experimental_variant_type {#allow_experimental_variant_type}
+
+Allows creation of experimental [Variant](../../sql-reference/data-types/variant.md).
+
+Default value: `false`.
+
+## use_variant_when_no_common_type_in_if {#use_variant_when_no_common_type_in_if}
+
+Allows to use `Variant` type as a result type for [if](../../sql-reference/functions/conditional-functions.md/#if)/[multiIf](../../sql-reference/functions/conditional-functions.md/#multiif) functions when there is no common type for argument types.
+
+Example:
+
+```sql
+SET use_variant_when_no_common_type_in_if = 1;
+SELECT toTypeName(if(number % 2, number, range(number))) as variant_type FROM numbers(1);
+SELECT if(number % 2, number, range(number)) as variant FROM numbers(5);
+```
+
+```text
+┌─variant_type───────────────────┐
+│ Variant(Array(UInt64), UInt64) │
+└────────────────────────────────┘
+┌─variant───┐
+│ []        │
+│ 1         │
+│ [0,1]     │
+│ 3         │
+│ [0,1,2,3] │
+└───────────┘
+```
+
+```sql
+SET use_variant_when_no_common_type_in_if = 1;
+SELECT toTypeName(multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) = 2, 'Hello, World!', NULL)) AS variant_type FROM numbers(1);
+SELECT multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) = 2, 'Hello, World!', NULL) AS variant FROM numbers(4);
+```
+
+```text
+─variant_type─────────────────────────┐
+│ Variant(Array(UInt8), String, UInt8) │
+└──────────────────────────────────────┘
+
+┌─variant───────┐
+│ 42            │
+│ [1,2,3]       │
+│ Hello, World! │
+│ ᴺᵁᴸᴸ          │
+└───────────────┘
+```
+
+Default value: `false`.
diff --git a/docs/en/sql-reference/data-types/variant.md b/docs/en/sql-reference/data-types/variant.md
new file mode 100644
index 00000000000..34966d79079
--- /dev/null
+++ b/docs/en/sql-reference/data-types/variant.md
@@ -0,0 +1,217 @@
+---
+slug: /en/sql-reference/data-types/json
+sidebar_position: 55
+sidebar_label: Variant
+---
+
+# Variant(T1, T2, T3, ...)
+
+This type represents a union of other data types. Type `Variant(T1, T2, ..., TN)` means that each row of this type 
+has a value of either type `T1` or `T2` or ... or `TN` or none of them (`NULL` value).
+
+The order of nested types doesn't matter: Variant(T1, T2) = Variant(T2, T1).
+Nested types can be arbitrary types except Nullable(...), LowCardinality(Nullable(...)) and Variant(...) types.
+
+:::note
+The Variant data type is an experimental feature. To use it, set `allow_experimental_variant_type = 1`.
+:::
+
+## Creating Variant
+
+Using `Variant` type in table column definition:
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT v FROM test;
+```
+
+```text
+┌─v─────────────┐
+│ ᴺᵁᴸᴸ          │
+│ 42            │
+│ Hello, World! │
+│ [1,2,3]       │
+└───────────────┘
+```
+
+Using CAST from ordinary columns:
+
+```sql
+SELECT toTypeName(variant) as type_name, 'Hello, World!'::Variant(UInt64, String, Array(UInt64)) as variant;
+```
+
+```text
+┌─type_name──────────────────────────────┬─variant───────┐
+│ Variant(Array(UInt64), String, UInt64) │ Hello, World! │
+└────────────────────────────────────────┴───────────────┘
+```
+
+Using functions `if/multiIf` when arguments doesn't have common type (setting `use_variant_when_no_common_type_in_if` should be enabled for it):
+
+```sql
+SET use_variant_when_no_common_type_in_if = 1;
+SELECT if(number % 2, number, range(number)) as variant FROM numbers(5);
+```
+
+```text
+┌─variant───┐
+│ []        │
+│ 1         │
+│ [0,1]     │
+│ 3         │
+│ [0,1,2,3] │
+└───────────┘
+```
+
+```sql
+SET use_variant_when_no_common_type_in_if = 1;
+SELECT multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) = 2, 'Hello, World!', NULL) AS variant FROM numbers(4);
+```
+
+```text
+┌─variant───────┐
+│ 42            │
+│ [1,2,3]       │
+│ Hello, World! │
+│ ᴺᵁᴸᴸ          │
+└───────────────┘
+```
+
+## Reading Variant nested types as subcolumns
+
+Variant type supports reading a single nested type from a Variant column using the type name as a subcolumn.
+So, if you have column `variant Variant(T1, T2, T3)` you can read a subcolumn of type `T2` using syntax `variant.T2`,
+this subcolumn will have type `Nullable(T2)` if `T2` can be inside `Nullable` and `T2` otherwise. This subcolumn will
+be the same size as original `Variant` column and will contain `NULL` values (or empty values if `T2` cannot be inside `Nullable`)
+in all rows in which original `Variant` column doesn't have type `T2`.
+
+Variant subcolumns can be also read using function `variantElement(variant_column, type_name)`. 
+
+Examples:
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT v, v.String, v.UInt64, v.`Array(UInt64)` FROM test;
+```
+
+```text
+┌─v─────────────┬─v.String──────┬─v.UInt64─┬─v.Array(UInt64)─┐
+│ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ          │     ᴺᵁᴸᴸ │ []              │
+│ 42            │ ᴺᵁᴸᴸ          │       42 │ []              │
+│ Hello, World! │ Hello, World! │     ᴺᵁᴸᴸ │ []              │
+│ [1,2,3]       │ ᴺᵁᴸᴸ          │     ᴺᵁᴸᴸ │ [1,2,3]         │
+└───────────────┴───────────────┴──────────┴─────────────────┘
+```
+
+```sql
+SELECT toTypeName(v.String), toTypeName(v.UInt64), toTypeName(v.`Array(UInt64)`) FROM test LIMIT 1;
+```
+
+```text
+┌─toTypeName(v.String)─┬─toTypeName(v.UInt64)─┬─toTypeName(v.Array(UInt64))─┐
+│ Nullable(String)     │ Nullable(UInt64)     │ Array(UInt64)               │
+└──────────────────────┴──────────────────────┴─────────────────────────────┘
+```
+
+```sql
+SELECT v, variantElement(v, 'String'), variantElement(v, 'UInt64'), variantElement(v, 'Array(UInt64)') FROM test;
+```
+
+```text
+┌─v─────────────┬─variantElement(v, 'String')─┬─variantElement(v, 'UInt64')─┬─variantElement(v, 'Array(UInt64)')─┐
+│ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ                        │                        ᴺᵁᴸᴸ │ []                                 │
+│ 42            │ ᴺᵁᴸᴸ                        │                          42 │ []                                 │
+│ Hello, World! │ Hello, World!               │                        ᴺᵁᴸᴸ │ []                                 │
+│ [1,2,3]       │ ᴺᵁᴸᴸ                        │                        ᴺᵁᴸᴸ │ [1,2,3]                            │
+└───────────────┴─────────────────────────────┴─────────────────────────────┴────────────────────────────────────┘
+```
+
+## Conversion between Variant column and other columns
+
+There are 3 possible conversions that can be performed with Variant column.
+
+### Converting an ordinary column to a Variant column
+
+It is possible to convert ordinary column with type `T` to a `Variant` column containing this type:
+
+```sql
+SELECT toTypeName(variant) as type_name, 'Hello, World!'::Variant(UInt64, String, Array(UInt64)) as variant;
+```
+
+```text
+┌─type_name──────────────────────────────┬─variant───────┐
+│ Variant(Array(UInt64), String, UInt64) │ Hello, World! │
+└────────────────────────────────────────┴───────────────┘
+```
+
+### Converting a Variant column to an ordinary column
+
+It is possible to convert a `Variant` column to an ordinary column. In this case all nested variants will be converted to a destination type:
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String)) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('42.42');
+SELECT v::Nullable(Float64) FROM test;
+```
+
+```text
+┌─CAST(v, 'Nullable(Float64)')─┐
+│                         ᴺᵁᴸᴸ │
+│                           42 │
+│                        42.42 │
+└──────────────────────────────┘
+```
+
+### Converting a Variant to another Variant
+
+It is possible to convert a `Variant` column to another `Variant` column, but only if the destination `Variant` column contains all nested types from the original `Variant`:
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String)) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('String');
+SELECT v::Variant(UInt64, String, Array(UInt64)) FROM test;
+```
+
+```text
+┌─CAST(v, 'Variant(UInt64, String, Array(UInt64))')─┐
+│ ᴺᵁᴸᴸ                                              │
+│ 42                                                │
+│ String                                            │
+└───────────────────────────────────────────────────┘
+```
+
+
+## Reading Variant type from the data
+
+All text formats (TSV, CSV, CustomSeparated, Values, JSONEachRow, etc) supports reading `Variant` type. During data parsing ClickHouse tries to insert value into most appropriate variant type.
+
+Example:
+
+```sql
+SELECT
+    v,
+    variantElement(v, 'String') AS str,
+    variantElement(v, 'UInt64') AS num,
+    variantElement(v, 'Float64') AS float,
+    variantElement(v, 'DateTime') AS date,
+    variantElement(v, 'Array(UInt64)') AS arr
+FROM format(JSONEachRow, 'v Variant(String, UInt64, Float64, DateTime, Array(UInt64))', $$
+{"v" : "Hello, World!"},
+{"v" : 42},
+{"v" : 42.42},
+{"v" : "2020-01-01 00:00:00"},
+{"v" : [1, 2, 3]}
+$$)
+```
+
+```text
+┌─v───────────────────┬─str───────────┬──num─┬─float─┬────────────────date─┬─arr─────┐
+│ Hello, World!       │ Hello, World! │ ᴺᵁᴸᴸ │  ᴺᵁᴸᴸ │                ᴺᵁᴸᴸ │ []      │
+│ 42                  │ ᴺᵁᴸᴸ          │   42 │  ᴺᵁᴸᴸ │                ᴺᵁᴸᴸ │ []      │
+│ 42.42               │ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ │ 42.42 │                ᴺᵁᴸᴸ │ []      │
+│ 2020-01-01 00:00:00 │ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ │  ᴺᵁᴸᴸ │ 2020-01-01 00:00:00 │ []      │
+│ [1,2,3]             │ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ │  ᴺᵁᴸᴸ │                ᴺᵁᴸᴸ │ [1,2,3] │
+└─────────────────────┴───────────────┴──────┴───────┴─────────────────────┴─────────┘
+```
diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index 5b9d01985dd..47b5ac7b724 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -2831,3 +2831,39 @@ Result:
 │ SELECT a, b FROM tab WHERE (a > 3) AND (b < 3)                          │
 └─────────────────────────────────────────────────────────────────────────┘
 ```
+
+## variantElement
+
+Extracts a column with specified type from a `Variant` column.
+
+**Syntax**
+
+``` sql
+tupleElement(variant, type_name, [, default_value])
+```
+
+- `variant` — Variant column. [Variant](../../sql-reference/data-types/variant.md).
+- `type_name` — The name of the variant type to extract. [String](../../sql-reference/data-types/string.md).
+- `default_value` - The default value that will be used if variant doesn't have variant with specified type. Can be any type. Optional.
+
+**Returned value**
+
+- Subcolumn of a `Variant` column with specified type.
+
+**Example**
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT v, variantElement(v, 'String'), variantElement(v, 'UInt64'), variantElement(v, 'Array(UInt64)') FROM test;
+```
+
+```text
+┌─v─────────────┬─variantElement(v, 'String')─┬─variantElement(v, 'UInt64')─┬─variantElement(v, 'Array(UInt64)')─┐
+│ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ                        │                        ᴺᵁᴸᴸ │ []                                 │
+│ 42            │ ᴺᵁᴸᴸ                        │                          42 │ []                                 │
+│ Hello, World! │ Hello, World!               │                        ᴺᵁᴸᴸ │ []                                 │
+│ [1,2,3]       │ ᴺᵁᴸᴸ                        │                        ᴺᵁᴸᴸ │ [1,2,3]                            │
+└───────────────┴─────────────────────────────┴─────────────────────────────┴────────────────────────────────────┘
+```
+
diff --git a/src/Columns/ColumnNullable.cpp b/src/Columns/ColumnNullable.cpp
index 4ee6bb3d586..d2a579d6800 100644
--- a/src/Columns/ColumnNullable.cpp
+++ b/src/Columns/ColumnNullable.cpp
@@ -890,10 +890,7 @@ ColumnPtr makeNullable(const ColumnPtr & column)
 
 ColumnPtr makeNullableOrLowCardinalityNullable(const ColumnPtr & column)
 {
-    if (isColumnNullable(*column))
-        return column;
-
-    if (isColumnLowCardinalityNullable(*column))
+    if (isColumnNullableOrLowCardinalityNullable(*column))
         return column;
 
     if (isColumnConst(*column))
@@ -919,4 +916,21 @@ ColumnPtr makeNullableSafe(const ColumnPtr & column)
     return column;
 }
 
+ColumnPtr makeNullableOrLowCardinalityNullableSafe(const ColumnPtr & column)
+{
+    if (isColumnNullableOrLowCardinalityNullable(*column))
+        return column;
+
+    if (isColumnConst(*column))
+        return ColumnConst::create(makeNullableOrLowCardinalityNullableSafe(assert_cast<const ColumnConst &>(*column).getDataColumnPtr()), column->size());
+
+    if (column->lowCardinality())
+        return assert_cast<const ColumnLowCardinality &>(*column).cloneNullable();
+
+    if (column->canBeInsideNullable())
+        return makeNullableSafe(column);
+
+    return column;
+}
+
 }
diff --git a/src/Columns/ColumnNullable.h b/src/Columns/ColumnNullable.h
index b57fdf3064d..60c7750f8fc 100644
--- a/src/Columns/ColumnNullable.h
+++ b/src/Columns/ColumnNullable.h
@@ -231,5 +231,6 @@ private:
 ColumnPtr makeNullable(const ColumnPtr & column);
 ColumnPtr makeNullableSafe(const ColumnPtr & column);
 ColumnPtr makeNullableOrLowCardinalityNullable(const ColumnPtr & column);
+ColumnPtr makeNullableOrLowCardinalityNullableSafe(const ColumnPtr & column);
 
 }
diff --git a/src/Columns/ColumnVariant.cpp b/src/Columns/ColumnVariant.cpp
new file mode 100644
index 00000000000..67754e77992
--- /dev/null
+++ b/src/Columns/ColumnVariant.cpp
@@ -0,0 +1,1360 @@
+#include <Columns/ColumnVariant.h>
+
+#include <Columns/ColumnCompressed.h>
+#include <Columns/ColumnsCommon.h>
+#include <Core/Field.h>
+#include <Processors/Transforms/ColumnGathererTransform.h>
+#include <IO/Operators.h>
+#include <IO/WriteBufferFromString.h>
+#include <Common/WeakHash.h>
+#include <Common/assert_cast.h>
+#include <Common/typeid_cast.h>
+#include <Common/Arena.h>
+#include <Common/SipHash.h>
+#include <Common/HashTable/Hash.h>
+#include <DataTypes/Serializations/SerializationInfoTuple.h>
+#include <Columns/MaskOperations.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+    extern const int ILLEGAL_COLUMN;
+    extern const int NOT_IMPLEMENTED;
+    extern const int LOGICAL_ERROR;
+    extern const int PARAMETER_OUT_OF_BOUND;
+    extern const int SIZES_OF_NESTED_COLUMNS_ARE_INCONSISTENT;
+    extern const int SIZES_OF_COLUMNS_DOESNT_MATCH;
+}
+
+std::string ColumnVariant::getName() const
+{
+    WriteBufferFromOwnString res;
+    res << "Variant(";
+    bool is_first = true;
+    for (const auto & local_variant : global_to_local_discriminators)
+    {
+        if (!is_first)
+            res << ", ";
+        is_first = false;
+        res << variants[local_variant]->getName();
+    }
+    res << ")";
+    return res.str();
+}
+
+
+void ColumnVariant::initIdentityGlobalToLocalDiscriminatorsMapping()
+{
+    local_to_global_discriminators.reserve(variants.size());
+    global_to_local_discriminators.reserve(variants.size());
+    for (size_t i = 0; i != variants.size(); ++i)
+    {
+        local_to_global_discriminators.push_back(i);
+        global_to_local_discriminators.push_back(i);
+    }
+}
+
+ColumnVariant::ColumnVariant(MutableColumns && variants_) : ColumnVariant(std::move(variants_), {})
+{
+}
+
+ColumnVariant::ColumnVariant(MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_)
+{
+    /// Empty local_to_global_discriminators mapping means that variants are already in the global order.
+    if (!local_to_global_discriminators_.empty() && local_to_global_discriminators_.size() != variants_.size())
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR,
+            "The number of values in local_to_global_discriminators mapping ({}) doesn't match the number of variants ({})",
+            local_to_global_discriminators_.size(),
+            variants_.size());
+
+    /// As variants are empty, column with local discriminators will be also empty and we can reorder variants according to global discriminators.
+    variants.resize(variants_.size());
+    for (size_t i = 0; i != variants_.size(); ++i)
+    {
+        if (isColumnConst(*variants_[i]))
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
+
+        if (!variants_[i]->empty())
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Not empty column passed to ColumnVariant, but no local_discriminators passed");
+
+        if (!local_to_global_discriminators_.empty() && local_to_global_discriminators_[i] > variants_.size())
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid global discriminator {}. The number of variants: {}", UInt64(local_to_global_discriminators_[i]), variants_.size());
+
+        if (local_to_global_discriminators_.empty())
+            variants[i] = std::move(variants_[i]);
+        else
+            variants[local_to_global_discriminators_[i]] = std::move(variants_[i]);
+    }
+
+    local_discriminators = ColumnDiscriminators::create();
+    offsets = ColumnOffsets::create();
+
+    /// Now global and local discriminators are the same.
+    initIdentityGlobalToLocalDiscriminatorsMapping();
+}
+
+ColumnVariant::ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumns && variants_) : ColumnVariant(std::move(local_discriminators_), nullptr, std::move(variants_), {})
+{
+}
+
+ColumnVariant::ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumns && variants_, const std::vector<Discriminator> & global_discriminators) : ColumnVariant(std::move(local_discriminators_), nullptr, std::move(variants_), global_discriminators)
+{
+}
+
+ColumnVariant::ColumnVariant(DB::MutableColumnPtr local_discriminators_, DB::MutableColumnPtr offsets_, DB::MutableColumns && variants_) : ColumnVariant(std::move(local_discriminators_), std::move(offsets_), std::move(variants_), {})
+{
+}
+
+ColumnVariant::ColumnVariant(DB::MutableColumnPtr local_discriminators_, DB::MutableColumnPtr offsets_, DB::MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_)
+{
+    if (variants_.size() > MAX_NESTED_COLUMNS)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Variant type with more than {} nested types is not allowed", ColumnVariant::MAX_NESTED_COLUMNS);
+
+    local_discriminators = std::move(local_discriminators_);
+    const ColumnDiscriminators * discriminators_concrete = typeid_cast<const ColumnDiscriminators *>(local_discriminators.get());
+    if (!discriminators_concrete)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "discriminator column must be a ColumnUInt8");
+
+    variants.reserve(variants_.size());
+    size_t total_size = 0;
+    for (auto & variant : variants_)
+    {
+        if (isColumnConst(*variant))
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
+
+        total_size += variant->size();
+        variants.push_back(std::move(variant));
+    }
+
+    /// We can have more discriminators than values in columns
+    /// (because of NULL discriminators), but not less.
+    if (total_size > local_discriminators->size())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Nested columns sizes are inconsistent with local_discriminators column size. Total column sizes: {}, local_discriminators size: {}", total_size, local_discriminators->size());
+
+    if (offsets_)
+    {
+        if (!typeid_cast<const ColumnOffsets *>(offsets_.get()))
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "offsets column must be a ColumnUInt64");
+
+        offsets = std::move(offsets_);
+    }
+    else
+    {
+        /// If no offsets column was provided, construct offsets based on discriminators.
+        offsets = ColumnOffsets::create();
+        Offsets & offsets_data = typeid_cast<ColumnOffsets *>(offsets.get())->getData();
+        offsets_data.reserve(discriminators_concrete->size());
+        /// If we have only NULLs, offsets column will not contain any real offsets.
+        if (hasOnlyNulls())
+        {
+            offsets_data.resize(discriminators_concrete->size());
+        }
+        /// If we have only one non empty variant and no NULLs,
+        /// offsets column will contain just sequential offsets 0, 1, 2, ...
+        else if (getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+        {
+            for (size_t i = 0; i != discriminators_concrete->size(); ++i)
+                offsets_data.push_back(i);
+        }
+        /// Otherwise we should iterate through discriminators and
+        /// remember current offset for each variant column.
+        else
+        {
+            std::vector<Offset> nested_offsets;
+            nested_offsets.resize(variants.size());
+            for (Discriminator discr : discriminators_concrete->getData())
+            {
+                if (discr == NULL_DISCRIMINATOR)
+                    offsets_data.emplace_back();
+                else
+                    offsets_data.push_back(nested_offsets[discr]++);
+            }
+        }
+    }
+
+    /// Empty global_discriminators means that variants are already in global order.
+    if (local_to_global_discriminators_.empty())
+    {
+        initIdentityGlobalToLocalDiscriminatorsMapping();
+    }
+    else
+    {
+        if (local_to_global_discriminators_.size() != variants.size())
+            throw Exception(
+                ErrorCodes::LOGICAL_ERROR,
+                "The number of values in local_to_global_discriminators mapping ({}) doesn't match the number of variants ({})",
+                local_to_global_discriminators_.size(),
+                variants.size());
+
+        local_to_global_discriminators = local_to_global_discriminators_;
+        global_to_local_discriminators.resize(local_to_global_discriminators.size());
+        /// Create mapping global discriminator -> local discriminator
+        for (size_t i = 0; i != local_to_global_discriminators.size(); ++i)
+        {
+            if (local_to_global_discriminators[i] > variants.size())
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid global discriminator {}. The number of variants: {}", UInt64(local_to_global_discriminators[i]), variants_.size());
+
+            global_to_local_discriminators[local_to_global_discriminators[i]] = i;
+        }
+    }
+}
+
+ColumnVariant::Ptr ColumnVariant::create(const Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
+{
+    MutableColumns mutable_variants;
+    mutable_variants.reserve(variants.size());
+    for (const auto & variant : variants)
+    {
+        if (isColumnConst(*variant))
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
+        mutable_variants.emplace_back(variant->assumeMutable());
+    }
+
+    return ColumnVariant::create(std::move(mutable_variants), local_to_global_discriminators);
+}
+
+ColumnVariant::Ptr ColumnVariant::create(const DB::ColumnPtr & local_discriminators, const DB::Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
+{
+    MutableColumns mutable_variants;
+    mutable_variants.reserve(variants.size());
+    for (const auto & variant : variants)
+    {
+        if (isColumnConst(*variant))
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
+        mutable_variants.emplace_back(variant->assumeMutable());
+    }
+
+    return ColumnVariant::create(local_discriminators->assumeMutable(), std::move(mutable_variants), local_to_global_discriminators);
+}
+
+ColumnVariant::Ptr ColumnVariant::create(const DB::ColumnPtr & local_discriminators, const DB::ColumnPtr & offsets, const DB::Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
+{
+    MutableColumns mutable_variants;
+    mutable_variants.reserve(variants.size());
+    for (const auto & variant : variants)
+    {
+        if (isColumnConst(*variant))
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
+        mutable_variants.emplace_back(variant->assumeMutable());
+    }
+
+    return ColumnVariant::create(local_discriminators->assumeMutable(), offsets->assumeMutable(), std::move(mutable_variants), local_to_global_discriminators);
+}
+
+MutableColumnPtr ColumnVariant::cloneEmpty() const
+{
+    MutableColumns new_variants;
+    new_variants.reserve(variants.size());
+    for (const auto & variant : variants)
+        new_variants.emplace_back(variant->cloneEmpty());
+
+    return ColumnVariant::create(std::move(new_variants), local_to_global_discriminators);
+}
+
+MutableColumnPtr ColumnVariant::cloneResized(size_t new_size) const
+{
+    if (new_size == 0)
+        return cloneEmpty();
+
+    const size_t num_variants = variants.size();
+    size_t size = local_discriminators->size();
+    /// If new size is bigger than the old one, just clone column and append default values.
+    if (new_size >= size)
+    {
+        MutableColumns new_variants;
+        new_variants.reserve(num_variants);
+        for (const auto & variant : variants)
+            new_variants.emplace_back(IColumn::mutate(variant));
+
+        auto res = ColumnVariant::create(IColumn::mutate(local_discriminators), IColumn::mutate(offsets), std::move(new_variants), local_to_global_discriminators);
+        res->insertManyDefaults(new_size - size);
+        return res;
+    }
+
+    /// If new size is less than current size, we should find the new size for all variants.
+
+    /// Optimization for case when we have only NULLs. In this case we should just resize discriminators and offsets.
+    if (hasOnlyNulls())
+    {
+        MutableColumns new_variants;
+        new_variants.reserve(num_variants);
+        for (const auto & variant : variants)
+            new_variants.emplace_back(IColumn::mutate(variant));
+
+        return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
+    }
+
+    /// Optimization for case when there is only 1 non-empty variant and no NULLs.
+    /// In this case we can simply call cloneResized on this single variant, discriminators and offsets.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        MutableColumns new_variants;
+        new_variants.reserve(num_variants);
+        for (size_t i = 0; i != variants.size(); ++i)
+        {
+            if (i == *non_empty_local_discr)
+                new_variants.emplace_back(variants[i]->cloneResized(new_size));
+            else
+                new_variants.emplace_back(variants[i]->cloneEmpty());
+        }
+
+        return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
+    }
+
+    const auto & local_discriminators_data = getLocalDiscriminators();
+    const auto & offsets_data = getOffsets();
+
+    /// We can find all variants sizes by scanning all new_size local_discriminators and calculating
+    /// sizes for all new variants. This code is below and commented.
+
+//    std::vector<size_t> new_nested_sizes(num_variants, 0);
+//    for (size_t i = 0; i != new_size; ++i)
+//    {
+//        Discriminator discr = local_discriminators_data[i];
+//        if (discr != NULL_DISCRIMINATOR)
+//            ++new_nested_sizes[discr];
+//    }
+//
+//    MutableColumns new_variants;
+//    new_variants.reserve(num_variants);
+//    for (size_t i = 0; i != num_variants; ++i)
+//    {
+//        if (new_nested_sizes[i])
+//            new_variants.emplace_back(variants[i]->cloneResized(new_nested_sizes[i]));
+//        else
+//            new_variants.emplace_back(variants[i]->cloneEmpty());
+//    }
+//
+//    return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
+
+    /// But instead we are trying to optimize it using offsets column:
+    /// For all non-empty variants we are trying to find last occurrence of its discriminator in local_discriminators[:new_size] or
+    /// first occurrence in local_discriminators[new_size:]. The same row in offsets column will contain the desired size (or size - 1) of variant.
+    /// All empty variants will remain empty.
+    /// Not sure how good this optimization is, feel free to remove it and use simpler version above.
+
+    MutableColumns new_variants(num_variants);
+    std::unordered_set<Discriminator> seen_variants;
+    /// First, check which variants are empty. They will remain empty.
+    for (Discriminator i = 0; i != num_variants; ++i)
+    {
+        if (variants[i]->empty())
+        {
+            seen_variants.insert(i);
+            new_variants[i] = variants[i]->cloneEmpty();
+        }
+    }
+
+    /// Now, iterate through local discriminators using two pointers.
+    /// First will go from new_size - 1 to 0, second from new_size to size.
+    /// Finish when we find all variants or hit lower or upper bound.
+    ssize_t i = new_size - 1;
+    size_t j = new_size;
+    while (i != -1 && j != size)
+    {
+        Discriminator i_discr = local_discriminators_data[i];
+        if (i_discr != NULL_DISCRIMINATOR)
+        {
+            auto [_, inserted] = seen_variants.insert(i_discr);
+            /// If this is the first occurrence of this discriminator,
+            /// we can get new size for this variant.
+            if (inserted)
+            {
+                new_variants[i_discr] = variants[i_discr]->cloneResized(offsets_data[i] + 1);
+                if (seen_variants.size() == num_variants)
+                    break;
+            }
+        }
+
+        Discriminator j_discr = local_discriminators_data[j];
+        if (j_discr != NULL_DISCRIMINATOR)
+        {
+            auto [_, inserted] = seen_variants.insert(j_discr);
+            /// If this is the first occurrence of this discriminator,
+            /// we can get new size for this variant.
+            if (inserted)
+            {
+                new_variants[j_discr] = variants[j_discr]->cloneResized(offsets_data[j]);
+                if (seen_variants.size() == num_variants)
+                    break;
+            }
+        }
+
+        --i;
+        ++j;
+    }
+
+    /// We can finish in 3 cases:
+    ///   1) seen_variants.size() == num_variants - we found local_discriminators of all variants, nothing to do.
+    ///   2) i == -1 - we scanned all values in local_discriminators[:new_size]. Not found variants doesn't have
+    /// values in local_discriminators[:new_size], so they should be empty in the resized version.
+    ///   3) j == size - we scanned all values in local_discriminators[new_size:]. Not found variants doesn't have
+    /// values in local_discriminators[new_size:], so, we should use the full variant in the resized version.
+    if (seen_variants.size() != num_variants)
+    {
+        for (size_t discr = 0; discr != num_variants; ++discr)
+        {
+            if (!seen_variants.contains(discr))
+            {
+                if (i == -1)
+                    new_variants[discr] = variants[discr]->cloneEmpty();
+                else
+                    new_variants[discr] = IColumn::mutate(variants[discr]);
+            }
+        }
+    }
+
+    return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
+}
+
+Field ColumnVariant::operator[](size_t n) const
+{
+    Discriminator discr = localDiscriminatorAt(n);
+    if (discr == NULL_DISCRIMINATOR)
+        return Null();
+    return (*variants[discr])[offsetAt(n)];
+}
+
+void ColumnVariant::get(size_t n, Field & res) const
+{
+    Discriminator discr = localDiscriminatorAt(n);
+    if (discr == NULL_DISCRIMINATOR)
+        res = Null();
+    else
+        variants[discr]->get(offsetAt(n), res);
+}
+
+bool ColumnVariant::isDefaultAt(size_t n) const
+{
+    return localDiscriminatorAt(n) == NULL_DISCRIMINATOR;
+}
+
+bool ColumnVariant::isNullAt(size_t n) const
+{
+    return localDiscriminatorAt(n) == NULL_DISCRIMINATOR;
+}
+
+StringRef ColumnVariant::getDataAt(size_t) const
+{
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method getDataAt is not supported for {}", getName());
+}
+
+void ColumnVariant::insertData(const char *, size_t)
+{
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method insertData is not supported for {}", getName());
+}
+
+void ColumnVariant::insert(const Field & field)
+{
+    if (field.isNull())
+        insertDefault();
+    else
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Cannot insert field {} to column {}", toString(field), getName());
+}
+
+void ColumnVariant::insertFrom(const IColumn & src_, size_t n)
+{
+    const ColumnVariant & src = assert_cast<const ColumnVariant &>(src_);
+
+    const size_t num_variants = variants.size();
+    if (src.variants.size() != num_variants)
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Cannot insert value of Variant type with different number of types");
+
+    /// Remember that src column can have different local variants order.
+    Discriminator global_discr = src.globalDiscriminatorAt(n);
+    Discriminator local_discr = localDiscriminatorByGlobal(global_discr);
+    getLocalDiscriminators().push_back(local_discr);
+    if (local_discr == NULL_DISCRIMINATOR)
+    {
+        getOffsets().emplace_back();
+    }
+    else
+    {
+        getOffsets().push_back(variants[local_discr]->size());
+        variants[local_discr]->insertFrom(src.getVariantByGlobalDiscriminator(global_discr), src.offsetAt(n));
+    }
+}
+
+void ColumnVariant::insertRangeFrom(const IColumn & src_, size_t start, size_t length)
+{
+    const size_t num_variants = variants.size();
+    const auto & src = assert_cast<const ColumnVariant &>(src_);
+    if (src.variants.size() != num_variants)
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Cannot insert value of Variant type with different number of types");
+
+    if (start + length > src.getLocalDiscriminators().size())
+        throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND, "Parameter out of bound in ColumnVariant::insertRangeFrom method. "
+                                                            "[start({}) + length({}) > local_discriminators.size({})]", start, length, src.getLocalDiscriminators().size());
+
+    /// If src column contains only NULLs, just insert NULLs.
+    if (src.hasOnlyNulls())
+    {
+        insertManyDefaults(length);
+        return;
+    }
+
+    /// Optimization for case when there is only 1 non-empty variant and no NULLs in src column.
+    /// In this case we can simply call insertRangeFrom on this single variant.
+    if (auto non_empty_src_local_discr = src.getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        auto local_discr = localDiscriminatorByGlobal(src.globalDiscriminatorByLocal(*non_empty_src_local_discr));
+        size_t offset = variants[local_discr]->size();
+        variants[local_discr]->insertRangeFrom(*src.variants[*non_empty_src_local_discr], start, length);
+        getLocalDiscriminators().resize_fill(local_discriminators->size() + length, local_discr);
+        auto & offsets_data = getOffsets();
+        offsets_data.reserve(offsets_data.size() + length);
+        for (size_t i = 0; i != length; ++i)
+            offsets_data.push_back(offset++);
+        return;
+    }
+
+    /// Iterate through src local_discriminators in range [start, start + length],
+    /// collect ranges we need to insert for all variants and update offsets.
+    /// nested_ranges[i].first - offset in src.variants[i]
+    /// nested_ranges[i].second - length in src.variants[i]
+    std::vector<std::pair<size_t, size_t>> nested_ranges(num_variants, {0, 0});
+    auto & offsets_data = getOffsets();
+    offsets_data.reserve(offsets_data.size() + length);
+    auto & local_discriminators_data = getLocalDiscriminators();
+    local_discriminators_data.reserve(local_discriminators_data.size() + length);
+    const auto & src_offsets_data = src.getOffsets();
+    const auto & src_local_discriminators_data = src.getLocalDiscriminators();
+    for (size_t i = start; i != start + length; ++i)
+    {
+        /// We insert from src.variants[src_local_discr] to variants[local_discr]
+        Discriminator src_local_discr = src_local_discriminators_data[i];
+        Discriminator local_discr = localDiscriminatorByGlobal(src.globalDiscriminatorByLocal(src_local_discr));
+        local_discriminators_data.push_back(local_discr);
+        if (local_discr == NULL_DISCRIMINATOR)
+        {
+            offsets_data.emplace_back();
+        }
+        else
+        {
+            /// If we see this discriminator for the first time, set its range start.
+            if (!nested_ranges[src_local_discr].second)
+                nested_ranges[src_local_discr].first = src_offsets_data[i];
+            /// Update offsets column with correct offset.
+            offsets_data.push_back(variants[local_discr]->size() + nested_ranges[src_local_discr].second);
+            ++nested_ranges[src_local_discr].second;
+        }
+    }
+
+    for (size_t src_local_discr = 0; src_local_discr != nested_ranges.size(); ++src_local_discr)
+    {
+        auto [nested_start, nested_length] = nested_ranges[src_local_discr];
+        auto local_discr = localDiscriminatorByGlobal(src.globalDiscriminatorByLocal(src_local_discr));
+        if (nested_length)
+            variants[local_discr]->insertRangeFrom(*src.variants[src_local_discr], nested_start, nested_length);
+    }
+}
+
+void ColumnVariant::insertManyFrom(const DB::IColumn & src_, size_t position, size_t length)
+{
+    const size_t num_variants = variants.size();
+    const auto & src = assert_cast<const ColumnVariant &>(src_);
+    if (src.variants.size() != num_variants)
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Cannot insert value of Variant type with different number of types");
+
+    /// Remember that src column can have different local variants order.
+    Discriminator src_local_discr = src.localDiscriminatorAt(position);
+    Discriminator local_discr = localDiscriminatorByGlobal(src.globalDiscriminatorByLocal(src_local_discr));
+    auto & local_discriminators_data = getLocalDiscriminators();
+    local_discriminators_data.resize_fill(local_discriminators_data.size() + length, local_discr);
+
+    auto & offsets_data = getOffsets();
+    if (local_discr == NULL_DISCRIMINATOR)
+    {
+        offsets_data.resize_fill(offsets_data.size() + length);
+    }
+    else
+    {
+        size_t prev_offset = variants[local_discr]->size();
+        offsets_data.reserve(offsets_data.size() + length);
+        for (size_t i = 0; i != length; ++i)
+            offsets_data.push_back(prev_offset + i);
+
+        variants[local_discr]->insertManyFrom(*src.variants[src_local_discr], src.offsetAt(position), length);
+    }
+}
+
+void ColumnVariant::insertDefault()
+{
+    getLocalDiscriminators().push_back(NULL_DISCRIMINATOR);
+    getOffsets().emplace_back();
+}
+
+void ColumnVariant::insertManyDefaults(size_t length)
+{
+    size_t size = local_discriminators->size();
+    getLocalDiscriminators().resize_fill(size + length, NULL_DISCRIMINATOR);
+    getOffsets().resize_fill(size + length);
+}
+
+void ColumnVariant::popBack(size_t n)
+{
+    /// If we have only NULLs, just pop back from local_discriminators and offsets.
+    if (hasOnlyNulls())
+    {
+        local_discriminators->popBack(n);
+        offsets->popBack(n);
+        return;
+    }
+
+    /// Optimization for case when there is only 1 non-empty variant and no NULLs.
+    /// In this case we can just popBack n elements from this variant.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        variants[*non_empty_local_discr]->popBack(n);
+        local_discriminators->popBack(n);
+        offsets->popBack(n);
+        return;
+    }
+
+    /// Calculate how many rows we need to pop from each variant
+    auto & local_discriminators_data = getLocalDiscriminators();
+    size_t size = local_discriminators_data.size();
+    const size_t num_variants = variants.size();
+    std::vector<size_t> nested_n(num_variants, 0);
+    for (size_t i = 0; i != n; ++i)
+    {
+        Discriminator discr = local_discriminators_data[size - i - 1];
+        if (discr != NULL_DISCRIMINATOR)
+            ++nested_n[discr];
+    }
+
+    for (size_t i = 0; i != num_variants; ++i)
+    {
+        if (nested_n[i])
+            variants[i]->popBack(nested_n[i]);
+    }
+
+    local_discriminators->popBack(n);
+    offsets->popBack(n);
+}
+
+StringRef ColumnVariant::serializeValueIntoArena(size_t n, Arena & arena, char const *& begin, const UInt8 *) const
+{
+    /// During any serialization/deserialization we should always use global discriminators.
+    Discriminator global_discr = globalDiscriminatorAt(n);
+    char * pos = arena.allocContinue(sizeof(global_discr), begin);
+    memcpy(pos, &global_discr, sizeof(global_discr));
+    StringRef res(pos, sizeof(global_discr));
+
+    if (global_discr == NULL_DISCRIMINATOR)
+        return res;
+
+    auto value_ref = variants[localDiscriminatorByGlobal(global_discr)]->serializeValueIntoArena(offsetAt(n), arena, begin);
+    res.data = value_ref.data - res.size;
+    res.size += value_ref.size;
+
+    return res;
+}
+
+const char * ColumnVariant::deserializeAndInsertFromArena(const char * pos)
+{
+    /// During any serialization/deserialization we should always use global discriminators.
+    Discriminator global_discr = unalignedLoad<Discriminator>(pos);
+    pos += sizeof(global_discr);
+    Discriminator local_discr = localDiscriminatorByGlobal(global_discr);
+    getLocalDiscriminators().push_back(local_discr);
+    if (local_discr == NULL_DISCRIMINATOR)
+    {
+        getOffsets().emplace_back();
+        return pos;
+    }
+
+    getOffsets().push_back(variants[local_discr]->size());
+    return variants[local_discr]->deserializeAndInsertFromArena(pos);
+}
+
+const char * ColumnVariant::skipSerializedInArena(const char * pos) const
+{
+    Discriminator global_discr = unalignedLoad<Discriminator>(pos);
+    pos += sizeof(global_discr);
+    if (global_discr == NULL_DISCRIMINATOR)
+        return pos;
+
+    return variants[localDiscriminatorByGlobal(global_discr)]->skipSerializedInArena(pos);
+}
+
+void ColumnVariant::updateHashWithValue(size_t n, SipHash & hash) const
+{
+    Discriminator global_discr = globalDiscriminatorAt(n);
+    hash.update(global_discr);
+    if (global_discr != NULL_DISCRIMINATOR)
+        variants[localDiscriminatorByGlobal(global_discr)]->updateHashWithValue(offsetAt(n), hash);
+}
+
+void ColumnVariant::updateWeakHash32(WeakHash32 & hash) const
+{
+    auto s = size();
+
+    if (hash.getData().size() != s)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Size of WeakHash32 does not match size of column: "
+                                                   "column size is {}, hash size is {}", std::to_string(s), std::to_string(hash.getData().size()));
+
+    /// If we have only NULLs, keep hash unchanged.
+    if (hasOnlyNulls())
+        return;
+
+    /// Optimization for case when there is only 1 non-empty variant and no NULLs.
+    /// In this case we can just calculate weak hash for this variant.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        variants[*non_empty_local_discr]->updateWeakHash32(hash);
+        return;
+    }
+
+    /// Calculate weak hash for all variants.
+    std::vector<WeakHash32> nested_hashes;
+    for (const auto & variant : variants)
+    {
+        WeakHash32 nested_hash(variant->size());
+        variant->updateWeakHash32(nested_hash);
+        nested_hashes.emplace_back(std::move(nested_hash));
+    }
+
+    /// For each row hash is a hash of corresponding row from corresponding variant.
+    auto & hash_data = hash.getData();
+    const auto & local_discriminators_data = getLocalDiscriminators();
+    const auto & offsets_data = getOffsets();
+    for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+    {
+        Discriminator discr = local_discriminators_data[i];
+        /// Update hash only for non-NULL values
+        if (discr != NULL_DISCRIMINATOR)
+        {
+            auto nested_hash = nested_hashes[local_discriminators_data[i]].getData()[offsets_data[i]];
+            hash_data[i] = static_cast<UInt32>(hashCRC32(nested_hash, hash_data[i]));
+        }
+    }
+}
+
+void ColumnVariant::updateHashFast(SipHash & hash) const
+{
+    local_discriminators->updateHashFast(hash);
+    for (const auto & variant : variants)
+        variant->updateHashFast(hash);
+}
+
+ColumnPtr ColumnVariant::filter(const Filter & filt, ssize_t result_size_hint) const
+{
+    if (size() != filt.size())
+        throw Exception(ErrorCodes::SIZES_OF_COLUMNS_DOESNT_MATCH, "Size of filter ({}) doesn't match size of column ({})", filt.size(), size());
+
+    /// If we have only NULLs, just filter local_discriminators column.
+    if (hasOnlyNulls())
+    {
+        Columns new_variants(variants.begin(), variants.end());
+        auto new_discriminators = local_discriminators->filter(filt, result_size_hint);
+        /// In case of all NULL values offsets doesn't contain any useful values, just resize it.
+        ColumnPtr new_offsets = offsets->cloneResized(new_discriminators->size());
+        return ColumnVariant::create(new_discriminators, new_offsets, new_variants, local_to_global_discriminators);
+    }
+
+    /// Optimization for case when there is only 1 non-empty variant and no NULLs.
+    /// In this case we can just filter this variant and resize discriminators/offsets.
+    if (auto non_empty_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        Columns new_variants(variants.begin(), variants.end());
+        new_variants[*non_empty_discr] = variants[*non_empty_discr]->filter(filt, result_size_hint);
+        size_t new_size = new_variants[*non_empty_discr]->size();
+        ColumnPtr new_discriminators = local_discriminators->cloneResized(new_size);
+        ColumnPtr new_offsets = offsets->cloneResized(new_size);
+        return ColumnVariant::create(new_discriminators, new_offsets, new_variants, local_to_global_discriminators);
+    }
+
+    /// We should create filter for each variant
+    /// according to local_discriminators and given filter.
+    const size_t num_variants = variants.size();
+    std::vector<Filter> nested_filters(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+        nested_filters[i].reserve(variants[i]->size());
+
+    /// As we will iterate through local_discriminators anyway, we can count
+    /// result size for each variant.
+    std::vector<ssize_t> variant_result_size_hints(num_variants);
+
+    const auto & local_discriminators_data = getLocalDiscriminators();
+    for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+    {
+        Discriminator discr = local_discriminators_data[i];
+        if (discr != NULL_DISCRIMINATOR)
+        {
+            nested_filters[local_discriminators_data[i]].push_back(filt[i]);
+            variant_result_size_hints[local_discriminators_data[i]] += !!(filt[i]);
+        }
+    }
+
+    Columns new_variants;
+    new_variants.reserve(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+    {
+        /// It make sense to call filter() on variant only if the result size is not 0.
+        if (variant_result_size_hints[i])
+            new_variants.emplace_back(variants[i]->filter(nested_filters[i], variant_result_size_hints[i]));
+        else
+            new_variants.emplace_back(variants[i]->cloneEmpty());
+    }
+
+    /// We cannot use filtered offsets column, as it will be incorrect.
+    /// It will be reconstructed on ColumnVariant creation according to new local_discriminators.
+    return ColumnVariant::create(local_discriminators->filter(filt, result_size_hint), new_variants, local_to_global_discriminators);
+}
+
+void ColumnVariant::expand(const Filter & mask, bool inverted)
+{
+    /// Expand local_discriminators using NULL_DISCRIMINATOR for 0-rows.
+    expandDataByMask(getLocalDiscriminators(), mask, inverted, NULL_DISCRIMINATOR);
+    expandDataByMask(getOffsets(), mask, inverted);
+}
+
+ColumnPtr ColumnVariant::permute(const Permutation & perm, size_t limit) const
+{
+    /// If we have only NULLs, permutation will take no effect, just return resized column.
+    if (hasOnlyNulls())
+        return cloneResized(limit);
+
+    /// Optimization when we have only one non empty variant and no NULLs.
+    /// In this case local_discriminators column is filled with identical values and offsets column
+    /// filled with sequential numbers. In this case we can just apply permutation to this
+    /// single non-empty variant and cut local_discriminators and offsets columns to the result size.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        MutableColumns new_variants;
+        const size_t num_variants = variants.size();
+        new_variants.reserve(num_variants);
+        for (size_t i = 0; i != num_variants; ++i)
+        {
+            if (i == *non_empty_local_discr)
+                new_variants.emplace_back(variants[*non_empty_local_discr]->permute(perm, limit)->assumeMutable());
+            else
+                new_variants.emplace_back(variants[i]->assumeMutable());
+        }
+
+        size_t new_size = new_variants[*non_empty_local_discr]->size();
+        return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
+    }
+
+    return permuteImpl(*this, perm, limit);
+}
+
+ColumnPtr ColumnVariant::index(const IColumn & indexes, size_t limit) const
+{
+    /// If we have only NULLs, index will take no effect, just return resized column.
+    if (hasOnlyNulls())
+        return cloneResized(limit);
+
+    /// Optimization when we have only one non empty variant and no NULLs.
+    /// In this case local_discriminators column is filled with identical values and offsets column
+    /// filled with sequential numbers. So we can just apply indexes to this
+    /// single non-empty variant and cut local_discriminators and offsets columns to the result size.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        MutableColumns new_variants;
+        const size_t num_variants = variants.size();
+        new_variants.reserve(num_variants);
+        for (size_t i = 0; i != num_variants; ++i)
+        {
+            if (i == *non_empty_local_discr)
+                new_variants.emplace_back(variants[*non_empty_local_discr]->index(indexes, limit)->assumeMutable());
+            else
+                new_variants.emplace_back(variants[i]->assumeMutable());
+        }
+
+        size_t new_size = new_variants[*non_empty_local_discr]->size();
+        return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
+    }
+
+    return selectIndexImpl(*this, indexes, limit);
+}
+
+template <typename Type>
+ColumnPtr ColumnVariant::indexImpl(const PaddedPODArray<Type> & indexes, size_t limit) const
+{
+    /// First, apply indexes for local_discriminators and offsets.
+    ColumnPtr new_local_discriminators = assert_cast<const ColumnDiscriminators &>(*local_discriminators).indexImpl(indexes, limit);
+    ColumnPtr new_offsets = assert_cast<const ColumnOffsets &>(*offsets).indexImpl(indexes, limit);
+    const auto & new_local_discriminators_data =  assert_cast<const ColumnDiscriminators &>(*new_local_discriminators).getData();
+    const auto & new_offsets_data = assert_cast<const ColumnOffsets &>(*new_offsets).getData();
+    /// Then, create permutation for each variant.
+    const size_t num_variants = variants.size();
+    std::vector<Permutation> nested_perms(num_variants);
+    /// If there is no limit, we know the size of each permutation
+    /// in advance and can use reserve.
+    if (limit == 0)
+    {
+        for (size_t i = 0; i != num_variants; ++i)
+            nested_perms[i].reserve(variants[i]->size());
+    }
+
+    for (size_t i = 0; i != new_local_discriminators_data.size(); ++i)
+    {
+        Discriminator discr = new_local_discriminators_data[i];
+        if (discr != NULL_DISCRIMINATOR)
+            nested_perms[discr].push_back(new_offsets_data[i]);
+    }
+
+    Columns new_variants;
+    new_variants.reserve(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+    {
+        size_t nested_limit = nested_perms[i].size() == variants[i]->size() ? 0 : nested_perms[i].size();
+        new_variants.emplace_back(variants[i]->permute(nested_perms[i], nested_limit));
+    }
+
+    /// We cannot use new_offsets column as an offset column, because it became invalid after variants permutation.
+    /// New offsets column will be created in constructor.
+    return ColumnVariant::create(new_local_discriminators, new_variants, local_to_global_discriminators);
+}
+
+ColumnPtr ColumnVariant::replicate(const Offsets & replicate_offsets) const
+{
+    if (size() != replicate_offsets.size())
+        throw Exception(ErrorCodes::SIZES_OF_COLUMNS_DOESNT_MATCH, "Size of offsets {} doesn't match size of column {}", replicate_offsets.size(), size());
+
+    if (empty())
+        return cloneEmpty();
+
+    /// If we have only NULLs, just resize column to the new size.
+    if (hasOnlyNulls())
+        return cloneResized(replicate_offsets.back());
+
+    const size_t num_variants = variants.size();
+
+    /// Optimization when we have only one non empty variant and no NULLs.
+    /// In this case local_discriminators column is filled with identical values and offsets column
+    /// filled with sequential numbers. So we can just replicate this one non empty variant,
+    /// then resize local_discriminators to the result size and fill offsets column.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        MutableColumns new_variants;
+        new_variants.reserve(num_variants);
+        for (size_t i = 0; i != num_variants; ++i)
+        {
+            if (i == *non_empty_local_discr)
+                new_variants.emplace_back(variants[*non_empty_local_discr]->replicate(replicate_offsets)->assumeMutable());
+            else
+                new_variants.emplace_back(variants[i]->cloneEmpty());
+        }
+
+        size_t new_size = new_variants[*non_empty_local_discr]->size();
+        /// Create and fill new local_discriminators column with non_empty_index discriminator.
+        auto new_local_discriminators = IColumn::mutate(local_discriminators);
+        assert_cast<ColumnDiscriminators &>(*new_local_discriminators).getData().resize_fill(new_size, *non_empty_local_discr);
+        /// Create and fill new offsets column with sequential indexes.
+        auto new_offsets = IColumn::mutate(offsets);
+        auto & new_offsets_data = assert_cast<ColumnOffsets &>(*new_offsets).getData();
+        size_t old_size = offsets->size();
+        if (new_size > old_size)
+        {
+            new_offsets_data.reserve(new_size);
+            for (size_t i = old_size; i < new_size; ++i)
+                new_offsets_data.push_back(new_offsets_data[i - 1] + 1);
+        }
+        else
+        {
+            new_offsets_data.resize(new_size);
+        }
+
+        return ColumnVariant::create(std::move(new_local_discriminators), std::move(new_offsets), std::move(new_variants), local_to_global_discriminators);
+    }
+
+    /// Create replicate offsets for each variant according to
+    /// local_discriminators column.
+    std::vector<Offsets> nested_replicated_offsets(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+        nested_replicated_offsets[i].reserve(variants[i]->size());
+
+    const auto & local_discriminators_data = getLocalDiscriminators();
+    for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+    {
+        Discriminator discr = local_discriminators_data[i];
+        if (discr != NULL_DISCRIMINATOR)
+        {
+            size_t repeat_count = replicate_offsets[i] - replicate_offsets[i - 1];
+            nested_replicated_offsets[discr].push_back(nested_replicated_offsets[discr].back() + repeat_count);
+        }
+    }
+
+    auto new_local_discriminators = local_discriminators->replicate(replicate_offsets);
+    Columns new_variants;
+    new_variants.reserve(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+        new_variants.emplace_back(variants[i]->replicate(nested_replicated_offsets[i]));
+
+    /// New offsets column will be created in constructor.
+    return ColumnVariant::create(new_local_discriminators, new_variants, local_to_global_discriminators);
+}
+
+MutableColumns ColumnVariant::scatter(ColumnIndex num_columns, const Selector & selector) const
+{
+    const size_t num_variants = variants.size();
+
+    /// If we have only NULLs, we need to scatter only local_discriminators.
+    if (hasOnlyNulls())
+    {
+        auto scattered_local_discriminators = local_discriminators->scatter(num_columns, selector);
+        MutableColumns result;
+        result.reserve(num_columns);
+        for (size_t i = 0; i != num_columns; ++i)
+        {
+            MutableColumns new_variants;
+            new_variants.reserve(num_variants);
+            for (const auto & variant : variants)
+                new_variants.emplace_back(IColumn::mutate(variant));
+
+            result.emplace_back(ColumnVariant::create(std::move(scattered_local_discriminators[i]), std::move(new_variants), local_to_global_discriminators));
+        }
+
+        return result;
+    }
+
+    /// Optimization when we have only one non empty variant and no NULLs.
+    /// In this case we can just scatter local_discriminators and this non empty variant.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        auto scattered_local_discriminators = local_discriminators->scatter(num_columns, selector);
+        auto scattered_non_empty_variant = variants[*non_empty_local_discr]->scatter(num_columns, selector);
+        MutableColumns result;
+        result.reserve(num_columns);
+        for (size_t i = 0; i != num_columns; ++i)
+        {
+            MutableColumns scattered_nested_variants(num_variants);
+            for (size_t j = 0; j != num_variants; ++j)
+            {
+                if (j == *non_empty_local_discr)
+                    scattered_nested_variants[j] = std::move(scattered_non_empty_variant[i]);
+                else
+                    scattered_nested_variants[j] = IColumn::mutate(variants[j]);
+            }
+
+            result.emplace_back(ColumnVariant::create(std::move(scattered_local_discriminators[i]), std::move(scattered_nested_variants), local_to_global_discriminators));
+        }
+
+        return result;
+    }
+
+    /// Create selector for each variant according to local_discriminators.
+    std::vector<Selector> nested_selectors(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+        nested_selectors[i].reserve(variants[i]->size());
+
+    const auto & local_discriminators_data = getLocalDiscriminators();
+    for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+    {
+        Discriminator discr = local_discriminators_data[i];
+        if (discr != NULL_DISCRIMINATOR)
+            nested_selectors[discr].push_back(selector[i]);
+    }
+
+    auto scattered_local_discriminators = local_discriminators->scatter(num_columns, selector);
+    std::vector<MutableColumns> nested_scattered_variants;
+    nested_scattered_variants.reserve(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+        nested_scattered_variants.emplace_back(variants[i]->scatter(num_columns, nested_selectors[i]));
+
+    MutableColumns result;
+    result.reserve(num_columns);
+    for (size_t i = 0; i != num_columns; ++i)
+    {
+        MutableColumns new_variants;
+        new_variants.reserve(num_variants);
+        for (size_t j = 0; j != num_variants; ++j)
+            new_variants.emplace_back(std::move(nested_scattered_variants[j][i]));
+        result.emplace_back(ColumnVariant::create(std::move(scattered_local_discriminators[i]), std::move(new_variants), local_to_global_discriminators));
+    }
+
+    return result;
+}
+
+void ColumnVariant::gather(ColumnGathererStream & gatherer)
+{
+    gatherer.gather(*this);
+}
+
+bool ColumnVariant::hasEqualValues() const
+{
+    if (local_discriminators->empty() || hasOnlyNulls())
+        return true;
+
+    return local_discriminators->hasEqualValues() && variants[localDiscriminatorAt(0)]->hasEqualValues();
+}
+
+void ColumnVariant::getPermutation(IColumn::PermutationSortDirection, IColumn::PermutationSortStability, size_t, int, IColumn::Permutation & res) const
+{
+    size_t s = local_discriminators->size();
+    res.resize(s);
+    for (size_t i = 0; i < s; ++i)
+        res[i] = i;
+}
+
+void ColumnVariant::updatePermutation(IColumn::PermutationSortDirection, IColumn::PermutationSortStability, size_t, int, IColumn::Permutation &, DB::EqualRanges &) const
+{
+}
+
+void ColumnVariant::reserve(size_t n)
+{
+    local_discriminators->reserve(n);
+    offsets->reserve(n);
+}
+
+void ColumnVariant::ensureOwnership()
+{
+    const size_t num_variants = variants.size();
+    for (size_t i = 0; i < num_variants; ++i)
+        getVariantByLocalDiscriminator(i).ensureOwnership();
+}
+
+size_t ColumnVariant::byteSize() const
+{
+    size_t res = local_discriminators->byteSize() + offsets->byteSize();
+    for (const auto & variant : variants)
+        res += variant->byteSize();
+    return res;
+}
+
+size_t ColumnVariant::byteSizeAt(size_t n) const
+{
+    size_t res = sizeof(Offset) + sizeof(Discriminator);
+    Discriminator discr = localDiscriminatorAt(n);
+    if (discr == NULL_DISCRIMINATOR)
+        return res;
+
+    return res + variants[discr]->byteSizeAt(offsetAt(n));
+}
+
+size_t ColumnVariant::allocatedBytes() const
+{
+    size_t res = local_discriminators->allocatedBytes() + offsets->allocatedBytes();
+    for (const auto & variant : variants)
+        res += variant->allocatedBytes();
+    return res;
+}
+
+void ColumnVariant::protect()
+{
+    local_discriminators->protect();
+    offsets->protect();
+    for (auto & variant : variants)
+        variant->protect();
+}
+
+void ColumnVariant::getExtremes(Field & min, Field & max) const
+{
+    min = Null();
+    max = Null();
+}
+
+void ColumnVariant::forEachSubcolumn(MutableColumnCallback callback)
+{
+    callback(local_discriminators);
+    callback(offsets);
+    for (auto & variant : variants)
+        callback(variant);
+}
+
+void ColumnVariant::forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback)
+{
+    callback(*local_discriminators);
+    local_discriminators->forEachSubcolumnRecursively(callback);
+    callback(*offsets);
+    offsets->forEachSubcolumnRecursively(callback);
+
+    for (auto & variant : variants)
+    {
+        callback(*variant);
+        variant->forEachSubcolumnRecursively(callback);
+    }
+}
+
+bool ColumnVariant::structureEquals(const IColumn & rhs) const
+{
+    const auto * rhs_variant = typeid_cast<const ColumnVariant *>(&rhs);
+    if (!rhs_variant)
+        return false;
+
+    const size_t num_variants = variants.size();
+    if (num_variants != rhs_variant->variants.size())
+        return false;
+
+    for (size_t i = 0; i < num_variants; ++i)
+        if (!variants[i]->structureEquals(rhs_variant->getVariantByGlobalDiscriminator(globalDiscriminatorByLocal(i))))
+            return false;
+
+    return true;
+}
+
+ColumnPtr ColumnVariant::compress() const
+{
+    ColumnPtr local_discriminators_compressed = local_discriminators->compress();
+    ColumnPtr offsets_compressed = offsets->compress();
+    size_t byte_size = local_discriminators_compressed->byteSize() + offsets_compressed->byteSize();
+    Columns compressed;
+    compressed.reserve(variants.size());
+    for (const auto & variant : variants)
+    {
+        auto compressed_variant = variant->compress();
+        byte_size += compressed_variant->byteSize();
+        compressed.emplace_back(std::move(compressed_variant));
+    }
+
+    return ColumnCompressed::create(size(), byte_size,
+        [my_local_discriminators_compressed = std::move(local_discriminators_compressed), my_offsets_compressed = std::move(offsets_compressed), my_compressed = std::move(compressed), my_local_to_global_discriminators = this->local_to_global_discriminators]() mutable
+        {
+            for (auto & variant : my_compressed)
+                variant = variant->decompress();
+            return ColumnVariant::create(my_local_discriminators_compressed->decompress(), my_offsets_compressed->decompress(), my_compressed, my_local_to_global_discriminators);
+        });
+}
+
+double ColumnVariant::getRatioOfDefaultRows(double) const
+{
+    UInt64 num_defaults = getNumberOfDefaultRows();
+    return static_cast<double>(num_defaults) / local_discriminators->size();
+}
+
+UInt64 ColumnVariant::getNumberOfDefaultRows() const
+{
+    size_t total_variant_sizes = 0;
+    for (const auto & variant : variants)
+        total_variant_sizes += variant->size();
+    return local_discriminators->size() - total_variant_sizes;
+}
+
+void ColumnVariant::getIndicesOfNonDefaultRows(Offsets & indices, size_t from, size_t limit) const
+{
+    return getIndicesOfNonDefaultRowsImpl<ColumnVariant>(indices, from, limit);
+}
+
+void ColumnVariant::finalize()
+{
+    for (auto & variant : variants)
+        variant->finalize();
+}
+
+bool ColumnVariant::isFinalized() const
+{
+    return std::all_of(variants.begin(), variants.end(), [](const auto & variant) { return variant->isFinalized(); });
+}
+
+std::optional<ColumnVariant::Discriminator> ColumnVariant::getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls() const
+{
+    for (size_t i = 0; i != variants.size(); ++i)
+    {
+        if (variants[i]->size() == local_discriminators->size())
+            return i;
+    }
+
+    return std::nullopt;
+}
+
+void ColumnVariant::applyNullMap(const ColumnVector<UInt8>::Container & null_map)
+{
+    applyNullMapImpl<false>(null_map);
+}
+
+void ColumnVariant::applyNegatedNullMap(const ColumnVector<UInt8>::Container & null_map)
+{
+    applyNullMapImpl<true>(null_map);
+}
+
+template <bool inverted>
+void ColumnVariant::applyNullMapImpl(const ColumnVector<UInt8>::Container & null_map)
+{
+    if (null_map.size() != local_discriminators->size())
+        throw Exception(ErrorCodes::SIZES_OF_NESTED_COLUMNS_ARE_INCONSISTENT,
+                        "Logical error: Sizes of discriminators column and null map data are not equal");
+
+    /// If we have only NULLs, nothing to do.
+    if (hasOnlyNulls())
+    {
+        return;
+    }
+
+    /// If we have only 1 non empty column and no NULLs, we can just filter that
+    /// variant according to the null_map.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        auto & local_discriminators_data = getLocalDiscriminators();
+        auto & offsets_data = getOffsets();
+        size_t size_hint = 0;
+
+        if constexpr (inverted)
+        {
+            for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+            {
+                if (null_map[i])
+                    offsets_data[i] = size_hint++;
+                else
+                    local_discriminators_data[i] = NULL_DISCRIMINATOR;
+            }
+            variants[*non_empty_local_discr] = variants[*non_empty_local_discr]->filter(null_map, size_hint);
+        }
+        else
+        {
+            ColumnVector<UInt8>::Container filter;
+            filter.reserve(null_map.size());
+            for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+            {
+               if (null_map[i])
+               {
+                    filter.push_back(0);
+                    local_discriminators_data[i] = NULL_DISCRIMINATOR;
+               }
+               else
+               {
+                   filter.push_back(1);
+                   offsets_data[i] = size_hint++;
+               }
+            }
+            variants[*non_empty_local_discr] = variants[*non_empty_local_discr]->filter(filter, size_hint);
+        }
+
+        return;
+    }
+
+    /// In general case we should iterate through null_map + discriminators,
+    /// create filter for each variant and update offsets column.
+    std::vector<Filter> variant_filters;
+    variant_filters.resize(variants.size());
+    std::vector<size_t> variant_new_sizes;
+    variant_new_sizes.resize(variants.size(), 0);
+
+    auto & local_discriminators_data = getLocalDiscriminators();
+    auto & offsets_data = getOffsets();
+    for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+    {
+        auto & discr = local_discriminators_data[i];
+        if (discr != NULL_DISCRIMINATOR)
+        {
+            if (null_map[i] ^ inverted)
+            {
+                auto & variant_filter = variant_filters[discr];
+                /// We create filters lazily.
+                if (variant_filter.empty())
+                   variant_filter.resize_fill(variants[discr]->size(), 1);
+                variant_filter[offsets_data[i]] = 0;
+                discr = NULL_DISCRIMINATOR;
+            }
+            else
+            {
+                offsets_data[i] = variant_new_sizes[discr]++;
+            }
+        }
+    }
+
+    for (size_t i = 0; i != variants.size(); ++i)
+    {
+        if (!variant_filters[i].empty())
+            variants[i] = variants[i]->filter(variant_filters[i], variant_new_sizes[i]);
+    }
+}
+
+}
diff --git a/src/Columns/ColumnVariant.h b/src/Columns/ColumnVariant.h
new file mode 100644
index 00000000000..692fdd1709e
--- /dev/null
+++ b/src/Columns/ColumnVariant.h
@@ -0,0 +1,306 @@
+#pragma once
+
+#include <Columns/IColumn.h>
+#include <Columns/ColumnVector.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
+/**
+ * Column for storing Variant(...) type values.
+ * Variant type represents a union of other data types.
+ * For example, type Variant(T1, T2, ..., TN) means that each row of this type
+ * has a value of either type T1 or T2 or ... or TN or none of them (NULL value)
+ *
+ * ColumnVariant stores:
+ *   - The discriminators column, which determines which variant is stored in each row.
+ *   - The offsets column, which determines the offset in the corresponding variant column in each row.
+ *   - The list of variant columns with only real values (so the sizes of variant columns can be different).
+ * Discriminator is an index of a variant in the variants list, it also has special value called NULL_DISCRIMINATOR
+ * that indicates that the value in the row is NULL.
+ *
+ * We want to be able to extend Variant column for free without rewriting the data, but as we don't care about the
+ * order of variants during Variant creation (we want Variant(T1, T2) to be the same as Variant(T2, T1)), we support
+ * some global order of nested types inside Variant during type creation, so after extension the order of variant types
+ * (and so their discriminators) can change. For example: Variant(T1, T3) -> Variant(T1, T2, T3).
+ * To avoid full rewrite of discriminators column on Variant extension, we differentiate local order of variants
+ * inside a column and global order of variants created during type creation. So, ColumnVariant stores only local
+ * discriminators and additionally stores the mapping between global and local discriminators.
+ * So, when we need to extend Variant column with new variant, we can just append it to a list of variant columns
+ * with new local discriminator and update mapping from global to local orders.
+ *
+ * Note that two instances of ColumnVariant can have different local orders, so we should always use global
+ * discriminators during inter-column interactions.
+ *
+ * Let's take an example with type Variant(UInt32, String, Array(UInt32)):
+ * During type creation we will sort types by their names and get the global order: Array(UInt32), String, UInt32.
+ * So, type Array(UInt32) will have global discriminator 0, String - 1 and UInt32 - 2.
+ * Let's say we have a column with local order (String, UInt32, Array(UInt32)) and values:
+ * 'Hello', 42, NULL, 'World', 43, [1, 2, 3], NULL, 44
+ *
+ * Let's see how these values will be stored in ColumnVariant:
+ *
+ * local_to_global_discriminators: {0 : 1, 1 : 2, 2 : 0}
+ * global_to_local_discriminators: {0 : 2, 1 : 0, 2 : 1}
+ * local_discriminators    offsets    String    UInt32    Array(UInt32)
+ *         0                  0       'Hello'     42        [1, 2, 3]
+ *         1                  0       'World'     43
+ *  NULL_DISCRIMINATOR        0                   44
+ *         0                  1
+ *         1                  1
+ *         2                  0
+ *  NULL_DISCRIMINATOR        0
+ *         1                  2
+ *
+ */
+class ColumnVariant final : public COWHelper<IColumn, ColumnVariant>
+{
+public:
+    using Discriminator = UInt8;
+    using Discriminators = PaddedPODArray<Discriminator>;
+    using ColumnDiscriminators = ColumnVector<Discriminator>;
+    using ColumnOffsets = ColumnVector<Offset>;
+
+    static constexpr UInt8 NULL_DISCRIMINATOR = std::numeric_limits<Discriminator>::max(); /// 255
+    static constexpr size_t MAX_NESTED_COLUMNS = std::numeric_limits<Discriminator>::max(); /// 255
+
+private:
+    friend class COWHelper<IColumn, ColumnVariant>;
+
+    using NestedColumns = std::vector<WrappedPtr>;
+
+    /// Create an empty column with provided variants.
+    /// Variants are in global order.
+    explicit ColumnVariant(MutableColumns && variants_);
+    /// Variants are in local order according to provided mapping.
+    explicit ColumnVariant(MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_);
+
+    /// Create column from discriminators column and list of variant columns.
+    /// Offsets column should be constructed according to the discriminators.
+    /// Variants are in global order.
+    ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumns && variants_);
+    /// Variants are in local order according to provided mapping.
+    ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_);
+
+    /// Create column from discriminators column, offsets column and list of variant columns.
+    /// Variants are in global order.
+    ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumnPtr offsets_, MutableColumns && variants_);
+    /// Variants are in local order according to provided mapping.
+    ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumnPtr offsets_, MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_);
+
+    ColumnVariant(const ColumnVariant &) = default;
+
+public:
+    /** Create immutable column using immutable arguments. This arguments may be shared with other variants.
+      * Use IColumn::mutate in order to make mutable column and mutate shared nested variants.
+      */
+    using Base = COWHelper<IColumn, ColumnVariant>;
+    static Ptr create(const Columns & variants_) { return create(variants_, {}); }
+    static Ptr create(const Columns & variants_, const std::vector<Discriminator> & local_to_global_discriminators_);
+    static Ptr create(const ColumnPtr & local_discriminators_, const Columns & variants_) { return create(local_discriminators_, variants_, {}); }
+    static Ptr create(const ColumnPtr & local_discriminators_, const Columns & variants_, const std::vector<Discriminator> & local_to_global_discriminators_);
+    static Ptr create(const ColumnPtr & local_discriminators_, const DB::ColumnPtr & offsets_, const Columns & variants_) { return create(local_discriminators_, offsets_, variants_, {}); }
+    static Ptr create(const ColumnPtr & local_discriminators_, const DB::ColumnPtr & offsets_, const Columns & variants_, const std::vector<Discriminator> & local_to_global_discriminators_);
+
+    static MutablePtr create(MutableColumns && variants_)
+    {
+        return Base::create(std::move(variants_));
+    }
+
+    static MutablePtr create(MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_)
+    {
+        return Base::create(std::move(variants_), local_to_global_discriminators_);
+    }
+
+    static MutablePtr create(MutableColumnPtr local_discriminators_, MutableColumns && variants_)
+    {
+        return Base::create(std::move(local_discriminators_), std::move(variants_));
+    }
+
+    static MutablePtr create(MutableColumnPtr local_discriminators_, MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_)
+    {
+        return Base::create(std::move(local_discriminators_), std::move(variants_), local_to_global_discriminators_);
+    }
+
+    static MutablePtr create(MutableColumnPtr local_discriminators_, MutableColumnPtr offsets_, MutableColumns && variants_)
+    {
+        return Base::create(std::move(local_discriminators_), std::move(offsets_), std::move(variants_));
+    }
+
+    static MutablePtr create(MutableColumnPtr local_discriminators_, MutableColumnPtr offsets_, MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_)
+    {
+        return Base::create(std::move(local_discriminators_), std::move(offsets_), std::move(variants_), local_to_global_discriminators_);
+    }
+
+    std::string getName() const override;
+    const char * getFamilyName() const override { return "Variant"; }
+    TypeIndex getDataType() const override { return TypeIndex::Variant; }
+
+    MutableColumnPtr cloneEmpty() const override;
+    MutableColumnPtr cloneResized(size_t size) const override;
+
+    size_t ALWAYS_INLINE offsetAt(size_t i) const { return getOffsets()[i]; }
+    Discriminator ALWAYS_INLINE localDiscriminatorAt(size_t i) const { return getLocalDiscriminators()[i]; }
+    Discriminator ALWAYS_INLINE globalDiscriminatorAt(size_t i) const { return globalDiscriminatorByLocal(getLocalDiscriminators()[i]); }
+
+    Discriminator ALWAYS_INLINE globalDiscriminatorByLocal(Discriminator local_discr) const
+    {
+        /// NULL_DISCRIMINATOR is always the same in local and global orders.
+        return local_discr == NULL_DISCRIMINATOR ? NULL_DISCRIMINATOR : local_to_global_discriminators[local_discr];
+    }
+
+    Discriminator ALWAYS_INLINE localDiscriminatorByGlobal(Discriminator global_discr) const
+    {
+        /// NULL_DISCRIMINATOR is always the same in local and global orders.
+        return global_discr == NULL_DISCRIMINATOR ? NULL_DISCRIMINATOR : global_to_local_discriminators[global_discr];
+    }
+
+    size_t size() const override
+    {
+        return local_discriminators->size();
+    }
+
+    Field operator[](size_t n) const override;
+    void get(size_t n, Field & res) const override;
+
+    bool isDefaultAt(size_t n) const override;
+    bool isNullAt(size_t n) const override;
+    StringRef getDataAt(size_t n) const override;
+    void insertData(const char * pos, size_t length) override;
+    void insert(const Field & x) override;
+    void insertFrom(const IColumn & src_, size_t n) override;
+    void insertRangeFrom(const IColumn & src, size_t start, size_t length) override;
+    void insertManyFrom(const IColumn & src, size_t position, size_t length) override;
+    void insertDefault() override;
+    void insertManyDefaults(size_t length) override;
+    void popBack(size_t n) override;
+    StringRef serializeValueIntoArena(size_t n, Arena & arena, char const *& begin, const UInt8 *) const override;
+    const char * deserializeAndInsertFromArena(const char * pos) override;
+    const char * skipSerializedInArena(const char * pos) const override;
+    void updateHashWithValue(size_t n, SipHash & hash) const override;
+    void updateWeakHash32(WeakHash32 & hash) const override;
+    void updateHashFast(SipHash & hash) const override;
+    ColumnPtr filter(const Filter & filt, ssize_t result_size_hint) const override;
+    void expand(const Filter & mask, bool inverted) override;
+    ColumnPtr permute(const Permutation & perm, size_t limit) const override;
+    ColumnPtr index(const IColumn & indexes, size_t limit) const override;
+    template <typename Type>
+    ColumnPtr indexImpl(const PaddedPODArray<Type> & indexes, size_t limit) const;
+    ColumnPtr replicate(const Offsets & replicate_offsets) const override;
+    MutableColumns scatter(ColumnIndex num_variants, const Selector & selector) const override;
+    void gather(ColumnGathererStream & gatherer_stream) override;
+
+    /// Variant type is not comparable.
+    int compareAt(size_t, size_t, const IColumn &, int) const override
+    {
+        return 0;
+    }
+
+    void compareColumn(const IColumn &, size_t, PaddedPODArray<UInt64> *, PaddedPODArray<Int8> &, int, int) const override
+    {
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method compareColumn is not supported for ColumnAggregateFunction");
+    }
+
+    bool hasEqualValues() const override;
+    void getExtremes(Field & min, Field & max) const override;
+    void getPermutation(IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
+                        size_t limit, int nan_direction_hint, IColumn::Permutation & res) const override;
+    void updatePermutation(IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
+                           size_t limit, int nan_direction_hint, IColumn::Permutation & res, EqualRanges & equal_ranges) const override;
+
+    void reserve(size_t n) override;
+    void ensureOwnership() override;
+    size_t byteSize() const override;
+    size_t byteSizeAt(size_t n) const override;
+    size_t allocatedBytes() const override;
+    void protect() override;
+    void forEachSubcolumn(MutableColumnCallback callback) override;
+    void forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback) override;
+    bool structureEquals(const IColumn & rhs) const override;
+    ColumnPtr compress() const override;
+    double getRatioOfDefaultRows(double sample_ratio) const override;
+    UInt64 getNumberOfDefaultRows() const override;
+    void getIndicesOfNonDefaultRows(Offsets & indices, size_t from, size_t limit) const override;
+    void finalize() override;
+    bool isFinalized() const override;
+
+    const IColumn & getVariantByLocalDiscriminator(size_t discr) const { return *variants[discr]; }
+    const IColumn & getVariantByGlobalDiscriminator(size_t discr) const { return *variants[global_to_local_discriminators.at(discr)]; }
+    IColumn & getVariantByLocalDiscriminator(size_t discr) { return *variants[discr]; }
+    IColumn & getVariantByGlobalDiscriminator(size_t discr) { return *variants[global_to_local_discriminators.at(discr)]; }
+
+    const ColumnPtr & getVariantPtrByLocalDiscriminator(size_t discr) const { return variants[discr]; }
+    const ColumnPtr & getVariantPtrByGlobalDiscriminator(size_t discr) const { return variants[global_to_local_discriminators.at(discr)]; }
+    ColumnPtr & getVariantPtrByLocalDiscriminator(size_t discr) { return variants[discr]; }
+    ColumnPtr & getVariantPtrByGlobalDiscriminator(size_t discr) { return variants[global_to_local_discriminators.at(discr)]; }
+
+    const IColumn & getLocalDiscriminatorsColumn() const { return *local_discriminators; }
+    IColumn & getLocalDiscriminatorsColumn() { return *local_discriminators; }
+
+    const ColumnPtr & getLocalDiscriminatorsPtr() const { return local_discriminators; }
+    ColumnPtr & getLocalDiscriminatorsPtr() { return local_discriminators; }
+
+    const Discriminators & ALWAYS_INLINE getLocalDiscriminators() const { return assert_cast<const ColumnDiscriminators &>(*local_discriminators).getData(); }
+    Discriminators & ALWAYS_INLINE getLocalDiscriminators() { return assert_cast<ColumnDiscriminators &>(*local_discriminators).getData(); }
+
+    const IColumn & getOffsetsColumn() const { return *offsets; }
+    IColumn & getOffsetsColumn() { return *offsets; }
+
+    const ColumnPtr & getOffsetsPtr() const { return offsets; }
+    ColumnPtr & getOffsetsPtr() { return offsets; }
+
+    const Offsets & ALWAYS_INLINE getOffsets() const { return assert_cast<const ColumnOffsets &>(*offsets).getData(); }
+    Offsets & ALWAYS_INLINE getOffsets() { return assert_cast<ColumnOffsets &>(*offsets).getData(); }
+
+    size_t getNumVariants() const { return variants.size(); }
+
+    bool hasOnlyNulls() const
+    {
+        /// If all variants are empty, we have only NULL values.
+        return std::all_of(variants.begin(), variants.end(), [](const auto & v){ return v->empty(); } );
+    }
+
+    /// Check if local and global order is the same.
+    bool hasGlobalVariantsOrder() const
+    {
+        for (size_t i = 0; i != local_to_global_discriminators.size(); ++i)
+        {
+            if (local_to_global_discriminators[i] != i)
+                return false;
+        }
+
+        return true;
+    }
+
+    /// Check if we have only 1 non-empty variant and no NULL values,
+    /// and if so, return the discriminator of this non-empty column.
+    std::optional<Discriminator> getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls() const;
+
+    /// Apply null map to a Variant column.
+    /// Replace corresponding discriminators with NULL_DISCRIMINATOR
+    /// and filter out rows in variants if needed.
+    void applyNullMap(const ColumnVector<UInt8>::Container & null_map);
+    void applyNegatedNullMap(const ColumnVector<UInt8>::Container & null_map);
+
+private:
+    void initIdentityGlobalToLocalDiscriminatorsMapping();
+
+    template <bool inverted>
+    void applyNullMapImpl(const ColumnVector<UInt8>::Container & null_map);
+
+    WrappedPtr local_discriminators;
+    WrappedPtr offsets;
+    NestedColumns variants;
+
+    std::vector<Discriminator> global_to_local_discriminators;
+    std::vector<Discriminator> local_to_global_discriminators;
+};
+
+
+}
diff --git a/src/Columns/IColumn.cpp b/src/Columns/IColumn.cpp
index 7923bca6354..82dc82e0bd9 100644
--- a/src/Columns/IColumn.cpp
+++ b/src/Columns/IColumn.cpp
@@ -2,6 +2,7 @@
 #include <IO/Operators.h>
 #include <Columns/IColumn.h>
 #include <Columns/ColumnNullable.h>
+#include <Columns/ColumnLowCardinality.h>
 #include <Columns/ColumnConst.h>
 #include <Core/Field.h>
 #include <DataTypes/Serializations/SerializationInfo.h>
@@ -83,6 +84,11 @@ bool isColumnNullable(const IColumn & column)
     return checkColumn<ColumnNullable>(column);
 }
 
+bool isColumnNullableOrLowCardinalityNullable(const IColumn & column)
+{
+    return isColumnNullable(column) || isColumnLowCardinalityNullable(column);
+}
+
 bool isColumnConst(const IColumn & column)
 {
     return checkColumn<ColumnConst>(column);
diff --git a/src/Columns/IColumn.h b/src/Columns/IColumn.h
index f012eeca61f..0dcba5b310c 100644
--- a/src/Columns/IColumn.h
+++ b/src/Columns/IColumn.h
@@ -631,6 +631,17 @@ struct IsMutableColumns<Arg, Args ...>
 template <>
 struct IsMutableColumns<> { static const bool value = true; };
 
+template <typename ... Args>
+struct IsMutableColumnsOrRvalueReferences;
+
+template <typename Arg, typename ... Args>
+struct IsMutableColumnsOrRvalueReferences<Arg, Args ...>
+{
+    static const bool value = (std::is_assignable<MutableColumnPtr &&, Arg>::value || std::is_rvalue_reference_v<Arg &&>) && IsMutableColumnsOrRvalueReferences<Args ...>::value;
+};
+
+template <>
+struct IsMutableColumnsOrRvalueReferences<> { static const bool value = true; };
 
 template <typename Type>
 const Type * checkAndGetColumn(const IColumn & column)
@@ -662,4 +673,7 @@ bool isColumnConst(const IColumn & column);
 /// True if column's an ColumnNullable instance. It's just a syntax sugar for type check.
 bool isColumnNullable(const IColumn & column);
 
+/// True if column's is ColumnNullable or ColumnLowCardinality with nullable nested column.
+bool isColumnNullableOrLowCardinalityNullable(const IColumn & column);
+
 }
diff --git a/src/Columns/MaskOperations.cpp b/src/Columns/MaskOperations.cpp
index b84268356a7..518269e1728 100644
--- a/src/Columns/MaskOperations.cpp
+++ b/src/Columns/MaskOperations.cpp
@@ -17,7 +17,7 @@ namespace ErrorCodes
 }
 
 template <typename T>
-void expandDataByMask(PaddedPODArray<T> & data, const PaddedPODArray<UInt8> & mask, bool inverted)
+void expandDataByMask(PaddedPODArray<T> & data, const PaddedPODArray<UInt8> & mask, bool inverted, T default_value)
 {
     if (mask.size() < data.size())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Mask size should be no less than data size.");
@@ -38,7 +38,7 @@ void expandDataByMask(PaddedPODArray<T> & data, const PaddedPODArray<UInt8> & ma
             --from;
         }
         else
-            data[index] = T();
+            data[index] = default_value;
 
         --index;
     }
@@ -49,7 +49,7 @@ void expandDataByMask(PaddedPODArray<T> & data, const PaddedPODArray<UInt8> & ma
 
 /// Explicit instantiations - not to place the implementation of the function above in the header file.
 #define INSTANTIATE(TYPE) \
-template void expandDataByMask<TYPE>(PaddedPODArray<TYPE> &, const PaddedPODArray<UInt8> &, bool);
+template void expandDataByMask<TYPE>(PaddedPODArray<TYPE> &, const PaddedPODArray<UInt8> &, bool, TYPE);
 
 INSTANTIATE(UInt8)
 INSTANTIATE(UInt16)
diff --git a/src/Columns/MaskOperations.h b/src/Columns/MaskOperations.h
index e43b4588258..cc5226bf0c1 100644
--- a/src/Columns/MaskOperations.h
+++ b/src/Columns/MaskOperations.h
@@ -13,7 +13,7 @@ namespace DB
 /// If inverted is true, we will work with inverted mask. This function is used in implementations of
 /// expand() method in IColumn interface.
 template <typename T>
-void expandDataByMask(PaddedPODArray<T> & data, const PaddedPODArray<UInt8> & mask, bool inverted);
+void expandDataByMask(PaddedPODArray<T> & data, const PaddedPODArray<UInt8> & mask, bool inverted, T default_value = T());
 
 struct MaskInfo
 {
diff --git a/src/Columns/tests/gtest_column_variant.cpp b/src/Columns/tests/gtest_column_variant.cpp
new file mode 100644
index 00000000000..b701e2d3183
--- /dev/null
+++ b/src/Columns/tests/gtest_column_variant.cpp
@@ -0,0 +1,688 @@
+#include <Columns/ColumnVariant.h>
+#include <Columns/ColumnVector.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnsNumber.h>
+#include <gtest/gtest.h>
+
+using namespace DB;
+
+TEST(ColumnVariant, CreateFromEmptyColumns)
+{
+    MutableColumns columns;
+    columns.push_back(ColumnUInt32::create());
+    columns.push_back(ColumnString::create());
+    auto column = ColumnVariant::create(std::move(columns));
+    ASSERT_TRUE(column->empty() && column->getLocalDiscriminators().empty() && column->getOffsets().empty());
+}
+
+TEST(ColumnVariant, CreateFromEmptyColumnsWithLocalOrder)
+{
+    MutableColumns columns;
+    columns.push_back(ColumnUInt32::create());
+    columns.push_back(ColumnString::create());
+    std::vector<ColumnVariant::Discriminator> local_to_global_discriminators;
+    local_to_global_discriminators.push_back(1);
+    local_to_global_discriminators.push_back(0);
+    auto column = ColumnVariant::create(std::move(columns), local_to_global_discriminators);
+    ASSERT_TRUE(column->empty() && column->getLocalDiscriminators().empty() && column->getOffsets().empty());
+    ASSERT_EQ(column->localDiscriminatorByGlobal(0), 0);
+    ASSERT_EQ(column->localDiscriminatorByGlobal(1), 1);
+    ASSERT_EQ(column->globalDiscriminatorByLocal(0), 0);
+    ASSERT_EQ(column->globalDiscriminatorByLocal(1), 1);
+}
+
+MutableColumns createColumns1()
+{
+    MutableColumns columns;
+    auto column1 = ColumnUInt64::create();
+    column1->insertValue(42);
+    columns.push_back(std::move(column1));
+    auto column2 = ColumnString::create();
+    column2->insertData("Hello", 5);
+    column2->insertData("World", 5);
+    columns.push_back(std::move(column2));
+    auto column3 = ColumnUInt32::create();
+    columns.push_back(std::move(column3));
+    return columns;
+}
+
+MutableColumnPtr createDiscriminators1()
+{
+    auto discriminators_column = ColumnVariant::ColumnDiscriminators::create();
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    return discriminators_column;
+}
+
+void reorderColumns(const std::vector<ColumnVariant::Discriminator> & local_to_global_order, MutableColumns & columns)
+{
+    MutableColumns res;
+    for (auto global_discr : local_to_global_order)
+        res.push_back(std::move(columns[global_discr]));
+    columns = std::move(res);
+}
+
+template <typename Ptr>
+void reorderDiscriminators(const std::vector<ColumnVariant::Discriminator> & local_to_global_order, Ptr & discriminators)
+{
+    std::vector<ColumnVariant::Discriminator> global_to_local_order(local_to_global_order.size());
+    for (size_t i = 0; i != local_to_global_order.size(); ++i)
+        global_to_local_order[local_to_global_order[i]] = i;
+
+    auto & discriminators_data = assert_cast<ColumnVariant::ColumnDiscriminators *>(discriminators.get())->getData();
+    for (auto & discr : discriminators_data)
+    {
+        if (discr != ColumnVariant::NULL_DISCRIMINATOR)
+            discr = global_to_local_order[discr];
+    }
+}
+
+MutableColumnPtr createOffsets1()
+{
+    auto offsets = ColumnVariant::ColumnOffsets::create();
+    offsets->insertValue(0);
+    offsets->insertValue(0);
+    offsets->insertValue(0);
+    offsets->insertValue(1);
+    offsets->insertValue(0);
+    return offsets;
+}
+
+std::vector<ColumnVariant::Discriminator> createLocalToGlobalOrder1()
+{
+    std::vector<ColumnVariant::Discriminator> local_to_global_discriminators;
+    local_to_global_discriminators.push_back(1);
+    local_to_global_discriminators.push_back(2);
+    local_to_global_discriminators.push_back(0);
+    return local_to_global_discriminators;
+}
+
+void checkColumnVariant1(ColumnVariant * column)
+{
+    const auto & offsets = column->getOffsets();
+    ASSERT_EQ(column->size(), 5);
+    ASSERT_EQ(offsets[0], 0);
+    ASSERT_EQ(offsets[1], 0);
+    ASSERT_EQ(offsets[3], 1);
+    ASSERT_TRUE(column->isDefaultAt(2) && column->isDefaultAt(4));
+    ASSERT_EQ((*column)[0].get<UInt32>(), 42);
+    ASSERT_EQ((*column)[1].get<String>(), "Hello");
+    ASSERT_TRUE((*column)[2].isNull());
+    ASSERT_EQ((*column)[3].get<String>(), "World");
+    ASSERT_TRUE((*column)[4].isNull());
+}
+
+void checkColumnVariant1Order(ColumnVariant * column)
+{
+    ASSERT_EQ(column->localDiscriminatorByGlobal(0), 2);
+    ASSERT_EQ(column->localDiscriminatorByGlobal(1), 0);
+    ASSERT_EQ(column->localDiscriminatorByGlobal(2), 1);
+    ASSERT_EQ(column->globalDiscriminatorByLocal(0), 1);
+    ASSERT_EQ(column->globalDiscriminatorByLocal(1), 2);
+    ASSERT_EQ(column->globalDiscriminatorByLocal(2), 0);
+    ASSERT_EQ(column->localDiscriminatorAt(0), 2);
+    ASSERT_EQ(column->localDiscriminatorAt(1), 0);
+    ASSERT_EQ(column->localDiscriminatorAt(2), ColumnVariant::NULL_DISCRIMINATOR);
+    ASSERT_EQ(column->localDiscriminatorAt(3), 0);
+    ASSERT_EQ(column->localDiscriminatorAt(4), ColumnVariant::NULL_DISCRIMINATOR);
+    ASSERT_EQ(column->globalDiscriminatorAt(0), 0);
+    ASSERT_EQ(column->globalDiscriminatorAt(1), 1);
+    ASSERT_EQ(column->globalDiscriminatorAt(2), ColumnVariant::NULL_DISCRIMINATOR);
+    ASSERT_EQ(column->globalDiscriminatorAt(3), 1);
+    ASSERT_EQ(column->globalDiscriminatorAt(4), ColumnVariant::NULL_DISCRIMINATOR);
+}
+
+TEST(ColumnVariant, CreateFromDiscriminatorsAndColumns)
+{
+    auto columns = createColumns1();
+    auto discriminators = createDiscriminators1();
+    auto column = ColumnVariant::create(std::move(discriminators), std::move(columns));
+    checkColumnVariant1(column.get());
+}
+
+TEST(ColumnVariant, CreateFromDiscriminatorsAndColumnsWithLocalOrder)
+{
+    auto local_to_global_order = createLocalToGlobalOrder1();
+    auto columns = createColumns1();
+    reorderColumns(local_to_global_order, columns);
+    auto discriminators = createDiscriminators1();
+    reorderDiscriminators(local_to_global_order, discriminators);
+    auto column = ColumnVariant::create(std::move(discriminators), std::move(columns), createLocalToGlobalOrder1());
+    checkColumnVariant1(column.get());
+    checkColumnVariant1Order(column.get());
+}
+
+TEST(ColumnVariant, CreateFromDiscriminatorsOffsetsAndColumns)
+{
+    auto columns = createColumns1();
+    auto discriminators = createDiscriminators1();
+    auto offsets = createOffsets1();
+    auto column = ColumnVariant::create(std::move(discriminators), std::move(offsets), std::move(columns));
+    checkColumnVariant1(column.get());
+}
+
+TEST(ColumnVariant, CreateFromDiscriminatorsOffsetsAndColumnsWithLocalOrder)
+{
+    auto local_to_global_order = createLocalToGlobalOrder1();
+    auto columns = createColumns1();
+    reorderColumns(local_to_global_order, columns);
+    auto discriminators = createDiscriminators1();
+    reorderDiscriminators(local_to_global_order, discriminators);
+    auto offsets = createOffsets1();
+    auto column = ColumnVariant::create(std::move(discriminators), std::move(offsets), std::move(columns), createLocalToGlobalOrder1());
+    checkColumnVariant1(column.get());
+    checkColumnVariant1Order(column.get());
+}
+
+ColumnVariant::MutablePtr createVariantWithOneFullColumNoNulls(size_t size, bool change_order)
+{
+    MutableColumns columns;
+    auto column1 = ColumnUInt64::create();
+    for (size_t i = 0; i != size; ++i)
+        column1->insertValue(i);
+    columns.push_back(std::move(column1));
+    auto column2 = ColumnString::create();
+    columns.push_back(std::move(column2));
+    auto column3 = ColumnUInt32::create();
+    columns.push_back(std::move(column3));
+    auto discriminators_column = ColumnVariant::ColumnDiscriminators::create();
+    for (size_t i = 0; i != size; ++i)
+        discriminators_column->insertValue(0);
+    if (change_order)
+    {
+        auto local_to_global_order = createLocalToGlobalOrder1();
+        reorderColumns(local_to_global_order, columns);
+        reorderDiscriminators(local_to_global_order, discriminators_column);
+        return ColumnVariant::create(std::move(discriminators_column), std::move(columns), createLocalToGlobalOrder1());
+    }
+    return ColumnVariant::create(std::move(discriminators_column), std::move(columns));
+}
+
+TEST(ColumnVariant, CreateFromDiscriminatorsAndOneFullColumnNoNulls)
+{
+    auto column = createVariantWithOneFullColumNoNulls(3, false);
+    const auto & offsets = column->getOffsets();
+    ASSERT_EQ(column->size(), 3);
+    ASSERT_EQ(offsets[0], 0);
+    ASSERT_EQ(offsets[1], 1);
+    ASSERT_EQ(offsets[2], 2);
+    ASSERT_EQ((*column)[0].get<UInt64>(), 0);
+    ASSERT_EQ((*column)[1].get<UInt64>(), 1);
+    ASSERT_EQ((*column)[2].get<UInt64>(), 2);
+}
+
+TEST(ColumnVariant, CreateFromDiscriminatorsAndOneFullColumnNoNullsWithLocalOrder)
+{
+    auto column = createVariantWithOneFullColumNoNulls(3, true);
+    const auto & offsets = column->getOffsets();
+    ASSERT_EQ(column->size(), 3);
+    ASSERT_EQ(offsets[0], 0);
+    ASSERT_EQ(offsets[1], 1);
+    ASSERT_EQ(offsets[2], 2);
+    ASSERT_EQ((*column)[0].get<UInt64>(), 0);
+    ASSERT_EQ((*column)[1].get<UInt64>(), 1);
+    ASSERT_EQ((*column)[2].get<UInt64>(), 2);
+    ASSERT_EQ(column->localDiscriminatorAt(0), 2);
+    ASSERT_EQ(column->localDiscriminatorAt(1), 2);
+    ASSERT_EQ(column->localDiscriminatorAt(2), 2);
+    ASSERT_EQ(column->globalDiscriminatorAt(0), 0);
+    ASSERT_EQ(column->globalDiscriminatorAt(0), 0);
+    ASSERT_EQ(column->globalDiscriminatorAt(0), 0);
+}
+
+TEST(ColumnVariant, CloneResizedToEmpty)
+{
+    auto column = ColumnVariant::create(createDiscriminators1(), createOffsets1(), createColumns1());
+    auto resized_column = column->cloneResized(0);
+    ASSERT_TRUE(resized_column->empty());
+}
+
+TEST(ColumnVariant, CloneResizedToLarge)
+{
+    auto column = ColumnVariant::create(createDiscriminators1(), createOffsets1(), createColumns1());
+    auto resized_column = column->cloneResized(7);
+    const auto * resized_column_variant = assert_cast<const ColumnVariant *>(resized_column.get());
+    ASSERT_EQ(resized_column_variant->size(), 7);
+    const auto & offsets = resized_column_variant->getOffsets();
+    for (size_t i = 0; i != 7; ++i)
+    {
+        if (i == 3)
+            ASSERT_EQ(offsets[i], 1);
+        else
+            ASSERT_EQ(offsets[i], 0);
+    }
+
+    const auto & discriminators = resized_column_variant->getLocalDiscriminators();
+    std::vector<size_t> null_indexes = {2, 4, 5, 6};
+    for (size_t i : null_indexes)
+        ASSERT_EQ(discriminators[i], ColumnVariant::NULL_DISCRIMINATOR);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(0).size(), 1);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(1).size(), 2);
+}
+
+TEST(ColumnVariant, CloneResizedWithOneFullColumnNoNulls)
+{
+    auto column = createVariantWithOneFullColumNoNulls(5, false);
+    auto resized_column = column->cloneResized(3);
+    const auto * resized_column_variant = assert_cast<const ColumnVariant *>(resized_column.get());
+    ASSERT_EQ(resized_column_variant->size(), 3);
+    const auto & offsets = resized_column_variant->getOffsets();
+    for (size_t i = 0; i != 3; ++i)
+        ASSERT_EQ(offsets[i], i);
+    const auto & discriminators = resized_column_variant->getLocalDiscriminators();
+    for (size_t i = 0; i != 3; ++i)
+        ASSERT_EQ(discriminators[i], 0);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(0).size(), 3);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(1).size(), 0);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(2).size(), 0);
+}
+
+MutableColumns createColumns2()
+{
+    MutableColumns columns;
+    auto column1 = ColumnUInt64::create();
+    column1->insertValue(42);
+    column1->insertValue(43);
+    column1->insertValue(44);
+    columns.push_back(std::move(column1));
+    auto column2 = ColumnString::create();
+    column2->insertData("Hello", 5);
+    column2->insertData("World", 5);
+    columns.push_back(std::move(column2));
+    auto column3 = ColumnUInt8::create();
+    columns.push_back(std::move(column3));
+    return columns;
+}
+
+TEST(ColumnVariant, CloneResizedGeneral1)
+{
+    ///   D     c1    c2    c3
+    ///   0     42   Hello
+    ///   1     43   World
+    ///  NULL   44
+    ///   0
+    ///   1
+    ///  NULL
+    ///   0
+    auto discriminators_column = ColumnVariant::ColumnDiscriminators::create();
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(0);
+    auto column = ColumnVariant::create(std::move(discriminators_column), createColumns2());
+    auto resized_column = column->cloneResized(4);
+    const auto * resized_column_variant = assert_cast<const ColumnVariant *>(resized_column.get());
+    ASSERT_EQ(resized_column_variant->size(), 4);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(0).size(), 2);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(1).size(), 1);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(2).size(), 0);
+    const auto & discriminators = resized_column_variant->getLocalDiscriminators();
+    ASSERT_EQ(discriminators[0], 0);
+    ASSERT_EQ(discriminators[1], 1);
+    ASSERT_EQ(discriminators[2], ColumnVariant::NULL_DISCRIMINATOR);
+    ASSERT_EQ(discriminators[3], 0);
+    const auto & offsets = resized_column_variant->getOffsets();
+    ASSERT_EQ(offsets[0], 0);
+    ASSERT_EQ(offsets[1], 0);
+    ASSERT_EQ(offsets[3], 1);
+    ASSERT_EQ((*resized_column_variant)[0].get<UInt64>(), 42);
+    ASSERT_EQ((*resized_column_variant)[1].get<String>(), "Hello");
+    ASSERT_EQ((*resized_column_variant)[3].get<UInt64>(), 43);
+}
+
+TEST(ColumnVariant, CloneResizedGeneral2)
+{
+    ///   D     c1    c2    c3
+    ///   0     42   Hello
+    ///  NULL   43   World
+    ///  NULL   44
+    ///   0
+    ///   1
+    ///   1
+    ///   0
+    auto discriminators_column = ColumnVariant::ColumnDiscriminators::create();
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(0);
+    auto column = ColumnVariant::create(std::move(discriminators_column), createColumns2());
+    auto resized_column = column->cloneResized(3);
+    const auto * resized_column_variant = assert_cast<const ColumnVariant *>(resized_column.get());
+    ASSERT_EQ(resized_column_variant->size(), 3);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(0).size(), 1);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(1).size(), 0);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(2).size(), 0);
+    const auto & discriminators = resized_column_variant->getLocalDiscriminators();
+    ASSERT_EQ(discriminators[0], 0);
+    ASSERT_EQ(discriminators[1], ColumnVariant::NULL_DISCRIMINATOR);
+    ASSERT_EQ(discriminators[2], ColumnVariant::NULL_DISCRIMINATOR);
+    const auto & offsets = resized_column_variant->getOffsets();
+    ASSERT_EQ(offsets[0], 0);
+    ASSERT_EQ((*resized_column_variant)[0].get<UInt64>(), 42);
+}
+
+TEST(ColumnVariant, CloneResizedGeneral3)
+{
+    ///   D     c1    c2    c3
+    ///   0     42   Hello
+    ///   1     43   World
+    ///   1     44
+    ///   0
+    ///  NULL
+    ///  NULL
+    ///   0
+    auto discriminators_column = ColumnVariant::ColumnDiscriminators::create();
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(0);
+    auto column = ColumnVariant::create(std::move(discriminators_column), createColumns2());
+    auto resized_column = column->cloneResized(5);
+    const auto * resized_column_variant = assert_cast<const ColumnVariant *>(resized_column.get());
+    ASSERT_EQ(resized_column_variant->size(), 5);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(0).size(), 2);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(1).size(), 2);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(2).size(), 0);
+    const auto & discriminators = resized_column_variant->getLocalDiscriminators();
+    ASSERT_EQ(discriminators[0], 0);
+    ASSERT_EQ(discriminators[1], 1);
+    ASSERT_EQ(discriminators[2], 1);
+    ASSERT_EQ(discriminators[3], 0);
+    const auto & offsets = resized_column_variant->getOffsets();
+    ASSERT_EQ(offsets[0], 0);
+    ASSERT_EQ(offsets[1], 0);
+    ASSERT_EQ(offsets[2], 1);
+    ASSERT_EQ(offsets[3], 1);
+    ASSERT_EQ((*resized_column_variant)[0].get<UInt64>(), 42);
+    ASSERT_EQ((*resized_column_variant)[1].get<String>(), "Hello");
+    ASSERT_EQ((*resized_column_variant)[2].get<String>(), "World");
+    ASSERT_EQ((*resized_column_variant)[3].get<UInt64>(), 43);
+}
+
+MutableColumnPtr createDiscriminators2()
+{
+    auto discriminators_column = ColumnVariant::ColumnDiscriminators::create();
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(0);
+    return discriminators_column;
+}
+
+std::vector<ColumnVariant::Discriminator> createLocalToGlobalOrder2()
+{
+    std::vector<ColumnVariant::Discriminator> local_to_global_discriminators;
+    local_to_global_discriminators.push_back(2);
+    local_to_global_discriminators.push_back(0);
+    local_to_global_discriminators.push_back(1);
+    return local_to_global_discriminators;
+}
+
+ColumnVariant::MutablePtr createVariantColumn1(bool reorder)
+{
+    auto columns = createColumns1();
+    auto discriminators = createDiscriminators1();
+    if (!reorder)
+        return ColumnVariant::create(std::move(discriminators), std::move(columns));
+    auto local_to_global_order = createLocalToGlobalOrder1();
+    reorderColumns(local_to_global_order, columns);
+    reorderDiscriminators(local_to_global_order, discriminators);
+    return ColumnVariant::create(std::move(discriminators), std::move(columns), local_to_global_order);
+}
+
+ColumnVariant::MutablePtr createVariantColumn2(bool reorder)
+{
+    auto columns = createColumns2();
+    auto discriminators = createDiscriminators2();
+    if (!reorder)
+        return ColumnVariant::create(std::move(discriminators), std::move(columns));
+    auto local_to_global_order = createLocalToGlobalOrder2();
+    reorderColumns(local_to_global_order, columns);
+    reorderDiscriminators(local_to_global_order, discriminators);
+    return ColumnVariant::create(std::move(discriminators), std::move(columns), local_to_global_order);
+}
+
+TEST(ColumnVariant, InsertFrom)
+{
+    for (bool change_order : {false, true})
+    {
+        auto column_to = createVariantColumn1(change_order);
+        auto column_from = createVariantColumn2(change_order);
+        column_to->insertFrom(*column_from, 3);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(5), 0);
+        ASSERT_EQ((*column_to)[5].get<UInt64>(), 43);
+    }
+}
+
+TEST(ColumnVariant, InsertRangeFromOneColumnNoNulls)
+{
+    for (bool change_order : {false, true})
+    {
+        auto column_to = createVariantColumn2(change_order);
+        auto column_from = createVariantWithOneFullColumNoNulls(5, change_order);
+        column_to->insertRangeFrom(*column_from, 2, 2);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(7), 0);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(8), 0);
+        ASSERT_EQ((*column_to)[7].get<UInt64>(), 2);
+        ASSERT_EQ((*column_to)[8].get<UInt64>(), 3);
+    }
+}
+
+TEST(ColumnVariant, InsertRangeFromGeneral)
+{
+    for (bool change_order : {false, true})
+    {
+        auto column_to = createVariantColumn1(change_order);
+        auto column_from = createVariantColumn2(change_order);
+        column_to->insertRangeFrom(*column_from, 1, 4);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(5), 1);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(6), ColumnVariant::NULL_DISCRIMINATOR);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(7), 0);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(8), 1);
+        ASSERT_EQ((*column_to)[5].get<String>(), "Hello");
+        ASSERT_EQ((*column_to)[7].get<UInt64>(), 43);
+        ASSERT_EQ((*column_to)[8].get<String>(), "World");
+    }
+}
+
+TEST(ColumnVariant, InsertManyFrom)
+{
+    for (bool change_order : {false, true})
+    {
+        auto column_to = createVariantColumn1(change_order);
+        auto column_from = createVariantColumn2(change_order);
+        column_to->insertManyFrom(*column_from, 3, 2);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(5), 0);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(6), 0);
+        ASSERT_EQ((*column_to)[5].get<UInt64>(), 43);
+        ASSERT_EQ((*column_to)[6].get<UInt64>(), 43);
+    }
+}
+
+TEST(ColumnVariant, PopBackOneColumnNoNulls)
+{
+    auto column = createVariantWithOneFullColumNoNulls(5, false);
+    column->popBack(3);
+    ASSERT_EQ(column->size(), 2);
+    ASSERT_EQ(column->getVariantByLocalDiscriminator(0).size(), 2);
+    ASSERT_EQ((*column)[0].get<UInt64>(), 0);
+    ASSERT_EQ((*column)[1].get<UInt64>(), 1);
+}
+
+TEST(ColumnVariant, PopBackGeneral)
+{
+    auto column = ColumnVariant::create(createDiscriminators2(), createColumns2());
+    column->popBack(4);
+    ASSERT_EQ(column->size(), 3);
+    ASSERT_EQ(column->getVariantByLocalDiscriminator(0).size(), 1);
+    ASSERT_EQ(column->getVariantByLocalDiscriminator(1).size(), 1);
+    ASSERT_EQ((*column)[0].get<UInt64>(), 42);
+    ASSERT_EQ((*column)[1].get<String>(), "Hello");
+    ASSERT_TRUE((*column)[2].isNull());
+}
+
+TEST(ColumnVariant, FilterOneColumnNoNulls)
+{
+    auto column = createVariantWithOneFullColumNoNulls(3, false);
+    IColumn::Filter filter;
+    filter.push_back(1);
+    filter.push_back(0);
+    filter.push_back(1);
+    auto filtered_column = column->filter(filter, -1);
+    ASSERT_EQ(filtered_column->size(), 2);
+    ASSERT_EQ((*filtered_column)[0].get<UInt64>(), 0);
+    ASSERT_EQ((*filtered_column)[1].get<UInt64>(), 2);
+}
+
+TEST(ColumnVariant, FilterGeneral)
+{
+    auto column = ColumnVariant::create(createDiscriminators2(), createColumns2());
+    IColumn::Filter filter;
+    filter.push_back(0);
+    filter.push_back(1);
+    filter.push_back(1);
+    filter.push_back(0);
+    filter.push_back(0);
+    filter.push_back(1);
+    filter.push_back(0);
+    auto filtered_column = column->filter(filter, -1);
+    ASSERT_EQ(filtered_column->size(), 3);
+    ASSERT_EQ((*filtered_column)[0].get<String>(), "Hello");
+    ASSERT_TRUE((*filtered_column)[1].isNull());
+    ASSERT_TRUE((*filtered_column)[2].isNull());
+}
+
+TEST(ColumnVariant, PermuteAndIndexOneColumnNoNulls)
+{
+    auto column = createVariantWithOneFullColumNoNulls(4, false);
+    IColumn::Permutation permutation;
+    permutation.push_back(1);
+    permutation.push_back(3);
+    permutation.push_back(2);
+    permutation.push_back(0);
+    auto permuted_column = column->permute(permutation, 3);
+    ASSERT_EQ(permuted_column->size(), 3);
+    ASSERT_EQ((*permuted_column)[0].get<UInt64>(), 1);
+    ASSERT_EQ((*permuted_column)[1].get<UInt64>(), 3);
+    ASSERT_EQ((*permuted_column)[2].get<UInt64>(), 2);
+
+    auto index = ColumnUInt64::create();
+    index->getData() = std::move(permutation);
+    auto indexed_column = column->index(*index, 3);
+    ASSERT_EQ(indexed_column->size(), 3);
+    ASSERT_EQ((*indexed_column)[0].get<UInt64>(), 1);
+    ASSERT_EQ((*indexed_column)[1].get<UInt64>(), 3);
+    ASSERT_EQ((*indexed_column)[2].get<UInt64>(), 2);
+}
+
+TEST(ColumnVariant, PermuteGeneral)
+{
+    auto column = ColumnVariant::create(createDiscriminators2(), createColumns2());
+    IColumn::Permutation permutation;
+    permutation.push_back(3);
+    permutation.push_back(4);
+    permutation.push_back(1);
+    permutation.push_back(5);
+    auto permuted_column = column->permute(permutation, 4);
+    ASSERT_EQ(permuted_column->size(), 4);
+    ASSERT_EQ((*permuted_column)[0].get<UInt64>(), 43);
+    ASSERT_EQ((*permuted_column)[1].get<String>(), "World");
+    ASSERT_EQ((*permuted_column)[2].get<String>(), "Hello");
+    ASSERT_TRUE((*permuted_column)[3].isNull());
+}
+
+TEST(ColumnVariant, ReplicateOneColumnNoNull)
+{
+    auto column = createVariantWithOneFullColumNoNulls(3, false);
+    IColumn::Offsets offsets;
+    offsets.push_back(0);
+    offsets.push_back(3);
+    offsets.push_back(6);
+    auto replicated_column = column->replicate(offsets);
+    ASSERT_EQ(replicated_column->size(), 6);
+    ASSERT_EQ((*replicated_column)[0].get<UInt64>(), 1);
+    ASSERT_EQ((*replicated_column)[1].get<UInt64>(), 1);
+    ASSERT_EQ((*replicated_column)[2].get<UInt64>(), 1);
+    ASSERT_EQ((*replicated_column)[3].get<UInt64>(), 2);
+    ASSERT_EQ((*replicated_column)[4].get<UInt64>(), 2);
+    ASSERT_EQ((*replicated_column)[5].get<UInt64>(), 2);
+}
+
+TEST(ColumnVariant, ReplicateGeneral)
+{
+    auto column = ColumnVariant::create(createDiscriminators1(), createColumns1());
+    IColumn::Offsets offsets;
+    offsets.push_back(1);
+    offsets.push_back(3);
+    offsets.push_back(5);
+    offsets.push_back(5);
+    offsets.push_back(7);
+    auto replicated_column = column->replicate(offsets);
+    ASSERT_EQ(replicated_column->size(), 7);
+    ASSERT_EQ((*replicated_column)[0].get<UInt64>(), 42);
+    ASSERT_EQ((*replicated_column)[1].get<String>(), "Hello");
+    ASSERT_EQ((*replicated_column)[2].get<String>(), "Hello");
+    ASSERT_TRUE((*replicated_column)[3].isNull());
+    ASSERT_TRUE((*replicated_column)[4].isNull());
+    ASSERT_TRUE((*replicated_column)[5].isNull());
+    ASSERT_TRUE((*replicated_column)[6].isNull());
+}
+
+TEST(ColumnVariant, ScatterOneColumnNoNulls)
+{
+    auto column = createVariantWithOneFullColumNoNulls(5, false);
+    IColumn::Selector selector;
+    selector.push_back(0);
+    selector.push_back(1);
+    selector.push_back(2);
+    selector.push_back(0);
+    selector.push_back(1);
+    auto columns = column->scatter(3, selector);
+    ASSERT_EQ(columns[0]->size(), 2);
+    ASSERT_EQ((*columns[0])[0].get<UInt64>(), 0);
+    ASSERT_EQ((*columns[0])[1].get<UInt64>(), 3);
+    ASSERT_EQ(columns[1]->size(), 2);
+    ASSERT_EQ((*columns[1])[0].get<UInt64>(), 1);
+    ASSERT_EQ((*columns[1])[1].get<UInt64>(), 4);
+    ASSERT_EQ(columns[2]->size(), 1);
+    ASSERT_EQ((*columns[2])[0].get<UInt64>(), 2);
+}
+
+TEST(ColumnVariant, ScatterGeneral)
+{
+    auto column = ColumnVariant::create(createDiscriminators2(), createColumns2());
+    IColumn::Selector selector;
+    selector.push_back(0);
+    selector.push_back(0);
+    selector.push_back(2);
+    selector.push_back(0);
+    selector.push_back(1);
+    selector.push_back(2);
+    selector.push_back(1);
+    auto columns = column->scatter(3, selector);
+    ASSERT_EQ(columns[0]->size(), 3);
+    ASSERT_EQ((*columns[0])[0].get<UInt64>(), 42);
+    ASSERT_EQ((*columns[0])[1].get<String>(), "Hello");
+    ASSERT_EQ((*columns[0])[2].get<UInt64>(), 43);
+    ASSERT_EQ(columns[1]->size(), 2);
+    ASSERT_EQ((*columns[1])[0].get<String>(), "World");
+    ASSERT_EQ((*columns[1])[1].get<UInt64>(), 44);
+    ASSERT_EQ(columns[2]->size(), 2);
+    ASSERT_TRUE((*columns[2])[0].isNull());
+    ASSERT_TRUE((*columns[2])[1].isNull());
+}
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 7e50a81ada8..0151dcb982d 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -816,6 +816,7 @@ class IColumn;
     M(Bool, function_json_value_return_type_allow_complex, false, "Allow function JSON_VALUE to return complex type, such as: struct, array, map.", 0) \
     M(Bool, use_with_fill_by_sorting_prefix, true, "Columns preceding WITH FILL columns in ORDER BY clause form sorting prefix. Rows with different values in sorting prefix are filled independently", 0) \
     M(Bool, optimize_uniq_to_count, true, "Rewrite uniq and its variants(except uniqUpTo) to count if subquery has distinct or group by clause.", 0) \
+    M(Bool, use_variant_when_no_common_type_in_if, false, "Use Variant as a result type for if/multiIf in case when there is no common type for arguments", 0) \
     \
     /** Experimental functions */ \
     M(Bool, allow_experimental_materialized_postgresql_table, false, "Allows to use the MaterializedPostgreSQL table engine. Disabled by default, because this feature is experimental", 0) \
@@ -823,6 +824,7 @@ class IColumn;
     M(Bool, allow_experimental_nlp_functions, false, "Enable experimental functions for natural language processing.", 0) \
     M(Bool, allow_experimental_hash_functions, false, "Enable experimental hash functions", 0) \
     M(Bool, allow_experimental_object_type, false, "Allow Object and JSON data types", 0) \
+    M(Bool, allow_experimental_variant_type, false, "Allow Variant data type", 0) \
     M(Bool, allow_experimental_annoy_index, false, "Allows to use Annoy index. Disabled by default because this feature is experimental", 0) \
     M(Bool, allow_experimental_usearch_index, false, "Allows to use USearch index. Disabled by default because this feature is experimental", 0) \
     M(UInt64, max_limit_for_ann_queries, 1'000'000, "SELECT queries with LIMIT bigger than this setting cannot use ANN indexes. Helps to prevent memory overflows in ANN search indexes.", 0) \
diff --git a/src/Core/TypeId.h b/src/Core/TypeId.h
index 9c634d2321c..7003e880cd5 100644
--- a/src/Core/TypeId.h
+++ b/src/Core/TypeId.h
@@ -49,6 +49,7 @@ enum class TypeIndex
     IPv4,
     IPv6,
     JSONPaths,
+    Variant,
 };
 
 /**
diff --git a/src/DataTypes/DataTypeFactory.cpp b/src/DataTypes/DataTypeFactory.cpp
index 415f24d8151..d154b386ace 100644
--- a/src/DataTypes/DataTypeFactory.cpp
+++ b/src/DataTypes/DataTypeFactory.cpp
@@ -290,6 +290,7 @@ DataTypeFactory::DataTypeFactory()
     registerDataTypeDomainGeo(*this);
     registerDataTypeMap(*this);
     registerDataTypeObject(*this);
+    registerDataTypeVariant(*this);
 }
 
 DataTypeFactory & DataTypeFactory::instance()
diff --git a/src/DataTypes/DataTypeFactory.h b/src/DataTypes/DataTypeFactory.h
index ba7c1a3d7fe..a2aeb6f3646 100644
--- a/src/DataTypes/DataTypeFactory.h
+++ b/src/DataTypes/DataTypeFactory.h
@@ -100,5 +100,6 @@ void registerDataTypeDomainBool(DataTypeFactory & factory);
 void registerDataTypeDomainSimpleAggregateFunction(DataTypeFactory & factory);
 void registerDataTypeDomainGeo(DataTypeFactory & factory);
 void registerDataTypeObject(DataTypeFactory & factory);
+void registerDataTypeVariant(DataTypeFactory & factory);
 
 }
diff --git a/src/DataTypes/DataTypeNullable.cpp b/src/DataTypes/DataTypeNullable.cpp
index 41a9a1de543..484d779551f 100644
--- a/src/DataTypes/DataTypeNullable.cpp
+++ b/src/DataTypes/DataTypeNullable.cpp
@@ -114,5 +114,33 @@ DataTypePtr makeNullableOrLowCardinalityNullable(const DataTypePtr & type)
     return std::make_shared<DataTypeNullable>(type);
 }
 
+DataTypePtr makeNullableOrLowCardinalityNullableSafe(const DataTypePtr & type)
+{
+    if (isNullableOrLowCardinalityNullable(type))
+        return type;
+
+    if (type->lowCardinality())
+    {
+        const auto & dictionary_type = assert_cast<const DataTypeLowCardinality &>(*type).getDictionaryType();
+        return std::make_shared<DataTypeLowCardinality>(makeNullable(dictionary_type));
+    }
+
+    return makeNullableSafe(type);
+}
+
+DataTypePtr removeNullableOrLowCardinalityNullable(const DataTypePtr & type)
+{
+    if (type->isNullable())
+        return static_cast<const DataTypeNullable &>(*type).getNestedType();
+
+    if (type->isLowCardinalityNullable())
+    {
+        auto dict_type = removeNullable(static_cast<const DataTypeLowCardinality &>(*type).getDictionaryType());
+        return std::make_shared<DataTypeLowCardinality>(dict_type);
+    }
+
+    return type;
+
+}
 
 }
diff --git a/src/DataTypes/DataTypeNullable.h b/src/DataTypes/DataTypeNullable.h
index 06d46fb15ed..7ad0e1ba5f1 100644
--- a/src/DataTypes/DataTypeNullable.h
+++ b/src/DataTypes/DataTypeNullable.h
@@ -54,5 +54,8 @@ DataTypePtr makeNullable(const DataTypePtr & type);
 DataTypePtr makeNullableSafe(const DataTypePtr & type);
 DataTypePtr removeNullable(const DataTypePtr & type);
 DataTypePtr makeNullableOrLowCardinalityNullable(const DataTypePtr & type);
+DataTypePtr makeNullableOrLowCardinalityNullableSafe(const DataTypePtr & type);
+/// Nullable(T) -> T, LowCardinality(Nullable(T)) -> T
+DataTypePtr removeNullableOrLowCardinalityNullable(const DataTypePtr & type);
 
 }
diff --git a/src/DataTypes/DataTypeTuple.cpp b/src/DataTypes/DataTypeTuple.cpp
index fd2e5e6a784..df9af203618 100644
--- a/src/DataTypes/DataTypeTuple.cpp
+++ b/src/DataTypes/DataTypeTuple.cpp
@@ -11,6 +11,7 @@
 #include <DataTypes/Serializations/SerializationTuple.h>
 #include <DataTypes/Serializations/SerializationNamed.h>
 #include <DataTypes/Serializations/SerializationInfoTuple.h>
+#include <DataTypes/Serializations/SerializationVariantElement.h>
 #include <DataTypes/NestedUtils.h>
 #include <Parsers/IAST.h>
 #include <Parsers/ASTNameTypePair.h>
@@ -172,11 +173,15 @@ MutableColumnPtr DataTypeTuple::createColumn() const
 
 MutableColumnPtr DataTypeTuple::createColumn(const ISerialization & serialization) const
 {
+    /// If we read Tuple as Variant subcolumn, it may be wrapped to SerializationVariantElement.
+    /// Here we don't need it, so we drop this wrapper.
+    const auto * current_serialization = &serialization;
+    while (const auto * serialization_variant_element = typeid_cast<const SerializationVariantElement *>(current_serialization))
+        current_serialization = serialization_variant_element->getNested().get();
+
     /// If we read subcolumn of nested Tuple, it may be wrapped to SerializationNamed
     /// several times to allow to reconstruct the substream path name.
     /// Here we don't need substream path name, so we drop first several wrapper serializations.
-
-    const auto * current_serialization = &serialization;
     while (const auto * serialization_named = typeid_cast<const SerializationNamed *>(current_serialization))
         current_serialization = serialization_named->getNested().get();
 
diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
new file mode 100644
index 00000000000..77e1c504cf8
--- /dev/null
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -0,0 +1,197 @@
+#include <Columns/ColumnVariant.h>
+#include <Core/Field.h>
+#include <DataTypes/DataTypeVariant.h>
+#include <DataTypes/DataTypeFactory.h>
+#include <DataTypes/Serializations/SerializationVariant.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <Common/assert_cast.h>
+#include <IO/WriteHelpers.h>
+#include <IO/WriteBufferFromString.h>
+#include <IO/Operators.h>
+#include <Parsers/IAST.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+    extern const int EMPTY_DATA_PASSED;
+}
+
+
+DataTypeVariant::DataTypeVariant(const DataTypes & variants_)
+{
+    /// Sort nested types by their full names and squash identical types.
+    std::map<String, DataTypePtr> name_to_type;
+    for (const auto & type : variants_)
+    {
+        /// Nullable(...), LowCardinality(Nullable(...)) and Variant(...) types are not allowed inside Variant type.
+        if (isNullableOrLowCardinalityNullable(type))
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Nullable/LowCardinality(Nullable) types are not allowed inside Variant type");
+        if (type->getTypeId() == TypeIndex::Variant)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Nested Variant types are not allowed");
+        /// Don't use Nothing type as a variant.
+        if (!isNothing(type))
+            name_to_type[type->getName()] = type;
+    }
+
+    variants.reserve(name_to_type.size());
+    for (const auto & [_, type] : name_to_type)
+        variants.push_back(type);
+
+    if (variants.empty())
+        throw Exception(ErrorCodes::EMPTY_DATA_PASSED, "Variant cannot be empty");
+
+    if (variants.size() > ColumnVariant::MAX_NESTED_COLUMNS)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Variant type with more than {} nested types is not allowed", ColumnVariant::MAX_NESTED_COLUMNS);
+}
+
+std::string DataTypeVariant::doGetName() const
+{
+    size_t size = variants.size();
+    WriteBufferFromOwnString s;
+
+    s << "Variant(";
+    for (size_t i = 0; i < size; ++i)
+    {
+        if (i != 0)
+            s << ", ";
+
+        s << variants[i]->getName();
+    }
+    s << ")";
+
+    return s.str();
+}
+
+std::string DataTypeVariant::doGetPrettyName(size_t indent) const
+{
+    size_t size = variants.size();
+    WriteBufferFromOwnString s;
+    s << "Variant(\n";
+
+    for (size_t i = 0; i != size; ++i)
+    {
+        if (i != 0)
+            s << ",\n";
+
+        s << fourSpaceIndent(indent + 1) << variants[i]->getPrettyName(indent + 1);
+    }
+
+    s << '\n' << fourSpaceIndent(indent) << ')';
+    return s.str();
+}
+
+MutableColumnPtr DataTypeVariant::createColumn() const
+{
+    size_t size = variants.size();
+    MutableColumns nested_columns;
+    nested_columns.reserve(size);
+    for (size_t i = 0; i < size; ++i)
+        nested_columns.push_back(variants[i]->createColumn());
+
+    return ColumnVariant::create(std::move(nested_columns));
+}
+
+
+Field DataTypeVariant::getDefault() const
+{
+    return Null();
+}
+
+bool DataTypeVariant::equals(const IDataType & rhs) const
+{
+    if (typeid(rhs) != typeid(*this))
+        return false;
+
+    const DataTypeVariant & rhs_variant = static_cast<const DataTypeVariant &>(rhs);
+
+    size_t size = variants.size();
+    if (size != rhs_variant.variants.size())
+        return false;
+
+    for (size_t i = 0; i < size; ++i)
+        if (!variants[i]->equals(*rhs_variant.variants[i]))
+            return false;
+
+    return true;
+}
+
+bool DataTypeVariant::textCanContainOnlyValidUTF8() const
+{
+    return std::all_of(variants.begin(), variants.end(), [](auto && elem) { return elem->textCanContainOnlyValidUTF8(); });
+}
+
+bool DataTypeVariant::haveMaximumSizeOfValue() const
+{
+    return std::all_of(variants.begin(), variants.end(), [](auto && elem) { return elem->haveMaximumSizeOfValue(); });
+}
+
+bool DataTypeVariant::hasDynamicSubcolumns() const
+{
+    return std::any_of(variants.begin(), variants.end(), [](auto && elem) { return elem->hasDynamicSubcolumns(); });
+}
+
+std::optional<ColumnVariant::Discriminator> DataTypeVariant::tryGetVariantDiscriminator(const DataTypePtr & type) const
+{
+    String type_name = type->getName();
+    for (size_t i = 0; i != variants.size(); ++i)
+    {
+        /// We don't use equals here, because it doesn't respect custom type names.
+        if (variants[i]->getName() == type_name)
+            return i;
+    }
+
+    return std::nullopt;
+}
+
+size_t DataTypeVariant::getMaximumSizeOfValueInMemory() const
+{
+    size_t max_size = 0;
+    for (const auto & elem : variants)
+    {
+        size_t elem_max_size = elem->getMaximumSizeOfValueInMemory();
+        if (elem_max_size > max_size)
+            max_size = elem_max_size;
+    }
+    return max_size;
+}
+
+SerializationPtr DataTypeVariant::doGetDefaultSerialization() const
+{
+    SerializationVariant::VariantSerializations serializations;
+    serializations.reserve(variants.size());
+    Names variant_names;
+    variant_names.reserve(variants.size());
+
+    for (const auto & variant : variants)
+    {
+        serializations.push_back(variant->getDefaultSerialization());
+        variant_names.push_back(variant->getName());
+    }
+
+    return std::make_shared<SerializationVariant>(std::move(serializations), std::move(variant_names), SerializationVariant::getVariantsDeserializeTextOrder(variants), getName());
+}
+
+static DataTypePtr create(const ASTPtr & arguments)
+{
+    if (!arguments || arguments->children.empty())
+        throw Exception(ErrorCodes::EMPTY_DATA_PASSED, "Variant cannot be empty");
+
+    DataTypes nested_types;
+    nested_types.reserve(arguments->children.size());
+
+    for (const ASTPtr & child : arguments->children)
+        nested_types.emplace_back(DataTypeFactory::instance().get(child));
+
+    return std::make_shared<DataTypeVariant>(nested_types);
+}
+
+
+void registerDataTypeVariant(DataTypeFactory & factory)
+{
+    factory.registerDataType("Variant", create);
+}
+
+}
diff --git a/src/DataTypes/DataTypeVariant.h b/src/DataTypes/DataTypeVariant.h
new file mode 100644
index 00000000000..60113a188b0
--- /dev/null
+++ b/src/DataTypes/DataTypeVariant.h
@@ -0,0 +1,64 @@
+#pragma once
+
+#include <DataTypes/IDataType.h>
+#include <Columns/ColumnVariant.h>
+#include <optional>
+
+
+namespace DB
+{
+
+/** Variant data type.
+  * This type represents a union of other data types.
+  * For example, type Variant(T1, T2, ..., TN) means that each row of this type
+  * has a value of either type T1 or T2 or ... or TN or none of them (NULL value).
+  * Nullable(...), LowCardinality(Nullable(...)) and Variant(...) types are not allowed
+  * inside Variant type.
+  * The order of nested types doesn't matter: Variant(T1, T2) = Variant(T2, T1).
+  * To have global order of nested types we sort variants by type names on Variant creation.
+  * The index of a variant in a sorted list is called global variant discriminator.
+  */
+class DataTypeVariant final : public IDataType
+{
+private:
+    DataTypes variants;
+
+public:
+    static constexpr bool is_parametric = true;
+
+    explicit DataTypeVariant(const DataTypes & variants_);
+
+    TypeIndex getTypeId() const override { return TypeIndex::Variant; }
+    const char * getFamilyName() const override { return "Variant"; }
+
+    bool canBeInsideNullable() const override { return false; }
+    bool supportsSparseSerialization() const override { return false; }
+    bool canBeInsideSparseColumns() const override { return false; }
+
+    MutableColumnPtr createColumn() const override;
+
+    Field getDefault() const override;
+
+    bool equals(const IDataType & rhs) const override;
+
+    bool isParametric() const override { return true; }
+    bool haveSubtypes() const override { return true; }
+    bool textCanContainOnlyValidUTF8() const override;
+    bool haveMaximumSizeOfValue() const override;
+    bool hasDynamicSubcolumns() const override;
+    size_t getMaximumSizeOfValueInMemory() const override;
+
+    const DataTypePtr & getVariant(size_t i) const { return variants[i]; }
+    const DataTypes & getVariants() const { return variants; }
+
+    /// Check if Variant has provided type in the list of variants and return its discriminator.
+    std::optional<ColumnVariant::Discriminator> tryGetVariantDiscriminator(const DataTypePtr & type) const;
+
+private:
+    std::string doGetName() const override;
+    std::string doGetPrettyName(size_t indent) const override;
+    SerializationPtr doGetDefaultSerialization() const override;
+};
+
+}
+
diff --git a/src/DataTypes/EnumValues.cpp b/src/DataTypes/EnumValues.cpp
index 9df49e765a7..8a4b1304d5e 100644
--- a/src/DataTypes/EnumValues.cpp
+++ b/src/DataTypes/EnumValues.cpp
@@ -74,6 +74,27 @@ T EnumValues<T>::getValue(StringRef field_name, bool try_treat_as_id) const
     return it->getMapped();
 }
 
+template <typename T>
+bool EnumValues<T>::tryGetValue(T & x, StringRef field_name, bool try_treat_as_id) const
+{
+    const auto it = name_to_value_map.find(field_name);
+    if (!it)
+    {
+        /// It is used in CSV and TSV input formats. If we fail to find given string in
+        /// enum names, we will try to treat it as enum id.
+        if (try_treat_as_id)
+        {
+            ReadBufferFromMemory tmp_buf(field_name.data, field_name.size);
+            if (!tryReadText(x, tmp_buf) || !tmp_buf.eof() || !value_to_name_map.contains(x))
+                return false;
+            return true;
+        }
+        return false;
+    }
+    x = it->getMapped();
+    return true;
+}
+
 template <typename T>
 Names EnumValues<T>::getAllRegisteredNames() const
 {
diff --git a/src/DataTypes/EnumValues.h b/src/DataTypes/EnumValues.h
index 5189f7a56f5..889878bc60f 100644
--- a/src/DataTypes/EnumValues.h
+++ b/src/DataTypes/EnumValues.h
@@ -7,7 +7,7 @@
 namespace DB
 {
 
-namespace ErrorCodes
+namespace ErrorCodesEnumValues
 {
     extern const int BAD_ARGUMENTS;
 }
@@ -42,6 +42,11 @@ public:
         return it;
     }
 
+    bool hasValue(const T & value) const
+    {
+        return value_to_name_map.contains(value);
+    }
+
     /// throws exception if value is not valid
     const StringRef & getNameForValue(const T & value) const
     {
@@ -60,6 +65,7 @@ public:
     }
 
     T getValue(StringRef field_name, bool try_treat_as_id = false) const;
+    bool tryGetValue(T & x, StringRef field_name, bool try_treat_as_id = false) const;
 
     template <typename TValues>
     bool containsAll(const TValues & rhs_values) const
diff --git a/src/DataTypes/IDataType.cpp b/src/DataTypes/IDataType.cpp
index 2a7e0f246de..392c56343e3 100644
--- a/src/DataTypes/IDataType.cpp
+++ b/src/DataTypes/IDataType.cpp
@@ -109,11 +109,26 @@ Ptr IDataType::getForSubcolumn(
     bool throw_if_null) const
 {
     Ptr res;
-    forEachSubcolumn([&](const auto &, const auto & name, const auto & subdata)
+
+    ISerialization::StreamCallback callback_with_data = [&](const auto & subpath)
     {
-        if (name == subcolumn_name)
-            res = subdata.*member;
-    }, data);
+        for (size_t i = 0; i < subpath.size(); ++i)
+        {
+            size_t prefix_len = i + 1;
+            if (!subpath[i].visited && ISerialization::hasSubcolumnForPath(subpath, prefix_len))
+            {
+                auto name = ISerialization::getSubcolumnNameForStream(subpath, prefix_len);
+                /// Create data from path only if it's requested subcolumn.
+                if (name == subcolumn_name)
+                    res = ISerialization::createFromPath(subpath, prefix_len).*member;
+            }
+            subpath[i].visited = true;
+        }
+    };
+
+    ISerialization::EnumerateStreamsSettings settings;
+    settings.position_independent_encoding = false;
+    data.serialization->enumerateStreams(settings, callback_with_data, data);
 
     if (!res && throw_if_null)
         throw Exception(ErrorCodes::ILLEGAL_COLUMN, "There is no subcolumn {} in type {}", subcolumn_name, getName());
diff --git a/src/DataTypes/IDataType.h b/src/DataTypes/IDataType.h
index eabf066bc3d..ccdf54f57c3 100644
--- a/src/DataTypes/IDataType.h
+++ b/src/DataTypes/IDataType.h
@@ -412,6 +412,8 @@ struct WhichDataType
     constexpr bool isSimple() const  { return isInt() || isUInt() || isFloat() || isString(); }
 
     constexpr bool isLowCardinality() const { return idx == TypeIndex::LowCardinality; }
+
+    constexpr bool isVariant() const { return idx == TypeIndex::Variant; }
 };
 
 /// IDataType helpers (alternative for IDataType virtual methods with single point of truth)
@@ -464,6 +466,7 @@ template <typename T> inline bool isTuple(const T & data_type) { return WhichDat
 template <typename T> inline bool isMap(const T & data_type) {return WhichDataType(data_type).isMap(); }
 template <typename T> inline bool isInterval(const T & data_type) {return WhichDataType(data_type).isInterval(); }
 template <typename T> inline bool isObject(const T & data_type) { return WhichDataType(data_type).isObject(); }
+template <typename T> inline bool isVariant(const T & data_type) { return WhichDataType(data_type).isVariant(); }
 
 template <typename T> inline bool isNothing(const T & data_type) { return WhichDataType(data_type).isNothing(); }
 
diff --git a/src/DataTypes/Serializations/ISerialization.cpp b/src/DataTypes/Serializations/ISerialization.cpp
index e70dc6a2380..86a37949dc8 100644
--- a/src/DataTypes/Serializations/ISerialization.cpp
+++ b/src/DataTypes/Serializations/ISerialization.cpp
@@ -55,6 +55,9 @@ String ISerialization::Substream::toString() const
         return fmt::format("TupleElement({}, escape_tuple_delimiter = {})",
             tuple_element_name, escape_tuple_delimiter ? "true" : "false");
 
+    if (type == VariantElement)
+        return fmt::format("VariantElement({})", variant_element_name);
+
     return String(magic_enum::enum_name(type));
 }
 
@@ -172,6 +175,10 @@ String getNameForSubstreamPath(
             else
                 stream_name += "." + it->tuple_element_name;
         }
+        else if (it->type == Substream::VariantDiscriminators)
+            stream_name += ".discr";
+        else if (it->type == Substream::VariantElement)
+            stream_name += "." + it->variant_element_name;
     }
 
     return stream_name;
@@ -252,6 +259,45 @@ bool ISerialization::isSpecialCompressionAllowed(const SubstreamPath & path)
     return true;
 }
 
+#define TRY_DESERIALIZE_TEXT(deserialize)                \
+    size_t prev_size = column.size();                    \
+    try                                                  \
+    {                                                    \
+        deserialize(column, istr, settings);             \
+        return true;                                     \
+    }                                                    \
+    catch (...)                                          \
+    {                                                    \
+        if (column.size() > prev_size)                   \
+            column.popBack(column.size() - prev_size);   \
+        return false;                                    \
+    }                                                    \
+
+bool ISerialization::tryDeserializeTextCSV(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    TRY_DESERIALIZE_TEXT(deserializeTextCSV)
+}
+
+bool ISerialization::tryDeserializeTextEscaped(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    TRY_DESERIALIZE_TEXT(deserializeTextEscaped)
+}
+
+bool ISerialization::tryDeserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    TRY_DESERIALIZE_TEXT(deserializeTextJSON)
+}
+
+bool ISerialization::tryDeserializeTextQuoted(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    TRY_DESERIALIZE_TEXT(deserializeTextQuoted)
+}
+
+bool ISerialization::tryDeserializeWholeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    TRY_DESERIALIZE_TEXT(deserializeWholeText)
+}
+
 void ISerialization::deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     String field;
@@ -261,6 +307,15 @@ void ISerialization::deserializeTextRaw(IColumn & column, ReadBuffer & istr, con
     deserializeWholeText(column, buf, settings);
 }
 
+bool ISerialization::tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    /// Read until \t or \n.
+    readString(field, istr);
+    ReadBufferFromString buf(field);
+    return tryDeserializeWholeText(column, buf, settings);
+}
+
 void ISerialization::serializeTextMarkdown(
     const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings & settings) const
 {
@@ -288,7 +343,9 @@ bool ISerialization::hasSubcolumnForPath(const SubstreamPath & path, size_t pref
     size_t last_elem = prefix_len - 1;
     return path[last_elem].type == Substream::NullMap
             || path[last_elem].type == Substream::TupleElement
-            || path[last_elem].type == Substream::ArraySizes;
+            || path[last_elem].type == Substream::ArraySizes
+            || path[last_elem].type == Substream::VariantDiscriminators
+            || path[last_elem].type == Substream::VariantElement;
 }
 
 ISerialization::SubstreamData ISerialization::createFromPath(const SubstreamPath & path, size_t prefix_len)
@@ -317,6 +374,8 @@ void ISerialization::throwUnexpectedDataAfterParsedValue(IColumn & column, ReadB
 {
     WriteBufferFromOwnString ostr;
     serializeText(column, column.size() - 1, ostr, settings);
+    /// Restore correct column size.
+    column.popBack(1);
     throw Exception(
         ErrorCodes::UNEXPECTED_DATA_AFTER_PARSED_VALUE,
         "Unexpected data '{}' after parsed {} value '{}'",
diff --git a/src/DataTypes/Serializations/ISerialization.h b/src/DataTypes/Serializations/ISerialization.h
index 030c3c6d81e..f0273f59d1f 100644
--- a/src/DataTypes/Serializations/ISerialization.h
+++ b/src/DataTypes/Serializations/ISerialization.h
@@ -152,6 +152,10 @@ public:
             ObjectStructure,
             ObjectData,
 
+            VariantDiscriminators,
+            VariantElements,
+            VariantElement,
+
             Regular,
         };
 
@@ -160,6 +164,9 @@ public:
         /// Index of tuple element, starting at 1 or name.
         String tuple_element_name;
 
+        /// The name of a variant element type.
+        String variant_element_name;
+
         /// Do we need to escape a dot in filenames for tuple elements.
         bool escape_tuple_delimiter = true;
 
@@ -320,17 +327,20 @@ public:
     virtual void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const = 0;
 
     virtual void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const = 0;
+    virtual bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const;
 
     /** Text serialization as a literal that may be inserted into a query.
       */
     virtual void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const = 0;
 
     virtual void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const = 0;
+    virtual bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const;
 
     /** Text serialization for the CSV format.
       */
     virtual void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const = 0;
     virtual void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const = 0;
+    virtual bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const;
 
     /** Text serialization for displaying on a terminal or saving into a text file, and the like.
       * Without escaping or quoting.
@@ -340,11 +350,13 @@ public:
     /** Text deserialization in case when buffer contains only one value, without any escaping and delimiters.
       */
     virtual void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const = 0;
+    virtual bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const;
 
     /** Text serialization intended for using in JSON format.
       */
     virtual void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const = 0;
     virtual void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const = 0;
+    virtual bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const;
     virtual void serializeTextJSONPretty(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings, size_t /*indent*/) const
     {
         serializeTextJSON(column, row_num, ostr, settings);
@@ -364,6 +376,7 @@ public:
      *  additional code in data types serialization and ReadHelpers.
      */
     virtual void deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const;
+    virtual bool tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const;
     virtual void serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const;
 
     virtual void serializeTextMarkdown(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const;
diff --git a/src/DataTypes/Serializations/SerializationArray.cpp b/src/DataTypes/Serializations/SerializationArray.cpp
index c804f58c567..be23278ef25 100644
--- a/src/DataTypes/Serializations/SerializationArray.cpp
+++ b/src/DataTypes/Serializations/SerializationArray.cpp
@@ -417,9 +417,11 @@ static void serializeTextImpl(const IColumn & column, size_t row_num, WriteBuffe
 }
 
 
-template <typename Reader>
-static void deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && read_nested, bool allow_unenclosed)
+template <typename ReturnType = void, typename Reader>
+static ReturnType deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && read_nested, bool allow_unenclosed)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     ColumnArray & column_array = assert_cast<ColumnArray &>(column);
     ColumnArray::Offsets & offsets = column_array.getOffsets();
 
@@ -431,7 +433,18 @@ static void deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && r
     if (checkChar('[', istr))
         has_braces = true;
     else if (!allow_unenclosed)
-        throw Exception(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT, "Array does not start with '[' character");
+    {
+        if constexpr (throw_exception)
+            throw Exception(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT, "Array does not start with '[' character");
+        return ReturnType(false);
+    }
+
+    auto on_error_no_throw = [&]()
+    {
+        if (size)
+            nested_column.popBack(size);
+        return ReturnType(false);
+    };
 
     try
     {
@@ -441,11 +454,17 @@ static void deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && r
             if (!first)
             {
                 if (*istr.position() == ',')
+                {
                     ++istr.position();
+                }
                 else
-                    throw ParsingException(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT,
-                        "Cannot read array from text, expected comma or end of array, found '{}'",
-                        *istr.position());
+                {
+                    if constexpr (throw_exception)
+                        throw ParsingException(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT,
+                            "Cannot read array from text, expected comma or end of array, found '{}'",
+                            *istr.position());
+                    return on_error_no_throw();
+                }
             }
 
             first = false;
@@ -455,25 +474,42 @@ static void deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && r
             if (*istr.position() == ']')
                 break;
 
-            read_nested(nested_column);
+            if constexpr (throw_exception)
+                read_nested(nested_column);
+            else if (!read_nested(nested_column))
+                return on_error_no_throw();
+
             ++size;
 
             skipWhitespaceIfAny(istr);
         }
 
         if (has_braces)
-            assertChar(']', istr);
+        {
+            if constexpr (throw_exception)
+                assertChar(']', istr);
+            else if (!checkChar(']', istr))
+                return on_error_no_throw();
+        }
         else /// If array is not enclosed in braces, we read until EOF.
-            assertEOF(istr);
+        {
+            if constexpr (throw_exception)
+                assertEOF(istr);
+            else if (!istr.eof())
+                return on_error_no_throw();
+        }
     }
     catch (...)
     {
         if (size)
             nested_column.popBack(size);
-        throw;
+        if constexpr (throw_exception)
+            throw;
+        return ReturnType(false);
     }
 
     offsets.push_back(offsets.back() + size);
+    return ReturnType(true);
 }
 
 
@@ -492,8 +528,8 @@ void SerializationArray::deserializeText(IColumn & column, ReadBuffer & istr, co
     deserializeTextImpl(column, istr,
         [&](IColumn & nested_column)
         {
-            if (settings.null_as_default)
-                SerializationNullable::deserializeTextQuotedImpl(nested_column, istr, settings, nested);
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+                SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(nested_column, istr, settings, nested);
             else
                 nested->deserializeTextQuoted(nested_column, istr, settings);
         }, false);
@@ -502,6 +538,29 @@ void SerializationArray::deserializeText(IColumn & column, ReadBuffer & istr, co
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "Array");
 }
 
+bool SerializationArray::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const
+{
+    auto read_nested = [&](IColumn & nested_column)
+    {
+        if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+            return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextQuoted(nested_column, istr, settings, nested);
+        return nested->tryDeserializeTextQuoted(nested_column, istr, settings);
+    };
+
+    bool ok = deserializeTextImpl<bool>(column, istr, std::move(read_nested), false);
+
+    if (!ok)
+        return false;
+
+    if (whole && !istr.eof())
+    {
+        column.popBack(1);
+        return false;
+    }
+
+    return true;
+}
+
 void SerializationArray::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     const ColumnArray & column_array = assert_cast<const ColumnArray &>(column);
@@ -557,13 +616,25 @@ void SerializationArray::deserializeTextJSON(IColumn & column, ReadBuffer & istr
     deserializeTextImpl(column, istr,
         [&](IColumn & nested_column)
         {
-            if (settings.null_as_default)
-                SerializationNullable::deserializeTextJSONImpl(nested_column, istr, settings, nested);
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+                SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(nested_column, istr, settings, nested);
             else
                 nested->deserializeTextJSON(nested_column, istr, settings);
         }, false);
 }
 
+bool SerializationArray::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    auto read_nested = [&](IColumn & nested_column)
+    {
+        if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+            return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextJSON(nested_column, istr, settings, nested);
+        return nested->tryDeserializeTextJSON(nested_column, istr, settings);
+    };
+
+    return deserializeTextImpl<bool>(column, istr, std::move(read_nested), false);
+}
+
 
 void SerializationArray::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -606,8 +677,8 @@ void SerializationArray::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
         deserializeTextImpl(column, rb,
             [&](IColumn & nested_column)
             {
-                if (settings.null_as_default)
-                    SerializationNullable::deserializeTextCSVImpl(nested_column, rb, settings, nested);
+                if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+                    SerializationNullable::deserializeNullAsDefaultOrNestedTextCSV(nested_column, rb, settings, nested);
                 else
                     nested->deserializeTextCSV(nested_column, rb, settings);
             }, true);
@@ -617,12 +688,43 @@ void SerializationArray::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
         deserializeTextImpl(column, rb,
             [&](IColumn & nested_column)
             {
-                if (settings.null_as_default)
-                    SerializationNullable::deserializeTextQuotedImpl(nested_column, rb, settings, nested);
+                if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+                    SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(nested_column, rb, settings, nested);
                 else
                     nested->deserializeTextQuoted(nested_column, rb, settings);
             }, true);
     }
 }
 
+bool SerializationArray::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String s;
+    if (!tryReadCSV(s, istr, settings.csv))
+        return false;
+    ReadBufferFromString rb(s);
+
+    if (settings.csv.arrays_as_nested_csv)
+    {
+        auto read_nested = [&](IColumn & nested_column)
+        {
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+                return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextCSV(nested_column, rb, settings, nested);
+            return nested->tryDeserializeTextCSV(nested_column, rb, settings);
+        };
+
+        return deserializeTextImpl<bool>(column, rb, read_nested, true);
+    }
+    else
+    {
+        auto read_nested = [&](IColumn & nested_column)
+        {
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+                return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextQuoted(nested_column, rb, settings, nested);
+            return nested->tryDeserializeTextQuoted(nested_column, rb, settings);
+        };
+
+        return deserializeTextImpl<bool>(column, rb, read_nested, true);
+    }
+}
+
 }
diff --git a/src/DataTypes/Serializations/SerializationArray.h b/src/DataTypes/Serializations/SerializationArray.h
index de331169db5..82f5e8bce45 100644
--- a/src/DataTypes/Serializations/SerializationArray.h
+++ b/src/DataTypes/Serializations/SerializationArray.h
@@ -20,15 +20,18 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSONPretty(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings, size_t indent) const override;
 
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     /** Streaming serialization of arrays is arranged in a special way:
       * - elements placed in a row are written/read without array sizes;
diff --git a/src/DataTypes/Serializations/SerializationBool.cpp b/src/DataTypes/Serializations/SerializationBool.cpp
index 41b5bf806e5..f745fac4d30 100644
--- a/src/DataTypes/Serializations/SerializationBool.cpp
+++ b/src/DataTypes/Serializations/SerializationBool.cpp
@@ -150,30 +150,42 @@ bool tryDeserializeAllVariants(ColumnUInt8 * column, ReadBuffer & istr)
     return true;
 }
 
-void deserializeImpl(
+template <typename ReturnType = void>
+ReturnType deserializeImpl(
     IColumn & column, ReadBuffer & istr, const FormatSettings & settings, std::function<bool(ReadBuffer &)> check_end_of_value)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     ColumnUInt8 * col = checkAndGetDeserializeColumnType(column);
+    auto restore_column_if_needed = [&, prev_size = col->size()]()
+    {
+        if (col->size() > prev_size)
+            col->popBack(1);
+    };
 
     PeekableReadBuffer buf(istr);
     buf.setCheckpoint();
     if (checkString(settings.bool_true_representation, buf) && check_end_of_value(buf))
     {
         col->insert(true);
-        return;
+        return ReturnType(true);
     }
 
     buf.rollbackToCheckpoint();
     if (checkString(settings.bool_false_representation, buf) && check_end_of_value(buf))
     {
-        col->insert(false);
         buf.dropCheckpoint();
         if (buf.hasUnreadData())
-            throw Exception(
-                ErrorCodes::CANNOT_PARSE_BOOL,
-                "Cannot continue parsing after parsed bool value because it will result in the loss of some data. It may happen if "
-                "bool_true_representation or bool_false_representation contains some delimiters of input format");
-        return;
+        {
+            if constexpr (throw_exception)
+                throw Exception(
+                    ErrorCodes::CANNOT_PARSE_BOOL,
+                    "Cannot continue parsing after parsed bool value because it will result in the loss of some data. It may happen if "
+                    "bool_true_representation or bool_false_representation contains some delimiters of input format");
+            return ReturnType(false);
+        }
+        col->insert(false);
+        return ReturnType(true);
     }
 
     buf.rollbackToCheckpoint();
@@ -181,22 +193,31 @@ void deserializeImpl(
     {
         buf.dropCheckpoint();
         if (buf.hasUnreadData())
-            throw Exception(
-                ErrorCodes::CANNOT_PARSE_BOOL,
-                "Cannot continue parsing after parsed bool value because it will result in the loss of some data. It may happen if "
-                "bool_true_representation or bool_false_representation contains some delimiters of input format");
-        return;
+        {
+            if constexpr (throw_exception)
+                throw Exception(
+                    ErrorCodes::CANNOT_PARSE_BOOL,
+                    "Cannot continue parsing after parsed bool value because it will result in the loss of some data. It may happen if "
+                    "bool_true_representation or bool_false_representation contains some delimiters of input format");
+            restore_column_if_needed();
+            return ReturnType(false);
+        }
+        return ReturnType(true);
     }
 
     buf.makeContinuousMemoryFromCheckpointToPos();
     buf.rollbackToCheckpoint();
-    throw Exception(
-        ErrorCodes::CANNOT_PARSE_BOOL,
-        "Cannot parse boolean value here: '{}', should be '{}' or '{}' controlled by setting bool_true_representation and "
-        "bool_false_representation or one of "
-        "True/False/T/F/Y/N/Yes/No/On/Off/Enable/Disable/Enabled/Disabled/1/0",
-        String(buf.position(), std::min(10lu, buf.available())),
-        settings.bool_true_representation, settings.bool_false_representation);
+    restore_column_if_needed();
+    if constexpr (throw_exception)
+        throw Exception(
+            ErrorCodes::CANNOT_PARSE_BOOL,
+            "Cannot parse boolean value here: '{}', should be '{}' or '{}' controlled by setting bool_true_representation and "
+            "bool_false_representation or one of "
+            "True/False/T/F/Y/N/Yes/No/On/Off/Enable/Disable/Enabled/Disabled/1/0",
+            String(buf.position(), std::min(10lu, buf.available())),
+            settings.bool_true_representation, settings.bool_false_representation);
+
+    return ReturnType(false);
 }
 
 }
@@ -225,6 +246,14 @@ void SerializationBool::deserializeTextEscaped(IColumn & column, ReadBuffer & is
     deserializeImpl(column, istr, settings, [](ReadBuffer & buf){ return buf.eof() || *buf.position() == '\t' || *buf.position() == '\n'; });
 }
 
+bool SerializationBool::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    if (istr.eof())
+        return false;
+
+    return deserializeImpl<bool>(column, istr, settings, [](ReadBuffer & buf){ return buf.eof() || *buf.position() == '\t' || *buf.position() == '\n'; });
+}
+
 void SerializationBool::serializeTextJSON(const IColumn &column, size_t row_num, WriteBuffer &ostr, const FormatSettings &settings) const
 {
     serializeSimple(column, row_num, ostr, settings);
@@ -250,6 +279,33 @@ void SerializationBool::deserializeTextJSON(IColumn &column, ReadBuffer &istr, c
     col->insert(value);
 }
 
+bool SerializationBool::tryDeserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    if (istr.eof())
+        return false;
+
+    ColumnUInt8 * col = checkAndGetDeserializeColumnType(column);
+    bool value = false;
+    char first_char = *istr.position();
+    if (first_char == 't' || first_char == 'f')
+    {
+        if (!readBoolTextWord<bool>(value, istr))
+            return false;
+    }
+    else if (first_char == '1' || first_char == '0')
+    {
+        /// Doesn't throw.
+        readBoolText(value, istr);
+    }
+    else
+    {
+        return false;
+    }
+
+    col->insert(value);
+    return true;
+}
+
 void SerializationBool::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeCustom(column, row_num, ostr, settings);
@@ -263,6 +319,14 @@ void SerializationBool::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
     deserializeImpl(column, istr, settings, [&](ReadBuffer & buf){ return buf.eof() || *buf.position() == settings.csv.delimiter || *buf.position() == '\n' || *buf.position() == '\r'; });
 }
 
+bool SerializationBool::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    if (istr.eof())
+        return false;
+
+    return deserializeImpl<bool>(column, istr, settings, [&](ReadBuffer & buf){ return buf.eof() || *buf.position() == settings.csv.delimiter || *buf.position() == '\n' || *buf.position() == '\r'; });
+}
+
 void SerializationBool::serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeCustom(column, row_num, ostr, settings);
@@ -276,15 +340,30 @@ void SerializationBool::deserializeTextRaw(IColumn & column, ReadBuffer & istr,
     deserializeImpl(column, istr, settings, [&](ReadBuffer & buf){ return buf.eof() || *buf.position() == '\t' || *buf.position() == '\n'; });
 }
 
+bool SerializationBool::tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    if (istr.eof())
+        return false;
+
+    return deserializeImpl<bool>(column, istr, settings, [&](ReadBuffer & buf){ return buf.eof() || *buf.position() == '\t' || *buf.position() == '\n'; });
+}
+
 void SerializationBool::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeSimple(column, row_num, ostr, settings);
 }
 
-void SerializationBool::deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+template <typename ReturnType>
+ReturnType deserializeTextQuotedImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     if (istr.eof())
-        throw Exception(ErrorCodes::CANNOT_PARSE_BOOL, "Expected boolean value but get EOF.");
+    {
+        if constexpr (throw_exception)
+            throw Exception(ErrorCodes::CANNOT_PARSE_BOOL, "Expected boolean value but get EOF.");
+        return ReturnType(false);
+    }
 
     auto * col = checkAndGetDeserializeColumnType(column);
 
@@ -292,11 +371,17 @@ void SerializationBool::deserializeTextQuoted(IColumn & column, ReadBuffer & ist
     switch (symbol)
     {
         case 't':
-            assertStringCaseInsensitive("true", istr);
+            if constexpr (throw_exception)
+                assertStringCaseInsensitive("true", istr);
+            else if (!checkStringCaseInsensitive("true", istr))
+                return ReturnType(false);
             col->insert(true);
             break;
         case 'f':
-            assertStringCaseInsensitive("false", istr);
+            if constexpr (throw_exception)
+                assertStringCaseInsensitive("false", istr);
+            else if (!checkStringCaseInsensitive("false", istr))
+                return ReturnType(false);
             col->insert(false);
             break;
         case '1':
@@ -307,16 +392,40 @@ void SerializationBool::deserializeTextQuoted(IColumn & column, ReadBuffer & ist
             break;
         case '\'':
             ++istr.position();
-            deserializeImpl(column, istr, settings, [](ReadBuffer & buf){ return !buf.eof() && *buf.position() == '\''; });
-            assertChar('\'', istr);
+            if constexpr (throw_exception)
+            {
+                deserializeImpl(column, istr, settings, [](ReadBuffer & buf){ return !buf.eof() && *buf.position() == '\''; });
+                assertChar('\'', istr);
+            }
+            else
+            {
+                if (!deserializeImpl<bool>(column, istr, settings, [](ReadBuffer & buf) { return !buf.eof() && *buf.position() == '\''; }) || !checkChar('\'', istr))
+                    return ReturnType(false);
+            }
             break;
         default:
-            throw Exception(
-                ErrorCodes::CANNOT_PARSE_BOOL,
-                "Cannot parse boolean value here: '{}', should be true/false, 1/0 or on of "
-                "True/False/T/F/Y/N/Yes/No/On/Off/Enable/Disable/Enabled/Disabled/1/0 in quotes",
-                String(istr.position(), std::min(10ul, istr.available())));
+        {
+            if constexpr (throw_exception)
+                throw Exception(
+                    ErrorCodes::CANNOT_PARSE_BOOL,
+                    "Cannot parse boolean value here: '{}', should be true/false, 1/0 or on of "
+                    "True/False/T/F/Y/N/Yes/No/On/Off/Enable/Disable/Enabled/Disabled/1/0 in quotes",
+                    String(istr.position(), std::min(10ul, istr.available())));
+            return ReturnType(false);
+        }
     }
+
+    return ReturnType(true);
+}
+
+void SerializationBool::deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    deserializeTextQuotedImpl<void>(column, istr, settings);
+}
+
+bool SerializationBool::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return deserializeTextQuotedImpl<bool>(column, istr, settings);
 }
 
 void SerializationBool::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
@@ -327,6 +436,14 @@ void SerializationBool::deserializeWholeText(IColumn & column, ReadBuffer & istr
     deserializeImpl(column, istr, settings, [&](ReadBuffer & buf){ return buf.eof(); });
 }
 
+bool SerializationBool::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    if (istr.eof())
+        return false;
+
+    return deserializeImpl<bool>(column, istr, settings, [&](ReadBuffer & buf){ return buf.eof(); });
+}
+
 void SerializationBool::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeSimple(column, row_num, ostr, settings);
diff --git a/src/DataTypes/Serializations/SerializationBool.h b/src/DataTypes/Serializations/SerializationBool.h
index a5aa0ca80a2..3e511b7249e 100644
--- a/src/DataTypes/Serializations/SerializationBool.h
+++ b/src/DataTypes/Serializations/SerializationBool.h
@@ -15,21 +15,27 @@ public:
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
-    void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const  override;
+    void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const  override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const  override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const  override;
 
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
 };
diff --git a/src/DataTypes/Serializations/SerializationCustomSimpleText.cpp b/src/DataTypes/Serializations/SerializationCustomSimpleText.cpp
index 03564bac64b..abe443cab1b 100644
--- a/src/DataTypes/Serializations/SerializationCustomSimpleText.cpp
+++ b/src/DataTypes/Serializations/SerializationCustomSimpleText.cpp
@@ -24,6 +24,12 @@ void deserializeFromString(const SerializationCustomSimpleText & domain, IColumn
     domain.deserializeText(column, istr, settings, true);
 }
 
+bool tryDeserializeFromString(const SerializationCustomSimpleText & domain, IColumn & column, const String & s, const FormatSettings & settings)
+{
+    ReadBufferFromString istr(s);
+    return domain.tryDeserializeText(column, istr, settings, true);
+}
+
 }
 
 namespace DB
@@ -34,6 +40,19 @@ SerializationCustomSimpleText::SerializationCustomSimpleText(const Serialization
 {
 }
 
+bool SerializationCustomSimpleText::tryDeserializeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, bool whole) const
+{
+    try
+    {
+        deserializeText(column, istr, settings, whole);
+        return true;
+    }
+    catch (...)
+    {
+        return false;
+    }
+}
+
 void SerializationCustomSimpleText::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     String str;
@@ -41,6 +60,13 @@ void SerializationCustomSimpleText::deserializeWholeText(IColumn & column, ReadB
     deserializeFromString(*this, column, str, settings);
 }
 
+bool SerializationCustomSimpleText::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String str;
+    readStringUntilEOF(str, istr);
+    return tryDeserializeFromString(*this, column, str, settings);
+}
+
 void SerializationCustomSimpleText::serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeEscapedString(serializeToString(*this, column, row_num, settings), ostr);
@@ -53,6 +79,13 @@ void SerializationCustomSimpleText::deserializeTextEscaped(IColumn & column, Rea
     deserializeFromString(*this, column, str, settings);
 }
 
+bool SerializationCustomSimpleText::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String str;
+    readEscapedString(str, istr);
+    return tryDeserializeFromString(*this, column, str, settings);
+}
+
 void SerializationCustomSimpleText::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeQuotedString(serializeToString(*this, column, row_num, settings), ostr);
@@ -65,6 +98,14 @@ void SerializationCustomSimpleText::deserializeTextQuoted(IColumn & column, Read
     deserializeFromString(*this, column, str, settings);
 }
 
+bool SerializationCustomSimpleText::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String str;
+    if (!tryReadQuotedString(str, istr))
+        return false;
+    return tryDeserializeFromString(*this, column, str, settings);
+}
+
 void SerializationCustomSimpleText::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeCSVString(serializeToString(*this, column, row_num, settings), ostr);
@@ -77,6 +118,13 @@ void SerializationCustomSimpleText::deserializeTextCSV(IColumn & column, ReadBuf
     deserializeFromString(*this, column, str, settings);
 }
 
+bool SerializationCustomSimpleText::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String str;
+    readCSVStringInto<String, false, false>(str, istr, settings.csv);
+    return tryDeserializeFromString(*this, column, str, settings);
+}
+
 void SerializationCustomSimpleText::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeJSONString(serializeToString(*this, column, row_num, settings), ostr, settings);
@@ -89,6 +137,14 @@ void SerializationCustomSimpleText::deserializeTextJSON(IColumn & column, ReadBu
     deserializeFromString(*this, column, str, settings);
 }
 
+bool SerializationCustomSimpleText::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String str;
+    if (!tryReadJSONStringInto(str, istr))
+        return false;
+    return tryDeserializeFromString(*this, column, str, settings);
+}
+
 void SerializationCustomSimpleText::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeXMLStringForTextElement(serializeToString(*this, column, row_num, settings), ostr);
diff --git a/src/DataTypes/Serializations/SerializationCustomSimpleText.h b/src/DataTypes/Serializations/SerializationCustomSimpleText.h
index 0c909350002..c80a57e234c 100644
--- a/src/DataTypes/Serializations/SerializationCustomSimpleText.h
+++ b/src/DataTypes/Serializations/SerializationCustomSimpleText.h
@@ -22,20 +22,24 @@ public:
     /// whole = true means that buffer contains only one value, so we should read until EOF.
     /// It's needed to check if there is garbage after parsed field.
     virtual void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const = 0;
+    virtual bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const;
 
     /** Text deserialization in case when buffer contains only one value, without any escaping and delimiters.
       */
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     /** Text serialization with escaping but without quoting.
       */
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const  override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const  override;
 
     /** Text serialization as a literal that may be inserted into a query.
       */
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const  override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const  override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const  override;
 
     /** Text serialization for the CSV format.
       */
@@ -44,12 +48,14 @@ public:
       * (the delimiter is not consumed).
       */
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     /** Text serialization intended for using in JSON format.
       * force_quoting_64bit_integers parameter forces to brace UInt64 and Int64 types into quotes.
       */
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     /** Text serialization for putting into the XML format.
       */
diff --git a/src/DataTypes/Serializations/SerializationDate.cpp b/src/DataTypes/Serializations/SerializationDate.cpp
index 534f599a072..38e1bb87b6d 100644
--- a/src/DataTypes/Serializations/SerializationDate.cpp
+++ b/src/DataTypes/Serializations/SerializationDate.cpp
@@ -22,6 +22,15 @@ void SerializationDate::deserializeWholeText(IColumn & column, ReadBuffer & istr
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "Date");
 }
 
+bool SerializationDate::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    DayNum x;
+    if (!tryReadDateText(x, istr, time_zone) || !istr.eof())
+        return false;
+    assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     DayNum x;
@@ -29,6 +38,15 @@ void SerializationDate::deserializeTextEscaped(IColumn & column, ReadBuffer & is
     assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
 }
 
+bool SerializationDate::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    DayNum x;
+    if (!tryReadDateText(x, istr, time_zone))
+        return false;
+    assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate::serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeText(column, row_num, ostr, settings);
@@ -50,6 +68,16 @@ void SerializationDate::deserializeTextQuoted(IColumn & column, ReadBuffer & ist
     assert_cast<ColumnUInt16 &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
 }
 
+bool SerializationDate::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    DayNum x;
+    if (!checkChar('\'', istr) || !tryReadDateText(x, istr, time_zone) || !checkChar('\'', istr))
+        return false;
+
+    assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -66,6 +94,15 @@ void SerializationDate::deserializeTextJSON(IColumn & column, ReadBuffer & istr,
     assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
 }
 
+bool SerializationDate::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    DayNum x;
+    if (!checkChar('"', istr) || !tryReadDateText(x, istr, time_zone) || !checkChar('"', istr))
+        return false;
+    assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -80,6 +117,15 @@ void SerializationDate::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
     assert_cast<ColumnUInt16 &>(column).getData().push_back(value);
 }
 
+bool SerializationDate::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    DayNum value;
+    if (!tryReadCSV(value, istr, time_zone))
+        return false;
+    assert_cast<ColumnUInt16 &>(column).getData().push_back(value);
+    return true;
+}
+
 SerializationDate::SerializationDate(const DateLUTImpl & time_zone_) : time_zone(time_zone_)
 {
 }
diff --git a/src/DataTypes/Serializations/SerializationDate.h b/src/DataTypes/Serializations/SerializationDate.h
index f751b06fba6..dcf79eb49da 100644
--- a/src/DataTypes/Serializations/SerializationDate.h
+++ b/src/DataTypes/Serializations/SerializationDate.h
@@ -13,14 +13,19 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
 protected:
     const DateLUTImpl & time_zone;
diff --git a/src/DataTypes/Serializations/SerializationDate32.cpp b/src/DataTypes/Serializations/SerializationDate32.cpp
index 851710de839..70a22d59e42 100644
--- a/src/DataTypes/Serializations/SerializationDate32.cpp
+++ b/src/DataTypes/Serializations/SerializationDate32.cpp
@@ -21,6 +21,15 @@ void SerializationDate32::deserializeWholeText(IColumn & column, ReadBuffer & is
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "Date32");
 }
 
+bool SerializationDate32::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    ExtendedDayNum x;
+    if (!tryReadDateText(x, istr, time_zone) || !istr.eof())
+        return false;
+    assert_cast<ColumnInt32 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate32::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     ExtendedDayNum x;
@@ -28,6 +37,15 @@ void SerializationDate32::deserializeTextEscaped(IColumn & column, ReadBuffer &
     assert_cast<ColumnInt32 &>(column).getData().push_back(x);
 }
 
+bool SerializationDate32::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    ExtendedDayNum x;
+    if (!tryReadDateText(x, istr, time_zone))
+        return false;
+    assert_cast<ColumnInt32 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate32::serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeText(column, row_num, ostr, settings);
@@ -49,6 +67,15 @@ void SerializationDate32::deserializeTextQuoted(IColumn & column, ReadBuffer & i
     assert_cast<ColumnInt32 &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
 }
 
+bool SerializationDate32::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    ExtendedDayNum x;
+    if (!checkChar('\'', istr) || !tryReadDateText(x, istr, time_zone) || !checkChar('\'', istr))
+        return false;
+    assert_cast<ColumnInt32 &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
+    return true;
+}
+
 void SerializationDate32::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -65,6 +92,15 @@ void SerializationDate32::deserializeTextJSON(IColumn & column, ReadBuffer & ist
     assert_cast<ColumnInt32 &>(column).getData().push_back(x);
 }
 
+bool SerializationDate32::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    ExtendedDayNum x;
+    if (!checkChar('"', istr) || !tryReadDateText(x, istr, time_zone) || !checkChar('"', istr))
+        return false;
+    assert_cast<ColumnInt32 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate32::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -79,6 +115,15 @@ void SerializationDate32::deserializeTextCSV(IColumn & column, ReadBuffer & istr
     assert_cast<ColumnInt32 &>(column).getData().push_back(value.getExtenedDayNum());
 }
 
+bool SerializationDate32::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    LocalDate value;
+    if (!tryReadCSV(value, istr))
+        return false;
+    assert_cast<ColumnInt32 &>(column).getData().push_back(value.getExtenedDayNum());
+    return true;
+}
+
 SerializationDate32::SerializationDate32(const DateLUTImpl & time_zone_) : time_zone(time_zone_)
 {
 }
diff --git a/src/DataTypes/Serializations/SerializationDate32.h b/src/DataTypes/Serializations/SerializationDate32.h
index 49560fb6c7d..be2e2b76c1d 100644
--- a/src/DataTypes/Serializations/SerializationDate32.h
+++ b/src/DataTypes/Serializations/SerializationDate32.h
@@ -12,14 +12,19 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
 protected:
     const DateLUTImpl & time_zone;
diff --git a/src/DataTypes/Serializations/SerializationDateTime.cpp b/src/DataTypes/Serializations/SerializationDateTime.cpp
index 77beb0d9b75..17465d85e9d 100644
--- a/src/DataTypes/Serializations/SerializationDateTime.cpp
+++ b/src/DataTypes/Serializations/SerializationDateTime.cpp
@@ -21,15 +21,56 @@ inline void readText(time_t & x, ReadBuffer & istr, const FormatSettings & setti
     switch (settings.date_time_input_format)
     {
         case FormatSettings::DateTimeInputFormat::Basic:
-            readDateTimeText(x, istr, time_zone);
-            return;
+            readDateTimeTextImpl<>(x, istr, time_zone);
+            break;
         case FormatSettings::DateTimeInputFormat::BestEffort:
             parseDateTimeBestEffort(x, istr, time_zone, utc_time_zone);
-            return;
+            break;
         case FormatSettings::DateTimeInputFormat::BestEffortUS:
             parseDateTimeBestEffortUS(x, istr, time_zone, utc_time_zone);
-            return;
+            break;
     }
+
+    if (x < 0)
+        x = 0;
+}
+
+inline void readAsIntText(time_t & x, ReadBuffer & istr)
+{
+    readIntText(x, istr);
+    if (x < 0)
+        x = 0;
+}
+
+inline bool tryReadText(time_t & x, ReadBuffer & istr, const FormatSettings & settings, const DateLUTImpl & time_zone, const DateLUTImpl & utc_time_zone)
+{
+    bool res;
+    switch (settings.date_time_input_format)
+    {
+        case FormatSettings::DateTimeInputFormat::Basic:
+            res = tryReadDateTimeText(x, istr, time_zone);
+            break;
+        case FormatSettings::DateTimeInputFormat::BestEffort:
+            res = tryParseDateTimeBestEffort(x, istr, time_zone, utc_time_zone);
+            break;
+        case FormatSettings::DateTimeInputFormat::BestEffortUS:
+            res = tryParseDateTimeBestEffortUS(x, istr, time_zone, utc_time_zone);
+            break;
+    }
+
+    if (x < 0)
+        x = 0;
+
+    return res;
+}
+
+inline bool tryReadAsIntText(time_t & x, ReadBuffer & istr)
+{
+    if (!tryReadIntText(x, istr))
+        return false;
+    if (x < 0)
+        x = 0;
+    return true;
 }
 
 }
@@ -68,15 +109,32 @@ void SerializationDateTime::deserializeWholeText(IColumn & column, ReadBuffer &
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "DateTime");
 }
 
+bool SerializationDateTime::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    time_t x = 0;
+    if (!tryReadText(x, istr, settings, time_zone, utc_time_zone) || !istr.eof())
+        return false;
+
+    assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
+    return true;
+}
+
 void SerializationDateTime::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     time_t x = 0;
     readText(x, istr, settings, time_zone, utc_time_zone);
-    if (x < 0)
-        x = 0;
     assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
 }
 
+bool SerializationDateTime::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    time_t x = 0;
+    if (!tryReadText(x, istr, settings, time_zone, utc_time_zone))
+        return false;
+    assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
+    return true;
+}
+
 void SerializationDateTime::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('\'', ostr);
@@ -94,15 +152,32 @@ void SerializationDateTime::deserializeTextQuoted(IColumn & column, ReadBuffer &
     }
     else /// Just 1504193808 or 01504193808
     {
-        readIntText(x, istr);
+        readAsIntText(x, istr);
     }
-    if (x < 0)
-        x = 0;
 
     /// It's important to do this at the end - for exception safety.
     assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
 }
 
+bool SerializationDateTime::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    time_t x = 0;
+    if (checkChar('\'', istr)) /// Cases: '2017-08-31 18:36:48' or '1504193808'
+    {
+        if (!tryReadText(x, istr, settings, time_zone, utc_time_zone) || !checkChar('\'', istr))
+            return false;
+    }
+    else /// Just 1504193808 or 01504193808
+    {
+        if (!tryReadAsIntText(x, istr))
+            return false;
+    }
+
+    /// It's important to do this at the end - for exception safety.
+    assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
+    return true;
+}
+
 void SerializationDateTime::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -120,13 +195,30 @@ void SerializationDateTime::deserializeTextJSON(IColumn & column, ReadBuffer & i
     }
     else
     {
-        readIntText(x, istr);
+        readAsIntText(x, istr);
     }
-    if (x < 0)
-        x = 0;
+
     assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
 }
 
+bool SerializationDateTime::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    time_t x = 0;
+    if (checkChar('"', istr))
+    {
+        if (!tryReadText(x, istr, settings, time_zone, utc_time_zone) || !checkChar('"', istr))
+            return false;
+    }
+    else
+    {
+        if (!tryReadIntText(x, istr))
+            return false;
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
+    return true;
+}
+
 void SerializationDateTime::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -165,13 +257,48 @@ void SerializationDateTime::deserializeTextCSV(IColumn & column, ReadBuffer & is
             readCSVString(datetime_str, istr, settings.csv);
             ReadBufferFromString buf(datetime_str);
             readText(x, buf, settings, time_zone, utc_time_zone);
+            if (!buf.eof())
+                throwUnexpectedDataAfterParsedValue(column, istr, settings, "DateTime");
         }
     }
 
-    if (x < 0)
-        x = 0;
-
     assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
 }
 
+bool SerializationDateTime::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    time_t x = 0;
+
+    if (istr.eof())
+        return false;
+
+    char maybe_quote = *istr.position();
+
+    if (maybe_quote == '\'' || maybe_quote == '\"')
+    {
+        ++istr.position();
+        if (!tryReadText(x, istr, settings, time_zone, utc_time_zone) || !checkChar(maybe_quote, istr))
+            return false;
+    }
+    else
+    {
+        if (settings.csv.delimiter != ',' || settings.date_time_input_format == FormatSettings::DateTimeInputFormat::Basic)
+        {
+            if (!tryReadText(x, istr, settings, time_zone, utc_time_zone))
+                return false;
+        }
+        else
+        {
+            String datetime_str;
+            readCSVString(datetime_str, istr, settings.csv);
+            ReadBufferFromString buf(datetime_str);
+            if (!tryReadText(x, buf, settings, time_zone, utc_time_zone) || !buf.eof())
+                return false;
+        }
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
+    return true;
+}
+
 }
diff --git a/src/DataTypes/Serializations/SerializationDateTime.h b/src/DataTypes/Serializations/SerializationDateTime.h
index f4a142483e5..584b0c4116b 100644
--- a/src/DataTypes/Serializations/SerializationDateTime.h
+++ b/src/DataTypes/Serializations/SerializationDateTime.h
@@ -15,14 +15,19 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationDateTime64.cpp b/src/DataTypes/Serializations/SerializationDateTime64.cpp
index 93891886000..a19619bf8d3 100644
--- a/src/DataTypes/Serializations/SerializationDateTime64.cpp
+++ b/src/DataTypes/Serializations/SerializationDateTime64.cpp
@@ -47,6 +47,16 @@ void SerializationDateTime64::deserializeText(IColumn & column, ReadBuffer & ist
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "DateTime64");
 }
 
+bool SerializationDateTime64::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const
+{
+    DateTime64 result = 0;
+    if (tryReadDateTime64Text(result, scale, istr, time_zone) || (whole && istr.eof()))
+        return false;
+
+    assert_cast<ColumnType &>(column).getData().push_back(result);
+    return true;
+}
+
 void SerializationDateTime64::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     deserializeTextEscaped(column, istr, settings);
@@ -75,6 +85,29 @@ static inline void readText(DateTime64 & x, UInt32 scale, ReadBuffer & istr, con
     }
 }
 
+static inline bool tryReadText(DateTime64 & x, UInt32 scale, ReadBuffer & istr, const FormatSettings & settings, const DateLUTImpl & time_zone, const DateLUTImpl & utc_time_zone)
+{
+    switch (settings.date_time_input_format)
+    {
+        case FormatSettings::DateTimeInputFormat::Basic:
+            return tryReadDateTime64Text(x, scale, istr, time_zone);
+        case FormatSettings::DateTimeInputFormat::BestEffort:
+            return tryParseDateTime64BestEffort(x, scale, istr, time_zone, utc_time_zone);
+        case FormatSettings::DateTimeInputFormat::BestEffortUS:
+            return tryParseDateTime64BestEffortUS(x, scale, istr, time_zone, utc_time_zone);
+    }
+}
+
+
+bool SerializationDateTime64::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    DateTime64 x = 0;
+    if (!tryReadText(x, scale, istr, settings, time_zone, utc_time_zone) || !istr.eof())
+        return false;
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDateTime64::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     DateTime64 x = 0;
@@ -82,6 +115,15 @@ void SerializationDateTime64::deserializeTextEscaped(IColumn & column, ReadBuffe
     assert_cast<ColumnType &>(column).getData().push_back(x);
 }
 
+bool SerializationDateTime64::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    DateTime64 x = 0;
+    if (!tryReadText(x, scale, istr, settings, time_zone, utc_time_zone))
+        return false;
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDateTime64::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('\'', ostr);
@@ -104,6 +146,23 @@ void SerializationDateTime64::deserializeTextQuoted(IColumn & column, ReadBuffer
     assert_cast<ColumnType &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
 }
 
+bool SerializationDateTime64::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    DateTime64 x = 0;
+    if (checkChar('\'', istr)) /// Cases: '2017-08-31 18:36:48' or '1504193808'
+    {
+        if (tryReadText(x, scale, istr, settings, time_zone, utc_time_zone) || !checkChar('\'', istr))
+            return false;
+    }
+    else /// Just 1504193808 or 01504193808
+    {
+        if (!tryReadIntText(x, istr))
+            return false;
+    }
+    assert_cast<ColumnType &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
+    return true;
+}
+
 void SerializationDateTime64::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -126,6 +185,23 @@ void SerializationDateTime64::deserializeTextJSON(IColumn & column, ReadBuffer &
     assert_cast<ColumnType &>(column).getData().push_back(x);
 }
 
+bool SerializationDateTime64::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    DateTime64 x = 0;
+    if (checkChar('"', istr))
+    {
+        if (!tryReadText(x, scale, istr, settings, time_zone, utc_time_zone) || !checkChar('"', istr))
+            return false;
+    }
+    else
+    {
+        if (!tryReadIntText(x, istr))
+            return false;
+    }
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDateTime64::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -170,4 +246,40 @@ void SerializationDateTime64::deserializeTextCSV(IColumn & column, ReadBuffer &
     assert_cast<ColumnType &>(column).getData().push_back(x);
 }
 
+bool SerializationDateTime64::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    DateTime64 x = 0;
+
+    if (istr.eof())
+        return false;
+
+    char maybe_quote = *istr.position();
+
+    if (maybe_quote == '\'' || maybe_quote == '\"')
+    {
+        ++istr.position();
+        if (!tryReadText(x, scale, istr, settings, time_zone, utc_time_zone) || !checkChar(maybe_quote, istr))
+            return false;
+    }
+    else
+    {
+        if (settings.csv.delimiter != ',' || settings.date_time_input_format == FormatSettings::DateTimeInputFormat::Basic)
+        {
+            if (tryReadText(x, scale, istr, settings, time_zone, utc_time_zone))
+                return false;
+        }
+        else
+        {
+            String datetime_str;
+            readCSVString(datetime_str, istr, settings.csv);
+            ReadBufferFromString buf(datetime_str);
+            if (!tryReadText(x, scale, buf, settings, time_zone, utc_time_zone) || !buf.eof())
+                return false;
+        }
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 }
diff --git a/src/DataTypes/Serializations/SerializationDateTime64.h b/src/DataTypes/Serializations/SerializationDateTime64.h
index f817edbf0dd..b49bd1e9098 100644
--- a/src/DataTypes/Serializations/SerializationDateTime64.h
+++ b/src/DataTypes/Serializations/SerializationDateTime64.h
@@ -15,15 +15,21 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationDecimal.cpp b/src/DataTypes/Serializations/SerializationDecimal.cpp
index b576b7a048c..d632c224783 100644
--- a/src/DataTypes/Serializations/SerializationDecimal.cpp
+++ b/src/DataTypes/Serializations/SerializationDecimal.cpp
@@ -16,11 +16,19 @@ namespace ErrorCodes
 }
 
 template <typename T>
-bool SerializationDecimal<T>::tryReadText(T & x, ReadBuffer & istr, UInt32 precision, UInt32 scale)
+bool SerializationDecimal<T>::tryReadText(T & x, ReadBuffer & istr, UInt32 precision, UInt32 scale, bool csv)
 {
     UInt32 unread_scale = scale;
-    if (!tryReadDecimalText(istr, x, precision, unread_scale))
-        return false;
+    if (csv)
+    {
+        if (!tryReadCSVDecimalText(istr, x, precision, unread_scale))
+            return false;
+    }
+    else
+    {
+        if (!tryReadDecimalText(istr, x, precision, unread_scale))
+            return false;
+    }
 
     if (common::mulOverflow(x.value, DecimalUtils::scaleMultiplier<T>(unread_scale), x.value))
         return false;
@@ -59,6 +67,16 @@ void SerializationDecimal<T>::deserializeText(IColumn & column, ReadBuffer & ist
         ISerialization::throwUnexpectedDataAfterParsedValue(column, istr, settings, "Decimal");
 }
 
+template <typename T>
+bool SerializationDecimal<T>::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const
+{
+    T x;
+    if (!tryReadText(x, istr) || (whole && !istr.eof()))
+        return false;
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename T>
 void SerializationDecimal<T>::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
@@ -67,6 +85,16 @@ void SerializationDecimal<T>::deserializeTextCSV(IColumn & column, ReadBuffer &
     assert_cast<ColumnType &>(column).getData().push_back(x);
 }
 
+template <typename T>
+bool SerializationDecimal<T>::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    T x;
+    if (!tryReadText(x, istr, true))
+        return false;
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename T>
 void SerializationDecimal<T>::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -88,6 +116,18 @@ void SerializationDecimal<T>::deserializeTextJSON(IColumn & column, ReadBuffer &
         assertChar('"', istr);
 }
 
+template <typename T>
+bool SerializationDecimal<T>::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    bool have_quotes = checkChar('"', istr);
+    T x;
+    if (!tryReadText(x, istr) || (have_quotes && !checkChar('"', istr)))
+        return false;
+
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 
 template class SerializationDecimal<Decimal32>;
 template class SerializationDecimal<Decimal64>;
diff --git a/src/DataTypes/Serializations/SerializationDecimal.h b/src/DataTypes/Serializations/SerializationDecimal.h
index 57decdd0973..22a8eb1a47c 100644
--- a/src/DataTypes/Serializations/SerializationDecimal.h
+++ b/src/DataTypes/Serializations/SerializationDecimal.h
@@ -16,15 +16,19 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void readText(T & x, ReadBuffer & istr, bool csv = false) const { readText(x, istr, this->precision, this->scale, csv); }
+    bool tryReadText(T & x, ReadBuffer & istr, bool csv = false) const { return tryReadText(x, istr, this->precision, this->scale, csv); }
 
     static void readText(T & x, ReadBuffer & istr, UInt32 precision_, UInt32 scale_, bool csv = false);
-    static bool tryReadText(T & x, ReadBuffer & istr, UInt32 precision_, UInt32 scale_);
+    static bool tryReadText(T & x, ReadBuffer & istr, UInt32 precision_, UInt32 scale_, bool csv = false);
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationEnum.cpp b/src/DataTypes/Serializations/SerializationEnum.cpp
index 9b3a437e9cf..6ad55913738 100644
--- a/src/DataTypes/Serializations/SerializationEnum.cpp
+++ b/src/DataTypes/Serializations/SerializationEnum.cpp
@@ -34,6 +34,27 @@ void SerializationEnum<Type>::deserializeTextEscaped(IColumn & column, ReadBuffe
     }
 }
 
+template <typename Type>
+bool SerializationEnum<Type>::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    FieldType x;
+    if (settings.tsv.enum_as_number)
+    {
+        if (!tryReadValue(istr, x))
+            return false;
+    }
+    else
+    {
+        std::string field_name;
+        readEscapedString(field_name, istr);
+        if (!this->tryGetValue(x, StringRef(field_name), true))
+            return false;
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename Type>
 void SerializationEnum<Type>::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
@@ -48,6 +69,18 @@ void SerializationEnum<Type>::deserializeTextQuoted(IColumn & column, ReadBuffer
     assert_cast<ColumnType &>(column).getData().push_back(ref_enum_values.getValue(StringRef(field_name)));
 }
 
+template <typename Type>
+bool SerializationEnum<Type>::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    std::string field_name;
+    readQuotedStringWithSQLStyle(field_name, istr);
+    FieldType x;
+    if (!this->tryGetValue(x, StringRef(field_name)))
+        return false;
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename Type>
 void SerializationEnum<Type>::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
@@ -65,6 +98,27 @@ void SerializationEnum<Type>::deserializeWholeText(IColumn & column, ReadBuffer
     }
 }
 
+template <typename Type>
+bool SerializationEnum<Type>::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    FieldType x;
+    if (settings.tsv.enum_as_number)
+    {
+        if (!tryReadValue(istr, x) || !istr.eof())
+            return false;
+    }
+    else
+    {
+        std::string field_name;
+        readStringUntilEOF(field_name, istr);
+        if (!this->tryGetValue(x, StringRef(field_name), true))
+            return false;
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename Type>
 void SerializationEnum<Type>::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -90,6 +144,27 @@ void SerializationEnum<Type>::deserializeTextJSON(IColumn & column, ReadBuffer &
     }
 }
 
+template <typename Type>
+bool SerializationEnum<Type>::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    FieldType x;
+    if (!istr.eof() && *istr.position() != '"')
+    {
+        if (!tryReadValue(istr, x))
+            return false;
+    }
+    else
+    {
+        std::string field_name;
+        readJSONString(field_name, istr);
+        if (!this->tryGetValue(x, StringRef(field_name)))
+            return false;
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename Type>
 void SerializationEnum<Type>::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
@@ -109,6 +184,28 @@ void SerializationEnum<Type>::deserializeTextCSV(IColumn & column, ReadBuffer &
     }
 }
 
+template <typename Type>
+bool SerializationEnum<Type>::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    FieldType x;
+
+    if (settings.csv.enum_as_number)
+    {
+        if (!tryReadValue(istr, x))
+            return false;
+    }
+    else
+    {
+        std::string field_name;
+        readCSVString(field_name, istr, settings.csv);
+        if (!this->tryGetValue(x, StringRef(field_name), true))
+            return false;
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename Type>
 void SerializationEnum<Type>::serializeTextMarkdown(
     const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
diff --git a/src/DataTypes/Serializations/SerializationEnum.h b/src/DataTypes/Serializations/SerializationEnum.h
index 03b134e59a6..708161dc5fd 100644
--- a/src/DataTypes/Serializations/SerializationEnum.h
+++ b/src/DataTypes/Serializations/SerializationEnum.h
@@ -34,15 +34,20 @@ public:
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeTextMarkdown(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
@@ -53,6 +58,14 @@ public:
         return ref_enum_values.findByValue(x)->first;
     }
 
+    bool tryReadValue(ReadBuffer & istr, FieldType & x) const
+    {
+       if (!tryReadText(x, istr) || !this->hasValue(x))
+           return false;
+
+       return true;
+    }
+
     std::optional<EnumValues<Type>> own_enum_values;
     std::shared_ptr<const DataTypeEnum<Type>> own_enum_type;
     const EnumValues<Type> & ref_enum_values;
diff --git a/src/DataTypes/Serializations/SerializationFixedString.cpp b/src/DataTypes/Serializations/SerializationFixedString.cpp
index fa50af52f2f..23e959d80c9 100644
--- a/src/DataTypes/Serializations/SerializationFixedString.cpp
+++ b/src/DataTypes/Serializations/SerializationFixedString.cpp
@@ -150,12 +150,49 @@ static inline void read(const SerializationFixedString & self, IColumn & column,
     }
 }
 
+bool SerializationFixedString::tryAlignStringLength(size_t n, PaddedPODArray<UInt8> & data, size_t string_start)
+{
+    size_t length = data.size() - string_start;
+    if (length < n)
+    {
+        data.resize_fill(string_start + n);
+    }
+    else if (length > n)
+    {
+        data.resize_assume_reserved(string_start);
+        return false;
+    }
+
+    return true;
+}
+
+template <typename Reader>
+static inline bool tryRead(const SerializationFixedString & self, IColumn & column, Reader && reader)
+{
+    ColumnFixedString::Chars & data = typeid_cast<ColumnFixedString &>(column).getChars();
+    size_t prev_size = data.size();
+    try
+    {
+        return reader(data) && SerializationFixedString::tryAlignStringLength(self.getN(), data, prev_size);
+    }
+    catch (...)
+    {
+        data.resize_assume_reserved(prev_size);
+        return false;
+    }
+}
+
 
 void SerializationFixedString::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     read(*this, column, [&istr](ColumnFixedString::Chars & data) { readEscapedStringInto(data, istr); });
 }
 
+bool SerializationFixedString::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return tryRead(*this, column, [&istr](ColumnFixedString::Chars & data) { readEscapedStringInto(data, istr); return true; });
+}
+
 
 void SerializationFixedString::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
@@ -169,12 +206,22 @@ void SerializationFixedString::deserializeTextQuoted(IColumn & column, ReadBuffe
     read(*this, column, [&istr](ColumnFixedString::Chars & data) { readQuotedStringInto<true>(data, istr); });
 }
 
+bool SerializationFixedString::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return tryRead(*this, column, [&istr](ColumnFixedString::Chars & data) { return tryReadQuotedStringInto<true>(data, istr); });
+}
+
 
 void SerializationFixedString::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     read(*this, column, [&istr](ColumnFixedString::Chars & data) { readStringUntilEOFInto(data, istr); });
 }
 
+bool SerializationFixedString::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return tryRead(*this, column, [&istr](ColumnFixedString::Chars & data) { readStringUntilEOFInto(data, istr); return true; });
+}
+
 
 void SerializationFixedString::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -188,6 +235,10 @@ void SerializationFixedString::deserializeTextJSON(IColumn & column, ReadBuffer
     read(*this, column, [&istr](ColumnFixedString::Chars & data) { readJSONStringInto(data, istr); });
 }
 
+bool SerializationFixedString::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return tryRead(*this, column, [&istr](ColumnFixedString::Chars & data) { return tryReadJSONStringInto(data, istr); });
+}
 
 void SerializationFixedString::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
@@ -208,6 +259,11 @@ void SerializationFixedString::deserializeTextCSV(IColumn & column, ReadBuffer &
     read(*this, column, [&istr, &csv = settings.csv](ColumnFixedString::Chars & data) { readCSVStringInto(data, istr, csv); });
 }
 
+bool SerializationFixedString::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryRead(*this, column, [&istr, &csv = settings.csv](ColumnFixedString::Chars & data) { readCSVStringInto<ColumnFixedString::Chars, false, false>(data, istr, csv); return true; });
+}
+
 void SerializationFixedString::serializeTextMarkdown(
     const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings & settings) const
 {
diff --git a/src/DataTypes/Serializations/SerializationFixedString.h b/src/DataTypes/Serializations/SerializationFixedString.h
index c27b10ad158..8eb4eacdbff 100644
--- a/src/DataTypes/Serializations/SerializationFixedString.h
+++ b/src/DataTypes/Serializations/SerializationFixedString.h
@@ -26,20 +26,25 @@ public:
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextMarkdown(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
@@ -47,6 +52,7 @@ public:
     /// If the length is less than getN() the function will add zero characters up to getN().
     /// If the length is greater than getN() the function will throw an exception.
     static void alignStringLength(size_t n, PaddedPODArray<UInt8> & data, size_t string_start);
+    static bool tryAlignStringLength(size_t n, PaddedPODArray<UInt8> & data, size_t string_start);
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp b/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp
new file mode 100644
index 00000000000..81c4af97401
--- /dev/null
+++ b/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp
@@ -0,0 +1,188 @@
+#include <DataTypes/Serializations/SerializationIPv4andIPv6.h>
+
+namespace DB
+{
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeText(const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings &) const
+{
+    writeText(assert_cast<const ColumnVector<IPv> &>(column).getData()[row_num], ostr);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, bool whole) const
+{
+    IPv x;
+    readText(x, istr);
+
+    if (whole && !istr.eof())
+        throwUnexpectedDataAfterParsedValue(column, istr, settings, TypeName<IPv>.data());
+
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+}
+
+template <typename IPv>
+bool SerializationIP<IPv>::tryDeserializeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &, bool whole) const
+{
+    IPv x;
+    if (!tryReadText(x, istr) || (whole && !istr.eof()))
+        return false;
+
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+    return true;
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeTextQuoted(const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings & settings) const
+{
+    writeChar('\'', ostr);
+    serializeText(column, row_num, ostr, settings);
+    writeChar('\'', ostr);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeTextQuoted(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv x;
+    assertChar('\'', istr);
+    readText(x, istr);
+    assertChar('\'', istr);
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
+}
+
+template <typename IPv>
+bool SerializationIP<IPv>::tryDeserializeTextQuoted(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv x;
+    if (!checkChar('\'', istr) || !tryReadText(x, istr) || !checkChar('\'', istr))
+        return false;
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+    return true;
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeTextJSON(const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings & settings) const
+{
+    writeChar('"', ostr);
+    serializeText(column, row_num, ostr, settings);
+    writeChar('"', ostr);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    IPv x;
+    assertChar('"', istr);
+    readText(x, istr);
+    /// this code looks weird, but we want to throw specific exception to match original behavior...
+    if (istr.eof())
+        assertChar('"', istr);
+    if (*istr.position() != '"')
+        throwUnexpectedDataAfterParsedValue(column, istr, settings, TypeName<IPv>.data());
+    istr.ignore();
+
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+}
+
+template <typename IPv>
+bool SerializationIP<IPv>::tryDeserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv x;
+    if (!checkChar('"', istr) || !tryReadText(x, istr) || !checkChar('"', istr))
+        return false;
+
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+    return true;
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeTextCSV(const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings & settings) const
+{
+    writeChar('"', ostr);
+    serializeText(column, row_num, ostr, settings);
+    writeChar('"', ostr);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeTextCSV(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv value;
+    readCSV(value, istr);
+
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(value);
+}
+
+template <typename IPv>
+bool SerializationIP<IPv>::tryDeserializeTextCSV(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv value;
+    if (!tryReadCSV(value, istr))
+        return false;
+
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(value);
+    return true;
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const
+{
+    IPv x = field.get<IPv>();
+    if constexpr (std::is_same_v<IPv, IPv6>)
+        writeBinary(x, ostr);
+    else
+        writeBinaryLittleEndian(x, ostr);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeBinary(DB::Field & field, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv x;
+    if constexpr (std::is_same_v<IPv, IPv6>)
+        readBinary(x, istr);
+    else
+        readBinaryLittleEndian(x, istr);
+    field = NearestFieldType<IPv>(x);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeBinary(const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings &) const
+{
+    writeBinary(assert_cast<const ColumnVector<IPv> &>(column).getData()[row_num], ostr);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeBinary(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv x;
+    readBinary(x.toUnderType(), istr);
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeBinaryBulk(const DB::IColumn & column, DB::WriteBuffer & ostr, size_t offset, size_t limit) const
+{
+    const typename ColumnVector<IPv>::Container & x = typeid_cast<const ColumnVector<IPv> &>(column).getData();
+
+    size_t size = x.size();
+
+    if (limit == 0 || offset + limit > size)
+        limit = size - offset;
+
+    if (limit)
+        ostr.write(reinterpret_cast<const char *>(&x[offset]), sizeof(IPv) * limit);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeBinaryBulk(DB::IColumn & column, DB::ReadBuffer & istr, size_t limit, double) const
+{
+    typename ColumnVector<IPv>::Container & x = typeid_cast<ColumnVector<IPv> &>(column).getData();
+    size_t initial_size = x.size();
+    x.resize(initial_size + limit);
+    size_t size = istr.readBig(reinterpret_cast<char*>(&x[initial_size]), sizeof(IPv) * limit);
+    x.resize(initial_size + size / sizeof(IPv));
+}
+
+template class SerializationIP<IPv4>;
+template class SerializationIP<IPv6>;
+
+}
diff --git a/src/DataTypes/Serializations/SerializationIPv4andIPv6.h b/src/DataTypes/Serializations/SerializationIPv4andIPv6.h
index 7d8669fd444..a53f257646b 100644
--- a/src/DataTypes/Serializations/SerializationIPv4andIPv6.h
+++ b/src/DataTypes/Serializations/SerializationIPv4andIPv6.h
@@ -13,123 +13,30 @@ template <typename IPv>
 class SerializationIP : public SimpleTextSerialization
 {
 public:
-    void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override
-    {
-        writeText(assert_cast<const ColumnVector<IPv> &>(column).getData()[row_num], ostr);
-    }
-    void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override
-    {
-        IPv x;
-        readText(x, istr);
+    void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
+    void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
 
-        if (whole && !istr.eof())
-            throwUnexpectedDataAfterParsedValue(column, istr, settings, TypeName<IPv>.data());
+    void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
-        assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
-    }
-    void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override
-    {
-        serializeText(column, row_num, ostr, settings);
-    }
-    void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
-    {
-        deserializeText(column, istr, settings, false);
-    }
-    void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override
-    {
-        writeChar('\'', ostr);
-        serializeText(column, row_num, ostr, settings);
-        writeChar('\'', ostr);
-    }
-    void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override
-    {
-        IPv x;
-        assertChar('\'', istr);
-        readText(x, istr);
-        assertChar('\'', istr);
-        assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
-    }
-    void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override
-    {
-        writeChar('"', ostr);
-        serializeText(column, row_num, ostr, settings);
-        writeChar('"', ostr);
-    }
-    void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
-    {
-        IPv x;
-        assertChar('"', istr);
-        readText(x, istr);
-        /// this code looks weird, but we want to throw specific exception to match original behavior...
-        if (istr.eof())
-            assertChar('"', istr);
-        if (*istr.position() != '"')
-            throwUnexpectedDataAfterParsedValue(column, istr, settings, TypeName<IPv>.data());
-        istr.ignore();
+    void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
-        assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
-    }
-    void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override
-    {
-        writeChar('"', ostr);
-        serializeText(column, row_num, ostr, settings);
-        writeChar('"', ostr);
-    }
-    void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &/* settings*/) const override
-    {
-        IPv value;
-        readCSV(value, istr);
+    void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &/* settings*/) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &/* settings*/) const override;
 
-        assert_cast<ColumnVector<IPv> &>(column).getData().push_back(value);
-    }
+    void serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const override;
+    void deserializeBinary(Field & field, ReadBuffer & istr, const FormatSettings &) const override;
 
-    void serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const override
-    {
-        IPv x = field.get<IPv>();
-        if constexpr (std::is_same_v<IPv, IPv6>)
-            writeBinary(x, ostr);
-        else
-            writeBinaryLittleEndian(x, ostr);
-    }
-    void deserializeBinary(Field & field, ReadBuffer & istr, const FormatSettings &) const override
-    {
-        IPv x;
-        if constexpr (std::is_same_v<IPv, IPv6>)
-            readBinary(x, istr);
-        else
-            readBinaryLittleEndian(x, istr);
-        field = NearestFieldType<IPv>(x);
-    }
-    void serializeBinary(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override
-    {
-        writeBinary(assert_cast<const ColumnVector<IPv> &>(column).getData()[row_num], ostr);
-    }
-    void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override
-    {
-        IPv x;
-        readBinary(x.toUnderType(), istr);
-        assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
-    }
-    void serializeBinaryBulk(const IColumn & column, WriteBuffer & ostr, size_t offset, size_t limit) const override
-    {
-        const typename ColumnVector<IPv>::Container & x = typeid_cast<const ColumnVector<IPv> &>(column).getData();
+    void serializeBinary(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
+    void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
-        size_t size = x.size();
-
-        if (limit == 0 || offset + limit > size)
-            limit = size - offset;
-
-        if (limit)
-            ostr.write(reinterpret_cast<const char *>(&x[offset]), sizeof(IPv) * limit);
-    }
-    void deserializeBinaryBulk(IColumn & column, ReadBuffer & istr, size_t limit, double /*avg_value_size_hint*/) const override
-    {
-        typename ColumnVector<IPv>::Container & x = typeid_cast<ColumnVector<IPv> &>(column).getData();
-        size_t initial_size = x.size();
-        x.resize(initial_size + limit);
-        size_t size = istr.readBig(reinterpret_cast<char*>(&x[initial_size]), sizeof(IPv) * limit);
-        x.resize(initial_size + size / sizeof(IPv));
-    }
+    void serializeBinaryBulk(const IColumn & column, WriteBuffer & ostr, size_t offset, size_t limit) const override;
+    void deserializeBinaryBulk(IColumn & column, ReadBuffer & istr, size_t limit, double /*avg_value_size_hint*/) const override;
 };
 
 using SerializationIPv4 = SerializationIP<IPv4>;
diff --git a/src/DataTypes/Serializations/SerializationLowCardinality.cpp b/src/DataTypes/Serializations/SerializationLowCardinality.cpp
index 3e1cbdb00f5..9efe05042ed 100644
--- a/src/DataTypes/Serializations/SerializationLowCardinality.cpp
+++ b/src/DataTypes/Serializations/SerializationLowCardinality.cpp
@@ -700,6 +700,11 @@ void SerializationLowCardinality::deserializeTextEscaped(IColumn & column, ReadB
     deserializeImpl(column, &ISerialization::deserializeTextEscaped, istr, settings);
 }
 
+bool SerializationLowCardinality::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryDeserializeImpl(column, &ISerialization::tryDeserializeTextEscaped, istr, settings);
+}
+
 void SerializationLowCardinality::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeImpl(column, row_num, &ISerialization::serializeTextQuoted, ostr, settings);
@@ -710,11 +715,21 @@ void SerializationLowCardinality::deserializeTextQuoted(IColumn & column, ReadBu
     deserializeImpl(column, &ISerialization::deserializeTextQuoted, istr, settings);
 }
 
+bool SerializationLowCardinality::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryDeserializeImpl(column, &ISerialization::tryDeserializeTextQuoted, istr, settings);
+}
+
 void SerializationLowCardinality::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     deserializeImpl(column, &ISerialization::deserializeWholeText, istr, settings);
 }
 
+bool SerializationLowCardinality::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryDeserializeImpl(column, &ISerialization::tryDeserializeWholeText, istr, settings);
+}
+
 void SerializationLowCardinality::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeImpl(column, row_num, &ISerialization::serializeTextCSV, ostr, settings);
@@ -725,6 +740,11 @@ void SerializationLowCardinality::deserializeTextCSV(IColumn & column, ReadBuffe
     deserializeImpl(column, &ISerialization::deserializeTextCSV, istr, settings);
 }
 
+bool SerializationLowCardinality::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryDeserializeImpl(column, &ISerialization::tryDeserializeTextCSV, istr, settings);
+}
+
 void SerializationLowCardinality::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeImpl(column, row_num, &ISerialization::serializeText, ostr, settings);
@@ -740,6 +760,11 @@ void SerializationLowCardinality::deserializeTextJSON(IColumn & column, ReadBuff
     deserializeImpl(column, &ISerialization::deserializeTextJSON, istr, settings);
 }
 
+bool SerializationLowCardinality::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryDeserializeImpl(column, &ISerialization::tryDeserializeTextJSON, istr, settings);
+}
+
 void SerializationLowCardinality::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeImpl(column, row_num, &ISerialization::serializeTextXML, ostr, settings);
@@ -750,6 +775,11 @@ void SerializationLowCardinality::deserializeTextRaw(IColumn & column, ReadBuffe
     deserializeImpl(column, &ISerialization::deserializeTextRaw, istr, settings);
 }
 
+bool SerializationLowCardinality::tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryDeserializeImpl(column, &ISerialization::tryDeserializeTextRaw, istr, settings);
+}
+
 void SerializationLowCardinality::serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeImpl(column, row_num, &ISerialization::serializeTextRaw, ostr, settings);
@@ -769,7 +799,7 @@ template <typename... Params, typename... Args>
 void SerializationLowCardinality::deserializeImpl(
     IColumn & column, SerializationLowCardinality::DeserializeFunctionPtr<Params...> func, Args &&... args) const
 {
-    auto & low_cardinality_column= getColumnLowCardinality(column);
+    auto & low_cardinality_column = getColumnLowCardinality(column);
     auto temp_column = low_cardinality_column.getDictionary().getNestedColumn()->cloneEmpty();
 
     auto serialization = dictionary_type->getDefaultSerialization();
@@ -778,4 +808,19 @@ void SerializationLowCardinality::deserializeImpl(
     low_cardinality_column.insertFromFullColumn(*temp_column, 0);
 }
 
+template <typename... Params, typename... Args>
+bool SerializationLowCardinality::tryDeserializeImpl(
+    IColumn & column, SerializationLowCardinality::TryDeserializeFunctionPtr<Params...> func, Args &&... args) const
+{
+    auto & low_cardinality_column = getColumnLowCardinality(column);
+    auto temp_column = low_cardinality_column.getDictionary().getNestedColumn()->cloneEmpty();
+
+    auto serialization = dictionary_type->getDefaultSerialization();
+    if (!(serialization.get()->*func)(*temp_column, std::forward<Args>(args)...))
+        return false;
+
+    low_cardinality_column.insertFromFullColumn(*temp_column, 0);
+    return true;
+}
+
 }
diff --git a/src/DataTypes/Serializations/SerializationLowCardinality.h b/src/DataTypes/Serializations/SerializationLowCardinality.h
index 5f56bcf8108..d2c3a95c702 100644
--- a/src/DataTypes/Serializations/SerializationLowCardinality.h
+++ b/src/DataTypes/Serializations/SerializationLowCardinality.h
@@ -55,16 +55,22 @@ public:
     void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
 
 private:
@@ -79,6 +85,12 @@ private:
 
     template <typename ... Params, typename... Args>
     void deserializeImpl(IColumn & column, DeserializeFunctionPtr<Params...> func, Args &&... args) const;
+
+    template <typename ... Params>
+    using TryDeserializeFunctionPtr = bool (ISerialization::*)(IColumn &, Params ...) const;
+
+    template <typename ... Params, typename... Args>
+    bool tryDeserializeImpl(IColumn & column, TryDeserializeFunctionPtr<Params...> func, Args &&... args) const;
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationMap.cpp b/src/DataTypes/Serializations/SerializationMap.cpp
index 7588e630689..7b6f87baf2e 100644
--- a/src/DataTypes/Serializations/SerializationMap.cpp
+++ b/src/DataTypes/Serializations/SerializationMap.cpp
@@ -115,9 +115,11 @@ void SerializationMap::serializeTextImpl(
     writeChar('}', ostr);
 }
 
-template <typename Reader>
-void SerializationMap::deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && reader) const
+template <typename ReturnType, typename Reader>
+ReturnType SerializationMap::deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && reader) const
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     auto & column_map = assert_cast<ColumnMap &>(column);
 
     auto & nested_array = column_map.getNestedColumn();
@@ -128,7 +130,21 @@ void SerializationMap::deserializeTextImpl(IColumn & column, ReadBuffer & istr,
     auto & value_column = nested_tuple.getColumn(1);
 
     size_t size = 0;
-    assertChar('{', istr);
+    if constexpr (throw_exception)
+        assertChar('{', istr);
+    else if (!checkChar('{', istr))
+        return ReturnType(false);
+
+    auto on_error_no_throw = [&]()
+    {
+        if (size)
+        {
+            nested_tuple.getColumnPtr(0) = key_column.cut(0, offsets.back());
+            nested_tuple.getColumnPtr(1) = value_column.cut(0, offsets.back());
+        }
+
+        return ReturnType(false);
+    };
 
     try
     {
@@ -138,9 +154,15 @@ void SerializationMap::deserializeTextImpl(IColumn & column, ReadBuffer & istr,
             if (!first)
             {
                 if (*istr.position() == ',')
+                {
                     ++istr.position();
+                }
                 else
-                    throw Exception(ErrorCodes::CANNOT_READ_MAP_FROM_TEXT, "Cannot read Map from text");
+                {
+                    if constexpr (throw_exception)
+                        throw Exception(ErrorCodes::CANNOT_READ_MAP_FROM_TEXT, "Cannot read Map from text");
+                    return on_error_no_throw();
+                }
             }
 
             first = false;
@@ -150,19 +172,32 @@ void SerializationMap::deserializeTextImpl(IColumn & column, ReadBuffer & istr,
             if (*istr.position() == '}')
                 break;
 
-            reader(istr, key, key_column);
+            if constexpr (throw_exception)
+                reader(istr, key, key_column);
+            else if (!reader(istr, key, key_column))
+                return on_error_no_throw();
+
             ++size;
 
             skipWhitespaceIfAny(istr);
-            assertChar(':', istr);
+            if constexpr (throw_exception)
+                assertChar(':', istr);
+            else if (!checkChar(':', istr))
+                return on_error_no_throw();
             skipWhitespaceIfAny(istr);
 
-            reader(istr, value, value_column);
+            if constexpr (throw_exception)
+                reader(istr, value, value_column);
+            else if (!reader(istr, value, value_column))
+                return on_error_no_throw();
 
             skipWhitespaceIfAny(istr);
         }
 
-        assertChar('}', istr);
+        if constexpr (throw_exception)
+            assertChar('}', istr);
+        else if (!checkChar('}', istr))
+            return on_error_no_throw();
     }
     catch (...)
     {
@@ -171,10 +206,14 @@ void SerializationMap::deserializeTextImpl(IColumn & column, ReadBuffer & istr,
             nested_tuple.getColumnPtr(0) = key_column.cut(0, offsets.back());
             nested_tuple.getColumnPtr(1) = value_column.cut(0, offsets.back());
         }
-        throw;
+
+        if constexpr (throw_exception)
+            throw;
+        return ReturnType(false);
     }
 
     offsets.push_back(offsets.back() + size);
+    return ReturnType(true);
 }
 
 void SerializationMap::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
@@ -192,8 +231,8 @@ void SerializationMap::deserializeText(IColumn & column, ReadBuffer & istr, cons
     deserializeTextImpl(column, istr,
         [&settings](ReadBuffer & buf, const SerializationPtr & subcolumn_serialization, IColumn & subcolumn)
         {
-            if (settings.null_as_default)
-                SerializationNullable::deserializeTextQuotedImpl(subcolumn, buf, settings, subcolumn_serialization);
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(subcolumn))
+                SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(subcolumn, buf, settings, subcolumn_serialization);
             else
                 subcolumn_serialization->deserializeTextQuoted(subcolumn, buf, settings);
         });
@@ -202,6 +241,28 @@ void SerializationMap::deserializeText(IColumn & column, ReadBuffer & istr, cons
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "Map");
 }
 
+bool SerializationMap::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const
+{
+    auto reader = [&settings](ReadBuffer & buf, const SerializationPtr & subcolumn_serialization, IColumn & subcolumn)
+    {
+        if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(subcolumn))
+            return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextQuoted(subcolumn, buf, settings, subcolumn_serialization);
+        return subcolumn_serialization->tryDeserializeTextQuoted(subcolumn, buf, settings);
+    };
+
+    auto ok = deserializeTextImpl<bool>(column, istr, reader);
+    if (!ok)
+        return false;
+
+    if (whole && !istr.eof())
+    {
+        column.popBack(1);
+        return false;
+    }
+
+    return true;
+}
+
 void SerializationMap::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeTextImpl(column, row_num, ostr,
@@ -260,13 +321,25 @@ void SerializationMap::deserializeTextJSON(IColumn & column, ReadBuffer & istr,
     deserializeTextImpl(column, istr,
         [&settings](ReadBuffer & buf, const SerializationPtr & subcolumn_serialization, IColumn & subcolumn)
         {
-            if (settings.null_as_default)
-                SerializationNullable::deserializeTextJSONImpl(subcolumn, buf, settings, subcolumn_serialization);
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(subcolumn))
+                SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(subcolumn, buf, settings, subcolumn_serialization);
             else
                 subcolumn_serialization->deserializeTextJSON(subcolumn, buf, settings);
         });
 }
 
+bool SerializationMap::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    auto reader = [&settings](ReadBuffer & buf, const SerializationPtr & subcolumn_serialization, IColumn & subcolumn)
+    {
+        if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(subcolumn))
+            return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextJSON(subcolumn, buf, settings, subcolumn_serialization);
+        return subcolumn_serialization->tryDeserializeTextJSON(subcolumn, buf, settings);
+    };
+
+    return deserializeTextImpl<bool>(column, istr, reader);
+}
+
 void SerializationMap::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     const auto & column_map = assert_cast<const ColumnMap &>(column);
@@ -308,6 +381,15 @@ void SerializationMap::deserializeTextCSV(IColumn & column, ReadBuffer & istr, c
     deserializeText(column, rb, settings, true);
 }
 
+bool SerializationMap::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String s;
+    if (!tryReadCSV(s, istr, settings.csv))
+        return false;
+    ReadBufferFromString rb(s);
+    return tryDeserializeText(column, rb, settings, true);
+}
+
 void SerializationMap::enumerateStreams(
     EnumerateStreamsSettings & settings,
     const StreamCallback & callback,
diff --git a/src/DataTypes/Serializations/SerializationMap.h b/src/DataTypes/Serializations/SerializationMap.h
index f32c656757d..3e27ef1b04a 100644
--- a/src/DataTypes/Serializations/SerializationMap.h
+++ b/src/DataTypes/Serializations/SerializationMap.h
@@ -24,13 +24,16 @@ public:
     void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSONPretty(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings, size_t indent) const override;
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void enumerateStreams(
         EnumerateStreamsSettings & settings,
@@ -68,8 +71,8 @@ private:
     template <typename KeyWriter, typename ValueWriter>
     void serializeTextImpl(const IColumn & column, size_t row_num, WriteBuffer & ostr, KeyWriter && key_writer, ValueWriter && value_writer) const;
 
-    template <typename Reader>
-    void deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && reader) const;
+    template <typename ReturnType = void, typename Reader>
+    ReturnType deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && reader) const;
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationNamed.cpp b/src/DataTypes/Serializations/SerializationNamed.cpp
index ca60948ce68..1a9cbe9a37d 100644
--- a/src/DataTypes/Serializations/SerializationNamed.cpp
+++ b/src/DataTypes/Serializations/SerializationNamed.cpp
@@ -1,4 +1,5 @@
 #include <DataTypes/Serializations/SerializationNamed.h>
+#include <iostream>
 
 namespace DB
 {
diff --git a/src/DataTypes/Serializations/SerializationNothing.h b/src/DataTypes/Serializations/SerializationNothing.h
index 02974d1ca76..7d1fff55b01 100644
--- a/src/DataTypes/Serializations/SerializationNothing.h
+++ b/src/DataTypes/Serializations/SerializationNothing.h
@@ -25,6 +25,7 @@ public:
     void deserializeBinary(IColumn &, ReadBuffer &, const FormatSettings &) const override                          { throwNoSerialization(); }
     void serializeText(const IColumn &, size_t, WriteBuffer &, const FormatSettings &) const override { throwNoSerialization(); }
     void deserializeText(IColumn &, ReadBuffer &, const FormatSettings &, bool) const override    { throwNoSerialization(); }
+    bool tryDeserializeText(IColumn &, ReadBuffer &, const FormatSettings &, bool) const override    { throwNoSerialization(); }
 
     /// These methods read and write zero bytes just to allow to figure out size of column.
     void serializeBinaryBulk(const IColumn & column, WriteBuffer & ostr, size_t offset, size_t limit) const override;
diff --git a/src/DataTypes/Serializations/SerializationNullable.cpp b/src/DataTypes/Serializations/SerializationNullable.cpp
index 15203bdc9fa..e7f0e61f2a5 100644
--- a/src/DataTypes/Serializations/SerializationNullable.cpp
+++ b/src/DataTypes/Serializations/SerializationNullable.cpp
@@ -187,55 +187,59 @@ void SerializationNullable::serializeBinary(const IColumn & column, size_t row_n
         nested->serializeBinary(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-/// Deserialize value into ColumnNullable.
-/// We need to insert both to nested column and to null byte map, or, in case of exception, to not insert at all.
-template <typename ReturnType = void, typename CheckForNull, typename DeserializeNested>
-requires std::same_as<ReturnType, void>
-static ReturnType
-safeDeserialize(IColumn & column, const ISerialization &, CheckForNull && check_for_null, DeserializeNested && deserialize_nested)
+template <typename ReturnType>
+ReturnType safeAppendToNullMap(ColumnNullable & column, bool is_null)
 {
-    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
-
-    if (check_for_null())
+    try
     {
-        col.insertDefault();
+        column.getNullMapData().push_back(is_null);
     }
-    else
+    catch (...)
     {
-        deserialize_nested(col.getNestedColumn());
-
-        try
-        {
-            col.getNullMapData().push_back(0);
-        }
-        catch (...)
-        {
-            col.getNestedColumn().popBack(1);
+        column.getNestedColumn().popBack(1);
+        if constexpr (std::is_same_v<ReturnType, void>)
             throw;
-        }
+        return ReturnType(false);
     }
+
+    return ReturnType(true);
 }
 
-/// Deserialize value into non-nullable column. In case of NULL, insert default value and return false.
+/// Deserialize value into non-nullable column. In case of NULL, insert default and set is_null to true.
+/// If ReturnType is bool, return true if parsing was succesfull and false in case of any error.
 template <typename ReturnType = void, typename CheckForNull, typename DeserializeNested>
-requires std::same_as<ReturnType, bool>
-static ReturnType
-safeDeserialize(IColumn & column, const ISerialization &, CheckForNull && check_for_null, DeserializeNested && deserialize_nested)
+static ReturnType deserializeImpl(IColumn & column, ReadBuffer & buf, CheckForNull && check_for_null, DeserializeNested && deserialize_nested, bool & is_null)
 {
-    bool insert_default = check_for_null();
-    if (insert_default)
+    is_null = check_for_null(buf);
+    if (is_null)
+    {
         column.insertDefault();
+    }
     else
-        deserialize_nested(column);
-    return !insert_default;
+    {
+        if constexpr (std::is_same_v<ReturnType, void>)
+            deserialize_nested(column, buf);
+        else if (!deserialize_nested(column, buf))
+            return ReturnType(false);
+    }
+
+    return ReturnType(true);
 }
 
 
 void SerializationNullable::deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
-    safeDeserialize(column, *nested,
-        [&istr] { bool is_null = false; readBinary(is_null, istr); return is_null; },
-        [this, &istr, settings] (IColumn & nested_column) { nested->deserializeBinary(nested_column, istr, settings); });
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    auto check_for_null = [](ReadBuffer & buf)
+    {
+        bool is_null_ = false;
+        readBinary(is_null_, buf);
+        return is_null_;
+    };
+    auto deserialize_nested = [this, &settings] (IColumn & nested_column, ReadBuffer & buf) { nested->deserializeBinary(nested_column, buf, settings); };
+    deserializeImpl(col.getNestedColumn(), istr, check_for_null, deserialize_nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
 }
 
 
@@ -244,20 +248,19 @@ void SerializationNullable::serializeTextEscaped(const IColumn & column, size_t
     const ColumnNullable & col = assert_cast<const ColumnNullable &>(column);
 
     if (col.isNullAt(row_num))
-        writeString(settings.tsv.null_representation, ostr);
+        serializeNullEscaped(ostr, settings);
     else
         nested->serializeTextEscaped(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-
-void SerializationNullable::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+void SerializationNullable::serializeNullEscaped(DB::WriteBuffer & ostr, const DB::FormatSettings & settings)
 {
-    deserializeTextEscapedImpl<void>(column, istr, settings, nested);
+    writeString(settings.tsv.null_representation, ostr);
 }
 
-void SerializationNullable::deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+bool SerializationNullable::tryDeserializeNullEscaped(DB::ReadBuffer & istr, const DB::FormatSettings & settings)
 {
-    deserializeTextRawImpl<void>(column, istr, settings, nested);
+    return checkString(settings.tsv.null_representation, istr);
 }
 
 void SerializationNullable::serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
@@ -265,72 +268,73 @@ void SerializationNullable::serializeTextRaw(const IColumn & column, size_t row_
     const ColumnNullable & col = assert_cast<const ColumnNullable &>(column);
 
     if (col.isNullAt(row_num))
-        writeString(settings.tsv.null_representation, ostr);
+        serializeNullRaw(ostr, settings);
     else
         nested->serializeTextRaw(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-template<typename ReturnType>
-ReturnType SerializationNullable::deserializeTextRawImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested)
+void SerializationNullable::serializeNullRaw(DB::WriteBuffer & ostr, const DB::FormatSettings & settings)
 {
-    return deserializeTextEscapedAndRawImpl<ReturnType, false>(column, istr, settings, nested);
+    writeString(settings.tsv.null_representation, ostr);
 }
 
-template<typename ReturnType>
-ReturnType SerializationNullable::deserializeTextEscapedImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
-                                                             const SerializationPtr & nested)
+bool SerializationNullable::tryDeserializeNullRaw(DB::ReadBuffer & istr, const DB::FormatSettings & settings)
 {
-    return deserializeTextEscapedAndRawImpl<ReturnType, true>(column, istr, settings, nested);
+    return checkString(settings.tsv.null_representation, istr);
 }
 
 template<typename ReturnType, bool escaped>
-ReturnType SerializationNullable::deserializeTextEscapedAndRawImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
-                                                    const SerializationPtr & nested_serialization)
+ReturnType deserializeTextEscapedAndRawImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization, bool & is_null)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     const String & null_representation = settings.tsv.null_representation;
+    auto deserialize_nested = [&nested_serialization, &settings] (IColumn & nested_column, ReadBuffer & buf_)
+    {
+        if constexpr (throw_exception)
+        {
+            if constexpr (escaped)
+                nested_serialization->deserializeTextEscaped(nested_column, buf_, settings);
+            else
+                nested_serialization->deserializeTextRaw(nested_column, buf_, settings);
+        }
+        else
+        {
+            if constexpr (escaped)
+                return nested_serialization->tryDeserializeTextEscaped(nested_column, buf_, settings);
+            else
+                return nested_serialization->tryDeserializeTextRaw(nested_column, buf_, settings);
+        }
+    };
 
     /// Some data types can deserialize absence of data (e.g. empty string), so eof is ok.
     if (istr.eof() || (!null_representation.empty() && *istr.position() != null_representation[0]))
     {
         /// This is not null, surely.
-        return safeDeserialize<ReturnType>(column, *nested_serialization,
-            [] { return false; },
-            [&nested_serialization, &istr, &settings] (IColumn & nested_column)
-            {
-                if constexpr (escaped)
-                    nested_serialization->deserializeTextEscaped(nested_column, istr, settings);
-                else
-                    nested_serialization->deserializeTextRaw(nested_column, istr, settings);
-            });
+        return deserializeImpl<ReturnType>(column, istr, [](ReadBuffer &){ return false; }, deserialize_nested, is_null);
     }
 
     /// Check if we have enough data in buffer to check if it's a null.
     if (istr.available() > null_representation.size())
     {
-        auto check_for_null = [&istr, &null_representation]()
+        auto check_for_null = [&null_representation](ReadBuffer & buf)
         {
-            auto * pos = istr.position();
-            if (checkString(null_representation, istr) && (*istr.position() == '\t' || *istr.position() == '\n'))
+            auto * pos = buf.position();
+            if (checkString(null_representation, buf) && (*buf.position() == '\t' || *buf.position() == '\n'))
                 return true;
-            istr.position() = pos;
+            buf.position() = pos;
             return false;
         };
-        auto deserialize_nested = [&nested_serialization, &settings, &istr] (IColumn & nested_column)
-        {
-            if constexpr (escaped)
-                nested_serialization->deserializeTextEscaped(nested_column, istr, settings);
-            else
-                nested_serialization->deserializeTextRaw(nested_column, istr, settings);
-        };
-        return safeDeserialize<ReturnType>(column, *nested_serialization, check_for_null, deserialize_nested);
+        return deserializeImpl<ReturnType>(column, istr, check_for_null, deserialize_nested, is_null);
     }
 
     /// We don't have enough data in buffer to check if it's a null.
     /// Use PeekableReadBuffer to make a checkpoint before checking null
     /// representation and rollback if check was failed.
-    PeekableReadBuffer buf(istr, true);
-    auto check_for_null = [&buf, &null_representation]()
+    PeekableReadBuffer peekable_buf(istr, true);
+    auto check_for_null = [&null_representation](ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
         buf.setCheckpoint();
         SCOPE_EXIT(buf.dropCheckpoint());
         if (checkString(null_representation, buf) && (buf.eof() || *buf.position() == '\t' || *buf.position() == '\n'))
@@ -340,16 +344,18 @@ ReturnType SerializationNullable::deserializeTextEscapedAndRawImpl(IColumn & col
         return false;
     };
 
-    auto deserialize_nested = [&nested_serialization, &settings, &buf, &null_representation, &istr] (IColumn & nested_column)
+    auto deserialize_nested_with_check = [&deserialize_nested, &nested_serialization, &settings, &null_representation, &istr] (IColumn & nested_column, ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
         auto * pos = buf.position();
-        if constexpr (escaped)
-            nested_serialization->deserializeTextEscaped(nested_column, buf, settings);
-        else
-            nested_serialization->deserializeTextRaw(nested_column, buf, settings);
+        if constexpr (throw_exception)
+            deserialize_nested(nested_column, buf);
+        else if (!deserialize_nested(nested_column, buf))
+            return ReturnType(false);
+
         /// Check that we don't have any unread data in PeekableReadBuffer own memory.
         if (likely(!buf.hasUnreadData()))
-            return;
+            return ReturnType(true);
 
         /// We have some unread data in PeekableReadBuffer own memory.
         /// It can happen only if there is a string instead of a number
@@ -358,6 +364,9 @@ ReturnType SerializationNullable::deserializeTextEscapedAndRawImpl(IColumn & col
         /// We also should delete incorrectly deserialized value from nested column.
         nested_column.popBack(1);
 
+        if constexpr (!throw_exception)
+            return ReturnType(false);
+
         if (null_representation.find('\t') != std::string::npos || null_representation.find('\n') != std::string::npos)
             throw DB::ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "TSV custom null representation "
                                        "containing '\\t' or '\\n' may not work correctly for large input.");
@@ -375,7 +384,63 @@ ReturnType SerializationNullable::deserializeTextEscapedAndRawImpl(IColumn & col
                                    istr.count(), std::string(pos, buf.position() - pos), parsed_value.str());
     };
 
-    return safeDeserialize<ReturnType>(column, *nested_serialization, check_for_null, deserialize_nested);
+    return deserializeImpl<ReturnType>(column, peekable_buf, check_for_null, deserialize_nested_with_check, is_null);
+}
+
+void SerializationNullable::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    deserializeTextEscapedAndRawImpl<void, true>(col.getNestedColumn(), istr, settings, nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
+}
+
+bool SerializationNullable::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    return deserializeTextEscapedAndRawImpl<bool, true>(col.getNestedColumn(), istr, settings, nested, is_null) && safeAppendToNullMap<bool>(col, is_null);
+}
+
+bool SerializationNullable::deserializeNullAsDefaultOrNestedTextEscaped(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    deserializeTextEscapedAndRawImpl<void, true>(nested_column, istr, settings, nested_serialization, is_null);
+    return !is_null;
+}
+
+bool SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextEscaped(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    return deserializeTextEscapedAndRawImpl<bool, true>(nested_column, istr, settings, nested_serialization, is_null);
+}
+
+void SerializationNullable::deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    deserializeTextEscapedAndRawImpl<void, false>(col.getNestedColumn(), istr, settings, nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
+}
+
+bool SerializationNullable::tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    return deserializeTextEscapedAndRawImpl<bool, false>(col.getNestedColumn(), istr, settings, nested, is_null) && safeAppendToNullMap<bool>(col, is_null);
+}
+
+bool SerializationNullable::deserializeNullAsDefaultOrNestedTextRaw(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    deserializeTextEscapedAndRawImpl<void, false>(nested_column, istr, settings, nested_serialization, is_null);
+    return !is_null;
+}
+
+bool SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextRaw(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    return deserializeTextEscapedAndRawImpl<bool, false>(nested_column, istr, settings, nested_serialization, is_null);
 }
 
 void SerializationNullable::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
@@ -383,45 +448,51 @@ void SerializationNullable::serializeTextQuoted(const IColumn & column, size_t r
     const ColumnNullable & col = assert_cast<const ColumnNullable &>(column);
 
     if (col.isNullAt(row_num))
-        writeCString("NULL", ostr);
+        serializeNullQuoted(ostr);
     else
         nested->serializeTextQuoted(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-
-void SerializationNullable::deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+void SerializationNullable::serializeNullQuoted(DB::WriteBuffer & ostr)
 {
-    deserializeTextQuotedImpl<void>(column, istr, settings, nested);
+    writeCString("NULL", ostr);
+}
+
+bool SerializationNullable::tryDeserializeNullQuoted(DB::ReadBuffer & istr)
+{
+    return checkStringCaseInsensitive("NULL", istr);
 }
 
 template<typename ReturnType>
-ReturnType SerializationNullable::deserializeTextQuotedImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
-                                                   const SerializationPtr & nested)
+ReturnType deserializeTextQuotedImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested, bool & is_null)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
+    auto deserialize_nested = [&nested, &settings] (IColumn & nested_column, ReadBuffer & buf)
+    {
+        if constexpr (!throw_exception)
+            return nested->tryDeserializeTextQuoted(nested_column, buf, settings);
+        nested->deserializeTextQuoted(nested_column, buf, settings);
+    };
+
     if (istr.eof() || (*istr.position() != 'N' && *istr.position() != 'n'))
     {
         /// This is not null, surely.
-        return safeDeserialize<ReturnType>(column, *nested,
-            [] { return false; },
-            [&nested, &istr, &settings] (IColumn & nested_column) { nested->deserializeTextQuoted(nested_column, istr, settings); });
+        return deserializeImpl<ReturnType>(column, istr, [](ReadBuffer &){ return false; }, deserialize_nested, is_null);
     }
 
     /// Check if we have enough data in buffer to check if it's a null.
     if (istr.available() >= 4)
     {
-        auto check_for_null = [&istr]()
+        auto check_for_null = [](ReadBuffer & buf)
         {
-            auto * pos = istr.position();
-            if (checkStringCaseInsensitive("NULL", istr))
+            auto * pos = buf.position();
+            if (checkStringCaseInsensitive("NULL", buf))
                 return true;
-            istr.position() = pos;
+            buf.position() = pos;
             return false;
         };
-        auto deserialize_nested = [&nested, &settings, &istr] (IColumn & nested_column)
-        {
-            nested->deserializeTextQuoted(nested_column, istr, settings);
-        };
-        return safeDeserialize<ReturnType>(column, *nested, check_for_null, deserialize_nested);
+        return deserializeImpl<ReturnType>(column, istr, check_for_null, deserialize_nested, is_null);
     }
 
     /// We don't have enough data in buffer to check if it's a NULL
@@ -429,9 +500,10 @@ ReturnType SerializationNullable::deserializeTextQuotedImpl(IColumn & column, Re
     /// to differentiate for example NULL and NaN for float)
     /// Use PeekableReadBuffer to make a checkpoint before checking
     /// null and rollback if the check was failed.
-    PeekableReadBuffer buf(istr, true);
-    auto check_for_null = [&buf]()
+    PeekableReadBuffer peekable_buf(istr, true);
+    auto check_for_null = [](ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
         buf.setCheckpoint();
         SCOPE_EXIT(buf.dropCheckpoint());
         if (checkStringCaseInsensitive("NULL", buf))
@@ -441,39 +513,74 @@ ReturnType SerializationNullable::deserializeTextQuotedImpl(IColumn & column, Re
         return false;
     };
 
-    auto deserialize_nested = [&nested, &settings, &buf] (IColumn & nested_column)
+    auto deserialize_nested_with_check = [&deserialize_nested] (IColumn & nested_column, ReadBuffer & buf_)
     {
-        nested->deserializeTextQuoted(nested_column, buf, settings);
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
+
+        if constexpr (throw_exception)
+            deserialize_nested(nested_column, buf);
+        else if (!deserialize_nested(nested_column, buf))
+            return false;
+
         /// Check that we don't have any unread data in PeekableReadBuffer own memory.
         if (likely(!buf.hasUnreadData()))
-            return;
+            return ReturnType(true);
 
         /// We have some unread data in PeekableReadBuffer own memory.
         /// It can happen only if there is an unquoted string instead of a number.
         /// We also should delete incorrectly deserialized value from nested column.
         nested_column.popBack(1);
+
+        if constexpr (!throw_exception)
+            return ReturnType(false);
+
         throw DB::ParsingException(
             ErrorCodes::CANNOT_READ_ALL_DATA,
             "Error while parsing Nullable: got an unquoted string {} instead of a number",
             String(buf.position(), std::min(10ul, buf.available())));
     };
 
-    return safeDeserialize<ReturnType>(column, *nested, check_for_null, deserialize_nested);
+    return deserializeImpl<ReturnType>(column, peekable_buf, check_for_null, deserialize_nested_with_check, is_null);
 }
 
 
-void SerializationNullable::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+void SerializationNullable::deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
-    deserializeWholeTextImpl<void>(column, istr, settings, nested);
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    deserializeTextQuotedImpl<void>(col.getNestedColumn(), istr, settings, nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
+}
+
+bool SerializationNullable::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    return deserializeTextQuotedImpl<bool>(col.getNestedColumn(), istr, settings, nested, is_null) && safeAppendToNullMap<bool>(col, is_null);
+}
+
+bool SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    deserializeTextQuotedImpl<void>(nested_column, istr, settings, nested_serialization, is_null);
+    return !is_null;
+}
+
+bool SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextQuoted(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    return deserializeTextQuotedImpl<bool>(nested_column, istr, settings, nested_serialization, is_null);
 }
 
 template <typename ReturnType>
-ReturnType SerializationNullable::deserializeWholeTextImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
-                                                  const SerializationPtr & nested)
+ReturnType deserializeWholeTextImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested, bool & is_null)
 {
-    PeekableReadBuffer buf(istr, true);
-    auto check_for_null = [&buf]()
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
+    PeekableReadBuffer peekable_buf(istr, true);
+    auto check_for_null = [](ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
         buf.setCheckpoint();
         SCOPE_EXIT(buf.dropCheckpoint());
 
@@ -488,15 +595,46 @@ ReturnType SerializationNullable::deserializeWholeTextImpl(IColumn & column, Rea
         return false;
     };
 
-    auto deserialize_nested = [&nested, &settings, &buf] (IColumn & nested_column)
+    auto deserialize_nested = [&nested, &settings] (IColumn & nested_column, ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
+        if constexpr (!throw_exception)
+            return nested->tryDeserializeWholeText(nested_column, buf, settings);
+
         nested->deserializeWholeText(nested_column, buf, settings);
         assert(!buf.hasUnreadData());
     };
 
-    return safeDeserialize<ReturnType>(column, *nested, check_for_null, deserialize_nested);
+    return deserializeImpl<ReturnType>(column, peekable_buf, check_for_null, deserialize_nested, is_null);
 }
 
+void SerializationNullable::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    deserializeWholeTextImpl<void>(col.getNestedColumn(), istr, settings, nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
+}
+
+bool SerializationNullable::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    return deserializeWholeTextImpl<bool>(col.getNestedColumn(), istr, settings, nested, is_null) && safeAppendToNullMap<bool>(col, is_null);
+}
+
+bool SerializationNullable::deserializeNullAsDefaultOrNestedWholeText(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    deserializeWholeTextImpl<void>(nested_column, istr, settings, nested_serialization, is_null);
+    return !is_null;
+}
+
+bool SerializationNullable::tryDeserializeNullAsDefaultOrNestedWholeText(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    return deserializeWholeTextImpl<bool>(nested_column, istr, settings, nested_serialization, is_null);
+}
 
 void SerializationNullable::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -508,48 +646,56 @@ void SerializationNullable::serializeTextCSV(const IColumn & column, size_t row_
         nested->serializeTextCSV(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-void SerializationNullable::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+void SerializationNullable::serializeNullCSV(DB::WriteBuffer & ostr, const DB::FormatSettings & settings)
 {
-    deserializeTextCSVImpl<void>(column, istr, settings, nested);
+    writeString(settings.csv.null_representation, ostr);
+}
+
+bool SerializationNullable::tryDeserializeNullCSV(DB::ReadBuffer & istr, const DB::FormatSettings & settings)
+{
+    return checkString(settings.csv.null_representation, istr);
 }
 
 template<typename ReturnType>
-ReturnType SerializationNullable::deserializeTextCSVImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
-                                                         const SerializationPtr & nested_serialization)
+ReturnType deserializeTextCSVImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization, bool & is_null)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
+    auto deserialize_nested = [&nested_serialization, &settings] (IColumn & nested_column, ReadBuffer & buf)
+    {
+        if constexpr (!throw_exception)
+            return nested_serialization->tryDeserializeTextCSV(nested_column, buf, settings);
+        nested_serialization->deserializeTextCSV(nested_column, buf, settings);
+    };
+
     const String & null_representation = settings.csv.null_representation;
     if (istr.eof() || (!null_representation.empty() && *istr.position() != null_representation[0]))
     {
         /// This is not null, surely.
-        return safeDeserialize<ReturnType>(column, *nested_serialization,
-            [] { return false; },
-            [&nested_serialization, &istr, &settings] (IColumn & nested_column) { nested_serialization->deserializeTextCSV(nested_column, istr, settings); });
+        return deserializeImpl<ReturnType>(column, istr, [](ReadBuffer &){ return false; }, deserialize_nested, is_null);
     }
 
     /// Check if we have enough data in buffer to check if it's a null.
     if (settings.csv.custom_delimiter.empty() && istr.available() > null_representation.size())
     {
-        auto check_for_null = [&istr, &null_representation, &settings]()
+        auto check_for_null = [&null_representation, &settings](ReadBuffer & buf)
         {
-            auto * pos = istr.position();
-            if (checkString(null_representation, istr) && (*istr.position() == settings.csv.delimiter || *istr.position() == '\r' || *istr.position() == '\n'))
+            auto * pos = buf.position();
+            if (checkString(null_representation, buf) && (*buf.position() == settings.csv.delimiter || *buf.position() == '\r' || *buf.position() == '\n'))
                 return true;
-            istr.position() = pos;
+            buf.position() = pos;
             return false;
         };
-        auto deserialize_nested = [&nested_serialization, &settings, &istr] (IColumn & nested_column)
-        {
-            nested_serialization->deserializeTextCSV(nested_column, istr, settings);
-        };
-        return safeDeserialize<ReturnType>(column, *nested_serialization, check_for_null, deserialize_nested);
+        return deserializeImpl<ReturnType>(column, istr, check_for_null, deserialize_nested, is_null);
     }
 
     /// We don't have enough data in buffer to check if it's a null.
     /// Use PeekableReadBuffer to make a checkpoint before checking null
     /// representation and rollback if the check was failed.
-    PeekableReadBuffer buf(istr, true);
-    auto check_for_null = [&buf, &null_representation, &settings]()
+    PeekableReadBuffer peekable_buf(istr, true);
+    auto check_for_null = [&null_representation, &settings](ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
         buf.setCheckpoint();
         SCOPE_EXIT(buf.dropCheckpoint());
         if (checkString(null_representation, buf))
@@ -572,13 +718,18 @@ ReturnType SerializationNullable::deserializeTextCSVImpl(IColumn & column, ReadB
         return false;
     };
 
-    auto deserialize_nested = [&nested_serialization, &settings, &buf, &null_representation, &istr] (IColumn & nested_column)
+    auto deserialize_nested_with_check = [&deserialize_nested, &nested_serialization, &settings, &null_representation, &istr] (IColumn & nested_column, ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
         auto * pos = buf.position();
-        nested_serialization->deserializeTextCSV(nested_column, buf, settings);
+        if constexpr (throw_exception)
+            deserialize_nested(nested_column, buf);
+        else if (!deserialize_nested(nested_column, buf))
+            return ReturnType(false);
+
         /// Check that we don't have any unread data in PeekableReadBuffer own memory.
         if (likely(!buf.hasUnreadData()))
-            return;
+            return ReturnType(true);
 
         /// We have some unread data in PeekableReadBuffer own memory.
         /// It can happen only if there is an unquoted string instead of a number
@@ -587,6 +738,9 @@ ReturnType SerializationNullable::deserializeTextCSVImpl(IColumn & column, ReadB
         /// We also should delete incorrectly deserialized value from nested column.
         nested_column.popBack(1);
 
+        if constexpr (!throw_exception)
+            return ReturnType(false);
+
         if (null_representation.find(settings.csv.delimiter) != std::string::npos || null_representation.find('\r') != std::string::npos
             || null_representation.find('\n') != std::string::npos)
             throw DB::ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "CSV custom null representation containing "
@@ -602,7 +756,35 @@ ReturnType SerializationNullable::deserializeTextCSVImpl(IColumn & column, ReadB
                                    istr.count(), std::string(pos, buf.position() - pos), parsed_value.str());
     };
 
-    return safeDeserialize<ReturnType>(column, *nested_serialization, check_for_null, deserialize_nested);
+    return deserializeImpl<ReturnType>(column, peekable_buf, check_for_null, deserialize_nested_with_check, is_null);
+}
+
+void SerializationNullable::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    deserializeTextCSVImpl<void>(col.getNestedColumn(), istr, settings, nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
+}
+
+bool SerializationNullable::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    return deserializeTextCSVImpl<bool>(col.getNestedColumn(), istr, settings, nested, is_null) && safeAppendToNullMap<bool>(col, is_null);
+}
+
+bool SerializationNullable::deserializeNullAsDefaultOrNestedTextCSV(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    deserializeTextCSVImpl<void>(nested_column, istr, settings, nested_serialization, is_null);
+    return !is_null;
+}
+
+bool SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextCSV(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    return deserializeTextCSVImpl<bool>(nested_column, istr, settings, nested_serialization, is_null);
 }
 
 void SerializationNullable::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
@@ -616,38 +798,86 @@ void SerializationNullable::serializeText(const IColumn & column, size_t row_num
     /// This assumes UTF-8 and proper font support. This is Ok, because Pretty formats are "presentational", not for data exchange.
 
     if (col.isNullAt(row_num))
-    {
-        if (settings.pretty.charset == FormatSettings::Pretty::Charset::UTF8)
-            writeCString("ᴺᵁᴸᴸ", ostr);
-        else
-            writeCString("NULL", ostr);
-    }
+        serializeNullText(ostr, settings);
     else
         nested->serializeText(col.getNestedColumn(), row_num, ostr, settings);
 }
 
+void SerializationNullable::serializeNullText(DB::WriteBuffer & ostr, const DB::FormatSettings & settings)
+{
+    if (settings.pretty.charset == FormatSettings::Pretty::Charset::UTF8)
+        writeCString("ᴺᵁᴸᴸ", ostr);
+    else
+        writeCString("NULL", ostr);
+}
+
+bool SerializationNullable::tryDeserializeNullText(DB::ReadBuffer & istr)
+{
+    if (checkCharCaseInsensitive('N', istr))
+        return checkStringCaseInsensitive("ULL", istr);
+    return checkStringCaseInsensitive("ᴺᵁᴸᴸ", istr);
+}
+
 void SerializationNullable::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     const ColumnNullable & col = assert_cast<const ColumnNullable &>(column);
 
     if (col.isNullAt(row_num))
-        writeCString("null", ostr);
+        serializeNullJSON(ostr);
     else
         nested->serializeTextJSON(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-void SerializationNullable::deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+void SerializationNullable::serializeNullJSON(DB::WriteBuffer & ostr)
 {
-    deserializeTextJSONImpl<void>(column, istr, settings, nested);
+    writeCString("null", ostr);
+}
+
+bool SerializationNullable::tryDeserializeNullJSON(DB::ReadBuffer & istr)
+{
+    return checkString("null", istr);
 }
 
 template<typename ReturnType>
-ReturnType SerializationNullable::deserializeTextJSONImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
-                                                    const SerializationPtr & nested)
+ReturnType deserializeTextJSONImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested, bool & is_null)
 {
-    return safeDeserialize<ReturnType>(column, *nested,
-        [&istr] { return checkStringByFirstCharacterAndAssertTheRest("null", istr); },
-        [&nested, &istr, &settings] (IColumn & nested_column) { nested->deserializeTextJSON(nested_column, istr, settings); });
+    auto check_for_null = [](ReadBuffer & buf){ return checkStringByFirstCharacterAndAssertTheRest("null", buf); };
+    auto deserialize_nested = [&nested, &settings](IColumn & nested_column, ReadBuffer & buf)
+    {
+        if constexpr (std::is_same_v<ReturnType, bool>)
+            return nested->tryDeserializeTextJSON(nested_column, buf, settings);
+        nested->deserializeTextJSON(nested_column, buf, settings);
+    };
+
+    return deserializeImpl<ReturnType>(column, istr, check_for_null, deserialize_nested, is_null);
+}
+
+void SerializationNullable::deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    deserializeTextJSONImpl<void>(col.getNestedColumn(), istr, settings, nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
+}
+
+bool SerializationNullable::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    return deserializeTextJSONImpl<bool>(col.getNestedColumn(), istr, settings, nested, is_null) && safeAppendToNullMap<bool>(col, is_null);
+}
+
+bool SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    deserializeTextJSONImpl<void>(nested_column, istr, settings, nested_serialization, is_null);
+    return !is_null;
+}
+
+bool SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextJSON(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    return deserializeTextJSONImpl<bool>(nested_column, istr, settings, nested_serialization, is_null);
 }
 
 void SerializationNullable::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
@@ -660,11 +890,9 @@ void SerializationNullable::serializeTextXML(const IColumn & column, size_t row_
         nested->serializeTextXML(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-template bool SerializationNullable::deserializeWholeTextImpl<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-template bool SerializationNullable::deserializeTextEscapedImpl<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-template bool SerializationNullable::deserializeTextQuotedImpl<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested);
-template bool SerializationNullable::deserializeTextCSVImpl<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-template bool SerializationNullable::deserializeTextJSONImpl<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested);
-template bool SerializationNullable::deserializeTextRawImpl<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested);
+void SerializationNullable::serializeNullXML(DB::WriteBuffer & ostr)
+{
+    writeCString("\\N", ostr);
+}
 
 }
diff --git a/src/DataTypes/Serializations/SerializationNullable.h b/src/DataTypes/Serializations/SerializationNullable.h
index 3ec01b46de5..37858ccdefd 100644
--- a/src/DataTypes/Serializations/SerializationNullable.h
+++ b/src/DataTypes/Serializations/SerializationNullable.h
@@ -51,9 +51,12 @@ public:
     void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
@@ -66,31 +69,49 @@ public:
       * In CSV, non-NULL string value, starting with \N characters, must be placed in quotes, to avoid ambiguity.
       */
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
 
-    /// If ReturnType is bool, check for NULL and deserialize value into non-nullable column (and return true) or insert default value of nested type (and return false)
-    /// If ReturnType is void, deserialize Nullable(T)
-    template <typename ReturnType = bool>
-    static ReturnType deserializeWholeTextImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-    template <typename ReturnType = bool>
-    static ReturnType deserializeTextEscapedImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-    template <typename ReturnType = bool>
-    static ReturnType deserializeTextQuotedImpl(IColumn & column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested);
-    template <typename ReturnType = bool>
-    static ReturnType deserializeTextCSVImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-    template <typename ReturnType = bool>
-    static ReturnType deserializeTextJSONImpl(IColumn & column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested);
-    template <typename ReturnType = bool>
-    static ReturnType deserializeTextRawImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-    template <typename ReturnType = bool, bool escaped>
-    static ReturnType deserializeTextEscapedAndRawImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
+    /// If Check for NULL and deserialize value into non-nullable column (and return true) or insert default value of nested type (and return false)
+    static bool deserializeNullAsDefaultOrNestedWholeText(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+    static bool deserializeNullAsDefaultOrNestedTextEscaped(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+    static bool deserializeNullAsDefaultOrNestedTextQuoted(IColumn & nested_column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested_serialization);
+    static bool deserializeNullAsDefaultOrNestedTextCSV(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+    static bool deserializeNullAsDefaultOrNestedTextJSON(IColumn & nested_column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested_serialization);
+    static bool deserializeNullAsDefaultOrNestedTextRaw(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+
+    /// If Check for NULL and deserialize value into non-nullable column or insert default value of nested type.
+    /// Return true if parsing was successful and false in case of any error.
+    static bool tryDeserializeNullAsDefaultOrNestedWholeText(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+    static bool tryDeserializeNullAsDefaultOrNestedTextEscaped(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+    static bool tryDeserializeNullAsDefaultOrNestedTextQuoted(IColumn & nested_column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested_serialization);
+    static bool tryDeserializeNullAsDefaultOrNestedTextCSV(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+    static bool tryDeserializeNullAsDefaultOrNestedTextJSON(IColumn & nested_column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested_serialization);
+    static bool tryDeserializeNullAsDefaultOrNestedTextRaw(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+
+
+    static void serializeNullEscaped(WriteBuffer & ostr, const FormatSettings & settings);
+    static bool tryDeserializeNullEscaped(ReadBuffer & istr, const FormatSettings & settings);
+    static void serializeNullQuoted(WriteBuffer & ostr);
+    static bool tryDeserializeNullQuoted(ReadBuffer & istr);
+    static void serializeNullCSV(WriteBuffer & ostr, const FormatSettings & settings);
+    static bool tryDeserializeNullCSV(ReadBuffer & istr, const FormatSettings & settings);
+    static void serializeNullJSON(WriteBuffer & ostr);
+    static bool tryDeserializeNullJSON(ReadBuffer & istr);
+    static void serializeNullRaw(WriteBuffer & ostr, const FormatSettings & settings);
+    static bool tryDeserializeNullRaw(ReadBuffer & istr, const FormatSettings & settings);
+    static void serializeNullText(WriteBuffer & ostr, const FormatSettings & settings);
+    static bool tryDeserializeNullText(ReadBuffer & istr);
+    static void serializeNullXML(WriteBuffer & ostr);
 
 private:
     struct SubcolumnCreator : public ISubcolumnCreator
diff --git a/src/DataTypes/Serializations/SerializationNumber.cpp b/src/DataTypes/Serializations/SerializationNumber.cpp
index b6c7e4618b8..bdb4dfc6735 100644
--- a/src/DataTypes/Serializations/SerializationNumber.cpp
+++ b/src/DataTypes/Serializations/SerializationNumber.cpp
@@ -37,6 +37,18 @@ void SerializationNumber<T>::deserializeText(IColumn & column, ReadBuffer & istr
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "Number");
 }
 
+template <typename T>
+bool SerializationNumber<T>::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const
+{
+    T x;
+
+    if (!tryReadText(x, istr) || (whole && !istr.eof()))
+        return false;
+
+    assert_cast<ColumnVector<T> &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename T>
 void SerializationNumber<T>::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -44,9 +56,10 @@ void SerializationNumber<T>::serializeTextJSON(const IColumn & column, size_t ro
     writeJSONNumber(x, ostr, settings);
 }
 
-template <typename T>
-void SerializationNumber<T>::deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+template <typename T, typename ReturnType>
+ReturnType deserializeTextJSONImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
     bool has_quote = false;
     if (!istr.eof() && *istr.position() == '"')        /// We understand the number both in quotes and without.
     {
@@ -54,13 +67,16 @@ void SerializationNumber<T>::deserializeTextJSON(IColumn & column, ReadBuffer &
         ++istr.position();
     }
 
-    FieldType x;
+    T x;
 
     /// null
     if (!has_quote && !istr.eof() && *istr.position() == 'n')
     {
         ++istr.position();
-        assertString("ull", istr);
+        if constexpr (throw_exception)
+            assertString("ull", istr);
+        else if (!checkString("ull", istr))
+            return ReturnType(false);
 
         x = NaNOrZero<T>();
     }
@@ -73,26 +89,62 @@ void SerializationNumber<T>::deserializeTextJSON(IColumn & column, ReadBuffer &
         {
             // extra conditions to parse true/false strings into 1/0
             if (istr.eof())
-                throwReadAfterEOF();
+            {
+                if constexpr (throw_exception)
+                    throwReadAfterEOF();
+                else
+                    return false;
+            }
+
             if (*istr.position() == 't' || *istr.position() == 'f')
             {
                 bool tmp = false;
-                readBoolTextWord(tmp, istr);
+                if constexpr (throw_exception)
+                    readBoolTextWord(tmp, istr);
+                else if (!readBoolTextWord<bool>(tmp, istr))
+                    return ReturnType(false);
+
                 x = tmp;
             }
             else
-                readText(x, istr);
+            {
+                if constexpr (throw_exception)
+                    readText(x, istr);
+                else if (!tryReadText(x, istr))
+                    return ReturnType(false);
+            }
         }
         else
         {
-            readText(x, istr);
+            if constexpr (throw_exception)
+                readText(x, istr);
+            else if (!tryReadText(x, istr))
+                return ReturnType(false);
         }
 
         if (has_quote)
-            assertChar('"', istr);
+        {
+            if constexpr (throw_exception)
+                assertChar('"', istr);
+            else if (!checkChar('"', istr))
+                return ReturnType(false);
+        }
     }
 
     assert_cast<ColumnVector<T> &>(column).getData().push_back(x);
+    return ReturnType(true);
+}
+
+template <typename T>
+void SerializationNumber<T>::deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    deserializeTextJSONImpl<T, void>(column, istr, settings);
+}
+
+template <typename T>
+bool SerializationNumber<T>::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return deserializeTextJSONImpl<T, bool>(column, istr, settings);
 }
 
 template <typename T>
@@ -103,6 +155,16 @@ void SerializationNumber<T>::deserializeTextCSV(IColumn & column, ReadBuffer & i
     assert_cast<ColumnVector<T> &>(column).getData().push_back(x);
 }
 
+template <typename T>
+bool SerializationNumber<T>::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & /*settings*/) const
+{
+    FieldType x;
+    if (!tryReadCSV(x, istr))
+        return false;
+    assert_cast<ColumnVector<T> &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename T>
 void SerializationNumber<T>::serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const
 {
diff --git a/src/DataTypes/Serializations/SerializationNumber.h b/src/DataTypes/Serializations/SerializationNumber.h
index 972c6c9a30f..9d53dc9c494 100644
--- a/src/DataTypes/Serializations/SerializationNumber.h
+++ b/src/DataTypes/Serializations/SerializationNumber.h
@@ -20,9 +20,12 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     /** Format is platform-dependent. */
     void serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const override;
diff --git a/src/DataTypes/Serializations/SerializationString.cpp b/src/DataTypes/Serializations/SerializationString.cpp
index 788ff429088..1680ec8a333 100644
--- a/src/DataTypes/Serializations/SerializationString.cpp
+++ b/src/DataTypes/Serializations/SerializationString.cpp
@@ -272,40 +272,67 @@ void SerializationString::serializeTextEscaped(const IColumn & column, size_t ro
 }
 
 
-template <typename Reader>
-static inline void read(IColumn & column, Reader && reader)
+template <typename ReturnType, typename Reader>
+static inline ReturnType read(IColumn & column, Reader && reader)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
     ColumnString & column_string = assert_cast<ColumnString &>(column);
     ColumnString::Chars & data = column_string.getChars();
     ColumnString::Offsets & offsets = column_string.getOffsets();
     size_t old_chars_size = data.size();
     size_t old_offsets_size = offsets.size();
-    try
-    {
-        reader(data);
-        data.push_back(0);
-        offsets.push_back(data.size());
-    }
-    catch (...)
+    auto restore_column = [&]()
     {
         offsets.resize_assume_reserved(old_offsets_size);
         data.resize_assume_reserved(old_chars_size);
-        throw;
+    };
+
+    try
+    {
+        if constexpr (throw_exception)
+        {
+            reader(data);
+        }
+        else if (!reader(data))
+        {
+            restore_column();
+            return false;
+        }
+
+        data.push_back(0);
+        offsets.push_back(data.size());
+        return ReturnType(true);
+    }
+    catch (...)
+    {
+        restore_column();
+        if constexpr (throw_exception)
+            throw;
+        else
+            return false;
     }
 }
 
 
 void SerializationString::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
-    read(column, [&](ColumnString::Chars & data) { readStringUntilEOFInto(data, istr); });
+    read<void>(column, [&](ColumnString::Chars & data) { readStringUntilEOFInto(data, istr); });
 }
 
+bool SerializationString::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return read<bool>(column, [&](ColumnString::Chars & data) { readStringUntilEOFInto(data, istr); return true; });
+}
 
 void SerializationString::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
-    read(column, [&](ColumnString::Chars & data) { readEscapedStringInto(data, istr); });
+    read<void>(column, [&](ColumnString::Chars & data) { readEscapedStringInto(data, istr); });
 }
 
+bool SerializationString::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return read<bool>(column, [&](ColumnString::Chars & data) { readEscapedStringInto(data, istr); return true; });
+}
 
 void SerializationString::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
@@ -315,7 +342,12 @@ void SerializationString::serializeTextQuoted(const IColumn & column, size_t row
 
 void SerializationString::deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
-    read(column, [&](ColumnString::Chars & data) { readQuotedStringInto<true>(data, istr); });
+    read<void>(column, [&](ColumnString::Chars & data) { readQuotedStringInto<true>(data, istr); });
+}
+
+bool SerializationString::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return read<bool>(column, [&](ColumnString::Chars & data) { return tryReadQuotedStringInto<true>(data, istr); });
 }
 
 
@@ -329,11 +361,11 @@ void SerializationString::deserializeTextJSON(IColumn & column, ReadBuffer & ist
 {
     if (settings.json.read_objects_as_strings && !istr.eof() && *istr.position() == '{')
     {
-        read(column, [&](ColumnString::Chars & data) { readJSONObjectPossiblyInvalid(data, istr); });
+        read<void>(column, [&](ColumnString::Chars & data) { readJSONObjectPossiblyInvalid(data, istr); });
     }
     else if (settings.json.read_arrays_as_strings && !istr.eof() && *istr.position() == '[')
     {
-        read(column, [&](ColumnString::Chars & data) { readJSONArrayInto(data, istr); });
+        read<void>(column, [&](ColumnString::Chars & data) { readJSONArrayInto(data, istr); });
     }
     else if (settings.json.read_numbers_as_strings && !istr.eof() && *istr.position() != '"')
     {
@@ -342,12 +374,40 @@ void SerializationString::deserializeTextJSON(IColumn & column, ReadBuffer & ist
         Float64 tmp;
         ReadBufferFromString buf(field);
         if (tryReadFloatText(tmp, buf) && buf.eof())
-            read(column, [&](ColumnString::Chars & data) { data.insert(field.begin(), field.end()); });
+            read<void>(column, [&](ColumnString::Chars & data) { data.insert(field.begin(), field.end()); });
         else
             throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse JSON String value here: {}", field);
     }
     else
-        read(column, [&](ColumnString::Chars & data) { readJSONStringInto(data, istr); });
+        read<void>(column, [&](ColumnString::Chars & data) { readJSONStringInto(data, istr); });
+}
+
+bool SerializationString::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    if (settings.json.read_objects_as_strings && !istr.eof() && *istr.position() == '{')
+        return read<bool>(column, [&](ColumnString::Chars & data) { return readJSONObjectPossiblyInvalid<ColumnString::Chars, bool>(data, istr); });
+
+    if (settings.json.read_arrays_as_strings && !istr.eof() && *istr.position() == '[')
+        return read<bool>(column, [&](ColumnString::Chars & data) { return readJSONArrayInto<ColumnString::Chars, bool>(data, istr); });
+
+    if (settings.json.read_numbers_as_strings && !istr.eof() && *istr.position() != '"')
+    {
+        String field;
+        if (!tryReadJSONField(field, istr))
+            return false;
+
+        Float64 tmp;
+        ReadBufferFromString buf(field);
+        if (tryReadFloatText(tmp, buf) && buf.eof())
+        {
+            read<void>(column, [&](ColumnString::Chars & data) { data.insert(field.begin(), field.end()); });
+            return true;
+        }
+
+        return false;
+    }
+
+    return read<bool>(column, [&](ColumnString::Chars & data) { return tryReadJSONStringInto(data, istr); });
 }
 
 
@@ -365,7 +425,12 @@ void SerializationString::serializeTextCSV(const IColumn & column, size_t row_nu
 
 void SerializationString::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
-    read(column, [&](ColumnString::Chars & data) { readCSVStringInto(data, istr, settings.csv); });
+    read<void>(column, [&](ColumnString::Chars & data) { readCSVStringInto(data, istr, settings.csv); });
+}
+
+bool SerializationString::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return read<bool>(column, [&](ColumnString::Chars & data) { readCSVStringInto<ColumnString::Chars, false, false>(data, istr, settings.csv); return true; });
 }
 
 void SerializationString::serializeTextMarkdown(
diff --git a/src/DataTypes/Serializations/SerializationString.h b/src/DataTypes/Serializations/SerializationString.h
index cd4cdf79c11..89ab84f0d22 100644
--- a/src/DataTypes/Serializations/SerializationString.h
+++ b/src/DataTypes/Serializations/SerializationString.h
@@ -18,20 +18,25 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextMarkdown(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 };
diff --git a/src/DataTypes/Serializations/SerializationTuple.cpp b/src/DataTypes/Serializations/SerializationTuple.cpp
index cbbe97eb05c..c0b0658e6b4 100644
--- a/src/DataTypes/Serializations/SerializationTuple.cpp
+++ b/src/DataTypes/Serializations/SerializationTuple.cpp
@@ -62,15 +62,35 @@ void SerializationTuple::serializeBinary(const IColumn & column, size_t row_num,
 }
 
 
-template <typename F>
-static void addElementSafe(size_t num_elems, IColumn & column, F && impl)
+template <typename ReturnType = void, typename F>
+static ReturnType addElementSafe(size_t num_elems, IColumn & column, F && impl)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     /// We use the assumption that tuples of zero size do not exist.
     size_t old_size = column.size();
 
+    auto restore_elements = [&]()
+    {
+        for (size_t i = 0; i < num_elems; ++i)
+        {
+            auto & element_column = extractElementColumn(column, i);
+            if (element_column.size() > old_size)
+                element_column.popBack(1);
+        }
+    };
+
     try
     {
-        impl();
+        if constexpr (throw_exception)
+        {
+            impl();
+        }
+        else if (!impl())
+        {
+            restore_elements();
+            return ReturnType(false);
+        }
 
         // Check that all columns now have the same size.
         size_t new_size = column.size();
@@ -81,22 +101,23 @@ static void addElementSafe(size_t num_elems, IColumn & column, F && impl)
             {
                 // This is not a logical error because it may work with
                 // user-supplied data.
-                throw Exception(ErrorCodes::SIZES_OF_COLUMNS_IN_TUPLE_DOESNT_MATCH,
-                    "Cannot read a tuple because not all elements are present");
+                if constexpr (throw_exception)
+                    throw Exception(ErrorCodes::SIZES_OF_COLUMNS_IN_TUPLE_DOESNT_MATCH,
+                        "Cannot read a tuple because not all elements are present");
+                restore_elements();
+                return ReturnType(false);
             }
         }
     }
     catch (...)
     {
-        for (size_t i = 0; i < num_elems; ++i)
-        {
-            auto & element_column = extractElementColumn(column, i);
-            if (element_column.size() > old_size)
-                element_column.popBack(1);
-        }
-
-        throw;
+        restore_elements();
+        if constexpr (throw_exception)
+            throw;
+        return ReturnType(false);
     }
+
+    return ReturnType(true);
 }
 
 void SerializationTuple::deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
@@ -120,25 +141,51 @@ void SerializationTuple::serializeText(const IColumn & column, size_t row_num, W
     writeChar(')', ostr);
 }
 
-void SerializationTuple::deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const
+template <typename ReturnType>
+ReturnType SerializationTuple::deserializeTextImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const
 {
-    const size_t size = elems.size();
-    assertChar('(', istr);
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
 
-    addElementSafe(elems.size(), column, [&]
+    const size_t size = elems.size();
+    if constexpr (throw_exception)
+        assertChar('(', istr);
+    else if (!checkChar('(', istr))
+        return ReturnType(false);
+
+    auto impl = [&]()
     {
         for (size_t i = 0; i < size; ++i)
         {
             skipWhitespaceIfAny(istr);
             if (i != 0)
             {
-                assertChar(',', istr);
+                if constexpr (throw_exception)
+                    assertChar(',', istr);
+                else if (!checkChar(',', istr))
+                    return ReturnType(false);
+
                 skipWhitespaceIfAny(istr);
             }
-            if (settings.null_as_default)
-                SerializationNullable::deserializeTextQuotedImpl(extractElementColumn(column, i), istr, settings, elems[i]);
+
+            auto & element_column = extractElementColumn(column, i);
+            if constexpr (throw_exception)
+            {
+                if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(element_column))
+                    SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(element_column, istr, settings, elems[i]);
+                else
+                    elems[i]->deserializeTextQuoted(element_column, istr, settings);
+            }
             else
-                elems[i]->deserializeTextQuoted(extractElementColumn(column, i), istr, settings);
+            {
+                bool ok;
+                if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(element_column))
+                    ok = SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextQuoted(element_column, istr, settings, elems[i]);
+                else
+                    ok = elems[i]->tryDeserializeTextQuoted(element_column, istr, settings);
+
+                if (!ok)
+                    return false;
+            }
         }
 
         // Special format for one element tuple (1,)
@@ -150,11 +197,35 @@ void SerializationTuple::deserializeText(IColumn & column, ReadBuffer & istr, co
         }
 
         skipWhitespaceIfAny(istr);
-        assertChar(')', istr);
+        if constexpr (throw_exception)
+            assertChar(')', istr);
+        else if (!checkChar(')', istr))
+            return ReturnType(false);
 
         if (whole && !istr.eof())
-            throwUnexpectedDataAfterParsedValue(column, istr, settings, "Tuple");
-    });
+        {
+            if constexpr (throw_exception)
+                throwUnexpectedDataAfterParsedValue(column, istr, settings, "Tuple");
+            return ReturnType(false);
+        }
+
+        return ReturnType(true);
+    };
+
+    if constexpr (throw_exception)
+        addElementSafe<ReturnType>(elems.size(), column, impl);
+    else
+        return addElementSafe<ReturnType>(elems.size(), column, impl);
+}
+
+void SerializationTuple::deserializeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, bool whole) const
+{
+    deserializeTextImpl(column, istr, settings, whole);
+}
+
+bool SerializationTuple::tryDeserializeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, bool whole) const
+{
+    return deserializeTextImpl<bool>(column, istr, settings, whole);
 }
 
 void SerializationTuple::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
@@ -239,16 +310,39 @@ void SerializationTuple::serializeTextJSONPretty(const IColumn & column, size_t
     }
 }
 
-void SerializationTuple::deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+template <typename ReturnType>
+ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
+    auto deserialize_element = [&](IColumn & element_column, size_t element_pos)
+    {
+        if constexpr (throw_exception)
+        {
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(element_column))
+                SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(element_column, istr, settings, elems[element_pos]);
+            else
+                elems[element_pos]->deserializeTextJSON(element_column, istr, settings);
+        }
+        else
+        {
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(element_column))
+                return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextJSON(element_column, istr, settings, elems[element_pos]);
+            return elems[element_pos]->tryDeserializeTextJSON(element_column, istr, settings);
+        }
+    };
+
     if (settings.json.read_named_tuples_as_objects
         && have_explicit_names)
     {
         skipWhitespaceIfAny(istr);
-        assertChar('{', istr);
+        if constexpr (throw_exception)
+            assertChar('{', istr);
+        else if (!checkChar('{', istr))
+            return ReturnType(false);
         skipWhitespaceIfAny(istr);
 
-        addElementSafe(elems.size(), column, [&]
+        auto impl = [&]()
         {
             std::vector<UInt8> seen_elements(elems.size(), 0);
             size_t processed = 0;
@@ -256,18 +350,32 @@ void SerializationTuple::deserializeTextJSON(IColumn & column, ReadBuffer & istr
             while (!istr.eof() && *istr.position() != '}')
             {
                 if (!settings.json.ignore_unknown_keys_in_named_tuple && processed == elems.size())
-                    throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected number of elements in named tuple. Expected no more than {} (consider enabling input_format_json_ignore_unknown_keys_in_named_tuple setting)", elems.size());
+                {
+                    if constexpr (throw_exception)
+                        throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected number of elements in named tuple. Expected no more than {} (consider enabling input_format_json_ignore_unknown_keys_in_named_tuple setting)", elems.size());
+                    return ReturnType(false);
+                }
 
                 if (processed + skipped > 0)
                 {
-                    assertChar(',', istr);
+                    if constexpr (throw_exception)
+                        assertChar(',', istr);
+                    else if (!checkChar(',', istr))
+                        return ReturnType(false);
                     skipWhitespaceIfAny(istr);
                 }
 
                 std::string name;
-                readDoubleQuotedString(name, istr);
+                if constexpr (throw_exception)
+                    readDoubleQuotedString(name, istr);
+                else if (!tryReadDoubleQuotedString(name, istr))
+                    return ReturnType(false);
+
                 skipWhitespaceIfAny(istr);
-                assertChar(':', istr);
+                if constexpr (throw_exception)
+                    assertChar(':', istr);
+                else if (!checkChar(':', istr))
+                    return ReturnType(false);
                 skipWhitespaceIfAny(istr);
 
                 const size_t element_pos = getPositionByName(name);
@@ -275,36 +383,52 @@ void SerializationTuple::deserializeTextJSON(IColumn & column, ReadBuffer & istr
                 {
                     if (settings.json.ignore_unknown_keys_in_named_tuple)
                     {
-                        skipJSONField(istr, name);
+                        if constexpr (throw_exception)
+                            skipJSONField(istr, name);
+                        else if (!trySkipJSONField(istr, name))
+                            return ReturnType(false);
+
                         skipWhitespaceIfAny(istr);
                         ++skipped;
                         continue;
                     }
                     else
-                        throw Exception(ErrorCodes::NOT_FOUND_COLUMN_IN_BLOCK, "Tuple doesn't have element with name '{}', enable setting input_format_json_ignore_unknown_keys_in_named_tuple", name);
+                    {
+                        if constexpr (throw_exception)
+                            throw Exception(ErrorCodes::NOT_FOUND_COLUMN_IN_BLOCK, "Tuple doesn't have element with name '{}', enable setting input_format_json_ignore_unknown_keys_in_named_tuple", name);
+                        return ReturnType(false);
+                    }
                 }
 
                 seen_elements[element_pos] = 1;
                 auto & element_column = extractElementColumn(column, element_pos);
 
-                try
+                if constexpr (throw_exception)
                 {
-                    if (settings.null_as_default)
-                        SerializationNullable::deserializeTextJSONImpl(element_column, istr, settings, elems[element_pos]);
-                    else
-                        elems[element_pos]->deserializeTextJSON(element_column, istr, settings);
+                    try
+                    {
+                        deserialize_element(element_column, element_pos);
+                    }
+                    catch (Exception & e)
+                    {
+                        e.addMessage("(while reading the value of nested key " + name + ")");
+                        throw;
+                    }
                 }
-                catch (Exception & e)
+                else
                 {
-                    e.addMessage("(while reading the value of nested key " + name + ")");
-                    throw;
+                    if (!deserialize_element(element_column, element_pos))
+                        return ReturnType(false);
                 }
 
                 skipWhitespaceIfAny(istr);
                 ++processed;
             }
 
-            assertChar('}', istr);
+            if constexpr (throw_exception)
+                assertChar('}', istr);
+            else if (!checkChar('}', istr))
+                return ReturnType(false);
 
             /// Check if we have missing elements.
             if (processed != elems.size())
@@ -315,41 +439,87 @@ void SerializationTuple::deserializeTextJSON(IColumn & column, ReadBuffer & istr
                         continue;
 
                     if (!settings.json.defaults_for_missing_elements_in_named_tuple)
-                        throw Exception(
-                            ErrorCodes::INCORRECT_DATA,
-                            "JSON object doesn't contain tuple element {}. If you want to insert defaults in case of missing elements, "
-                            "enable setting input_format_json_defaults_for_missing_elements_in_named_tuple",
-                            elems[element_pos]->getElementName());
+                    {
+                        if constexpr (throw_exception)
+                            throw Exception(
+                                ErrorCodes::INCORRECT_DATA,
+                                "JSON object doesn't contain tuple element {}. If you want to insert defaults in case of missing elements, "
+                                "enable setting input_format_json_defaults_for_missing_elements_in_named_tuple",
+                                elems[element_pos]->getElementName());
+                        return ReturnType(false);
+                    }
 
                     auto & element_column = extractElementColumn(column, element_pos);
                     element_column.insertDefault();
                 }
             }
-        });
+
+            return ReturnType(true);
+        };
+
+        if constexpr (throw_exception)
+            addElementSafe<ReturnType>(elems.size(), column, impl);
+        else
+            return addElementSafe<ReturnType>(elems.size(), column, impl);
     }
     else
     {
-        assertChar('[', istr);
+        skipWhitespaceIfAny(istr);
+        if constexpr (throw_exception)
+            assertChar('[', istr);
+        else if (!checkChar('[', istr))
+            return ReturnType(false);
+        skipWhitespaceIfAny(istr);
 
-        addElementSafe(elems.size(), column, [&]
+        auto impl = [&]()
         {
             for (size_t i = 0; i < elems.size(); ++i)
             {
                 skipWhitespaceIfAny(istr);
                 if (i != 0)
                 {
-                    assertChar(',', istr);
+                    if constexpr (throw_exception)
+                        assertChar(',', istr);
+                    else if (!checkChar(',', istr))
+                        return ReturnType(false);
                     skipWhitespaceIfAny(istr);
                 }
-                elems[i]->deserializeTextJSON(extractElementColumn(column, i), istr, settings);
+
+                auto & element_column = extractElementColumn(column, i);
+
+                if constexpr (throw_exception)
+                    deserialize_element(element_column, i);
+                else if (!deserialize_element(element_column, i))
+                    return ReturnType(false);
             }
 
             skipWhitespaceIfAny(istr);
-            assertChar(']', istr);
-        });
+            if constexpr (throw_exception)
+                assertChar(']', istr);
+            else if (!checkChar(']', istr))
+                return ReturnType(false);
+
+            return ReturnType(true);
+        };
+
+        if constexpr (throw_exception)
+            addElementSafe<ReturnType>(elems.size(), column, impl);
+        else
+            return addElementSafe<ReturnType>(elems.size(), column, impl);
     }
 }
 
+void SerializationTuple::deserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    deserializeTextJSONImpl(column, istr, settings);
+}
+
+bool SerializationTuple::tryDeserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    return deserializeTextJSONImpl<bool>(column, istr, settings);
+}
+
+
 void SerializationTuple::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeCString("<tuple>", ostr);
@@ -385,14 +555,48 @@ void SerializationTuple::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
                 assertChar(settings.csv.tuple_delimiter, istr);
                 skipWhitespaceIfAny(istr);
             }
-            if (settings.null_as_default)
-                SerializationNullable::deserializeTextCSVImpl(extractElementColumn(column, i), istr, settings, elems[i]);
+
+            auto & element_column = extractElementColumn(column, i);
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(element_column))
+                SerializationNullable::deserializeNullAsDefaultOrNestedTextCSV(element_column, istr, settings, elems[i]);
             else
-                elems[i]->deserializeTextCSV(extractElementColumn(column, i), istr, settings);
+                elems[i]->deserializeTextCSV(element_column, istr, settings);
         }
     });
 }
 
+bool SerializationTuple::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return addElementSafe<bool>(elems.size(), column, [&]
+    {
+        const size_t size = elems.size();
+        for (size_t i = 0; i < size; ++i)
+        {
+            if (i != 0)
+            {
+               skipWhitespaceIfAny(istr);
+               if (!checkChar(settings.csv.tuple_delimiter, istr))
+                   return false;
+               skipWhitespaceIfAny(istr);
+            }
+
+            auto & element_column = extractElementColumn(column, i);
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(element_column))
+            {
+               if (!SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextCSV(element_column, istr, settings, elems[i]))
+                   return false;
+            }
+            else
+            {
+               if (!elems[i]->tryDeserializeTextCSV(element_column, istr, settings))
+                   return false;
+            }
+        }
+
+        return true;
+    });
+}
+
 void SerializationTuple::enumerateStreams(
     EnumerateStreamsSettings & settings,
     const StreamCallback & callback,
diff --git a/src/DataTypes/Serializations/SerializationTuple.h b/src/DataTypes/Serializations/SerializationTuple.h
index 7325259f440..d9c63a05217 100644
--- a/src/DataTypes/Serializations/SerializationTuple.h
+++ b/src/DataTypes/Serializations/SerializationTuple.h
@@ -23,14 +23,17 @@ public:
     void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSONPretty(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings, size_t indent) const override;
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     /// Tuples in CSV format will be serialized as separate columns (that is, losing their nesting in the tuple).
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     /** Each sub-column in a tuple is serialized in separate stream.
       */
@@ -73,6 +76,15 @@ private:
     bool have_explicit_names;
 
     size_t getPositionByName(const String & name) const;
+
+    template <typename ReturnType = void>
+    ReturnType deserializeTextImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const;
+
+    template <typename ReturnType = void>
+    ReturnType deserializeTextJSONImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const;
+
+    template <typename ReturnType = void>
+    ReturnType deserializeTextCSVImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const;
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationUUID.cpp b/src/DataTypes/Serializations/SerializationUUID.cpp
index 5cf17b4c0c8..5a7aeca67a0 100644
--- a/src/DataTypes/Serializations/SerializationUUID.cpp
+++ b/src/DataTypes/Serializations/SerializationUUID.cpp
@@ -25,15 +25,16 @@ void SerializationUUID::deserializeText(IColumn & column, ReadBuffer & istr, con
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "UUID");
 }
 
-void SerializationUUID::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+bool SerializationUUID::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const
 {
-    deserializeText(column, istr, settings, false);
+    UUID x;
+    if (!tryReadText(x, istr) || (whole && !istr.eof()))
+        return false;
+
+    assert_cast<ColumnUUID &>(column).getData().push_back(x);
+    return true;
 }
 
-void SerializationUUID::serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
-{
-    serializeText(column, row_num, ostr, settings);
-}
 
 void SerializationUUID::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -76,6 +77,17 @@ void SerializationUUID::deserializeTextQuoted(IColumn & column, ReadBuffer & ist
     assert_cast<ColumnUUID &>(column).getData().push_back(std::move(uuid)); /// It's important to do this at the end - for exception safety.
 }
 
+bool SerializationUUID::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    UUID uuid;
+    String field;
+    if (!checkChar('\'', istr) || !tryReadText(uuid, istr) || !checkChar('\'', istr))
+        return false;
+
+    assert_cast<ColumnUUID &>(column).getData().push_back(std::move(uuid));
+    return true;
+}
+
 void SerializationUUID::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -92,6 +104,15 @@ void SerializationUUID::deserializeTextJSON(IColumn & column, ReadBuffer & istr,
     assert_cast<ColumnUUID &>(column).getData().push_back(x);
 }
 
+bool SerializationUUID::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    UUID x;
+    if (!checkChar('"', istr) || !tryReadText(x, istr) || !checkChar('"', istr))
+        return false;
+    assert_cast<ColumnUUID &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationUUID::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -106,6 +127,14 @@ void SerializationUUID::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
     assert_cast<ColumnUUID &>(column).getData().push_back(value);
 }
 
+bool SerializationUUID::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    UUID value;
+    if (!tryReadCSV(value, istr))
+        return false;
+    assert_cast<ColumnUUID &>(column).getData().push_back(value);
+    return true;
+}
 
 void SerializationUUID::serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const
 {
diff --git a/src/DataTypes/Serializations/SerializationUUID.h b/src/DataTypes/Serializations/SerializationUUID.h
index da8c15f7279..458504f8f42 100644
--- a/src/DataTypes/Serializations/SerializationUUID.h
+++ b/src/DataTypes/Serializations/SerializationUUID.h
@@ -10,14 +10,16 @@ class SerializationUUID : public SimpleTextSerialization
 public:
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
-    void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
-    void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeBinary(Field & field, ReadBuffer & istr, const FormatSettings &) const override;
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
new file mode 100644
index 00000000000..ebd44fd6955
--- /dev/null
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -0,0 +1,828 @@
+#include <DataTypes/Serializations/SerializationVariant.h>
+#include <DataTypes/Serializations/SerializationVariantElement.h>
+#include <DataTypes/Serializations/SerializationNumber.h>
+#include <DataTypes/Serializations/SerializationNullable.h>
+#include <DataTypes/Serializations/SerializationNamed.h>
+#include <DataTypes/DataTypeVariant.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeTuple.h>
+#include <DataTypes/DataTypeMap.h>
+#include <DataTypes/DataTypeLowCardinality.h>
+#include <Columns/ColumnVariant.h>
+
+#include <IO/ReadBuffer.h>
+#include <IO/WriteBuffer.h>
+#include <IO/WriteHelpers.h>
+#include <IO/ReadHelpers.h>
+#include <IO/ReadBufferFromString.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+    extern const int NOT_IMPLEMENTED;
+    extern const int INCORRECT_DATA;
+}
+
+void SerializationVariant::enumerateStreams(
+    EnumerateStreamsSettings & settings,
+    const StreamCallback & callback,
+    const SubstreamData & data) const
+{
+    const auto * type_variant = data.type ? &assert_cast<const DataTypeVariant &>(*data.type) : nullptr;
+    const auto * column_variant = data.column ? &assert_cast<const ColumnVariant &>(*data.column) : nullptr;
+
+    auto discriminators_serialization = std::make_shared<SerializationNamed>(std::make_shared<SerializationNumber<ColumnVariant::Discriminator>>(), "discr", false);
+    auto local_discriminators = column_variant ? column_variant->getLocalDiscriminatorsPtr() : nullptr;
+
+    settings.path.push_back(Substream::VariantDiscriminators);
+    auto discriminators_data = SubstreamData(discriminators_serialization)
+                             .withType(type_variant ? std::make_shared<DataTypeNumber<ColumnVariant::Discriminator>>() : nullptr)
+                             .withColumn(column_variant ? column_variant->getLocalDiscriminatorsPtr() : nullptr)
+                             .withSerializationInfo(data.serialization_info);
+
+    settings.path.back().data = discriminators_data;
+    callback(settings.path);
+    settings.path.pop_back();
+
+    settings.path.push_back(Substream::VariantElements);
+    settings.path.back().data = data;
+
+    for (size_t i = 0; i < variants.size(); ++i)
+    {
+        settings.path.back().creator = std::make_shared<SerializationVariantElement::VariantSubcolumnCreator>(local_discriminators, variant_names[i], i, column_variant ? column_variant->localDiscriminatorByGlobal(i) : i);
+
+        auto variant_data = SubstreamData(variants[i])
+                             .withType(type_variant ? type_variant->getVariant(i) : nullptr)
+                             .withColumn(column_variant ? column_variant->getVariantPtrByGlobalDiscriminator(i) : nullptr)
+                             .withSerializationInfo(data.serialization_info);
+
+        addVariantElementToPath(settings.path, i);
+        settings.path.back().data = variant_data;
+        variants[i]->enumerateStreams(settings, callback, variant_data);
+        settings.path.pop_back();
+    }
+
+    settings.path.pop_back();
+}
+
+struct SerializeBinaryBulkStateVariant : public ISerialization::SerializeBinaryBulkState
+{
+    std::vector<ISerialization::SerializeBinaryBulkStatePtr> states;
+};
+
+struct DeserializeBinaryBulkStateVariant : public ISerialization::DeserializeBinaryBulkState
+{
+    std::vector<ISerialization::DeserializeBinaryBulkStatePtr> states;
+};
+
+void SerializationVariant::serializeBinaryBulkStatePrefix(
+    const IColumn & column,
+    SerializeBinaryBulkSettings & settings,
+    SerializeBinaryBulkStatePtr & state) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+
+    auto variant_state = std::make_shared<SerializeBinaryBulkStateVariant>();
+    variant_state->states.resize(variants.size());
+
+    settings.path.push_back(Substream::VariantElements);
+
+    for (size_t i = 0; i < variants.size(); ++i)
+    {
+        addVariantElementToPath(settings.path, i);
+        variants[i]->serializeBinaryBulkStatePrefix(col.getVariantByGlobalDiscriminator(i), settings, variant_state->states[i]);
+        settings.path.pop_back();
+    }
+
+    settings.path.pop_back();
+    state = std::move(variant_state);
+}
+
+
+void SerializationVariant::serializeBinaryBulkStateSuffix(
+    SerializeBinaryBulkSettings & settings,
+    SerializeBinaryBulkStatePtr & state) const
+{
+    auto * variant_state = checkAndGetState<SerializeBinaryBulkStateVariant>(state);
+
+    settings.path.push_back(Substream::VariantElements);
+    for (size_t i = 0; i < variants.size(); ++i)
+    {
+        addVariantElementToPath(settings.path, i);
+        variants[i]->serializeBinaryBulkStateSuffix(settings, variant_state->states[i]);
+        settings.path.pop_back();
+    }
+    settings.path.pop_back();
+}
+
+
+void SerializationVariant::deserializeBinaryBulkStatePrefix(
+    DeserializeBinaryBulkSettings & settings,
+    DeserializeBinaryBulkStatePtr & state) const
+{
+    auto variant_state = std::make_shared<DeserializeBinaryBulkStateVariant>();
+    variant_state->states.resize(variants.size());
+
+    settings.path.push_back(Substream::VariantElements);
+    for (size_t i = 0; i < variants.size(); ++i)
+    {
+        addVariantElementToPath(settings.path, i);
+        variants[i]->deserializeBinaryBulkStatePrefix(settings, variant_state->states[i]);
+        settings.path.pop_back();
+    }
+
+    settings.path.pop_back();
+    state = std::move(variant_state);
+}
+
+
+void SerializationVariant::serializeBinaryBulkWithMultipleStreams(
+    const IColumn & column,
+    size_t offset,
+    size_t limit,
+    SerializeBinaryBulkSettings & settings,
+    SerializeBinaryBulkStatePtr & state) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    if (const size_t size = col.size(); limit == 0 || offset + limit > size)
+        limit = size - offset;
+
+    settings.path.push_back(Substream::VariantDiscriminators);
+    auto * discriminators_stream = settings.getter(settings.path);
+    settings.path.pop_back();
+
+    if (!discriminators_stream)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariant::serializeBinaryBulkWithMultipleStreams");
+
+    auto * variant_state = checkAndGetState<SerializeBinaryBulkStateVariant>(state);
+
+    /// If offset = 0 and limit == col.size() or we have only NULLs, we don't need to calculate
+    /// offsets and limits for variants and need to just serialize whole columns.
+    if ((offset == 0 && limit == col.size()) || col.hasOnlyNulls())
+    {
+        /// First, serialize discriminators.
+        /// If we have only NULLs or local and global discriminators are the same, just serialize the column as is.
+        if (col.hasOnlyNulls() || col.hasGlobalVariantsOrder())
+        {
+            SerializationNumber<ColumnVariant::Discriminator>().serializeBinaryBulk(col.getLocalDiscriminatorsColumn(), *discriminators_stream, offset, limit);
+        }
+        /// If local and global discriminators are different, we should convert local to global before serializing (because we don't serialize the mapping).
+        else
+        {
+            const auto & local_discriminators = col.getLocalDiscriminators();
+            for (size_t i = offset; i != offset + limit; ++i)
+                writeBinaryLittleEndian(col.globalDiscriminatorByLocal(local_discriminators[i]), *discriminators_stream);
+        }
+
+        /// Second, serialize variants in global order.
+        settings.path.push_back(Substream::VariantElements);
+        for (size_t i = 0; i != variants.size(); ++i)
+        {
+            addVariantElementToPath(settings.path, i);
+            variants[i]->serializeBinaryBulkWithMultipleStreams(col.getVariantByGlobalDiscriminator(i), 0, 0, settings, variant_state->states[i]);
+            settings.path.pop_back();
+        }
+        settings.path.pop_back();
+        return;
+    }
+
+    /// If we have only one non empty variant and no NULLs, we can use the same limit offset for this variant.
+    if (auto non_empty_local_discr = col.getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        /// First, serialize discriminators.
+        /// We know that all discriminators are the same, so we just need to serialize this discriminator limit times.
+        auto non_empty_global_discr = col.globalDiscriminatorByLocal(*non_empty_local_discr);
+        for (size_t i = 0; i != limit; ++i)
+            writeBinaryLittleEndian(non_empty_global_discr, *discriminators_stream);
+
+        /// Second, serialize variants in global order.
+        settings.path.push_back(Substream::VariantElements);
+        for (size_t i = 0; i != variants.size(); ++i)
+        {
+            addVariantElementToPath(settings.path, i);
+            /// For non empty variant use the same offset/limit as for whole Variant column
+            if (i == non_empty_global_discr)
+                variants[i]->serializeBinaryBulkWithMultipleStreams(col.getVariantByGlobalDiscriminator(i), offset, limit, settings, variant_state->states[i]);
+            /// For empty variants, use just 0/0, they won't serialize anything.
+            else
+                variants[i]->serializeBinaryBulkWithMultipleStreams(col.getVariantByGlobalDiscriminator(i), 0, 0, settings, variant_state->states[i]);
+            settings.path.pop_back();
+        }
+        settings.path.pop_back();
+        return;
+    }
+
+    /// In general case we should iterate through local discriminators in range [offset, offset + limit] to serialize global discriminators and calculate offset/limit pair for each variant.
+    const auto & local_discriminators = col.getLocalDiscriminators();
+    const auto & offsets = col.getOffsets();
+    std::vector<std::pair<size_t, size_t>> variant_offsets_and_limits(variants.size(), {0, 0});
+    size_t end = offset + limit;
+    for (size_t i = offset; i < end; ++i)
+    {
+        auto global_discr = col.globalDiscriminatorByLocal(local_discriminators[i]);
+        writeBinaryLittleEndian(global_discr, *discriminators_stream);
+
+        if (global_discr != ColumnVariant::NULL_DISCRIMINATOR)
+        {
+            /// If we see this discriminator for the first time, update offset
+            if (!variant_offsets_and_limits[global_discr].second)
+                variant_offsets_and_limits[global_discr].first = offsets[i];
+            /// Update limit for this discriminator.
+            ++variant_offsets_and_limits[global_discr].second;
+        }
+    }
+
+    /// If limit for some variant is 0, it means that we don't have its discriminator in the range.
+    /// Set offset to the size of column for such variants, so we won't serialize values from them.
+    for (size_t i = 0; i != variant_offsets_and_limits.size(); ++i)
+    {
+        if (!variant_offsets_and_limits[i].second)
+            variant_offsets_and_limits[i].first = col.getVariantByGlobalDiscriminator(i).size();
+    }
+
+    /// Serialize variants in global order.
+    settings.path.push_back(Substream::VariantElements);
+    for (size_t i = 0; i != variants.size(); ++i)
+    {
+        addVariantElementToPath(settings.path, i);
+        variants[i]->serializeBinaryBulkWithMultipleStreams(
+            col.getVariantByGlobalDiscriminator(i),
+            variant_offsets_and_limits[i].first,
+            variant_offsets_and_limits[i].second,
+            settings,
+            variant_state->states[i]);
+        settings.path.pop_back();
+    }
+    settings.path.pop_back();
+}
+
+
+void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
+    ColumnPtr & column,
+    size_t limit,
+    DeserializeBinaryBulkSettings & settings,
+    DeserializeBinaryBulkStatePtr & state,
+    SubstreamsCache * cache) const
+{
+    auto mutable_column = column->assumeMutable();
+    ColumnVariant & col = assert_cast<ColumnVariant &>(*mutable_column);
+    /// We always serialize Variant column with global variants order,
+    /// so while deserialization column should be always with global variants order.
+    if (!col.hasGlobalVariantsOrder())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to deserialize data into Variant column with not global variants order");
+
+    /// First, deserialize new discriminators.
+    /// We deserialize them into a separate column to be able to use substream cache,
+    /// so if we also need to deserialize some of sub columns, we will read discriminators only once.
+    settings.path.push_back(Substream::VariantDiscriminators);
+    ColumnPtr discriminators;
+    if (auto cached_discriminators = getFromSubstreamsCache(cache, settings.path))
+    {
+        discriminators = cached_discriminators;
+    }
+    else
+    {
+        auto * discriminators_stream = settings.getter(settings.path);
+        if (!discriminators_stream)
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariant::deserializeBinaryBulkWithMultipleStreams");
+
+        discriminators = ColumnVariant::ColumnDiscriminators::create();
+        SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*discriminators->assumeMutable(), *discriminators_stream, limit, 0);
+        addToSubstreamsCache(cache, settings.path, discriminators);
+    }
+
+    settings.path.pop_back();
+
+    /// Iterate through new discriminators, append them to column and calculate the limit for each variant.
+    /// While calculating limits we can also fill offsets column (we store offsets only in memory).
+    const auto & discriminators_data = assert_cast<const ColumnVariant::ColumnDiscriminators &>(*discriminators).getData();
+    auto & local_discriminators = col.getLocalDiscriminators();
+    local_discriminators.reserve(local_discriminators.size() + limit);
+    auto & offsets = col.getOffsets();
+    offsets.reserve(offsets.size() + limit);
+    std::vector<size_t> variant_limits(variants.size(), 0);
+    for (size_t i = 0; i != limit; ++i)
+    {
+        ColumnVariant::Discriminator discr = discriminators_data[i];
+        local_discriminators.push_back(discr);
+        if (discr == ColumnVariant::NULL_DISCRIMINATOR)
+            offsets.emplace_back();
+        else
+            offsets.push_back(col.getVariantByLocalDiscriminator(discr).size() + variant_limits[discr]++);
+    }
+
+    /// Now we can deserialize variants according to their limits.
+    auto * variant_state = checkAndGetState<DeserializeBinaryBulkStateVariant>(state);
+    settings.path.push_back(Substream::VariantElements);
+    for (size_t i = 0; i != variants.size(); ++i)
+    {
+        addVariantElementToPath(settings.path, i);
+        variants[i]->deserializeBinaryBulkWithMultipleStreams(col.getVariantPtrByLocalDiscriminator(i), variant_limits[i], settings, variant_state->states[i], cache);
+        settings.path.pop_back();
+    }
+    settings.path.pop_back();
+}
+
+void SerializationVariant::addVariantElementToPath(DB::ISerialization::SubstreamPath & path, size_t i) const
+{
+    path.push_back(Substream::VariantElement);
+    path.back().variant_element_name = variant_names[i];
+}
+
+void SerializationVariant::serializeBinary(const Field & /*field*/, WriteBuffer & /*ostr*/, const FormatSettings & /*settings*/) const
+{
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method serializeBinary from a field is not implemented for SerializationVariant");
+}
+
+void SerializationVariant::deserializeBinary(Field & /*field*/, ReadBuffer & /*istr*/, const FormatSettings & /*settings*/) const
+{
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method deserializeBinary to a field is not implemented for SerializationVariant");
+}
+
+void SerializationVariant::serializeBinary(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    writeBinaryLittleEndian(global_discr, ostr);
+    if (global_discr != ColumnVariant::NULL_DISCRIMINATOR)
+        variants[global_discr]->serializeBinary(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+void SerializationVariant::deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnVariant & col = assert_cast<ColumnVariant &>(column);
+    ColumnVariant::Discriminator global_discr;
+    readBinaryLittleEndian(global_discr, istr);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+    {
+        col.insertDefault();
+    }
+    else
+    {
+        auto & variant_column = col.getVariantByGlobalDiscriminator(global_discr);
+        variants[global_discr]->deserializeBinary(variant_column, istr, settings);
+        col.getLocalDiscriminators().push_back(col.localDiscriminatorByGlobal(global_discr));
+        col.getOffsets().push_back(variant_column.size() - 1);
+    }
+}
+
+namespace
+{
+
+std::unordered_map<TypeIndex, size_t> getTypesTextDeserializePriorityMap()
+{
+    static const std::vector<TypeIndex> priorities = {
+        /// Complex types have highest priority.
+        TypeIndex::Array,
+        TypeIndex::Tuple,
+        TypeIndex::Map,
+        TypeIndex::AggregateFunction,
+
+        /// Enums can be parsed both from strings and numbers.
+        /// So they have high enough priority.
+        TypeIndex::Enum8,
+        TypeIndex::Enum16,
+
+        /// Types that can be parsed from strings.
+        TypeIndex::UUID,
+        TypeIndex::IPv4,
+        TypeIndex::IPv6,
+
+        /// Types that can be parsed from numbers.
+        /// The order:
+        ///    1) Integers
+        ///    2) Big Integers
+        ///    3) Decimals
+        ///    4) Floats
+        /// In each group small types have higher priority.
+        TypeIndex::Int8,
+        TypeIndex::UInt8,
+        TypeIndex::Int16,
+        TypeIndex::UInt16,
+        TypeIndex::Int32,
+        TypeIndex::UInt32,
+        TypeIndex::Int64,
+        TypeIndex::UInt64,
+        TypeIndex::Int128,
+        TypeIndex::UInt128,
+        TypeIndex::Int256,
+        TypeIndex::UInt256,
+        TypeIndex::Decimal32,
+        TypeIndex::Decimal64,
+        TypeIndex::Decimal128,
+        TypeIndex::Decimal256,
+        TypeIndex::Float32,
+        TypeIndex::Float64,
+
+        /// Dates and DateTimes. More simple Date types have higher priority.
+        /// They have lower priority as numbers as some DateTimes sometimes can
+        /// be also parsed from numbers, but we don't want it usually.
+        TypeIndex::Date,
+        TypeIndex::Date32,
+        TypeIndex::DateTime,
+        TypeIndex::DateTime64,
+
+        /// String types have almost the lowest priority,
+        /// as in text formats almost all data can
+        /// be deserialized into String type.
+        TypeIndex::FixedString,
+        TypeIndex::String,
+    };
+
+    std::unordered_map<TypeIndex, size_t> priority_map;
+    priority_map.reserve(priorities.size());
+    for (size_t i = 0; i != priorities.size(); ++i)
+        priority_map[priorities[i]] = priorities.size() - i;
+    return priority_map;
+}
+
+/// We want to create more or less optimal order of types in which we will try text deserializations.
+/// To do it, for each type we calculate a priority and then sort them by this priority.
+/// Above we defined priority of each data type, but types can be nested and also we can have LowCardinality and Nullable.
+/// To sort any nested types we create a priority that is a tuple of 3 elements:
+/// 1) The maximum depth of nested types like Array/Map/Tuple.
+/// 2) The combination of simple and complex types priorities.
+/// 3) The depth of nested types LowCardinality/Nullable.
+/// So, when we will sort types, first we will sort by the maximum depth of nested types, so more nested types are deserialized first,
+/// then for types with the same depth we sort by the types priority, and last we sort by the depth of LowCardinality/Nullable types,
+/// so if we have types with the same level of nesting and the same priority, we will first try to deserialize LowCardinality/Nullable types
+/// (for example if we have types Array(Array(String)) and Array(Array(Nullable(String))).
+/// This is just a batch of heuristics,
+std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataTypePtr & type, size_t nested_depth, size_t simple_nested_depth, std::unordered_map<TypeIndex, size_t> & priority_map)
+{
+    if (const auto * nullable_type = typeid_cast<const DataTypeNullable *>(type.get()))
+        return getTypeTextDeserializePriority(nullable_type->getNestedType(), nested_depth, simple_nested_depth + 1, priority_map);
+
+    if (const auto * lc_type = typeid_cast<const DataTypeLowCardinality *>(type.get()))
+        return getTypeTextDeserializePriority(lc_type->getDictionaryType(), nested_depth, simple_nested_depth + 1, priority_map);
+
+    if (const auto * array_type = typeid_cast<const DataTypeArray *>(type.get()))
+    {
+        auto [elements_nested_depth, elements_priority, elements_simple_nested_depth] = getTypeTextDeserializePriority(array_type->getNestedType(), nested_depth + 1, simple_nested_depth, priority_map);
+        return {elements_nested_depth, elements_priority + priority_map[TypeIndex::Array], elements_simple_nested_depth};
+    }
+
+    if (const auto * tuple_type = typeid_cast<const DataTypeTuple *>(type.get()))
+    {
+        size_t max_nested_depth = 0;
+        size_t sum_priority = 0;
+        size_t max_simple_nested_depth = 0;
+        for (const auto & elem : tuple_type->getElements())
+        {
+            auto [elem_nested_depth, elem_priority, elem_simple_nested_depth] = getTypeTextDeserializePriority(elem, nested_depth + 1, simple_nested_depth, priority_map);
+            sum_priority += elem_priority;
+            if (elem_nested_depth > max_nested_depth)
+                max_nested_depth = elem_nested_depth;
+            if (elem_simple_nested_depth > max_simple_nested_depth)
+                max_simple_nested_depth = elem_simple_nested_depth;
+        }
+
+        return {max_nested_depth, sum_priority + priority_map[TypeIndex::Tuple], max_simple_nested_depth};
+    }
+
+    if (const auto * map_type = typeid_cast<const DataTypeMap *>(type.get()))
+    {
+        auto [key_max_depth, key_priority, key_simple_nested_depth] = getTypeTextDeserializePriority(map_type->getKeyType(), nested_depth + 1, simple_nested_depth, priority_map);
+        auto [value_max_depth, value_priority, value_simple_nested_depth] = getTypeTextDeserializePriority(map_type->getValueType(), nested_depth + 1, simple_nested_depth, priority_map);
+        return {std::max(key_max_depth, value_max_depth), key_priority + value_priority + priority_map[TypeIndex::Map], std::max(key_simple_nested_depth, value_simple_nested_depth)};
+    }
+
+    if (const auto * variant_type = typeid_cast<const DataTypeVariant *>(type.get()))
+    {
+        size_t max_priority = 0;
+        size_t max_depth = 0;
+        size_t max_simple_nested_depth = 0;
+        for (const auto & variant : variant_type->getVariants())
+        {
+            auto [variant_max_depth, variant_priority, variant_simple_nested_depth] = getTypeTextDeserializePriority(variant, nested_depth, simple_nested_depth, priority_map);
+            if (variant_priority > max_priority)
+                max_priority = variant_priority;
+            if (variant_max_depth > max_depth)
+                max_depth = variant_max_depth;
+            if (variant_simple_nested_depth > max_simple_nested_depth)
+                max_simple_nested_depth = variant_simple_nested_depth;
+        }
+
+        return {max_depth, max_priority, max_simple_nested_depth};
+    }
+
+    return {nested_depth, priority_map[type->getTypeId()], simple_nested_depth};
+}
+
+}
+
+std::vector<size_t> SerializationVariant::getVariantsDeserializeTextOrder(const DB::DataTypes & variant_types)
+{
+    std::vector<std::tuple<size_t, size_t, size_t>> priorities;
+    priorities.reserve(variant_types.size());
+    std::vector<size_t> order;
+    order.reserve(variant_types.size());
+    auto priority_map = getTypesTextDeserializePriorityMap();
+    for (size_t i = 0; i != variant_types.size(); ++i)
+    {
+        priorities.push_back(getTypeTextDeserializePriority(variant_types[i], 0, 0, priority_map));
+        order.push_back(i);
+    }
+
+    std::sort(order.begin(), order.end(), [&](size_t left, size_t right) { return priorities[left] > priorities[right]; });
+    String types_order;
+    for (auto i : order)
+        types_order += " " + variant_types[i]->getName();
+    return order;
+}
+
+
+bool SerializationVariant::tryDeserializeImpl(
+    IColumn & column,
+    const String & field,
+    std::function<bool(ReadBuffer &)> check_for_null,
+    std::function<bool(IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer &)> try_deserialize_variant) const
+{
+    auto & column_variant = assert_cast<ColumnVariant &>(column);
+    ReadBufferFromString null_buf(field);
+    if (check_for_null(null_buf) && null_buf.eof())
+    {
+        column_variant.insertDefault();
+        return true;
+    }
+
+    for (size_t global_discr : deserialize_text_order)
+    {
+        ReadBufferFromString variant_buf(field);
+        /// Usually try_deserialize_variant should not throw an exception, but let's use try/catch just in case.
+        try
+        {
+            auto & variant_column = column_variant.getVariantByGlobalDiscriminator(global_discr);
+            size_t prev_size = variant_column.size();
+            if (try_deserialize_variant(variant_column, variants[global_discr], variant_buf) && variant_buf.eof())
+            {
+                column_variant.getLocalDiscriminators().push_back(column_variant.localDiscriminatorByGlobal(global_discr));
+                column_variant.getOffsets().push_back(prev_size);
+                return true;
+            }
+            else if (variant_column.size() > prev_size)
+            {
+                variant_column.popBack(1);
+            }
+        }
+        catch (...)
+        {
+            /// Try next variant.
+        }
+    }
+
+    return false;
+}
+
+void SerializationVariant::serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullEscaped(ostr, settings);
+    else
+        variants[global_discr]->serializeTextEscaped(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+bool SerializationVariant::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readEscapedString(field, istr);
+    return tryDeserializeTextEscapedImpl(column, field, settings);
+}
+
+void SerializationVariant::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readEscapedString(field, istr);
+    if (!tryDeserializeTextEscapedImpl(column, field, settings))
+        throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse escaped value of type {} here: {}", variant_name, field);
+}
+
+bool SerializationVariant::tryDeserializeTextEscapedImpl(DB::IColumn & column, const String & field, const DB::FormatSettings & settings) const
+{
+    auto check_for_null = [&](ReadBuffer & buf)
+    {
+        return SerializationNullable::tryDeserializeNullEscaped(buf, settings);
+    };
+    auto try_deserialize_variant =[&](IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer & buf)
+    {
+        return variant_serialization->tryDeserializeTextEscaped(variant_column, buf, settings);
+    };
+
+    return tryDeserializeImpl(column, field, check_for_null, try_deserialize_variant);
+}
+
+void SerializationVariant::serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullRaw(ostr, settings);
+    else
+        variants[global_discr]->serializeTextRaw(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+bool SerializationVariant::tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readString(field, istr);
+    return tryDeserializeTextRawImpl(column, field, settings);
+}
+
+void SerializationVariant::deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readString(field, istr);
+    if (!tryDeserializeTextRawImpl(column, field, settings))
+        throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse raw value of type {} here: {}", variant_name, field);
+}
+
+bool SerializationVariant::tryDeserializeTextRawImpl(DB::IColumn & column, const String & field, const DB::FormatSettings & settings) const
+{
+    auto check_for_null = [&](ReadBuffer & buf)
+    {
+        return SerializationNullable::tryDeserializeNullRaw(buf, settings);
+    };
+    auto try_deserialize_variant =[&](IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer & buf)
+    {
+        return variant_serialization->tryDeserializeTextRaw(variant_column, buf, settings);
+    };
+
+    return tryDeserializeImpl(column, field, check_for_null, try_deserialize_variant);
+}
+
+void SerializationVariant::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullQuoted(ostr);
+    else
+        variants[global_discr]->serializeTextQuoted(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+bool SerializationVariant::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    if (!tryReadQuotedField(field, istr))
+        return false;
+    return tryDeserializeTextQuotedImpl(column, field, settings);
+}
+
+void SerializationVariant::deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readQuotedField(field, istr);
+    if (!tryDeserializeTextQuotedImpl(column, field, settings))
+        throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse quoted value of type {} here: {}", variant_name, field);
+}
+
+bool SerializationVariant::tryDeserializeTextQuotedImpl(DB::IColumn & column, const String & field, const DB::FormatSettings & settings) const
+{
+    auto check_for_null = [&](ReadBuffer & buf)
+    {
+        return SerializationNullable::tryDeserializeNullQuoted(buf);
+    };
+    auto try_deserialize_variant =[&](IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer & buf)
+    {
+        return variant_serialization->tryDeserializeTextQuoted(variant_column, buf, settings);
+    };
+
+    return tryDeserializeImpl(column, field, check_for_null, try_deserialize_variant);
+}
+
+void SerializationVariant::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullCSV(ostr, settings);
+    else
+        variants[global_discr]->serializeTextCSV(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+bool SerializationVariant::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readCSVStringInto<String, true, false>(field, istr, settings.csv);
+    return tryDeserializeTextCSVImpl(column, field, settings);
+}
+
+void SerializationVariant::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readCSVField(field, istr, settings.csv);
+    if (!tryDeserializeTextCSVImpl(column, field, settings))
+        throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse CSV value of type {} here: {}", variant_name, field);
+}
+
+bool SerializationVariant::tryDeserializeTextCSVImpl(DB::IColumn & column, const String & field, const DB::FormatSettings & settings) const
+{
+    auto check_for_null = [&](ReadBuffer & buf)
+    {
+        return SerializationNullable::tryDeserializeNullCSV(buf, settings);
+    };
+    auto try_deserialize_variant =[&](IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer & buf)
+    {
+        return variant_serialization->tryDeserializeTextCSV(variant_column, buf, settings);
+    };
+
+    return tryDeserializeImpl(column, field, check_for_null, try_deserialize_variant);
+}
+
+void SerializationVariant::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullText(ostr, settings);
+    else
+        variants[global_discr]->serializeText(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+bool SerializationVariant::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readStringUntilEOF(field, istr);
+    return tryDeserializeWholeTextImpl(column, field, settings);
+}
+
+void SerializationVariant::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readStringUntilEOF(field, istr);
+    if (!tryDeserializeWholeTextImpl(column, field, settings))
+        throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse text value of type {} here: {}", variant_name, field);
+}
+
+bool SerializationVariant::tryDeserializeWholeTextImpl(DB::IColumn & column, const String & field, const DB::FormatSettings & settings) const
+{
+    auto check_for_null = [&](ReadBuffer & buf)
+    {
+        return SerializationNullable::tryDeserializeNullText(buf);
+    };
+    auto try_deserialize_variant =[&](IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer & buf)
+    {
+        return variant_serialization->tryDeserializeWholeText(variant_column, buf, settings);
+    };
+
+    return tryDeserializeImpl(column, field, check_for_null, try_deserialize_variant);
+}
+
+void SerializationVariant::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullJSON(ostr);
+    else
+        variants[global_discr]->serializeTextJSON(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+bool SerializationVariant::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    if (!tryReadJSONField(field, istr))
+        return false;
+    return tryDeserializeTextJSONImpl(column, field, settings);
+}
+
+void SerializationVariant::deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readJSONField(field, istr);
+    if (!tryDeserializeTextJSONImpl(column, field, settings))
+        throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse JSON value of type {} here: {}", variant_name, field);
+}
+
+bool SerializationVariant::tryDeserializeTextJSONImpl(DB::IColumn & column, const String & field, const DB::FormatSettings & settings) const
+{
+    auto check_for_null = [&](ReadBuffer & buf)
+    {
+        return SerializationNullable::tryDeserializeNullJSON(buf);
+    };
+    auto try_deserialize_variant =[&](IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer & buf)
+    {
+        return variant_serialization->tryDeserializeTextJSON(variant_column, buf, settings);
+    };
+
+    return tryDeserializeImpl(column, field, check_for_null, try_deserialize_variant);
+}
+
+void SerializationVariant::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullXML(ostr);
+    else
+        variants[global_discr]->serializeTextXML(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+}
diff --git a/src/DataTypes/Serializations/SerializationVariant.h b/src/DataTypes/Serializations/SerializationVariant.h
new file mode 100644
index 00000000000..b6bee94c65f
--- /dev/null
+++ b/src/DataTypes/Serializations/SerializationVariant.h
@@ -0,0 +1,116 @@
+#pragma once
+
+#include <DataTypes/Serializations/ISerialization.h>
+#include <DataTypes/Serializations/SerializationVariantElement.h>
+
+namespace DB
+{
+
+class SerializationVariant : public ISerialization
+{
+public:
+    using VariantSerializations = std::vector<SerializationPtr>;
+
+    explicit SerializationVariant(
+        const VariantSerializations & variants_,
+        const std::vector<String> & variant_names_,
+        const std::vector<size_t> & deserialize_text_order_,
+        const String & variant_name_)
+        : variants(variants_), variant_names(variant_names_), deserialize_text_order(deserialize_text_order_), variant_name(variant_name_)
+    {
+    }
+
+    void enumerateStreams(
+        EnumerateStreamsSettings & settings,
+        const StreamCallback & callback,
+        const SubstreamData & data) const override;
+
+    void serializeBinaryBulkStatePrefix(
+        const IColumn & column,
+        SerializeBinaryBulkSettings & settings,
+        SerializeBinaryBulkStatePtr & state) const override;
+
+    void serializeBinaryBulkStateSuffix(
+        SerializeBinaryBulkSettings & settings,
+        SerializeBinaryBulkStatePtr & state) const override;
+
+    void deserializeBinaryBulkStatePrefix(
+        DeserializeBinaryBulkSettings & settings,
+        DeserializeBinaryBulkStatePtr & state) const override;
+
+    void serializeBinaryBulkWithMultipleStreams(
+        const IColumn & column,
+        size_t offset,
+        size_t limit,
+        SerializeBinaryBulkSettings & settings,
+        SerializeBinaryBulkStatePtr & state) const override;
+
+    void deserializeBinaryBulkWithMultipleStreams(
+        ColumnPtr & column,
+        size_t limit,
+        DeserializeBinaryBulkSettings & settings,
+        DeserializeBinaryBulkStatePtr & state,
+        SubstreamsCache * cache) const override;
+
+    void serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeBinary(Field & field, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeBinary(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+
+    /// Determine the order in which we should try to deserialize variants.
+    /// In some cases the text representation of a value can be deserialized
+    /// into several types (for example, almost all text values can be deserialized
+    /// into String type), so we uses some heuristics to determine the more optimal order.
+    static std::vector<size_t> getVariantsDeserializeTextOrder(const DataTypes & variant_types);
+
+private:
+    void addVariantElementToPath(SubstreamPath & path, size_t i) const;
+
+    bool tryDeserializeTextEscapedImpl(IColumn & column, const String & field, const FormatSettings & settings) const;
+    bool tryDeserializeTextQuotedImpl(IColumn & column, const String & field, const FormatSettings & settings) const;
+    bool tryDeserializeWholeTextImpl(IColumn & column, const String & field, const FormatSettings & settings) const;
+    bool tryDeserializeTextCSVImpl(IColumn & column, const String & field, const FormatSettings & settings) const;
+    bool tryDeserializeTextJSONImpl(IColumn & column, const String & field, const FormatSettings & settings) const;
+    bool tryDeserializeTextRawImpl(IColumn & column, const String & field, const FormatSettings & settings) const;
+
+    bool tryDeserializeImpl(
+        IColumn & column,
+        const String & field,
+        std::function<bool(ReadBuffer &)> check_for_null,
+        std::function<bool(IColumn & variant_columm, const SerializationPtr & nested, ReadBuffer &)> try_deserialize_nested) const;
+
+    VariantSerializations variants;
+    std::vector<String> variant_names;
+    std::vector<size_t> deserialize_text_order;
+    /// Name of Variant data type for better exception messages.
+    String variant_name;
+};
+
+}
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
new file mode 100644
index 00000000000..4b24ee5754e
--- /dev/null
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -0,0 +1,241 @@
+#include <DataTypes/Serializations/SerializationVariantElement.h>
+#include <DataTypes/Serializations/SerializationNumber.h>
+#include <Columns/ColumnLowCardinality.h>
+#include <Columns/ColumnNullable.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int NOT_IMPLEMENTED;
+    extern const int LOGICAL_ERROR;
+}
+
+void SerializationVariantElement::enumerateStreams(
+    DB::ISerialization::EnumerateStreamsSettings & settings,
+    const DB::ISerialization::StreamCallback & callback,
+    const DB::ISerialization::SubstreamData & data) const
+{
+    /// We will need stream for discriminators during deserialization.
+    settings.path.push_back(Substream::VariantDiscriminators);
+    callback(settings.path);
+    settings.path.pop_back();
+
+    addVariantToPath(settings.path);
+    settings.path.back().data = data;
+    nested_serialization->enumerateStreams(settings, callback, data);
+    removeVariantFromPath(settings.path);
+}
+
+void SerializationVariantElement::serializeBinaryBulkStatePrefix(const IColumn &, SerializeBinaryBulkSettings &, SerializeBinaryBulkStatePtr &) const
+{
+    throw Exception(
+        ErrorCodes::NOT_IMPLEMENTED, "Method serializeBinaryBulkStatePrefix is not implemented for SerializationVariantElement");
+}
+
+void SerializationVariantElement::serializeBinaryBulkStateSuffix(SerializeBinaryBulkSettings &, SerializeBinaryBulkStatePtr &) const
+{
+    throw Exception(
+        ErrorCodes::NOT_IMPLEMENTED, "Method serializeBinaryBulkStateSuffix is not implemented for SerializationVariantElement");
+}
+
+void SerializationVariantElement::deserializeBinaryBulkStatePrefix(DeserializeBinaryBulkSettings & settings, DeserializeBinaryBulkStatePtr & state) const
+{
+    addVariantToPath(settings.path);
+    nested_serialization->deserializeBinaryBulkStatePrefix(settings, state);
+    removeVariantFromPath(settings.path);
+}
+
+void SerializationVariantElement::serializeBinaryBulkWithMultipleStreams(const IColumn &, size_t, size_t, SerializeBinaryBulkSettings &, SerializeBinaryBulkStatePtr &) const
+{
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method serializeBinaryBulkWithMultipleStreams is not implemented for SerializationVariantElement");
+}
+
+void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
+    ColumnPtr & column,
+    size_t limit,
+    DeserializeBinaryBulkSettings & settings,
+    DeserializeBinaryBulkStatePtr & state,
+    SubstreamsCache * cache) const
+{
+    auto mutable_column = column->assumeMutable();
+    ColumnNullable * nullable_col = typeid_cast<ColumnNullable *>(mutable_column.get());
+    NullMap * null_map = nullable_col ? &nullable_col->getNullMapData() : nullptr;
+
+    /// First, deserialize discriminators from Variant column.
+    settings.path.push_back(Substream::VariantDiscriminators);
+    ColumnPtr discriminators;
+    if (auto cached_discriminators = getFromSubstreamsCache(cache, settings.path))
+    {
+        discriminators = cached_discriminators;
+    }
+    else
+    {
+        auto * discriminators_stream = settings.getter(settings.path);
+        if (!discriminators_stream)
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams");
+
+        discriminators = ColumnVariant::ColumnDiscriminators::create();
+        SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*discriminators->assumeMutable(), *discriminators_stream, limit, 0);
+        addToSubstreamsCache(cache, settings.path, discriminators);
+    }
+    settings.path.pop_back();
+
+    /// Iterate through discriminators to calculate the size of the variant.
+    const auto & discriminators_data = assert_cast<const ColumnVariant::ColumnDiscriminators &>(*discriminators).getData();
+    size_t variant_size = 0;
+    for (auto discr : discriminators_data)
+        variant_size += discr == variant_discriminator;
+
+    /// Now we know the size of the variant and can deserialize it.
+
+    /// If the size of variant column is the same as the size of discriminators,
+    /// we can deserialize new values directly into our column.
+    if (variant_size == discriminators_data.size())
+    {
+        addVariantToPath(settings.path);
+        /// Special case when our result column is LowCardinality(Nullable(T)).
+        /// In this case the variant type is LowCardinality(T), and we cannot just
+        /// deserialize its values directly into LowCardinality(Nullable(T)) column.
+        /// We create a separate column with type LowCardinality(T), deserialize
+        /// values into it and then insert into result column using insertRangeFrom.
+        if (isColumnLowCardinalityNullable(*column))
+        {
+            ColumnPtr variant_col = mutable_column->cloneEmpty();
+            /// LowCardinality(Nullable(T)) -> LowCardinality(T)
+            assert_cast<ColumnLowCardinality &>(*variant_col->assumeMutable()).nestedRemoveNullable();
+            nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_col, limit, settings, state, cache);
+            mutable_column->insertRangeFrom(*variant_col, 0, variant_col->size());
+        }
+        else
+        {
+            nested_serialization->deserializeBinaryBulkWithMultipleStreams(nullable_col ? nullable_col->getNestedColumnPtr() : column, limit, settings, state, cache);
+        }
+        if (nullable_col)
+            null_map->resize_fill(null_map->size() + limit, 0);
+        removeVariantFromPath(settings.path);
+        return;
+    }
+
+    /// If variant size is 0, just fill column with default values.
+    if (variant_size == 0)
+    {
+        mutable_column->insertManyDefaults(limit);
+        return;
+    }
+
+    /// In general case we should deserialize variant into a separate column,
+    /// iterate through discriminators and insert values from variant only when
+    /// row contains its discriminator and default value otherwise.
+    mutable_column->reserve(mutable_column->size() + limit);
+    mutable_column = nullable_col ? nullable_col->getNestedColumnPtr()->assumeMutable() : std::move(mutable_column);
+    ColumnPtr variant_col = mutable_column->cloneEmpty();
+
+    /// Special case when our result column is LowCardinality(Nullable(T)).
+    /// We should remove Nullable from variant column before deserialization.
+    if (isColumnLowCardinalityNullable(*column))
+        assert_cast<ColumnLowCardinality &>(*variant_col->assumeMutable()).nestedRemoveNullable();
+
+    addVariantToPath(settings.path);
+    nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_col, variant_size, settings, state, cache);
+    removeVariantFromPath(settings.path);
+
+    size_t variant_index = 0;
+    for (auto discr : discriminators_data)
+    {
+        if (discr == variant_discriminator)
+        {
+            if (null_map)
+                null_map->push_back(0);
+            mutable_column->insertFrom(*variant_col, variant_index++);
+        }
+        else
+        {
+            if (null_map)
+                null_map->push_back(1);
+            mutable_column->insertDefault();
+        }
+    }
+}
+
+void SerializationVariantElement::addVariantToPath(DB::ISerialization::SubstreamPath & path) const
+{
+    path.push_back(Substream::VariantElements);
+    path.push_back(Substream::VariantElement);
+    path.back().variant_element_name = variant_element_name;
+}
+
+void SerializationVariantElement::removeVariantFromPath(DB::ISerialization::SubstreamPath & path) const
+{
+    path.pop_back();
+    path.pop_back();
+}
+
+SerializationVariantElement::VariantSubcolumnCreator::VariantSubcolumnCreator(
+    const DB::ColumnPtr & local_discriminators_,
+    const DB::String & variant_element_name_,
+    const ColumnVariant::Discriminator global_variant_discriminator_,
+    const ColumnVariant::Discriminator local_variant_discriminator_)
+    : local_discriminators(local_discriminators_)
+    , variant_element_name(variant_element_name_)
+    , global_variant_discriminator(global_variant_discriminator_)
+    , local_variant_discriminator(local_variant_discriminator_)
+{
+}
+
+DataTypePtr SerializationVariantElement::VariantSubcolumnCreator::create(const DB::DataTypePtr & prev) const
+{
+    return makeNullableOrLowCardinalityNullableSafe(prev);
+}
+
+SerializationPtr SerializationVariantElement::VariantSubcolumnCreator::create(const DB::SerializationPtr & prev) const
+{
+    return std::make_shared<SerializationVariantElement>(prev, variant_element_name, global_variant_discriminator);
+}
+
+ColumnPtr SerializationVariantElement::VariantSubcolumnCreator::create(const DB::ColumnPtr & prev) const
+{
+    /// Case when original Variant column contained only one non-empty variant and no NULLs.
+    /// In this case just use this variant.
+    if (prev->size() == local_discriminators->size())
+        return makeNullableOrLowCardinalityNullableSafe(prev);
+
+    /// If this variant is empty, fill result column with default values.
+    if (prev->empty())
+    {
+        auto res = IColumn::mutate(makeNullableOrLowCardinalityNullableSafe(prev));
+        res->insertManyDefaults(local_discriminators->size());
+        return res;
+    }
+
+    /// In general case we should iterate through discriminators and create null-map for our variant.
+    NullMap null_map;
+    null_map.reserve(local_discriminators->size());
+    const auto & local_discriminators_data = assert_cast<const ColumnVariant::ColumnDiscriminators &>(*local_discriminators).getData();
+    for (auto local_discr : local_discriminators_data)
+        null_map.push_back(local_discr != local_variant_discriminator);
+
+    /// Now we can create new column from null-map and variant column using IColumn::expand.
+    auto res_column = IColumn::mutate(prev);
+
+    /// Special case for LowCardinality. We want the result to be LowCardinality(Nullable),
+    /// but we don't have a good way to apply null-mask for LowCardinality(), so, we first
+    /// convert our column to LowCardinality(Nullable()) and then use expand which will
+    /// fill rows with 0 in mask with default value (that is NULL).
+    if (prev->lowCardinality())
+        res_column = assert_cast<ColumnLowCardinality &>(*res_column).cloneNullable();
+
+    res_column->expand(null_map, /*inverted = */ true);
+
+    if (res_column->canBeInsideNullable())
+    {
+        auto null_map_col = ColumnUInt8::create();
+        null_map_col->getData() = std::move(null_map);
+        return ColumnNullable::create(std::move(res_column), std::move(null_map_col));
+    }
+
+    return res_column;
+}
+
+}
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.h b/src/DataTypes/Serializations/SerializationVariantElement.h
new file mode 100644
index 00000000000..c343c219cf3
--- /dev/null
+++ b/src/DataTypes/Serializations/SerializationVariantElement.h
@@ -0,0 +1,87 @@
+#pragma once
+
+#include <DataTypes/Serializations/SerializationWrapper.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <Columns/ColumnNullable.h>
+#include <Columns/ColumnVariant.h>
+
+namespace DB
+{
+
+class SerializationVariant;
+
+/// Serialization for Variant element when we read it as a subcolumn.
+class SerializationVariantElement final : public SerializationWrapper
+{
+private:
+    /// To be able to deserialize Variant element as a subcolumn
+    /// we need its type name and global discriminator.
+    String variant_element_name;
+    ColumnVariant::Discriminator variant_discriminator;
+
+public:
+    SerializationVariantElement(const SerializationPtr & nested_, const String & variant_element_name_, ColumnVariant::Discriminator variant_discriminator_)
+        : SerializationWrapper(nested_)
+        , variant_element_name(variant_element_name_)
+        , variant_discriminator(variant_discriminator_)
+    {
+    }
+
+    void enumerateStreams(
+        EnumerateStreamsSettings & settings,
+        const StreamCallback & callback,
+        const SubstreamData & data) const override;
+
+    void serializeBinaryBulkStatePrefix(
+        const IColumn & column,
+        SerializeBinaryBulkSettings & settings,
+        SerializeBinaryBulkStatePtr & state) const override;
+
+    void serializeBinaryBulkStateSuffix(
+        SerializeBinaryBulkSettings & settings,
+        SerializeBinaryBulkStatePtr & state) const override;
+
+    void deserializeBinaryBulkStatePrefix(
+        DeserializeBinaryBulkSettings & settings,
+        DeserializeBinaryBulkStatePtr & state) const override;
+
+    void serializeBinaryBulkWithMultipleStreams(
+        const IColumn & column,
+        size_t offset,
+        size_t limit,
+        SerializeBinaryBulkSettings & settings,
+        SerializeBinaryBulkStatePtr & state) const override;
+
+    void deserializeBinaryBulkWithMultipleStreams(
+        ColumnPtr & column,
+        size_t limit,
+        DeserializeBinaryBulkSettings & settings,
+        DeserializeBinaryBulkStatePtr & state,
+        SubstreamsCache * cache) const override;
+
+private:
+    friend SerializationVariant;
+
+    void addVariantToPath(SubstreamPath & path) const;
+    void removeVariantFromPath(SubstreamPath & path) const;
+
+    struct VariantSubcolumnCreator : public ISubcolumnCreator
+    {
+        const ColumnPtr local_discriminators;
+        const String variant_element_name;
+        const ColumnVariant::Discriminator global_variant_discriminator;
+        const ColumnVariant::Discriminator local_variant_discriminator;
+
+        VariantSubcolumnCreator(
+            const ColumnPtr & local_discriminators_,
+            const String & variant_element_name_,
+            const ColumnVariant::Discriminator global_variant_discriminator_,
+            const ColumnVariant::Discriminator local_variant_discriminator_);
+
+        DataTypePtr create(const DataTypePtr & prev) const override;
+        ColumnPtr create(const ColumnPtr & prev) const override;
+        SerializationPtr create(const SerializationPtr & prev) const override;
+    };
+};
+
+}
diff --git a/src/DataTypes/Serializations/SerializationWrapper.cpp b/src/DataTypes/Serializations/SerializationWrapper.cpp
index 18e4891ee65..bde52bb8096 100644
--- a/src/DataTypes/Serializations/SerializationWrapper.cpp
+++ b/src/DataTypes/Serializations/SerializationWrapper.cpp
@@ -96,6 +96,11 @@ void SerializationWrapper::deserializeTextEscaped(IColumn & column, ReadBuffer &
     nested_serialization->deserializeTextEscaped(column, istr, settings);
 }
 
+bool SerializationWrapper::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return nested_serialization->tryDeserializeTextEscaped(column, istr, settings);
+}
+
 void SerializationWrapper::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     nested_serialization->serializeTextQuoted(column, row_num, ostr, settings);
@@ -106,6 +111,11 @@ void SerializationWrapper::deserializeTextQuoted(IColumn & column, ReadBuffer &
     nested_serialization->deserializeTextQuoted(column, istr, settings);
 }
 
+bool SerializationWrapper::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return nested_serialization->tryDeserializeTextQuoted(column, istr, settings);
+}
+
 void SerializationWrapper::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     nested_serialization->serializeTextCSV(column, row_num, ostr, settings);
@@ -116,6 +126,11 @@ void SerializationWrapper::deserializeTextCSV(IColumn & column, ReadBuffer & ist
     nested_serialization->deserializeTextCSV(column, istr, settings);
 }
 
+bool SerializationWrapper::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return nested_serialization->tryDeserializeTextCSV(column, istr, settings);
+}
+
 void SerializationWrapper::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     nested_serialization->serializeText(column, row_num, ostr, settings);
@@ -126,6 +141,11 @@ void SerializationWrapper::deserializeWholeText(IColumn & column, ReadBuffer & i
     nested_serialization->deserializeWholeText(column, istr, settings);
 }
 
+bool SerializationWrapper::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return nested_serialization->tryDeserializeWholeText(column, istr, settings);
+}
+
 void SerializationWrapper::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     nested_serialization->serializeTextJSON(column, row_num, ostr, settings);
@@ -136,6 +156,11 @@ void SerializationWrapper::deserializeTextJSON(IColumn & column, ReadBuffer & is
     nested_serialization->deserializeTextJSON(column, istr, settings);
 }
 
+bool SerializationWrapper::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return nested_serialization->tryDeserializeTextJSON(column, istr, settings);
+}
+
 void SerializationWrapper::serializeTextJSONPretty(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings, size_t indent) const
 {
     nested_serialization->serializeTextJSONPretty(column, row_num, ostr, settings, indent);
diff --git a/src/DataTypes/Serializations/SerializationWrapper.h b/src/DataTypes/Serializations/SerializationWrapper.h
index 31900f93148..6c5e2046062 100644
--- a/src/DataTypes/Serializations/SerializationWrapper.h
+++ b/src/DataTypes/Serializations/SerializationWrapper.h
@@ -63,18 +63,23 @@ public:
 
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSONPretty(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings, size_t indent) const override;
 
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
diff --git a/src/DataTypes/Serializations/SimpleTextSerialization.h b/src/DataTypes/Serializations/SimpleTextSerialization.h
index 0247f30b30a..11f56de73d1 100644
--- a/src/DataTypes/Serializations/SimpleTextSerialization.h
+++ b/src/DataTypes/Serializations/SimpleTextSerialization.h
@@ -36,29 +36,67 @@ protected:
         deserializeText(column, istr, settings, true);
     }
 
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
+    {
+        return tryDeserializeText(column, istr, settings, true);
+    }
+
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
     {
         deserializeText(column, istr, settings, false);
     }
 
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
+    {
+        return tryDeserializeText(column, istr, settings, false);
+    }
+
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
     {
         deserializeText(column, istr, settings, false);
     }
 
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
+    {
+        return tryDeserializeText(column, istr, settings, false);
+    }
+
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
     {
         deserializeText(column, istr, settings, false);
     }
 
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
+    {
+        return tryDeserializeText(column, istr, settings, false);
+    }
+
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
     {
         deserializeText(column, istr, settings, false);
     }
 
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
+    {
+        return tryDeserializeText(column, istr, settings, false);
+    }
+
     /// whole = true means that buffer contains only one value, so we should read until EOF.
     /// It's needed to check if there is garbage after parsed field.
     virtual void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const = 0;
+
+    virtual bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const
+    {
+        try
+        {
+            deserializeText(column, istr, settings, whole);
+            return true;
+        }
+        catch (...)
+        {
+            return false;
+        }
+    }
 };
 
 }
diff --git a/src/DataTypes/Utils.cpp b/src/DataTypes/Utils.cpp
index e58331a8bcb..2f29d57d454 100644
--- a/src/DataTypes/Utils.cpp
+++ b/src/DataTypes/Utils.cpp
@@ -223,6 +223,7 @@ bool canBeSafelyCasted(const DataTypePtr & from_type, const DataTypePtr & to_typ
         case TypeIndex::AggregateFunction:
         case TypeIndex::Nothing:
         case TypeIndex::JSONPaths:
+        case TypeIndex::Variant:
             return false;
     }
 
diff --git a/src/Databases/DatabaseReplicated.cpp b/src/Databases/DatabaseReplicated.cpp
index 36dd858dcf7..76f6dc25aae 100644
--- a/src/Databases/DatabaseReplicated.cpp
+++ b/src/Databases/DatabaseReplicated.cpp
@@ -907,6 +907,7 @@ void DatabaseReplicated::recoverLostReplica(const ZooKeeperPtr & current_zookeep
         query_context->setSetting("allow_experimental_nlp_functions", 1);
         query_context->setSetting("allow_experimental_hash_functions", 1);
         query_context->setSetting("allow_experimental_object_type", 1);
+        query_context->setSetting("allow_experimental_variant_type", 1);
         query_context->setSetting("allow_experimental_annoy_index", 1);
         query_context->setSetting("allow_experimental_usearch_index", 1);
         query_context->setSetting("allow_experimental_bigint_types", 1);
diff --git a/src/Formats/EscapingRuleUtils.cpp b/src/Formats/EscapingRuleUtils.cpp
index 9cc7cb3b89e..a2528f9f948 100644
--- a/src/Formats/EscapingRuleUtils.cpp
+++ b/src/Formats/EscapingRuleUtils.cpp
@@ -109,31 +109,31 @@ bool deserializeFieldByEscapingRule(
     {
         case FormatSettings::EscapingRule::Escaped:
             if (parse_as_nullable)
-                read = SerializationNullable::deserializeTextEscapedImpl(column, buf, format_settings, serialization);
+                read = SerializationNullable::deserializeNullAsDefaultOrNestedTextEscaped(column, buf, format_settings, serialization);
             else
                 serialization->deserializeTextEscaped(column, buf, format_settings);
             break;
         case FormatSettings::EscapingRule::Quoted:
             if (parse_as_nullable)
-                read = SerializationNullable::deserializeTextQuotedImpl(column, buf, format_settings, serialization);
+                read = SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(column, buf, format_settings, serialization);
             else
                 serialization->deserializeTextQuoted(column, buf, format_settings);
             break;
         case FormatSettings::EscapingRule::CSV:
             if (parse_as_nullable)
-                read = SerializationNullable::deserializeTextCSVImpl(column, buf, format_settings, serialization);
+                read = SerializationNullable::deserializeNullAsDefaultOrNestedTextCSV(column, buf, format_settings, serialization);
             else
                 serialization->deserializeTextCSV(column, buf, format_settings);
             break;
         case FormatSettings::EscapingRule::JSON:
             if (parse_as_nullable)
-                read = SerializationNullable::deserializeTextJSONImpl(column, buf, format_settings, serialization);
+                read = SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(column, buf, format_settings, serialization);
             else
                 serialization->deserializeTextJSON(column, buf, format_settings);
             break;
         case FormatSettings::EscapingRule::Raw:
             if (parse_as_nullable)
-                read = SerializationNullable::deserializeTextRawImpl(column, buf, format_settings, serialization);
+                read = SerializationNullable::deserializeNullAsDefaultOrNestedTextRaw(column, buf, format_settings, serialization);
             else
                 serialization->deserializeTextRaw(column, buf, format_settings);
             break;
diff --git a/src/Formats/JSONUtils.cpp b/src/Formats/JSONUtils.cpp
index 7ddfdb6b572..4e7795f61bd 100644
--- a/src/Formats/JSONUtils.cpp
+++ b/src/Formats/JSONUtils.cpp
@@ -288,14 +288,14 @@ namespace JSONUtils
                 ReadBufferFromString buf(str);
 
                 if (as_nullable)
-                    return SerializationNullable::deserializeWholeTextImpl(column, buf, format_settings, serialization);
+                    return SerializationNullable::deserializeNullAsDefaultOrNestedWholeText(column, buf, format_settings, serialization);
 
                 serialization->deserializeWholeText(column, buf, format_settings);
                 return true;
             }
 
             if (as_nullable)
-                return SerializationNullable::deserializeTextJSONImpl(column, in, format_settings, serialization);
+                return SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(column, in, format_settings, serialization);
 
             serialization->deserializeTextJSON(column, in, format_settings);
             return true;
diff --git a/src/Formats/SchemaInferenceUtils.cpp b/src/Formats/SchemaInferenceUtils.cpp
index e2ba188d015..6890e412f75 100644
--- a/src/Formats/SchemaInferenceUtils.cpp
+++ b/src/Formats/SchemaInferenceUtils.cpp
@@ -946,7 +946,7 @@ namespace
         if constexpr (is_json)
             ok = tryReadJSONStringInto(field, buf);
         else
-            ok = tryReadQuotedStringInto(field, buf);
+            ok = tryReadQuotedString(field, buf);
 
         if (!ok)
             return nullptr;
diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index bef1e7b420a..f9f61ceed0d 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -28,6 +28,7 @@
 #include <DataTypes/DataTypeObject.h>
 #include <DataTypes/ObjectUtils.h>
 #include <DataTypes/DataTypeNested.h>
+#include <DataTypes/DataTypeVariant.h>
 #include <DataTypes/Serializations/SerializationDecimal.h>
 #include <Formats/FormatSettings.h>
 #include <Columns/ColumnString.h>
@@ -40,6 +41,7 @@
 #include <Columns/ColumnMap.h>
 #include <Columns/ColumnObject.h>
 #include <Columns/ColumnsCommon.h>
+#include <Columns/ColumnVariant.h>
 #include <Columns/ColumnStringHelpers.h>
 #include <Common/assert_cast.h>
 #include <Common/Concepts.h>
@@ -4067,6 +4069,259 @@ arguments, result_type, input_rows_count); \
             "Cast to Object can be performed only from flatten named Tuple, Map or String. Got: {}", from_type->getName());
     }
 
+    WrapperType createVariantToVariantWrapper(const DataTypeVariant & from_variant, const DataTypeVariant & to_variant) const
+    {
+        /// We support only extension of variant type, so, only new types can be added.
+        /// For example: Variant(T1, T2) -> Variant(T1, T2, T3) is supported, but Variant(T1, T2) -> Variant(T1, T3) is not supported.
+        /// We want to extend Variant type for free without rewriting the data, but we sort data types inside Variant during type creation
+        /// (we do it because we want Variant(T1, T2) to be the same as Variant(T2, T1)), but after extension the order of variant types
+        /// (and so their discriminators) can be different. For example: Variant(T1, T3) -> Variant(T1, T2, T3).
+        /// To avoid full rewrite of discriminators column, ColumnVariant supports it's local order of variant columns (and so local
+        /// discriminators) and stores mapping global order -> local order.
+        /// So, to extend Variant with new types for free, we should keep old local order for old variants, append new variants and change
+        /// mapping global order -> local order according to the new global order.
+
+        /// Create map (new variant type) -> (it's global discriminator in new order).
+        const auto & new_variants = to_variant.getVariants();
+        std::unordered_map<String, ColumnVariant::Discriminator> new_variant_types_to_new_global_discriminator;
+        new_variant_types_to_new_global_discriminator.reserve(new_variants.size());
+        for (size_t i = 0; i != new_variants.size(); ++i)
+            new_variant_types_to_new_global_discriminator[new_variants[i]->getName()] = i;
+
+        /// Create set of old variant types.
+        const auto & old_variants = from_variant.getVariants();
+        std::unordered_map<String, ColumnVariant::Discriminator> old_variant_types_to_old_global_discriminator;
+        old_variant_types_to_old_global_discriminator.reserve(old_variants.size());
+        for (size_t i = 0; i != old_variants.size(); ++i)
+            old_variant_types_to_old_global_discriminator[old_variants[i]->getName()] = i;
+
+        /// Check that the set of old variants types is a subset of new variant types and collect new global discriminator for each old global discriminator.
+        std::unordered_map<ColumnVariant::Discriminator, ColumnVariant::Discriminator> old_global_discriminator_to_new;
+        old_global_discriminator_to_new.reserve(old_variants.size());
+        for (const auto & [old_variant_type, old_discriminator] : old_variant_types_to_old_global_discriminator)
+        {
+            auto it = new_variant_types_to_new_global_discriminator.find(old_variant_type);
+            if (it == new_variant_types_to_new_global_discriminator.end())
+                throw Exception(
+                    ErrorCodes::CANNOT_CONVERT_TYPE,
+                    "Cannot convert type {} to {}. Conversion between Variant types is allowed only when new Variant type is an extension "
+                    "of an initial one", from_variant.getName(), to_variant.getName());
+            old_global_discriminator_to_new[old_discriminator] = it->second;
+        }
+
+        /// Collect variant types and their global discriminators that should be added to the old Variant to get the new Variant.
+        std::vector<std::pair<DataTypePtr, ColumnVariant::Discriminator>> variant_types_and_discriminators_to_add;
+        variant_types_and_discriminators_to_add.reserve(new_variants.size() - old_variants.size());
+        for (size_t i = 0; i != new_variants.size(); ++i)
+        {
+            if (!old_variant_types_to_old_global_discriminator.contains(new_variants[i]->getName()))
+                variant_types_and_discriminators_to_add.emplace_back(new_variants[i], i);
+        }
+
+        return [old_global_discriminator_to_new, variant_types_and_discriminators_to_add]
+               (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t) -> ColumnPtr
+        {
+            const auto & column_variant = assert_cast<const ColumnVariant &>(*arguments.front().column.get());
+            size_t num_old_variants = column_variant.getNumVariants();
+            Columns new_variant_columns;
+            new_variant_columns.reserve(num_old_variants + variant_types_and_discriminators_to_add.size());
+            std::vector<ColumnVariant::Discriminator> new_local_to_global_discriminators;
+            new_local_to_global_discriminators.reserve(num_old_variants + variant_types_and_discriminators_to_add.size());
+            for (size_t i = 0; i != num_old_variants; ++i)
+            {
+                new_variant_columns.push_back(column_variant.getVariantPtrByLocalDiscriminator(i));
+                new_local_to_global_discriminators.push_back(old_global_discriminator_to_new.at(column_variant.globalDiscriminatorByLocal(i)));
+            }
+
+            for (const auto & [new_variant_type, new_global_discriminator] : variant_types_and_discriminators_to_add)
+            {
+                new_variant_columns.push_back(new_variant_type->createColumn());
+                new_local_to_global_discriminators.push_back(new_global_discriminator);
+            }
+
+            return ColumnVariant::create(column_variant.getLocalDiscriminatorsPtr(), column_variant.getOffsetsPtr(), new_variant_columns, new_local_to_global_discriminators);
+        };
+    }
+
+    WrapperType createVariantToColumnWrapper(const DataTypeVariant & from_variant, const DataTypePtr & to_type) const
+    {
+        const auto & variant_types = from_variant.getVariants();
+        std::vector<WrapperType> variant_wrappers;
+        variant_wrappers.reserve(variant_types.size());
+
+        /// Create conversion wrapper for each variant.
+        for (const auto & variant_type : variant_types)
+            variant_wrappers.push_back(prepareUnpackDictionaries(variant_type, to_type));
+
+        return [variant_wrappers, variant_types, to_type]
+               (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
+        {
+            const auto & column_variant = assert_cast<const ColumnVariant &>(*arguments.front().column.get());
+
+            /// First, cast each variant to the result type.
+            std::vector<ColumnPtr> casted_variant_columns;
+            casted_variant_columns.reserve(variant_types.size());
+            for (size_t i = 0; i != variant_types.size(); ++i)
+            {
+                auto variant_col = column_variant.getVariantPtrByLocalDiscriminator(i);
+                ColumnsWithTypeAndName variant = {{variant_col, variant_types[i], "" }};
+                const auto & variant_wrapper = variant_wrappers[column_variant.globalDiscriminatorByLocal(i)];
+                casted_variant_columns.push_back(variant_wrapper(variant, result_type, nullptr, variant_col->size()));
+            }
+
+            /// Second, construct resulting column from casted variant columns according to discriminators.
+            const auto & local_discriminators = column_variant.getLocalDiscriminators();
+            auto res = result_type->createColumn();
+            res->reserve(input_rows_count);
+            for (size_t i = 0; i != input_rows_count; ++i)
+            {
+                auto local_discr = local_discriminators[i];
+                if (local_discr == ColumnVariant::NULL_DISCRIMINATOR)
+                    res->insertDefault();
+                else
+                    res->insertFrom(*casted_variant_columns[local_discr], column_variant.offsetAt(i));
+            }
+
+            return res;
+        };
+    }
+
+    static ColumnPtr createVariantFromDescriptorsAndOneNonEmptyVariant(const DataTypes & variant_types, const ColumnPtr & discriminators, const ColumnPtr & variant, ColumnVariant::Discriminator variant_discr)
+    {
+        Columns variants;
+        variants.reserve(variant_types.size());
+        for (size_t i = 0; i != variant_types.size(); ++i)
+        {
+            if (i == variant_discr)
+                variants.emplace_back(variant);
+            else
+                variants.push_back(variant_types[i]->createColumn());
+        }
+
+        return ColumnVariant::create(discriminators, variants);
+    }
+
+    WrapperType createColumnToVariantWrapper(const DataTypePtr & from_type, const DataTypeVariant & to_variant) const
+    {
+        /// We allow converting NULL to Variant(...) as Variant can store NULLs.
+        if (from_type->onlyNull())
+        {
+            return [](ColumnsWithTypeAndName &, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
+            {
+                auto result_column = result_type->createColumn();
+                result_column->insertManyDefaults(input_rows_count);
+                return result_column;
+            };
+        }
+
+        auto variant_discr_opt = to_variant.tryGetVariantDiscriminator(removeNullableOrLowCardinalityNullable(from_type));
+        if (!variant_discr_opt)
+            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Cannot convert type {} to {}. Conversion to Variant allowed only for types from this Variant", from_type->getName(), to_variant.getName());
+
+        return [variant_discr = *variant_discr_opt]
+               (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t) -> ColumnPtr
+        {
+            const auto & result_variant_type = assert_cast<const DataTypeVariant &>(*result_type);
+            const auto & variant_types = result_variant_type.getVariants();
+            if (const ColumnNullable * col_nullable = typeid_cast<const ColumnNullable *>(arguments.front().column.get()))
+            {
+                const auto & column = col_nullable->getNestedColumnPtr();
+                const auto & null_map = col_nullable->getNullMapData();
+                IColumn::Filter filter;
+                filter.reserve(column->size());
+                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
+                auto & discriminators_data = discriminators->getData();
+                discriminators_data.reserve(column->size());
+                size_t variant_size_hint = 0;
+                for (size_t i = 0; i != column->size(); ++i)
+                {
+                    if (null_map[i])
+                    {
+                        discriminators_data.push_back(ColumnVariant::NULL_DISCRIMINATOR);
+                        filter.push_back(0);
+                    }
+                    else
+                    {
+                        discriminators_data.push_back(variant_discr);
+                        filter.push_back(1);
+                        ++variant_size_hint;
+                    }
+                }
+
+                ColumnPtr variant_column;
+                /// If there were no NULLs, just use the column.
+                if (variant_size_hint == column->size())
+                    variant_column = column;
+                /// Otherwise we should use filtered column.
+                else
+                    variant_column = column->filter(filter, variant_size_hint);
+                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), variant_column, variant_discr);
+            }
+            else if (isColumnLowCardinalityNullable(*arguments.front().column))
+            {
+                const auto & column = arguments.front().column;
+
+                /// Variant column cannot have LowCardinality(Nullable(...)) variant, as Variant column stores NULLs itself.
+                /// We should create a null-map, insert NULL_DISCRIMINATOR on NULL values and filter initial column.
+                const auto & col_lc = assert_cast<const ColumnLowCardinality &>(*column);
+                const auto & indexes = col_lc.getIndexes();
+                auto null_index = col_lc.getDictionary().getNullValueIndex();
+                IColumn::Filter filter;
+                filter.reserve(col_lc.size());
+                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
+                auto & discriminators_data = discriminators->getData();
+                discriminators_data.reserve(col_lc.size());
+                size_t variant_size_hint = 0;
+                for (size_t i = 0; i != col_lc.size(); ++i)
+                {
+                    if (indexes.getUInt(i) == null_index)
+                    {
+                        discriminators_data.push_back(ColumnVariant::NULL_DISCRIMINATOR);
+                        filter.push_back(0);
+                    }
+                    else
+                    {
+                        discriminators_data.push_back(variant_discr);
+                        filter.push_back(1);
+                        ++variant_size_hint;
+                    }
+                }
+
+                MutableColumnPtr variant_column;
+                /// If there were no NULLs, we can just clone the column.
+                if (variant_size_hint == col_lc.size())
+                    variant_column = IColumn::mutate(column);
+                /// Otherwise we should filter column.
+                else
+                    variant_column = column->filter(filter, variant_size_hint)->assumeMutable();
+
+                assert_cast<ColumnLowCardinality &>(*variant_column).nestedRemoveNullable();
+                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), std::move(variant_column), variant_discr);
+            }
+            else
+            {
+                const auto & column = arguments.front().column;
+                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
+                discriminators->getData().resize_fill(column->size(), variant_discr);
+                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), column, variant_discr);
+            }
+        };
+    }
+
+    /// Wrapper for conversion to/from Variant type
+    WrapperType createVariantWrapper(const DataTypePtr & from_type, const DataTypePtr & to_type) const
+    {
+        if (const auto * from_variant = checkAndGetDataType<DataTypeVariant>(from_type.get()))
+        {
+            if (const auto * to_variant = checkAndGetDataType<DataTypeVariant>(to_type.get()))
+                return createVariantToVariantWrapper(*from_variant, *to_variant);
+
+            return createVariantToColumnWrapper(*from_variant, to_type);
+        }
+
+        return createColumnToVariantWrapper(from_type, assert_cast<const DataTypeVariant &>(*to_type));
+    }
+
     template <typename FieldType>
     WrapperType createEnumWrapper(const DataTypePtr & from_type, const DataTypeEnum<FieldType> * to_type) const
     {
@@ -4246,6 +4501,11 @@ arguments, result_type, input_rows_count); \
 
     WrapperType prepareUnpackDictionaries(const DataTypePtr & from_type, const DataTypePtr & to_type) const
     {
+        /// Conversion from/to Variant data type is processed in a special way.
+        /// We don't need to remove LowCardinality/Nullable.
+        if (isVariant(to_type) || isVariant(from_type))
+            return createVariantWrapper(from_type, to_type);
+
         const auto * from_low_cardinality = typeid_cast<const DataTypeLowCardinality *>(from_type.get());
         const auto * to_low_cardinality = typeid_cast<const DataTypeLowCardinality *>(to_type.get());
         const auto & from_nested = from_low_cardinality ? from_low_cardinality->getDictionaryType() : from_type;
@@ -4253,7 +4513,7 @@ arguments, result_type, input_rows_count); \
 
         if (from_type->onlyNull())
         {
-            if (!to_nested->isNullable())
+            if (!to_nested->isNullable() && !isVariant(to_type))
             {
                 if (cast_type == CastType::accurateOrNull)
                 {
diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index eba1733c683..b15bc5938be 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -4,6 +4,7 @@
 #include <DataTypes/DataTypeFixedString.h>
 #include <DataTypes/DataTypeTuple.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeVariant.h>
 #include <DataTypes/NumberTraits.h>
 #include <DataTypes/getLeastSupertype.h>
 #include <Columns/ColumnVector.h>
@@ -14,6 +15,7 @@
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnTuple.h>
 #include <Columns/ColumnNullable.h>
+#include <Columns/ColumnVariant.h>
 #include <Columns/MaskOperations.h>
 #include <Common/typeid_cast.h>
 #include <Common/assert_cast.h>
@@ -22,6 +24,8 @@
 #include <Functions/GatherUtils/Algorithms.h>
 #include <Functions/FunctionIfBase.h>
 #include <Interpreters/castColumn.h>
+#include <Interpreters/Context.h>
+
 #include <Functions/FunctionFactory.h>
 
 
@@ -215,9 +219,16 @@ class FunctionIf : public FunctionIfBase
 {
 public:
     static constexpr auto name = "if";
-    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionIf>(); }
+    static FunctionPtr create(ContextPtr context)
+    {
+        return std::make_shared<FunctionIf>(context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_when_no_common_type_in_if);
+    }
+
+    FunctionIf(bool use_variant_when_no_common_type_ = false) : FunctionIfBase(), use_variant_when_no_common_type(use_variant_when_no_common_type_) {}
 
 private:
+    bool use_variant_when_no_common_type = false;
+
     template <typename T0, typename T1>
     static UInt32 decimalScale(const ColumnsWithTypeAndName & arguments [[maybe_unused]])
     {
@@ -626,13 +637,23 @@ private:
     }
 
     static ColumnPtr executeGeneric(
-        const ColumnUInt8 * cond_col, const ColumnsWithTypeAndName & arguments, size_t input_rows_count)
+        const ColumnUInt8 * cond_col, const ColumnsWithTypeAndName & arguments, size_t input_rows_count, bool use_variant_when_no_common_type)
     {
         /// Convert both columns to the common type (if needed).
         const ColumnWithTypeAndName & arg1 = arguments[1];
         const ColumnWithTypeAndName & arg2 = arguments[2];
 
-        DataTypePtr common_type = getLeastSupertype(DataTypes{arg1.type, arg2.type});
+        DataTypePtr common_type;
+        if (use_variant_when_no_common_type)
+        {
+            common_type = tryGetLeastSupertype(DataTypes{arg1.type, arg2.type});
+            if (!common_type)
+                common_type = std::make_shared<DataTypeVariant>(DataTypes{removeNullableOrLowCardinalityNullable(arg1.type), removeNullableOrLowCardinalityNullable(arg2.type)});
+        }
+        else
+        {
+            common_type = getLeastSupertype(DataTypes{arg1.type, arg2.type});
+        }
 
         ColumnPtr col_then = castColumn(arg1, common_type);
         ColumnPtr col_else = castColumn(arg2, common_type);
@@ -807,6 +828,10 @@ private:
 
     ColumnPtr executeForNullableThenElse(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const
     {
+        /// If result type is Variant, we don't need to remove Nullable.
+        if (isVariant(result_type))
+            return nullptr;
+
         const ColumnWithTypeAndName & arg_cond = arguments[0];
         const ColumnWithTypeAndName & arg_then = arguments[1];
         const ColumnWithTypeAndName & arg_else = arguments[2];
@@ -912,6 +937,11 @@ private:
                     assert_cast<ColumnNullable &>(*result_column).applyNullMap(assert_cast<const ColumnUInt8 &>(*arg_cond.column));
                     return result_column;
                 }
+                else if (auto * variant_column = typeid_cast<ColumnVariant *>(result_column.get()))
+                {
+                    variant_column->applyNullMap(assert_cast<const ColumnUInt8 &>(*arg_cond.column).getData());
+                    return result_column;
+                }
                 else
                     return ColumnNullable::create(materializeColumnIfConst(result_column), arg_cond.column);
             }
@@ -950,6 +980,11 @@ private:
                     assert_cast<ColumnNullable &>(*result_column).applyNegatedNullMap(assert_cast<const ColumnUInt8 &>(*arg_cond.column));
                     return result_column;
                 }
+                else if (auto * variant_column = typeid_cast<ColumnVariant *>(result_column.get()))
+                {
+                    variant_column->applyNegatedNullMap(assert_cast<const ColumnUInt8 &>(*arg_cond.column).getData());
+                    return result_column;
+                }
                 else
                 {
                     size_t size = input_rows_count;
@@ -1039,6 +1074,13 @@ public:
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of first argument (condition) of function if. "
                 "Must be UInt8.", arguments[0]->getName());
 
+        if (use_variant_when_no_common_type)
+        {
+            if (auto res = tryGetLeastSupertype(DataTypes{arguments[1], arguments[2]}))
+                return res;
+            return std::make_shared<DataTypeVariant>(DataTypes{removeNullableOrLowCardinalityNullable(arguments[1]), removeNullableOrLowCardinalityNullable(arguments[2])});
+        }
+
         return getLeastSupertype(DataTypes{arguments[1], arguments[2]});
     }
 
@@ -1122,7 +1164,7 @@ public:
             || (res = executeGenericArray(cond_col, arguments, result_type))
             || (res = executeTuple(arguments, result_type, input_rows_count))))
         {
-            return executeGeneric(cond_col, arguments, input_rows_count);
+            return executeGeneric(cond_col, arguments, input_rows_count, use_variant_when_no_common_type);
         }
 
         return res;
diff --git a/src/Functions/isNotNull.cpp b/src/Functions/isNotNull.cpp
index cbdc08c2fab..360c2fc7f9f 100644
--- a/src/Functions/isNotNull.cpp
+++ b/src/Functions/isNotNull.cpp
@@ -5,6 +5,7 @@
 #include <Core/ColumnNumbers.h>
 #include <Columns/ColumnNullable.h>
 #include <Columns/ColumnLowCardinality.h>
+#include <Columns/ColumnVariant.h>
 #include <Common/assert_cast.h>
 
 
@@ -45,6 +46,18 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
         const ColumnWithTypeAndName & elem = arguments[0];
+
+        if (isVariant(elem.type))
+        {
+            const auto & discriminators = checkAndGetColumn<ColumnVariant>(*elem.column)->getLocalDiscriminators();
+            auto res = DataTypeUInt8().createColumn();
+            auto & data = typeid_cast<ColumnUInt8 &>(*res).getData();
+            data.reserve(discriminators.size());
+            for (auto discr : discriminators)
+                data.push_back(discr != ColumnVariant::NULL_DISCRIMINATOR);
+            return res;
+        }
+
         if (elem.type->isLowCardinalityNullable())
         {
             const auto * low_cardinality_column = checkAndGetColumn<ColumnLowCardinality>(*elem.column);
diff --git a/src/Functions/isNull.cpp b/src/Functions/isNull.cpp
index cdce037088d..4bf4e44f866 100644
--- a/src/Functions/isNull.cpp
+++ b/src/Functions/isNull.cpp
@@ -5,6 +5,7 @@
 #include <Core/ColumnNumbers.h>
 #include <Columns/ColumnNullable.h>
 #include <Columns/ColumnLowCardinality.h>
+#include <Columns/ColumnVariant.h>
 
 
 namespace DB
@@ -44,6 +45,18 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t) const override
     {
         const ColumnWithTypeAndName & elem = arguments[0];
+
+        if (isVariant(elem.type))
+        {
+            const auto & discriminators = checkAndGetColumn<ColumnVariant>(*elem.column)->getLocalDiscriminators();
+            auto res = DataTypeUInt8().createColumn();
+            auto & data = typeid_cast<ColumnUInt8 &>(*res).getData();
+            data.reserve(discriminators.size());
+            for (auto discr : discriminators)
+                data.push_back(discr == ColumnVariant::NULL_DISCRIMINATOR);
+            return res;
+        }
+
         if (elem.type->isLowCardinalityNullable())
         {
             const auto * low_cardinality_column = checkAndGetColumn<ColumnLowCardinality>(*elem.column);
diff --git a/src/Functions/multiIf.cpp b/src/Functions/multiIf.cpp
index cdb9ca061c3..7a2e9444b2c 100644
--- a/src/Functions/multiIf.cpp
+++ b/src/Functions/multiIf.cpp
@@ -9,6 +9,7 @@
 #include <Common/typeid_cast.h>
 #include <Interpreters/Context.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeVariant.h>
 #include <DataTypes/getLeastSupertype.h>
 
 
@@ -117,6 +118,15 @@ public:
             types_of_branches.emplace_back(arg);
         });
 
+        if (context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_when_no_common_type_in_if)
+        {
+            if (auto res = tryGetLeastSupertype(types_of_branches))
+                return res;
+            for (auto & type : types_of_branches)
+                type = removeNullableOrLowCardinalityNullable(type);
+            return std::make_shared<DataTypeVariant>(types_of_branches);
+        }
+
         return getLeastSupertype(types_of_branches);
     }
 
diff --git a/src/Functions/variantElement.cpp b/src/Functions/variantElement.cpp
new file mode 100644
index 00000000000..7c63e1266e6
--- /dev/null
+++ b/src/Functions/variantElement.cpp
@@ -0,0 +1,238 @@
+#include <Functions/IFunction.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionHelpers.h>
+#include <DataTypes/IDataType.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeVariant.h>
+#include <DataTypes/DataTypeFactory.h>
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnVariant.h>
+#include <Columns/ColumnNullable.h>
+#include <Columns/ColumnLowCardinality.h>
+#include <Common/assert_cast.h>
+#include <memory>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+}
+
+namespace
+{
+
+/** Extract element of Variant by variant type name.
+  * Also the function looks through Arrays: you can get Array of Variant elements from Array of Variants.
+  */
+class FunctionVariantElement : public IFunction
+{
+public:
+    static constexpr auto name = "variantElement";
+
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionVariantElement>(); }
+    String getName() const override { return name; }
+    bool isVariadic() const override { return true; }
+    size_t getNumberOfArguments() const override { return 0; }
+    bool useDefaultImplementationForConstants() const override { return true; }
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
+    bool useDefaultImplementationForNulls() const override { return false; }
+    bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
+
+    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
+    {
+        const size_t number_of_arguments = arguments.size();
+
+        if (number_of_arguments < 2 || number_of_arguments > 3)
+            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                            "Number of arguments for function {} doesn't match: passed {}, should be 2 or 3",
+                            getName(), number_of_arguments);
+
+        size_t count_arrays = 0;
+        const IDataType * input_type = arguments[0].type.get();
+        while (const DataTypeArray * array = checkAndGetDataType<DataTypeArray>(input_type))
+        {
+            input_type = array->getNestedType().get();
+            ++count_arrays;
+        }
+
+        const DataTypeVariant * variant_type = checkAndGetDataType<DataTypeVariant>(input_type);
+        if (!variant_type)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "First argument for function {} must be Variant or Array of Variant. Actual {}",
+                    getName(),
+                    arguments[0].type->getName());
+
+        std::optional<size_t> variant_global_discr = getVariantGlobalDiscriminator(arguments[1].column, *variant_type, number_of_arguments);
+        if (variant_global_discr.has_value())
+        {
+            DataTypePtr return_type = makeNullableOrLowCardinalityNullableSafe(variant_type->getVariant(variant_global_discr.value()));
+
+            for (; count_arrays; --count_arrays)
+                return_type = std::make_shared<DataTypeArray>(return_type);
+
+            return return_type;
+        }
+        else
+            return arguments[2].type;
+    }
+
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
+    {
+        const auto & input_arg = arguments[0];
+        const IDataType * input_type = input_arg.type.get();
+        const IColumn * input_col = input_arg.column.get();
+
+        bool input_arg_is_const = false;
+        if (typeid_cast<const ColumnConst *>(input_col))
+        {
+            input_col = assert_cast<const ColumnConst *>(input_col)->getDataColumnPtr().get();
+            input_arg_is_const = true;
+        }
+
+        Columns array_offsets;
+        while (const DataTypeArray * array_type = checkAndGetDataType<DataTypeArray>(input_type))
+        {
+            const ColumnArray * array_col = assert_cast<const ColumnArray *>(input_col);
+
+            input_type = array_type->getNestedType().get();
+            input_col = &array_col->getData();
+            array_offsets.push_back(array_col->getOffsetsPtr());
+        }
+
+        const DataTypeVariant * input_type_as_variant = checkAndGetDataType<DataTypeVariant>(input_type);
+        const ColumnVariant * input_col_as_variant = checkAndGetColumn<ColumnVariant>(input_col);
+        if (!input_type_as_variant || !input_col_as_variant)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                            "First argument for function {} must be Variant or array of Variants. Actual {}", getName(), input_arg.type->getName());
+
+        std::optional<size_t> variant_global_discr = getVariantGlobalDiscriminator(arguments[1].column, *input_type_as_variant, arguments.size());
+
+        if (!variant_global_discr.has_value())
+            return arguments[2].column;
+
+        const auto & variant_type = input_type_as_variant->getVariant(*variant_global_discr);
+        const auto & variant_column = input_col_as_variant->getVariantPtrByGlobalDiscriminator(*variant_global_discr);
+
+        /// If Variant has only NULLs or our variant doesn't have any real values,
+        /// just create column with default values and create null mask with 1.
+        if (input_col_as_variant->hasOnlyNulls() || variant_column->empty())
+        {
+            auto res = variant_type->createColumn();
+
+            if (variant_type->lowCardinality())
+                assert_cast<ColumnLowCardinality &>(*res).nestedToNullable();
+
+            res->insertManyDefaults(input_col_as_variant->size());
+            if (!variant_type->canBeInsideNullable())
+                return wrapInArraysAndConstIfNeeded(std::move(res), array_offsets, input_arg_is_const, input_rows_count);
+
+            auto null_map = ColumnUInt8::create();
+            auto & null_map_data = null_map->getData();
+            null_map_data.resize_fill(input_col_as_variant->size(), 1);
+            return wrapInArraysAndConstIfNeeded(ColumnNullable::create(std::move(res), std::move(null_map)), array_offsets, input_arg_is_const, input_rows_count);
+        }
+
+        /// If we extract single non-empty column and have no NULLs, then just return this variant.
+        if (auto non_empty_local_discr = input_col_as_variant->getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+        {
+            /// If we were trying to extract some other variant,
+            /// it would be empty and we would already processed this case above.
+            chassert(input_col_as_variant->globalDiscriminatorByLocal(*non_empty_local_discr) == variant_global_discr);
+            return wrapInArraysAndConstIfNeeded(makeNullableOrLowCardinalityNullableSafe(variant_column), array_offsets, input_arg_is_const, input_rows_count);
+        }
+
+        /// In general case we should calculate null-mask for variant
+        /// according to the discriminators column and expand
+        /// variant column by this mask to get a full column (with default values on NULLs)
+        const auto & local_discriminators = input_col_as_variant->getLocalDiscriminators();
+        auto null_map = ColumnUInt8::create();
+        auto & null_map_data = null_map->getData();
+        null_map_data.reserve(local_discriminators.size());
+        auto variant_local_discr = input_col_as_variant->localDiscriminatorByGlobal(*variant_global_discr);
+        for (auto local_discr : local_discriminators)
+            null_map_data.push_back(local_discr != variant_local_discr);
+
+        auto expanded_variant_column = IColumn::mutate(variant_column);
+        if (variant_type->lowCardinality())
+            expanded_variant_column = assert_cast<ColumnLowCardinality &>(*expanded_variant_column).cloneNullable();
+        expanded_variant_column->expand(null_map_data, /*inverted = */ true);
+        if (variant_type->canBeInsideNullable())
+            return wrapInArraysAndConstIfNeeded(ColumnNullable::create(std::move(expanded_variant_column), std::move(null_map)), array_offsets, input_arg_is_const, input_rows_count);
+        return wrapInArraysAndConstIfNeeded(std::move(expanded_variant_column), array_offsets, input_arg_is_const, input_rows_count);
+    }
+private:
+    std::optional<size_t> getVariantGlobalDiscriminator(const ColumnPtr & index_column, const DataTypeVariant & variant_type, size_t argument_size) const
+    {
+        const auto * name_col = checkAndGetColumnConst<ColumnString>(index_column.get());
+        if (!name_col)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                            "Second argument to {} with Variant argument must be a constant String",
+                            getName());
+
+        String variant_element_name = name_col->getValue<String>();
+        auto variant_element_type = DataTypeFactory::instance().tryGet(variant_element_name);
+        if (variant_element_type)
+        {
+            const auto & variants = variant_type.getVariants();
+            for (size_t i = 0; i != variants.size(); ++i)
+            {
+                if (variants[i]->getName() == variant_element_type->getName())
+                    return i;
+            }
+        }
+
+        if (argument_size == 2)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "{} doesn't contain variant with type {}", variant_type.getName(), variant_element_name);
+        return std::nullopt;
+    }
+
+    ColumnPtr wrapInArraysAndConstIfNeeded(ColumnPtr res, const Columns & array_offsets, bool input_arg_is_const, size_t input_rows_count) const
+    {
+        for (auto it = array_offsets.rbegin(); it != array_offsets.rend(); ++it)
+            res = ColumnArray::create(res, *it);
+
+        if (input_arg_is_const)
+            res = ColumnConst::create(res, input_rows_count);
+
+        return res;
+    }
+};
+
+}
+
+REGISTER_FUNCTION(VariantElement)
+{
+    factory.registerFunction<FunctionVariantElement>(FunctionDocumentation{
+        .description = R"(
+Extracts a column with specified type from a `Variant` column.
+)",
+        .syntax{"tupleElement(variant, type_name, [, default_value])"},
+        .arguments{{
+            {"variant", "Variant column"},
+            {"type_name", "The name of the variant type to extract"},
+            {"default_value", "The default value that will be used if variant doesn't have variant with specified type. Can be any type. Optional"}}},
+        .examples{{{
+            "Example",
+            R"(
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT v, variantElement(v, 'String'), variantElement(v, 'UInt64'), variantElement(v, 'Array(UInt64)') FROM test;)",
+            R"(
+┌─v─────────────┬─variantElement(v, 'String')─┬─variantElement(v, 'UInt64')─┬─variantElement(v, 'Array(UInt64)')─┐
+│ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ                        │                        ᴺᵁᴸᴸ │ []                                 │
+│ 42            │ ᴺᵁᴸᴸ                        │                          42 │ []                                 │
+│ Hello, World! │ Hello, World!               │                        ᴺᵁᴸᴸ │ []                                 │
+│ [1,2,3]       │ ᴺᵁᴸᴸ                        │                        ᴺᵁᴸᴸ │ [1,2,3]                            │
+└───────────────┴─────────────────────────────┴─────────────────────────────┴────────────────────────────────────┘
+)"}}},
+        .categories{"Variant"},
+    });
+}
+
+}
diff --git a/src/IO/ReadHelpers.cpp b/src/IO/ReadHelpers.cpp
index ff5743a63af..2534f248d83 100644
--- a/src/IO/ReadHelpers.cpp
+++ b/src/IO/ReadHelpers.cpp
@@ -619,13 +619,16 @@ void readQuotedStringInto(Vector & s, ReadBuffer & buf)
     readAnyQuotedStringInto<'\'', enable_sql_style_quoting>(s, buf);
 }
 
-template <typename Vector>
+template <bool enable_sql_style_quoting, typename Vector>
 bool tryReadQuotedStringInto(Vector & s, ReadBuffer & buf)
 {
-    return readAnyQuotedStringInto<'\'', false, Vector, bool>(s, buf);
+    return readAnyQuotedStringInto<'\'', enable_sql_style_quoting, Vector, bool>(s, buf);
 }
 
-template bool tryReadQuotedStringInto(String & s, ReadBuffer & buf);
+template bool tryReadQuotedStringInto<true, String>(String & s, ReadBuffer & buf);
+template bool tryReadQuotedStringInto<false, String>(String & s, ReadBuffer & buf);
+template bool tryReadQuotedStringInto<true, PaddedPODArray<UInt8>>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
+template bool tryReadQuotedStringInto<false, PaddedPODArray<UInt8>>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
 
 template <bool enable_sql_style_quoting, typename Vector>
 void readDoubleQuotedStringInto(Vector & s, ReadBuffer & buf)
@@ -633,6 +636,16 @@ void readDoubleQuotedStringInto(Vector & s, ReadBuffer & buf)
     readAnyQuotedStringInto<'"', enable_sql_style_quoting>(s, buf);
 }
 
+template <bool enable_sql_style_quoting, typename Vector>
+bool tryReadDoubleQuotedStringInto(Vector & s, ReadBuffer & buf)
+{
+    return readAnyQuotedStringInto<'"', enable_sql_style_quoting, Vector, bool>(s, buf);
+}
+
+template bool tryReadDoubleQuotedStringInto<true, String>(String & s, ReadBuffer & buf);
+template bool tryReadDoubleQuotedStringInto<false, String>(String & s, ReadBuffer & buf);
+
+
 template <bool enable_sql_style_quoting, typename Vector>
 void readBackQuotedStringInto(Vector & s, ReadBuffer & buf)
 {
@@ -652,6 +665,18 @@ void readQuotedStringWithSQLStyle(String & s, ReadBuffer & buf)
     readQuotedStringInto<true>(s, buf);
 }
 
+bool tryReadQuotedString(String & s, ReadBuffer & buf)
+{
+    s.clear();
+    return tryReadQuotedStringInto<false>(s, buf);
+}
+
+bool tryReadQuotedStringWithSQLStyle(String & s, ReadBuffer & buf)
+{
+    s.clear();
+    return tryReadQuotedStringInto<true>(s, buf);
+}
+
 
 template void readQuotedStringInto<true>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
 template void readQuotedStringInto<true>(String & s, ReadBuffer & buf);
@@ -672,6 +697,18 @@ void readDoubleQuotedStringWithSQLStyle(String & s, ReadBuffer & buf)
     readDoubleQuotedStringInto<true>(s, buf);
 }
 
+bool tryReadDoubleQuotedString(String & s, ReadBuffer & buf)
+{
+    s.clear();
+    return tryReadDoubleQuotedStringInto<false>(s, buf);
+}
+
+bool tryReadDoubleQuotedStringWithSQLStyle(String & s, ReadBuffer & buf)
+{
+    s.clear();
+    return tryReadDoubleQuotedStringInto<true>(s, buf);
+}
+
 void readBackQuotedString(String & s, ReadBuffer & buf)
 {
     s.clear();
@@ -691,7 +728,7 @@ concept WithResize = requires (T value)
     { value.size() } -> std::integral<>;
 };
 
-template <typename Vector, bool include_quotes>
+template <typename Vector, bool include_quotes, bool allow_throw>
 void readCSVStringInto(Vector & s, ReadBuffer & buf, const FormatSettings::CSV & settings)
 {
     /// Empty string
@@ -754,12 +791,20 @@ void readCSVStringInto(Vector & s, ReadBuffer & buf, const FormatSettings::CSV &
         {
             PeekableReadBuffer * peekable_buf = dynamic_cast<PeekableReadBuffer *>(&buf);
             if (!peekable_buf)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Reading CSV string with custom delimiter is allowed only when using PeekableReadBuffer");
+            {
+                if constexpr (allow_throw)
+                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Reading CSV string with custom delimiter is allowed only when using PeekableReadBuffer");
+                return;
+            }
 
             while (true)
             {
                 if (peekable_buf->eof())
-                    throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected EOF while reading CSV string, expected custom delimiter \"{}\"", custom_delimiter);
+                {
+                    if constexpr (allow_throw)
+                        throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected EOF while reading CSV string, expected custom delimiter \"{}\"", custom_delimiter);
+                    return;
+                }
 
                 char * next_pos = reinterpret_cast<char *>(memchr(peekable_buf->position(), custom_delimiter[0], peekable_buf->available()));
                 if (!next_pos)
@@ -948,6 +993,9 @@ String readCSVFieldWithTwoPossibleDelimiters(PeekableReadBuffer & buf, const For
 
 template void readCSVStringInto<PaddedPODArray<UInt8>>(PaddedPODArray<UInt8> & s, ReadBuffer & buf, const FormatSettings::CSV & settings);
 template void readCSVStringInto<NullOutput>(NullOutput & s, ReadBuffer & buf, const FormatSettings::CSV & settings);
+template void readCSVStringInto<String, false, false>(String & s, ReadBuffer & buf, const FormatSettings::CSV & settings);
+template void readCSVStringInto<String, true, false>(String & s, ReadBuffer & buf, const FormatSettings::CSV & settings);
+template void readCSVStringInto<PaddedPODArray<UInt8>, false, false>(PaddedPODArray<UInt8> & s, ReadBuffer & buf, const FormatSettings::CSV & settings);
 
 
 template <typename Vector, typename ReturnType>
@@ -1069,15 +1117,18 @@ ReturnType readJSONObjectPossiblyInvalid(Vector & s, ReadBuffer & buf)
 }
 
 template void readJSONObjectPossiblyInvalid<String>(String & s, ReadBuffer & buf);
+template bool readJSONObjectPossiblyInvalid<String, bool>(String & s, ReadBuffer & buf);
 template void readJSONObjectPossiblyInvalid<PaddedPODArray<UInt8>>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
+template bool readJSONObjectPossiblyInvalid<PaddedPODArray<UInt8>, bool>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
 
-template <typename Vector>
-void readJSONArrayInto(Vector & s, ReadBuffer & buf)
+template <typename Vector, typename ReturnType>
+ReturnType readJSONArrayInto(Vector & s, ReadBuffer & buf)
 {
-    readJSONObjectOrArrayPossiblyInvalid<Vector, void, '[', ']'>(s, buf);
+    return readJSONObjectOrArrayPossiblyInvalid<Vector, ReturnType, '[', ']'>(s, buf);
 }
 
-template void readJSONArrayInto<PaddedPODArray<UInt8>>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
+template void readJSONArrayInto<PaddedPODArray<UInt8>, void>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
+template bool readJSONArrayInto<PaddedPODArray<UInt8>, bool>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
 
 template <typename ReturnType>
 ReturnType readDateTextFallback(LocalDate & date, ReadBuffer & buf)
@@ -1217,6 +1268,13 @@ ReturnType readDateTimeTextFallback(time_t & datetime, ReadBuffer & buf, const D
                 return false;
         }
 
+        if constexpr (!throw_exception)
+        {
+            if (!isNumericASCII(s[0]) || !isNumericASCII(s[1]) || !isNumericASCII(s[2]) || !isNumericASCII(s[3])
+                || !isNumericASCII(s[5]) || !isNumericASCII(s[6]) || !isNumericASCII(s[8]) || !isNumericASCII(s[9]))
+                return false;
+        }
+
         UInt16 year = (s[0] - '0') * 1000 + (s[1] - '0') * 100 + (s[2] - '0') * 10 + (s[3] - '0');
         UInt8 month = (s[5] - '0') * 10 + (s[6] - '0');
         UInt8 day = (s[8] - '0') * 10 + (s[9] - '0');
@@ -1240,6 +1298,13 @@ ReturnType readDateTimeTextFallback(time_t & datetime, ReadBuffer & buf, const D
                     return false;
             }
 
+            if constexpr (!throw_exception)
+            {
+                if (!isNumericASCII(s[0]) || !isNumericASCII(s[1]) || !isNumericASCII(s[3]) || !isNumericASCII(s[4])
+                    || !isNumericASCII(s[6]) || !isNumericASCII(s[7]))
+                    return false;
+            }
+
             hour = (s[0] - '0') * 10 + (s[1] - '0');
             minute = (s[3] - '0') * 10 + (s[4] - '0');
             second = (s[6] - '0') * 10 + (s[7] - '0');
@@ -1259,7 +1324,14 @@ ReturnType readDateTimeTextFallback(time_t & datetime, ReadBuffer & buf, const D
         {
             /// Not very efficient.
             for (const char * digit_pos = s; digit_pos < s_pos; ++digit_pos)
+            {
+                if constexpr (!throw_exception)
+                {
+                    if (!isNumericASCII(*digit_pos))
+                        return false;
+                }
                 datetime = datetime * 10 + *digit_pos - '0';
+            }
         }
         datetime *= negative_multiplier;
 
@@ -1282,14 +1354,24 @@ template bool readDateTimeTextFallback<bool, false>(time_t &, ReadBuffer &, cons
 template bool readDateTimeTextFallback<bool, true>(time_t &, ReadBuffer &, const DateLUTImpl &);
 
 
-void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
+template <typename ReturnType>
+ReturnType skipJSONFieldImpl(ReadBuffer & buf, StringRef name_of_field)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     if (buf.eof())
-        throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected EOF for key '{}'", name_of_field.toString());
+    {
+        if constexpr (throw_exception)
+            throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected EOF for key '{}'", name_of_field.toString());
+        return ReturnType(false);
+    }
     else if (*buf.position() == '"') /// skip double-quoted string
     {
         NullOutput sink;
-        readJSONStringInto(sink, buf);
+        if constexpr (throw_exception)
+            readJSONStringInto(sink, buf);
+        else if (!tryReadJSONStringInto(sink, buf))
+            return ReturnType(false);
     }
     else if (isNumericASCII(*buf.position()) || *buf.position() == '-' || *buf.position() == '+' || *buf.position() == '.') /// skip number
     {
@@ -1298,19 +1380,32 @@ void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
 
         double v;
         if (!tryReadFloatText(v, buf))
-            throw Exception(ErrorCodes::INCORRECT_DATA, "Expected a number field for key '{}'", name_of_field.toString());
+        {
+            if constexpr (throw_exception)
+                throw Exception(ErrorCodes::INCORRECT_DATA, "Expected a number field for key '{}'", name_of_field.toString());
+            return ReturnType(false);
+        }
     }
     else if (*buf.position() == 'n') /// skip null
     {
-        assertString("null", buf);
+        if constexpr (throw_exception)
+            assertString("null", buf);
+        else if (!checkString("null", buf))
+            return ReturnType(false);
     }
     else if (*buf.position() == 't') /// skip true
     {
-        assertString("true", buf);
+        if constexpr (throw_exception)
+            assertString("true", buf);
+        else if (!checkString("true", buf))
+            return ReturnType(false);
     }
     else if (*buf.position() == 'f') /// skip false
     {
-        assertString("false", buf);
+        if constexpr (throw_exception)
+            assertString("false", buf);
+        else if (!checkString("false", buf))
+            return ReturnType(false);
     }
     else if (*buf.position() == '[')
     {
@@ -1320,12 +1415,16 @@ void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
         if (!buf.eof() && *buf.position() == ']') /// skip empty array
         {
             ++buf.position();
-            return;
+            return ReturnType(true);
         }
 
         while (true)
         {
-            skipJSONField(buf, name_of_field);
+            if constexpr (throw_exception)
+                skipJSONFieldImpl<ReturnType>(buf, name_of_field);
+            else if (!skipJSONFieldImpl<ReturnType>(buf, name_of_field))
+                return ReturnType(false);
+
             skipWhitespaceIfAny(buf);
 
             if (!buf.eof() && *buf.position() == ',')
@@ -1339,7 +1438,11 @@ void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
                 break;
             }
             else
-                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol for key '{}'", name_of_field.toString());
+            {
+                if constexpr (throw_exception)
+                    throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol for key '{}'", name_of_field.toString());
+                return ReturnType(false);
+            }
         }
     }
     else if (*buf.position() == '{') /// skip whole object
@@ -1353,19 +1456,34 @@ void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
             if (*buf.position() == '"')
             {
                 NullOutput sink;
-                readJSONStringInto(sink, buf);
+                if constexpr (throw_exception)
+                    readJSONStringInto(sink, buf);
+                else if (!tryReadJSONStringInto(sink, buf))
+                    return ReturnType(false);
             }
             else
-                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol for key '{}'", name_of_field.toString());
+            {
+                if constexpr (throw_exception)
+                    throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol for key '{}'", name_of_field.toString());
+                return ReturnType(false);
+            }
 
             // ':'
             skipWhitespaceIfAny(buf);
             if (buf.eof() || !(*buf.position() == ':'))
-                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol for key '{}'", name_of_field.toString());
+            {
+                if constexpr (throw_exception)
+                    throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol for key '{}'", name_of_field.toString());
+                return ReturnType(false);
+            }
             ++buf.position();
             skipWhitespaceIfAny(buf);
 
-            skipJSONField(buf, name_of_field);
+            if constexpr (throw_exception)
+                skipJSONFieldImpl<ReturnType>(buf, name_of_field);
+            else if (!skipJSONFieldImpl<ReturnType>(buf, name_of_field))
+                return ReturnType(false);
+
             skipWhitespaceIfAny(buf);
 
             // optional ','
@@ -1377,14 +1495,32 @@ void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
         }
 
         if (buf.eof())
-            throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected EOF for key '{}'", name_of_field.toString());
+        {
+            if constexpr (throw_exception)
+                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected EOF for key '{}'", name_of_field.toString());
+            return ReturnType(false);
+        }
         ++buf.position();
     }
     else
     {
-        throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol '{}' for key '{}'",
-                        std::string(*buf.position(), 1), name_of_field.toString());
+        if constexpr (throw_exception)
+            throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol '{}' for key '{}'",
+                            std::string(*buf.position(), 1), name_of_field.toString());
+        return ReturnType(false);
     }
+
+    return ReturnType(true);
+}
+
+void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
+{
+    skipJSONFieldImpl<void>(buf, name_of_field);
+}
+
+bool trySkipJSONField(ReadBuffer & buf, StringRef name_of_field)
+{
+    return skipJSONFieldImpl<bool>(buf, name_of_field);
 }
 
 
@@ -1597,23 +1733,31 @@ void skipToNextRowOrEof(PeekableReadBuffer & buf, const String & row_after_delim
 }
 
 // Use PeekableReadBuffer to copy field to string after parsing.
-template <typename Vector, typename ParseFunc>
-static void readParsedValueInto(Vector & s, ReadBuffer & buf, ParseFunc parse_func)
+template <typename ReturnType, typename Vector, typename ParseFunc>
+static ReturnType readParsedValueInto(Vector & s, ReadBuffer & buf, ParseFunc parse_func)
 {
     PeekableReadBuffer peekable_buf(buf);
     peekable_buf.setCheckpoint();
-    parse_func(peekable_buf);
+    if constexpr (std::is_same_v<ReturnType, void>)
+        parse_func(peekable_buf);
+    else if (!parse_func(peekable_buf))
+        return ReturnType(false);
     peekable_buf.makeContinuousMemoryFromCheckpointToPos();
     auto * end = peekable_buf.position();
     peekable_buf.rollbackToCheckpoint();
     s.append(peekable_buf.position(), end);
     peekable_buf.position() = end;
+    return ReturnType(true);
 }
 
-template <typename Vector>
-static void readQuotedStringFieldInto(Vector & s, ReadBuffer & buf)
+template <typename ReturnType = void, typename Vector>
+static ReturnType readQuotedStringFieldInto(Vector & s, ReadBuffer & buf)
 {
-    assertChar('\'', buf);
+    if constexpr (std::is_same_v<ReturnType, void>)
+        assertChar('\'', buf);
+    else if (!checkChar('\'', buf))
+        return ReturnType(false);
+
     s.push_back('\'');
     while (!buf.eof())
     {
@@ -1641,16 +1785,23 @@ static void readQuotedStringFieldInto(Vector & s, ReadBuffer & buf)
     }
 
     if (buf.eof())
-        return;
+        return ReturnType(false);
 
     ++buf.position();
     s.push_back('\'');
+    return ReturnType(true);
 }
 
-template <char opening_bracket, char closing_bracket, typename Vector>
-static void readQuotedFieldInBracketsInto(Vector & s, ReadBuffer & buf)
+template <typename ReturnType = void, char opening_bracket, char closing_bracket, typename Vector>
+static ReturnType readQuotedFieldInBracketsInto(Vector & s, ReadBuffer & buf)
 {
-    assertChar(opening_bracket, buf);
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
+    if constexpr (throw_exception)
+        assertChar(opening_bracket, buf);
+    else if (!checkChar(opening_bracket, buf))
+        return ReturnType(false);
+
     s.push_back(opening_bracket);
 
     size_t balance = 1;
@@ -1666,7 +1817,10 @@ static void readQuotedFieldInBracketsInto(Vector & s, ReadBuffer & buf)
 
         if (*buf.position() == '\'')
         {
-            readQuotedStringFieldInto(s, buf);
+            if constexpr (throw_exception)
+                readQuotedStringFieldInto<void>(s, buf);
+            else if (!readQuotedStringFieldInto<bool>(s, buf))
+                return ReturnType(false);
         }
         else if (*buf.position() == opening_bracket)
         {
@@ -1681,13 +1835,20 @@ static void readQuotedFieldInBracketsInto(Vector & s, ReadBuffer & buf)
             ++buf.position();
         }
     }
+
+    if (balance)
+        return ReturnType(false);
+
+    return ReturnType(true);
 }
 
-template <typename Vector>
-void readQuotedFieldInto(Vector & s, ReadBuffer & buf)
+template <typename ReturnType, typename Vector>
+ReturnType readQuotedFieldInto(Vector & s, ReadBuffer & buf)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     if (buf.eof())
-        return;
+        return ReturnType(false);
 
     /// Possible values in 'Quoted' field:
     /// - Strings: '...'
@@ -1699,35 +1860,47 @@ void readQuotedFieldInto(Vector & s, ReadBuffer & buf)
     /// - Number: integer, float, decimal.
 
     if (*buf.position() == '\'')
-        readQuotedStringFieldInto(s, buf);
+        return readQuotedStringFieldInto<ReturnType>(s, buf);
     else if (*buf.position() == '[')
-        readQuotedFieldInBracketsInto<'[', ']'>(s, buf);
+        return readQuotedFieldInBracketsInto<ReturnType, '[', ']'>(s, buf);
     else if (*buf.position() == '(')
-        readQuotedFieldInBracketsInto<'(', ')'>(s, buf);
+        return readQuotedFieldInBracketsInto<ReturnType, '(', ')'>(s, buf);
     else if (*buf.position() == '{')
-        readQuotedFieldInBracketsInto<'{', '}'>(s, buf);
+        return readQuotedFieldInBracketsInto<ReturnType, '{', '}'>(s, buf);
     else if (checkCharCaseInsensitive('n', buf))
     {
         /// NULL or NaN
         if (checkCharCaseInsensitive('u', buf))
         {
-            assertStringCaseInsensitive("ll", buf);
+            if constexpr (throw_exception)
+                assertStringCaseInsensitive("ll", buf);
+            else if (!checkStringCaseInsensitive("ll", buf))
+                return ReturnType(false);
             s.append("NULL");
         }
         else
         {
-            assertStringCaseInsensitive("an", buf);
+            if constexpr (throw_exception)
+                assertStringCaseInsensitive("an", buf);
+            else if (!checkStringCaseInsensitive("an", buf))
+                return ReturnType(false);
             s.append("NaN");
         }
     }
     else if (checkCharCaseInsensitive('t', buf))
     {
-        assertStringCaseInsensitive("rue", buf);
+        if constexpr (throw_exception)
+            assertStringCaseInsensitive("rue", buf);
+        else if (!checkStringCaseInsensitive("rue", buf))
+            return ReturnType(false);
         s.append("true");
     }
     else if (checkCharCaseInsensitive('f', buf))
     {
-        assertStringCaseInsensitive("alse", buf);
+        if constexpr (throw_exception)
+            assertStringCaseInsensitive("alse", buf);
+        else if (!checkStringCaseInsensitive("alse", buf))
+            return ReturnType(false);
         s.append("false");
     }
     else
@@ -1736,13 +1909,19 @@ void readQuotedFieldInto(Vector & s, ReadBuffer & buf)
         auto parse_func = [](ReadBuffer & in)
         {
             Float64 tmp;
-            readFloatText(tmp, in);
+            if constexpr (throw_exception)
+                readFloatText(tmp, in);
+            else
+                return tryReadFloatText(tmp, in);
         };
-        readParsedValueInto(s, buf, parse_func);
+
+        return readParsedValueInto<ReturnType>(s, buf, parse_func);
     }
+
+    return ReturnType(true);
 }
 
-template void readQuotedFieldInto<NullOutput>(NullOutput & s, ReadBuffer & buf);
+template void readQuotedFieldInto<void, NullOutput>(NullOutput & s, ReadBuffer & buf);
 
 void readQuotedField(String & s, ReadBuffer & buf)
 {
@@ -1750,11 +1929,24 @@ void readQuotedField(String & s, ReadBuffer & buf)
     readQuotedFieldInto(s, buf);
 }
 
+bool tryReadQuotedField(String & s, ReadBuffer & buf)
+{
+    s.clear();
+    return readQuotedFieldInto<bool>(s, buf);
+}
+
 void readJSONField(String & s, ReadBuffer & buf)
 {
     s.clear();
     auto parse_func = [](ReadBuffer & in) { skipJSONField(in, "json_field"); };
-    readParsedValueInto(s, buf, parse_func);
+    readParsedValueInto<void>(s, buf, parse_func);
+}
+
+bool tryReadJSONField(String & s, ReadBuffer & buf)
+{
+    s.clear();
+    auto parse_func = [](ReadBuffer & in) { return trySkipJSONField(in, "json_field"); };
+    return readParsedValueInto<bool>(s, buf, parse_func);
 }
 
 void readTSVField(String & s, ReadBuffer & buf)
diff --git a/src/IO/ReadHelpers.h b/src/IO/ReadHelpers.h
index 17f3d3d4151..ad62a3deaca 100644
--- a/src/IO/ReadHelpers.h
+++ b/src/IO/ReadHelpers.h
@@ -257,26 +257,43 @@ inline void readBoolText(bool & x, ReadBuffer & buf)
     x = tmp != '0';
 }
 
-inline void readBoolTextWord(bool & x, ReadBuffer & buf, bool support_upper_case = false)
+template <typename ReturnType = void>
+inline ReturnType readBoolTextWord(bool & x, ReadBuffer & buf, bool support_upper_case = false)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     if (buf.eof()) [[unlikely]]
-        throwReadAfterEOF();
+    {
+        if constexpr (throw_exception)
+            throwReadAfterEOF();
+        else
+            return ReturnType(false);
+    }
 
     switch (*buf.position())
     {
         case 't':
-            assertString("true", buf);
+            if constexpr (throw_exception)
+                assertString("true", buf);
+            else if (!checkString("true", buf))
+                return ReturnType(false);
             x = true;
             break;
         case 'f':
-            assertString("false", buf);
+            if constexpr (throw_exception)
+                assertString("false", buf);
+            else if (!checkString("false", buf))
+                return ReturnType(false);
             x = false;
             break;
         case 'T':
         {
             if (support_upper_case)
             {
-                assertString("TRUE", buf);
+                if constexpr (throw_exception)
+                    assertString("TRUE", buf);
+                else if (!checkString("TRUE", buf))
+                    return ReturnType(false);
                 x = true;
                 break;
             }
@@ -287,7 +304,10 @@ inline void readBoolTextWord(bool & x, ReadBuffer & buf, bool support_upper_case
         {
             if (support_upper_case)
             {
-                assertString("FALSE", buf);
+                if constexpr (throw_exception)
+                    assertString("FALSE", buf);
+                else if (!checkString("FALSE", buf))
+                    return ReturnType(false);
                 x = false;
                 break;
             }
@@ -295,8 +315,15 @@ inline void readBoolTextWord(bool & x, ReadBuffer & buf, bool support_upper_case
                 [[fallthrough]];
         }
         default:
-            throw ParsingException(ErrorCodes::CANNOT_PARSE_BOOL, "Unexpected Bool value");
+        {
+            if constexpr (throw_exception)
+                throw ParsingException(ErrorCodes::CANNOT_PARSE_BOOL, "Unexpected Bool value");
+            else
+                return ReturnType(false);
+        }
     }
+
+    return ReturnType(true);
 }
 
 enum class ReadIntTextCheckOverflow
@@ -468,7 +495,10 @@ void readIntText(T & x, ReadBuffer & buf)
 template <ReadIntTextCheckOverflow check_overflow = ReadIntTextCheckOverflow::CHECK_OVERFLOW, typename T>
 bool tryReadIntText(T & x, ReadBuffer & buf)
 {
-    return readIntTextImpl<T, bool, check_overflow>(x, buf);
+    if constexpr (is_decimal<T>)
+        return tryReadIntText<check_overflow>(x.value, buf);
+    else
+        return readIntTextImpl<T, bool, check_overflow>(x, buf);
 }
 
 
@@ -477,16 +507,18 @@ bool tryReadIntText(T & x, ReadBuffer & buf)
   * - for numbers starting with zero, parsed only zero;
   * - symbol '+' before number is not supported;
   */
-template <typename T, bool throw_on_error = true>
-void readIntTextUnsafe(T & x, ReadBuffer & buf)
+template <typename T, typename ReturnType = void>
+ReturnType readIntTextUnsafe(T & x, ReadBuffer & buf)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
     bool negative = false;
     make_unsigned_t<T> res = 0;
 
     auto on_error = []
     {
-        if (throw_on_error)
+        if constexpr (throw_exception)
             throwReadAfterEOF();
+        return ReturnType(false);
     };
 
     if (buf.eof()) [[unlikely]]
@@ -504,7 +536,7 @@ void readIntTextUnsafe(T & x, ReadBuffer & buf)
     {
         ++buf.position();
         x = 0;
-        return;
+        return ReturnType(true);
     }
 
     while (!buf.eof())
@@ -523,12 +555,13 @@ void readIntTextUnsafe(T & x, ReadBuffer & buf)
 
     /// See note about undefined behaviour above.
     x = is_signed_v<T> && negative ? -res : res;
+    return ReturnType(true);
 }
 
 template <typename T>
-void tryReadIntTextUnsafe(T & x, ReadBuffer & buf)
+bool tryReadIntTextUnsafe(T & x, ReadBuffer & buf)
 {
-    return readIntTextUnsafe<T, false>(x, buf);
+    return readIntTextUnsafe<T, bool>(x, buf);
 }
 
 
@@ -550,9 +583,15 @@ void readEscapedString(String & s, ReadBuffer & buf);
 void readQuotedString(String & s, ReadBuffer & buf);
 void readQuotedStringWithSQLStyle(String & s, ReadBuffer & buf);
 
+bool tryReadQuotedString(String & s, ReadBuffer & buf);
+bool tryReadQuotedStringWithSQLStyle(String & s, ReadBuffer & buf);
+
 void readDoubleQuotedString(String & s, ReadBuffer & buf);
 void readDoubleQuotedStringWithSQLStyle(String & s, ReadBuffer & buf);
 
+bool tryReadDoubleQuotedString(String & s, ReadBuffer & buf);
+bool tryReadDoubleQuotedStringWithSQLStyle(String & s, ReadBuffer & buf);
+
 void readJSONString(String & s, ReadBuffer & buf);
 
 void readBackQuotedString(String & s, ReadBuffer & buf);
@@ -615,7 +654,7 @@ void readBackQuotedStringInto(Vector & s, ReadBuffer & buf);
 template <typename Vector>
 void readStringUntilEOFInto(Vector & s, ReadBuffer & buf);
 
-template <typename Vector, bool include_quotes = false>
+template <typename Vector, bool include_quotes = false, bool allow_throw = true>
 void readCSVStringInto(Vector & s, ReadBuffer & buf, const FormatSettings::CSV & settings);
 
 /// ReturnType is either bool or void. If bool, the function will return false instead of throwing an exception.
@@ -628,7 +667,7 @@ bool tryReadJSONStringInto(Vector & s, ReadBuffer & buf)
     return readJSONStringInto<Vector, bool>(s, buf);
 }
 
-template <typename Vector>
+template <bool enable_sql_style_quoting, typename Vector>
 bool tryReadQuotedStringInto(Vector & s, ReadBuffer & buf);
 
 /// Reads chunk of data between {} in that way,
@@ -637,8 +676,8 @@ bool tryReadQuotedStringInto(Vector & s, ReadBuffer & buf);
 template <typename Vector, typename ReturnType = void>
 ReturnType readJSONObjectPossiblyInvalid(Vector & s, ReadBuffer & buf);
 
-template <typename Vector>
-void readJSONArrayInto(Vector & s, ReadBuffer & buf);
+template <typename Vector, typename ReturnType = void>
+ReturnType readJSONArrayInto(Vector & s, ReadBuffer & buf);
 
 template <typename Vector>
 void readStringUntilWhitespaceInto(Vector & s, ReadBuffer & buf);
@@ -962,6 +1001,13 @@ inline ReturnType readDateTimeTextImpl(time_t & datetime, ReadBuffer & buf, cons
     {
         if (s[4] < '0' || s[4] > '9')
         {
+            if constexpr (!throw_exception)
+            {
+                if (!isNumericASCII(s[0]) || !isNumericASCII(s[1]) || !isNumericASCII(s[2]) || !isNumericASCII(s[3])
+                    || !isNumericASCII(s[5]) || !isNumericASCII(s[6]) || !isNumericASCII(s[8]) || !isNumericASCII(s[9]))
+                    return ReturnType(false);
+            }
+
             UInt16 year = (s[0] - '0') * 1000 + (s[1] - '0') * 100 + (s[2] - '0') * 10 + (s[3] - '0');
             UInt8 month = (s[5] - '0') * 10 + (s[6] - '0');
             UInt8 day = (s[8] - '0') * 10 + (s[9] - '0');
@@ -974,6 +1020,13 @@ inline ReturnType readDateTimeTextImpl(time_t & datetime, ReadBuffer & buf, cons
             bool dt_long = (s[10] == ' ' || s[10] == 'T');
             if (dt_long)
             {
+                if constexpr (!throw_exception)
+                {
+                    if (!isNumericASCII(s[11]) || !isNumericASCII(s[12]) || !isNumericASCII(s[14]) || !isNumericASCII(s[15])
+                        || !isNumericASCII(s[17]) || !isNumericASCII(s[18]))
+                        return ReturnType(false);
+                }
+
                 hour = (s[11] - '0') * 10 + (s[12] - '0');
                 minute = (s[14] - '0') * 10 + (s[15] - '0');
                 second = (s[17] - '0') * 10 + (s[18] - '0');
@@ -1311,6 +1364,11 @@ inline bool tryReadText(is_integer auto & x, ReadBuffer & buf)
     return tryReadIntText(x, buf);
 }
 
+inline bool tryReadText(is_floating_point auto & x, ReadBuffer & buf)
+{
+    return tryReadFloatText(x, buf);
+}
+
 inline bool tryReadText(UUID & x, ReadBuffer & buf) { return tryReadUUIDText(x, buf); }
 inline bool tryReadText(IPv4 & x, ReadBuffer & buf) { return tryReadIPv4Text(x, buf); }
 inline bool tryReadText(IPv6 & x, ReadBuffer & buf) { return tryReadIPv6Text(x, buf); }
@@ -1320,9 +1378,20 @@ inline void readText(is_floating_point auto & x, ReadBuffer & buf) { readFloatTe
 inline void readText(String & x, ReadBuffer & buf) { readEscapedString(x, buf); }
 
 inline void readText(DayNum & x, ReadBuffer & buf, const DateLUTImpl & time_zone = DateLUT::instance()) { readDateText(x, buf, time_zone); }
+inline bool tryReadText(DayNum & x, ReadBuffer & buf, const DateLUTImpl & time_zone = DateLUT::instance()) { return tryReadDateText(x, buf, time_zone); }
 
 inline void readText(LocalDate & x, ReadBuffer & buf) { readDateText(x, buf); }
+inline bool tryReadText(LocalDate & x, ReadBuffer & buf) { return tryReadDateText(x, buf); }
 inline void readText(LocalDateTime & x, ReadBuffer & buf) { readDateTimeText(x, buf); }
+inline bool tryReadText(LocalDateTime & x, ReadBuffer & buf)
+{
+    time_t time;
+    if (!tryReadDateTimeText(time, buf))
+        return false;
+    x = LocalDateTime(time, DateLUT::instance());
+    return true;
+}
+
 inline void readText(UUID & x, ReadBuffer & buf) { readUUIDText(x, buf); }
 inline void readText(IPv4 & x, ReadBuffer & buf) { readIPv4Text(x, buf); }
 inline void readText(IPv6 & x, ReadBuffer & buf) { readIPv6Text(x, buf); }
@@ -1400,39 +1469,71 @@ inline void readDoubleQuoted(LocalDateTime & x, ReadBuffer & buf)
 }
 
 /// CSV for numbers: quotes are optional, no special escaping rules.
-template <typename T>
-inline void readCSVSimple(T & x, ReadBuffer & buf)
+template <typename T, typename ReturnType = void>
+inline ReturnType readCSVSimple(T & x, ReadBuffer & buf)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     if (buf.eof()) [[unlikely]]
-        throwReadAfterEOF();
+    {
+        if constexpr (throw_exception)
+            throwReadAfterEOF();
+        return ReturnType(false);
+    }
 
     char maybe_quote = *buf.position();
 
     if (maybe_quote == '\'' || maybe_quote == '\"')
         ++buf.position();
 
-    readText(x, buf);
+    if constexpr (throw_exception)
+        readText(x, buf);
+    else if (!tryReadText(x, buf))
+        return ReturnType(false);
 
     if (maybe_quote == '\'' || maybe_quote == '\"')
-        assertChar(maybe_quote, buf);
+    {
+        if constexpr (throw_exception)
+            assertChar(maybe_quote, buf);
+        else if (!checkChar(maybe_quote, buf))
+            return ReturnType(false);
+    }
+
+    return ReturnType(true);
 }
 
 // standalone overload for dates: to avoid instantiating DateLUTs while parsing other types
-template <typename T>
-inline void readCSVSimple(T & x, ReadBuffer & buf, const DateLUTImpl & time_zone)
+template <typename T, typename ReturnType = void>
+inline ReturnType readCSVSimple(T & x, ReadBuffer & buf, const DateLUTImpl & time_zone)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     if (buf.eof()) [[unlikely]]
-        throwReadAfterEOF();
+    {
+        if constexpr (throw_exception)
+            throwReadAfterEOF();
+        return ReturnType(false);
+    }
 
     char maybe_quote = *buf.position();
 
     if (maybe_quote == '\'' || maybe_quote == '\"')
         ++buf.position();
 
-    readText(x, buf, time_zone);
+    if constexpr (throw_exception)
+        readText(x, buf, time_zone);
+    else if (!tryReadText(x, buf, time_zone))
+        return ReturnType(false);
 
     if (maybe_quote == '\'' || maybe_quote == '\"')
-        assertChar(maybe_quote, buf);
+    {
+        if constexpr (throw_exception)
+            assertChar(maybe_quote, buf);
+        else if (!checkChar(maybe_quote, buf))
+            return ReturnType(false);
+    }
+
+    return ReturnType(true);
 }
 
 template <typename T>
@@ -1442,18 +1543,52 @@ inline void readCSV(T & x, ReadBuffer & buf)
     readCSVSimple(x, buf);
 }
 
+template <typename T>
+requires is_arithmetic_v<T>
+inline bool tryReadCSV(T & x, ReadBuffer & buf)
+{
+    return readCSVSimple<T, bool>(x, buf);
+}
+
 inline void readCSV(String & x, ReadBuffer & buf, const FormatSettings::CSV & settings) { readCSVString(x, buf, settings); }
+inline bool tryReadCSV(String & x, ReadBuffer & buf, const FormatSettings::CSV & settings)
+{
+    x.clear();
+    readCSVStringInto<String, false, false>(x, buf, settings);
+    return true;
+}
+
 inline void readCSV(LocalDate & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(LocalDate & x, ReadBuffer & buf) { return readCSVSimple<LocalDate, bool>(x, buf); }
+
 inline void readCSV(DayNum & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(DayNum & x, ReadBuffer & buf) { return readCSVSimple<DayNum, bool>(x, buf); }
 inline void readCSV(DayNum & x, ReadBuffer & buf, const DateLUTImpl & time_zone) { readCSVSimple(x, buf, time_zone); }
+inline bool tryReadCSV(DayNum & x, ReadBuffer & buf, const DateLUTImpl & time_zone) { return readCSVSimple<DayNum, bool>(x, buf, time_zone); }
+
 inline void readCSV(LocalDateTime & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(LocalDateTime & x, ReadBuffer & buf) { return readCSVSimple<LocalDateTime, bool>(x, buf); }
+
 inline void readCSV(UUID & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(UUID & x, ReadBuffer & buf) { return readCSVSimple<UUID, bool>(x, buf); }
+
 inline void readCSV(IPv4 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(IPv4 & x, ReadBuffer & buf) { return readCSVSimple<IPv4, bool>(x, buf); }
+
 inline void readCSV(IPv6 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(IPv6 & x, ReadBuffer & buf) { return readCSVSimple<IPv6, bool>(x, buf); }
+
 inline void readCSV(UInt128 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(UInt128 & x, ReadBuffer & buf) { return readCSVSimple<UInt128, bool>(x, buf); }
+
 inline void readCSV(Int128 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(Int128 & x, ReadBuffer & buf) { return readCSVSimple<Int128, bool>(x, buf); }
+
 inline void readCSV(UInt256 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(UInt256 & x, ReadBuffer & buf) { return readCSVSimple<UInt256, bool>(x, buf); }
+
 inline void readCSV(Int256 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(Int256 & x, ReadBuffer & buf) { return readCSVSimple<Int256, bool>(x, buf); }
 
 template <typename T>
 void readBinary(std::vector<T> & x, ReadBuffer & buf)
@@ -1535,6 +1670,7 @@ inline void skipWhitespaceIfAny(ReadBuffer & buf, bool one_line = false)
 
 /// Skips json value.
 void skipJSONField(ReadBuffer & buf, StringRef name_of_field);
+bool trySkipJSONField(ReadBuffer & buf, StringRef name_of_field);
 
 
 /** Read serialized exception.
@@ -1749,12 +1885,14 @@ struct PcgDeserializer
     }
 };
 
-template <typename Vector>
-void readQuotedFieldInto(Vector & s, ReadBuffer & buf);
+template <typename ReturnType = void, typename Vector>
+ReturnType readQuotedFieldInto(Vector & s, ReadBuffer & buf);
 
 void readQuotedField(String & s, ReadBuffer & buf);
+bool tryReadQuotedField(String & s, ReadBuffer & buf);
 
 void readJSONField(String & s, ReadBuffer & buf);
+bool tryReadJSONField(String & s, ReadBuffer & buf);
 
 void readTSVField(String & s, ReadBuffer & buf);
 
diff --git a/src/IO/readDecimalText.h b/src/IO/readDecimalText.h
index 9fd9c439b87..81bde87f1f1 100644
--- a/src/IO/readDecimalText.h
+++ b/src/IO/readDecimalText.h
@@ -224,4 +224,24 @@ inline void readCSVDecimalText(ReadBuffer & buf, T & x, uint32_t precision, uint
         assertChar(maybe_quote, buf);
 }
 
+template <typename T>
+inline bool tryReadCSVDecimalText(ReadBuffer & buf, T & x, uint32_t precision, uint32_t & scale)
+{
+    if (buf.eof())
+        return false;
+
+    char maybe_quote = *buf.position();
+
+    if (maybe_quote == '\'' || maybe_quote == '\"')
+        ++buf.position();
+
+    if (!tryReadDecimalText(buf, x, precision, scale))
+        return false;
+
+    if ((maybe_quote == '\'' || maybe_quote == '\"') && !checkChar(maybe_quote, buf))
+        return false;
+
+    return true;
+}
+
 }
diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index bf07f4ed3ee..51f767afc04 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -939,6 +939,20 @@ void InterpreterCreateQuery::validateTableStructure(const ASTCreateQuery & creat
             }
         }
     }
+    if (!create.attach && !settings.allow_experimental_variant_type)
+    {
+        for (const auto & [name, type] : properties.columns.getAllPhysical())
+        {
+            if (isVariant(type))
+            {
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN,
+                        "Cannot create table with column '{}' which type is '{}' "
+                        "because experimental Variant type is not allowed. "
+                        "Set setting allow_experimental_variant_type = 1 in order to allow it",
+                        name, type->getName());
+            }
+        }
+    }
 }
 
 namespace
diff --git a/src/Interpreters/InterpreterInsertQuery.cpp b/src/Interpreters/InterpreterInsertQuery.cpp
index 283289f0dfc..32b24cba940 100644
--- a/src/Interpreters/InterpreterInsertQuery.cpp
+++ b/src/Interpreters/InterpreterInsertQuery.cpp
@@ -532,7 +532,7 @@ BlockIO InterpreterInsertQuery::execute()
                     {
                         /// Change query sample block columns to Nullable to allow inserting nullable columns, where NULL values will be substituted with
                         /// default column values (in AddingDefaultsTransform), so all values will be cast correctly.
-                        if (isNullableOrLowCardinalityNullable(input_columns[col_idx].type) && !isNullableOrLowCardinalityNullable(query_columns[col_idx].type) && output_columns.has(query_columns[col_idx].name))
+                        if (isNullableOrLowCardinalityNullable(input_columns[col_idx].type) && !isNullableOrLowCardinalityNullable(query_columns[col_idx].type) && !isVariant(query_columns[col_idx].type) && output_columns.has(query_columns[col_idx].name))
                             query_sample_block.setColumn(col_idx, ColumnWithTypeAndName(makeNullableOrLowCardinalityNullable(query_columns[col_idx].column), makeNullableOrLowCardinalityNullable(query_columns[col_idx].type), query_columns[col_idx].name));
                     }
                 }
diff --git a/src/Interpreters/inplaceBlockConversions.cpp b/src/Interpreters/inplaceBlockConversions.cpp
index c7a1cab8bac..fd8f5b154c4 100644
--- a/src/Interpreters/inplaceBlockConversions.cpp
+++ b/src/Interpreters/inplaceBlockConversions.cpp
@@ -237,17 +237,36 @@ static std::unordered_map<String, ColumnPtr> collectOffsetsColumns(
             {
                 auto & offsets_column = offsets_columns[stream_name];
                 if (!offsets_column)
+                {
                     offsets_column = current_offsets_column;
+                }
+                else
+                {
+                    /// If we are inside Variant element, it may happen that
+                    /// offsets are different, because when we read Variant
+                    /// element as a subcolumn, we expand this column according
+                    /// to the discriminators, so, offsets column can be changed.
+                    /// In this case we should select the original offsets column
+                    /// of this stream, which is the smallest one.
+                    bool inside_variant_element = false;
+                    for (const auto & elem : subpath)
+                        inside_variant_element |= elem.type == ISerialization::Substream::VariantElement;
 
-            #ifndef NDEBUG
-                const auto & offsets_data = assert_cast<const ColumnUInt64 &>(*offsets_column).getData();
-                const auto & current_offsets_data = assert_cast<const ColumnUInt64 &>(*current_offsets_column).getData();
+                    if (offsets_column->size() != current_offsets_column->size() && inside_variant_element)
+                        offsets_column = offsets_column->size() < current_offsets_column->size() ? offsets_column : current_offsets_column;
+#ifndef NDEBUG
+                    else
+                    {
+                        const auto & offsets_data = assert_cast<const ColumnUInt64 &>(*offsets_column).getData();
+                        const auto & current_offsets_data = assert_cast<const ColumnUInt64 &>(*current_offsets_column).getData();
 
-                if (offsets_data != current_offsets_data)
-                    throw Exception(ErrorCodes::LOGICAL_ERROR,
-                        "Found non-equal columns with offsets (sizes: {} and {}) for stream {}",
-                        offsets_data.size(), current_offsets_data.size(), stream_name);
-            #endif
+                        if (offsets_data != current_offsets_data)
+                            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                                            "Found non-equal columns with offsets (sizes: {} and {}) for stream {}",
+                                            offsets_data.size(), current_offsets_data.size(), stream_name);
+                    }
+#endif
+                }
             }
         }, available_column->type, res_columns[i]);
     }
diff --git a/src/Interpreters/parseColumnsListForTableFunction.cpp b/src/Interpreters/parseColumnsListForTableFunction.cpp
index 87f76f7f824..551a883d093 100644
--- a/src/Interpreters/parseColumnsListForTableFunction.cpp
+++ b/src/Interpreters/parseColumnsListForTableFunction.cpp
@@ -60,6 +60,17 @@ void validateDataType(const DataTypePtr & type, const DataTypeValidationSettings
                     MAX_FIXEDSTRING_SIZE_WITHOUT_SUSPICIOUS);
         }
     }
+
+    if (!settings.allow_experimental_variant_type)
+    {
+        if (isVariant(type))
+        {
+            throw Exception(
+                ErrorCodes::ILLEGAL_COLUMN,
+                "Cannot create column with type '{}' because experimental Variant type is not allowed. "
+                "Set setting allow_experimental_variant_type = 1 in order to allow it", type->getName());
+        }
+    }
 }
 
 ColumnsDescription parseColumnsListFromString(const std::string & structure, const ContextPtr & context)
diff --git a/src/Interpreters/parseColumnsListForTableFunction.h b/src/Interpreters/parseColumnsListForTableFunction.h
index ef1bbe5498e..1fbbfa4b12f 100644
--- a/src/Interpreters/parseColumnsListForTableFunction.h
+++ b/src/Interpreters/parseColumnsListForTableFunction.h
@@ -18,12 +18,14 @@ struct DataTypeValidationSettings
         : allow_suspicious_low_cardinality_types(settings.allow_suspicious_low_cardinality_types)
         , allow_experimental_object_type(settings.allow_experimental_object_type)
         , allow_suspicious_fixed_string_types(settings.allow_suspicious_fixed_string_types)
+        , allow_experimental_variant_type(settings.allow_experimental_variant_type)
     {
     }
 
     bool allow_suspicious_low_cardinality_types = true;
     bool allow_experimental_object_type = true;
     bool allow_suspicious_fixed_string_types = true;
+    bool allow_experimental_variant_type = true;
 };
 
 void validateDataType(const DataTypePtr & type, const DataTypeValidationSettings & settings);
diff --git a/src/Parsers/ExpressionElementParsers.cpp b/src/Parsers/ExpressionElementParsers.cpp
index 594221fe050..5dc791f7003 100644
--- a/src/Parsers/ExpressionElementParsers.cpp
+++ b/src/Parsers/ExpressionElementParsers.cpp
@@ -250,7 +250,7 @@ bool ParserTableAsStringLiteralIdentifier::parseImpl(Pos & pos, ASTPtr & node, E
     ReadBufferFromMemory in(pos->begin, pos->size());
     String s;
 
-    if (!tryReadQuotedStringInto(s, in))
+    if (!tryReadQuotedString(s, in))
     {
         expected.add(pos, "string literal");
         return false;
diff --git a/src/Processors/Formats/Impl/CSVRowInputFormat.cpp b/src/Processors/Formats/Impl/CSVRowInputFormat.cpp
index 5e12ec18d27..cab0f7523f1 100644
--- a/src/Processors/Formats/Impl/CSVRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/CSVRowInputFormat.cpp
@@ -391,7 +391,7 @@ bool CSVFormatReader::readFieldImpl(ReadBuffer & istr, DB::IColumn & column, con
     if (format_settings.null_as_default && !isNullableOrLowCardinalityNullable(type))
     {
         /// If value is null but type is not nullable then use default value instead.
-        return SerializationNullable::deserializeTextCSVImpl(column, istr, format_settings, serialization);
+        return SerializationNullable::deserializeNullAsDefaultOrNestedTextCSV(column, istr, format_settings, serialization);
     }
 
     /// Read the column normally.
diff --git a/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp b/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp
index 7e8b4accf4d..9c7f095e661 100644
--- a/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp
@@ -409,7 +409,7 @@ bool MySQLDumpRowInputFormat::readField(IColumn & column, size_t column_idx)
     const auto & type = types[column_idx];
     const auto & serialization = serializations[column_idx];
     if (format_settings.null_as_default && !isNullableOrLowCardinalityNullable(type))
-        return SerializationNullable::deserializeTextQuotedImpl(column, *in, format_settings, serialization);
+        return SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(column, *in, format_settings, serialization);
 
     serialization->deserializeTextQuoted(column, *in, format_settings);
     return true;
diff --git a/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp b/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp
index f4f92583473..0f68c28ab1f 100644
--- a/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp
@@ -147,7 +147,7 @@ bool TSKVRowInputFormat::readRow(MutableColumns & columns, RowReadExtension & ex
                     const auto & type = getPort().getHeader().getByPosition(index).type;
                     const auto & serialization = serializations[index];
                     if (format_settings.null_as_default && !isNullableOrLowCardinalityNullable(type))
-                        read_columns[index] = SerializationNullable::deserializeTextEscapedImpl(*columns[index], *in, format_settings, serialization);
+                        read_columns[index] = SerializationNullable::deserializeNullAsDefaultOrNestedTextEscaped(*columns[index], *in, format_settings, serialization);
                     else
                         serialization->deserializeTextEscaped(*columns[index], *in, format_settings);
                 }
diff --git a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
index 3205adc2a48..88eb11d130d 100644
--- a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
@@ -167,7 +167,7 @@ bool TabSeparatedFormatReader::readField(IColumn & column, const DataTypePtr & t
     if (is_raw)
     {
         if (as_nullable)
-            return SerializationNullable::deserializeTextRawImpl(column, *buf, format_settings, serialization);
+            return SerializationNullable::deserializeNullAsDefaultOrNestedTextRaw(column, *buf, format_settings, serialization);
 
         serialization->deserializeTextRaw(column, *buf, format_settings);
         return true;
@@ -175,7 +175,7 @@ bool TabSeparatedFormatReader::readField(IColumn & column, const DataTypePtr & t
 
 
     if (as_nullable)
-        return SerializationNullable::deserializeTextEscapedImpl(column, *buf, format_settings, serialization);
+        return SerializationNullable::deserializeNullAsDefaultOrNestedTextEscaped(column, *buf, format_settings, serialization);
 
     serialization->deserializeTextEscaped(column, *buf, format_settings);
     return true;
diff --git a/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp b/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
index d55ccce8879..a7b5795b89e 100644
--- a/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
@@ -293,7 +293,7 @@ bool ValuesBlockInputFormat::tryReadValue(IColumn & column, size_t column_idx)
             const auto & type = types[column_idx];
             const auto & serialization = serializations[column_idx];
             if (format_settings.null_as_default && !isNullableOrLowCardinalityNullable(type))
-                read = SerializationNullable::deserializeTextQuotedImpl(column, *buf, format_settings, serialization);
+                read = SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(column, *buf, format_settings, serialization);
             else
                 serialization->deserializeTextQuoted(column, *buf, format_settings);
         }
diff --git a/tests/queries/0_stateless/02940_variant_text_deserialization.reference b/tests/queries/0_stateless/02940_variant_text_deserialization.reference
new file mode 100644
index 00000000000..98725917567
--- /dev/null
+++ b/tests/queries/0_stateless/02940_variant_text_deserialization.reference
@@ -0,0 +1,516 @@
+JSON
+String
+{"v":null,"variantElement(v, 'String')":null}
+{"v":"string","variantElement(v, 'String')":"string"}
+{"v":"42","variantElement(v, 'String')":null}
+FixedString
+{"v":null,"variantElement(v, 'FixedString(4)')":null}
+{"v":"string","variantElement(v, 'FixedString(4)')":null}
+{"v":"abcd","variantElement(v, 'FixedString(4)')":"abcd"}
+Bool
+{"v":null,"variantElement(v, 'Bool')":null}
+{"v":"string","variantElement(v, 'Bool')":null}
+{"v":true,"variantElement(v, 'Bool')":true}
+Integers
+{"v":null,"variantElement(v, 'Int8')":null}
+{"v":"string","variantElement(v, 'Int8')":null}
+{"v":-1,"variantElement(v, 'Int8')":-1}
+{"v":0,"variantElement(v, 'Int8')":0}
+{"v":"10000000000","variantElement(v, 'Int8')":null}
+{"v":null,"variantElement(v, 'UInt8')":null}
+{"v":"string","variantElement(v, 'UInt8')":null}
+{"v":"-1","variantElement(v, 'UInt8')":null}
+{"v":0,"variantElement(v, 'UInt8')":0}
+{"v":"10000000000","variantElement(v, 'UInt8')":null}
+{"v":null,"variantElement(v, 'Int16')":null}
+{"v":"string","variantElement(v, 'Int16')":null}
+{"v":-1,"variantElement(v, 'Int16')":-1}
+{"v":0,"variantElement(v, 'Int16')":0}
+{"v":"10000000000","variantElement(v, 'Int16')":null}
+{"v":null,"variantElement(v, 'UInt16')":null}
+{"v":"string","variantElement(v, 'UInt16')":null}
+{"v":"-1","variantElement(v, 'UInt16')":null}
+{"v":0,"variantElement(v, 'UInt16')":0}
+{"v":"10000000000","variantElement(v, 'UInt16')":null}
+{"v":null,"variantElement(v, 'Int32')":null}
+{"v":"string","variantElement(v, 'Int32')":null}
+{"v":-1,"variantElement(v, 'Int32')":-1}
+{"v":0,"variantElement(v, 'Int32')":0}
+{"v":"10000000000","variantElement(v, 'Int32')":null}
+{"v":null,"variantElement(v, 'UInt32')":null}
+{"v":"string","variantElement(v, 'UInt32')":null}
+{"v":"-1","variantElement(v, 'UInt32')":null}
+{"v":0,"variantElement(v, 'UInt32')":0}
+{"v":"10000000000","variantElement(v, 'UInt32')":null}
+{"v":null,"variantElement(v, 'Int64')":null}
+{"v":"string","variantElement(v, 'Int64')":null}
+{"v":"-1","variantElement(v, 'Int64')":"-1"}
+{"v":"0","variantElement(v, 'Int64')":"0"}
+{"v":"10000000000000000000000","variantElement(v, 'Int64')":null}
+{"v":null,"variantElement(v, 'UInt64')":null}
+{"v":"string","variantElement(v, 'UInt64')":null}
+{"v":"-1","variantElement(v, 'UInt64')":null}
+{"v":"0","variantElement(v, 'UInt64')":"0"}
+{"v":"10000000000000000000000","variantElement(v, 'UInt64')":null}
+{"v":null,"variantElement(v, 'Int128')":null}
+{"v":"string","variantElement(v, 'Int128')":null}
+{"v":"-1","variantElement(v, 'Int128')":"-1"}
+{"v":"0","variantElement(v, 'Int128')":"0"}
+{"v":null,"variantElement(v, 'UInt128')":null}
+{"v":"string","variantElement(v, 'UInt128')":null}
+{"v":"-1","variantElement(v, 'UInt128')":null}
+{"v":"0","variantElement(v, 'UInt128')":"0"}
+Floats
+{"v":null,"variantElement(v, 'Float32')":null}
+{"v":"string","variantElement(v, 'Float32')":null}
+{"v":42.42,"variantElement(v, 'Float32')":42.42}
+{"v":null,"variantElement(v, 'Float64')":null}
+{"v":"string","variantElement(v, 'Float64')":null}
+{"v":42.42,"variantElement(v, 'Float64')":42.42}
+Decimals
+{"v":null,"variantElement(v, 'Decimal32(6)')":null}
+{"v":"string","variantElement(v, 'Decimal32(6)')":null}
+{"v":42.42,"variantElement(v, 'Decimal32(6)')":42.42}
+{"v":"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242","variantElement(v, 'Decimal32(6)')":null}
+{"v":null,"variantElement(v, 'Decimal64(6)')":null}
+{"v":"string","variantElement(v, 'Decimal64(6)')":null}
+{"v":42.42,"variantElement(v, 'Decimal64(6)')":42.42}
+{"v":"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242","variantElement(v, 'Decimal64(6)')":null}
+{"v":null,"variantElement(v, 'Decimal128(6)')":null}
+{"v":"string","variantElement(v, 'Decimal128(6)')":null}
+{"v":42.42,"variantElement(v, 'Decimal128(6)')":42.42}
+{"v":"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242","variantElement(v, 'Decimal128(6)')":null}
+{"v":null,"variantElement(v, 'Decimal256(6)')":null}
+{"v":"string","variantElement(v, 'Decimal256(6)')":null}
+{"v":42.42,"variantElement(v, 'Decimal256(6)')":42.42}
+{"v":"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242","variantElement(v, 'Decimal256(6)')":null}
+Dates and DateTimes
+{"v":null,"variantElement(v, 'Date')":null}
+{"v":"string","variantElement(v, 'Date')":null}
+{"v":"2020-01-01","variantElement(v, 'Date')":"2020-01-01"}
+{"v":"2020-01-01 00:00:00.999","variantElement(v, 'Date')":null}
+{"v":null,"variantElement(v, 'Date32')":null}
+{"v":"string","variantElement(v, 'Date32')":null}
+{"v":"1900-01-01","variantElement(v, 'Date32')":"1900-01-01"}
+{"v":"2020-01-01 00:00:00.999","variantElement(v, 'Date32')":null}
+{"v":null,"variantElement(v, 'DateTime')":null}
+{"v":"string","variantElement(v, 'DateTime')":null}
+{"v":"2020-01-01 00:00:00","variantElement(v, 'DateTime')":"2020-01-01 00:00:00"}
+{"v":"2020-01-01 00:00:00.999","variantElement(v, 'DateTime')":null}
+{"v":null,"variantElement(v, 'DateTime64')":null}
+{"v":"string","variantElement(v, 'DateTime64')":null}
+{"v":"2020-01-01 00:00:00.999","variantElement(v, 'DateTime64')":"2020-01-01 00:00:00.999"}
+{"v":"2020-01-01 00:00:00.999999999 ABC","variantElement(v, 'DateTime64')":null}
+UUID
+{"v":null,"variantElement(v, 'UUID')":null}
+{"v":"string","variantElement(v, 'UUID')":null}
+{"v":"c8619cca-0caa-445e-ae76-1d4f6e0b3927","variantElement(v, 'UUID')":"c8619cca-0caa-445e-ae76-1d4f6e0b3927"}
+IPv4
+{"v":null,"variantElement(v, 'IPv4')":null}
+{"v":"string","variantElement(v, 'IPv4')":null}
+{"v":"127.0.0.1","variantElement(v, 'IPv4')":"127.0.0.1"}
+IPv6
+{"v":null,"variantElement(v, 'IPv6')":null}
+{"v":"string","variantElement(v, 'IPv6')":null}
+{"v":"2001:db8:85a3::8a2e:370:7334","variantElement(v, 'IPv6')":"2001:db8:85a3::8a2e:370:7334"}
+Enum
+{"v":null,"variantElement(v, 'Enum(\\'a\\' = 1)')":null}
+{"v":"string","variantElement(v, 'Enum(\\'a\\' = 1)')":null}
+{"v":"a","variantElement(v, 'Enum(\\'a\\' = 1)')":"a"}
+{"v":"a","variantElement(v, 'Enum(\\'a\\' = 1)')":"a"}
+{"v":2,"variantElement(v, 'Enum(\\'a\\' = 1)')":null}
+Map
+{"v":null,"variantElement(v, 'Map(String, UInt64)')":{}}
+{"v":"string","variantElement(v, 'Map(String, UInt64)')":{}}
+{"v":{"a":"42","b":"43","c":"0"},"variantElement(v, 'Map(String, UInt64)')":{"a":"42","b":"43","c":"0"}}
+{"v":"{\"c\" : 44, \"d\" : [1,2,3]}","variantElement(v, 'Map(String, UInt64)')":{}}
+Tuple
+{"v":null,"variantElement(v, 'Tuple(a UInt64, b UInt64)')":{"a":"0","b":"0"}}
+{"v":"string","variantElement(v, 'Tuple(a UInt64, b UInt64)')":{"a":"0","b":"0"}}
+{"v":{"a":"42","b":"0"},"variantElement(v, 'Tuple(a UInt64, b UInt64)')":{"a":"42","b":"0"}}
+{"v":{"a":"44","b":"0"},"variantElement(v, 'Tuple(a UInt64, b UInt64)')":{"a":"44","b":"0"}}
+\N	(0,0)
+string	(0,0)
+(42,0)	(42,0)
+{"a" : 44, "d" : 32}	(0,0)
+Array
+{"v":null,"variantElement(v, 'Array(UInt64)')":[]}
+{"v":"string","variantElement(v, 'Array(UInt64)')":[]}
+{"v":["1","2","3"],"variantElement(v, 'Array(UInt64)')":["1","2","3"]}
+{"v":["0","0","0"],"variantElement(v, 'Array(UInt64)')":["0","0","0"]}
+{"v":"[1, 2, \"hello\"]","variantElement(v, 'Array(UInt64)')":[]}
+LowCardinality
+{"v":null,"variantElement(v, 'LowCardinality(String)')":null}
+{"v":"string","variantElement(v, 'LowCardinality(String)')":"string"}
+{"v":"42","variantElement(v, 'LowCardinality(String)')":null}
+{"v":null,"variantElement(v, 'Array(LowCardinality(Nullable(String)))')":[]}
+{"v":["string",null],"variantElement(v, 'Array(LowCardinality(Nullable(String)))')":["string",null]}
+{"v":"42","variantElement(v, 'Array(LowCardinality(Nullable(String)))')":[]}
+Nullable
+{"v":null,"variantElement(v, 'Array(Nullable(String))')":[]}
+{"v":"string","variantElement(v, 'Array(Nullable(String))')":[]}
+{"v":["hello",null,"world"],"variantElement(v, 'Array(Nullable(String))')":["hello",null,"world"]}
+{"repeat('-', 80)":"--------------------------------------------------------------------------------"}
+CSV
+String
+\N,\N
+"string","string"
+"string","string"
+42,\N
+FixedString
+\N,\N
+"string",\N
+"string",\N
+"abcd","abcd"
+Bool
+\N,\N
+"Truee",\N
+true,true
+Integers
+\N,\N
+"string",\N
+-1,-1
+0,0
+10000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,\N
+0,0
+10000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,-1
+0,0
+10000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,\N
+0,0
+10000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,-1
+0,0
+10000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,\N
+0,0
+10000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,-1
+0,0
+10000000000000000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,\N
+0,0
+10000000000000000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,-1
+0,0
+"42d42",\N
+\N,\N
+"string",\N
+-1,\N
+0,0
+"42d42",\N
+Floats
+\N,\N
+"string",\N
+42.42,42.42
+"42.d42",\N
+\N,\N
+"string",\N
+42.42,42.42
+"42.d42",\N
+Decimals
+\N,\N
+"string",\N
+42.42,42.42
+"42d42",\N
+"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242",\N
+\N,\N
+"string",\N
+42.42,42.42
+"42d42",\N
+"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242",\N
+\N,\N
+"string",\N
+42.42,42.42
+"42d42",\N
+"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242",\N
+\N,\N
+"string",\N
+42.42,42.42
+"42d42",\N
+"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242",\N
+Dates and DateTimes
+\N,\N
+"string",\N
+"2020-01-d1",\N
+"2020-01-01","2020-01-01"
+"2020-01-01 00:00:00.999",\N
+\N,\N
+"string",\N
+"2020-01-d1",\N
+"1900-01-01","1900-01-01"
+"2020-01-01 00:00:00.999",\N
+\N,\N
+"string",\N
+"2020-01-d1",\N
+"2020-01-01 00:00:00","2020-01-01 00:00:00"
+"2020-01-01 00:00:00.999",\N
+\N,\N
+"string",\N
+"2020-01-d1",\N
+"2020-01-01 00:00:00.999","2020-01-01 00:00:00.999"
+"2020-01-01 00:00:00.999999999 ABC",\N
+UUID
+\N,\N
+"string",\N
+"c8619cca-0caa-445e-ae76-1d4f6e0b3927","c8619cca-0caa-445e-ae76-1d4f6e0b3927"
+"c8619cca-0caa-445e-ae76-1d4f6e0b3927AAA",\N
+IPv4
+\N,\N
+"string",\N
+"127.0.0.1","127.0.0.1"
+"127.0.0.1AAA",\N
+IPv6
+\N,\N
+"string",\N
+"2001:db8:85a3::8a2e:370:7334","2001:db8:85a3::8a2e:370:7334"
+"2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA",\N
+Enum
+\N,\N
+"string",\N
+"a","a"
+"a","a"
+2,\N
+"aa",\N
+Map
+\N,"{}"
+"string","{}"
+"{'a':42,'b':43,'c':0}","{'a':42,'b':43,'c':0}"
+"{'c' : 44, 'd' : [1,2,3]}","{}"
+"{'c' : 44","{}"
+Array
+\N,"[]"
+"string","[]"
+"[1,2,3]","[1,2,3]"
+"[0,0,0]","[0,0,0]"
+"[1, 2, 'hello']","[]"
+"[1, 2","[]"
+LowCardinality
+\N,\N
+"string","string"
+42,\N
+\N,"[]"
+"['string',NULL]","['string',NULL]"
+"['string', nul]","[]"
+42,"[]"
+Nullable
+\N,"[]"
+"string","[]"
+"['hello',NULL,'world']","['hello',NULL,'world']"
+"['hello', nul]","[]"
+{"repeat('-', 80)":"--------------------------------------------------------------------------------"}
+TSV
+String
+\N	\N
+string	string
+42	\N
+FixedString
+\N	\N
+string	\N
+abcd	abcd
+Bool
+\N	\N
+Truee	\N
+true	true
+Integers
+\N	\N
+string	\N
+-1	-1
+0	0
+10000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	\N
+0	0
+10000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	-1
+0	0
+10000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	\N
+0	0
+10000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	-1
+0	0
+10000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	\N
+0	0
+10000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	-1
+0	0
+10000000000000000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	\N
+0	0
+10000000000000000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	-1
+0	0
+42d42	\N
+\N	\N
+string	\N
+-1	\N
+0	0
+42d42	\N
+Floats
+\N	\N
+string	\N
+42.42	42.42
+42.d42	\N
+\N	\N
+string	\N
+42.42	42.42
+42.d42	\N
+Decimals
+\N	\N
+string	\N
+42.42	42.42
+42d42	\N
+4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242	\N
+\N	\N
+string	\N
+42.42	42.42
+42d42	\N
+4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242	\N
+\N	\N
+string	\N
+42.42	42.42
+42d42	\N
+4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242	\N
+\N	\N
+string	\N
+42.42	42.42
+42d42	\N
+4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242	\N
+Dates and DateTimes
+\N	\N
+string	\N
+2020-01-d1	\N
+2020-01-01	2020-01-01
+2020-01-01 00:00:00.999	\N
+\N	\N
+string	\N
+2020-01-d1	\N
+1900-01-01	1900-01-01
+2020-01-01 00:00:00.999	\N
+\N	\N
+string	\N
+2020-01-d1	\N
+2020-01-01 00:00:00	2020-01-01 00:00:00
+2020-01-01 00:00:00.999	\N
+\N	\N
+string	\N
+2020-01-d1	\N
+2020-01-01 00:00:00.999	2020-01-01 00:00:00.999
+2020-01-01 00:00:00.999999999 ABC	\N
+UUID
+\N	\N
+string	\N
+c8619cca-0caa-445e-ae76-1d4f6e0b3927	c8619cca-0caa-445e-ae76-1d4f6e0b3927
+c8619cca-0caa-445e-ae76-1d4f6e0b3927AAA	\N
+IPv4
+\N	\N
+string	\N
+127.0.0.1	127.0.0.1
+127.0.0.1AAA	\N
+IPv6
+\N	\N
+string	\N
+2001:db8:85a3::8a2e:370:7334	2001:db8:85a3::8a2e:370:7334
+2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA	\N
+Enum
+\N	\N
+string	\N
+a	a
+a	a
+2	\N
+aa	\N
+Map
+\N	{}
+string	{}
+{'a':42,'b':43,'c':0}	{'a':42,'b':43,'c':0}
+{\'c\' : 44, \'d\' : [1,2,3]}	{}
+{\'c\' : 44	{}
+Array
+\N	[]
+string	[]
+[1,2,3]	[1,2,3]
+[0,0,0]	[0,0,0]
+[1, 2, \'hello\']	[]
+[1, 2	[]
+LowCardinality
+\N	\N
+string	string
+42	\N
+\N	[]
+['string',NULL]	['string',NULL]
+[\'string\', nul]	[]
+42	[]
+Nullable
+\N	[]
+string	[]
+['hello',NULL,'world']	['hello',NULL,'world']
+[\'hello\', nul]	[]
+{"repeat('-', 80)":"--------------------------------------------------------------------------------"}
+Values
+String
+(NULL,NULL),('string','string'),(42,NULL)FixedString
+(NULL,NULL),('string',NULL),('abcd','abcd')Bool
+(NULL,NULL),(true,true)Integers
+(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000000000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000000000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0)(NULL,NULL),('string',NULL),(-1,NULL),(0,0)Floats
+(NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)Decimals
+(NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)Dates and DateTimes
+(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000',NULL),('2020-01-01','2020-01-01'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000',NULL),('1900-01-01','1900-01-01'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000',NULL),('2020-01-01 00:00:00','2020-01-01 00:00:00'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000','1970-01-01 00:00:00.000'),('2020-01-01 00:00:00.999',NULL),('2020-01-01 00:00:00.999999999 ABC',NULL)UUID
+(NULL,NULL),('string',NULL),('c8619cca-0caa-445e-ae76-1d4f6e0b3927','c8619cca-0caa-445e-ae76-1d4f6e0b3927'),('c8619cca-0caa-445e-ae76-1d4f6e0b3927AAA',NULL)IPv4
+(NULL,NULL),('string',NULL),('127.0.0.1','127.0.0.1'),('127.0.0.1AAA',NULL)IPv6
+(NULL,NULL),('string',NULL),('2001:db8:85a3::8a2e:370:7334','2001:db8:85a3::8a2e:370:7334'),('2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA',NULL)Enum
+(NULL,NULL),('string',NULL),('a','a'),(1,NULL),(2,NULL),('aa',NULL)Map
+(NULL,{}),('string',{}),({'a':42,'b':43,'c':0},{'a':42,'b':43,'c':0})Array
+(NULL,[]),('string',[]),([1,2,3],[1,2,3]),([0,0,0],[0,0,0])LowCardinality
+(NULL,NULL),('string','string'),(42,NULL)(NULL,[]),(['string',NULL],['string',NULL]),(42,[])Nullable
+(NULL,[]),('string',[]),(['hello',NULL,'world'],['hello',NULL,'world'])
diff --git a/tests/queries/0_stateless/02940_variant_text_deserialization.sql b/tests/queries/0_stateless/02940_variant_text_deserialization.sql
new file mode 100644
index 00000000000..041d02088ef
--- /dev/null
+++ b/tests/queries/0_stateless/02940_variant_text_deserialization.sql
@@ -0,0 +1,266 @@
+set allow_experimental_variant_type = 1;
+set session_timezone = 'UTC';
+
+select 'JSON';
+select 'String';
+select v, variantElement(v, 'String') from format(JSONEachRow, 'v Variant(String, UInt64)', '{"v" : null}, {"v" : "string"}, {"v" : 42}') format JSONEachRow;
+
+select 'FixedString';
+select v, variantElement(v, 'FixedString(4)') from format(JSONEachRow, 'v Variant(String, FixedString(4))', '{"v" : null}, {"v" : "string"}, {"v" : "abcd"}') format JSONEachRow;
+
+select 'Bool';
+select v, variantElement(v, 'Bool') from format(JSONEachRow, 'v Variant(String, Bool)', '{"v" : null}, {"v" : "string"}, {"v" : true}') format JSONEachRow;
+
+select 'Integers';
+select v, variantElement(v, 'Int8') from format(JSONEachRow, 'v Variant(String, Int8, UInt64)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000}') format JSONEachRow;
+select v, variantElement(v, 'UInt8') from format(JSONEachRow, 'v Variant(String, UInt8, Int64)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000}') format JSONEachRow;
+select v, variantElement(v, 'Int16') from format(JSONEachRow, 'v Variant(String, Int16, Int64)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000}') format JSONEachRow;
+select v, variantElement(v, 'UInt16') from format(JSONEachRow, 'v Variant(String, UInt16, Int64)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000}') format JSONEachRow;
+select v, variantElement(v, 'Int32') from format(JSONEachRow, 'v Variant(String, Int32, Int64)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000}') format JSONEachRow;
+select v, variantElement(v, 'UInt32') from format(JSONEachRow, 'v Variant(String, UInt32, Int64)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000}') format JSONEachRow;
+select v, variantElement(v, 'Int64') from format(JSONEachRow, 'v Variant(String, Int64, Int128)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000000000000000}') format JSONEachRow;
+select v, variantElement(v, 'UInt64') from format(JSONEachRow, 'v Variant(String, UInt64, Int128)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000000000000000}') format JSONEachRow;
+select v, variantElement(v, 'Int128') from format(JSONEachRow, 'v Variant(String, Int128, Int256)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}') format JSONEachRow;
+select v, variantElement(v, 'UInt128') from format(JSONEachRow, 'v Variant(String, UInt128, Int256)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}') format JSONEachRow;
+
+select 'Floats';
+select v, variantElement(v, 'Float32') from format(JSONEachRow, 'v Variant(String, Float32)', '{"v" : null}, {"v" : "string"}, {"v" : 42.42}') format JSONEachRow;
+select v, variantElement(v, 'Float64') from format(JSONEachRow, 'v Variant(String, Float64)', '{"v" : null}, {"v" : "string"}, {"v" : 42.42}') format JSONEachRow;
+
+select 'Decimals';
+select v, variantElement(v, 'Decimal32(6)') from format(JSONEachRow, 'v Variant(String, Decimal32(6))', '{"v" : null}, {"v" : "string"}, {"v" : 42.42}, {"v" : 4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242}') format JSONEachRow;
+select v, variantElement(v, 'Decimal64(6)') from format(JSONEachRow, 'v Variant(String, Decimal64(6))', '{"v" : null}, {"v" : "string"}, {"v" : 42.42}, {"v" : 4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242}') format JSONEachRow;
+select v, variantElement(v, 'Decimal128(6)') from format(JSONEachRow, 'v Variant(String, Decimal128(6))', '{"v" : null}, {"v" : "string"}, {"v" : 42.42}, {"v" : 4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242}') format JSONEachRow;
+select v, variantElement(v, 'Decimal256(6)') from format(JSONEachRow, 'v Variant(String, Decimal256(6))', '{"v" : null}, {"v" : "string"}, {"v" : 42.42}, {"v" : 4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242}') format JSONEachRow;
+
+select 'Dates and DateTimes';
+select v, variantElement(v, 'Date') from format(JSONEachRow, 'v Variant(String, Date, DateTime64)', '{"v" : null}, {"v" : "string"}, {"v" : "2020-01-01"}, {"v" : "2020-01-01 00:00:00.999"}') format JSONEachRow;
+select v, variantElement(v, 'Date32') from format(JSONEachRow, 'v Variant(String, Date32, DateTime64)', '{"v" : null}, {"v" : "string"}, {"v" : "1900-01-01"}, {"v" : "2020-01-01 00:00:00.999"}') format JSONEachRow;
+select v, variantElement(v, 'DateTime') from format(JSONEachRow, 'v Variant(String, DateTime, DateTime64)', '{"v" : null}, {"v" : "string"}, {"v" : "2020-01-01 00:00:00"}, {"v" : "2020-01-01 00:00:00.999"}') format JSONEachRow;
+select v, variantElement(v, 'DateTime64') from format(JSONEachRow, 'v Variant(String, DateTime64)', '{"v" : null}, {"v" : "string"}, {"v" : "2020-01-01 00:00:00.999"}, {"v" : "2020-01-01 00:00:00.999999999 ABC"}') format JSONEachRow;
+
+select 'UUID';
+select v, variantElement(v, 'UUID') from format(JSONEachRow, 'v Variant(String, UUID)', '{"v" : null}, {"v" : "string"}, {"v" : "c8619cca-0caa-445e-ae76-1d4f6e0b3927"}') format JSONEachRow;
+
+select 'IPv4';
+select v, variantElement(v, 'IPv4') from format(JSONEachRow, 'v Variant(String, IPv4)', '{"v" : null}, {"v" : "string"}, {"v" : "127.0.0.1"}') format JSONEachRow;
+
+select 'IPv6';
+select v, variantElement(v, 'IPv6') from format(JSONEachRow, 'v Variant(String, IPv6)', '{"v" : null}, {"v" : "string"}, {"v" : "2001:0db8:85a3:0000:0000:8a2e:0370:7334"}') format JSONEachRow;
+
+select 'Enum';
+select v, variantElement(v, 'Enum(''a'' = 1)') from format(JSONEachRow, 'v Variant(String, UInt32, Enum(''a'' = 1))', '{"v" : null}, {"v" : "string"}, {"v" : "a"}, {"v" : 1}, {"v" : 2}') format JSONEachRow;
+
+select 'Map';
+select v, variantElement(v, 'Map(String, UInt64)') from format(JSONEachRow, 'v Variant(String, Map(String, UInt64))', '{"v" : null}, {"v" : "string"}, {"v" : {"a" : 42, "b" : 43, "c" : null}}, {"v" : {"c" : 44, "d" : [1,2,3]}}') format JSONEachRow;
+
+select 'Tuple';
+select v, variantElement(v, 'Tuple(a UInt64, b UInt64)') from format(JSONEachRow, 'v Variant(String, Tuple(a UInt64, b UInt64))', '{"v" : null}, {"v" : "string"}, {"v" : {"a" : 42, "b" : null}}, {"v" : {"a" : 44, "d" : 32}}') format JSONEachRow;
+select v, variantElement(v, 'Tuple(a UInt64, b UInt64)') from format(JSONEachRow, 'v Variant(String, Tuple(a UInt64, b UInt64))', '{"v" : null}, {"v" : "string"}, {"v" : {"a" : 42, "b" : null}}, {"v" : {"a" : 44, "d" : 32}}') settings input_format_json_defaults_for_missing_elements_in_named_tuple=0;
+
+select 'Array';
+select v, variantElement(v, 'Array(UInt64)') from format(JSONEachRow, 'v Variant(String, Array(UInt64))', '{"v" : null}, {"v" : "string"}, {"v" : [1, 2, 3]}, {"v" : [null, null, null]} {"v" : [1, 2, "hello"]}') format JSONEachRow;
+
+select 'LowCardinality';
+select v, variantElement(v, 'LowCardinality(String)') from format(JSONEachRow, 'v Variant(LowCardinality(String), UInt64)', '{"v" : null}, {"v" : "string"}, {"v" : 42}') format JSONEachRow;
+select v, variantElement(v, 'Array(LowCardinality(Nullable(String)))') from format(JSONEachRow, 'v Variant(Array(LowCardinality(Nullable(String))), UInt64)', '{"v" : null}, {"v" : ["string", null]}, {"v" : 42}') format JSONEachRow;
+
+select 'Nullable';
+select v, variantElement(v, 'Array(Nullable(String))') from format(JSONEachRow, 'v Variant(String, Array(Nullable(String)))', '{"v" : null}, {"v" : "string"}, {"v" : ["hello", null, "world"]}') format JSONEachRow;
+
+select repeat('-', 80) format JSONEachRow;
+
+select 'CSV';
+select 'String';
+select v, variantElement(v, 'String') from format(CSV, 'v Variant(String, UInt64)', '\\N\n"string"\nstring\n42') format CSV;
+
+select 'FixedString';
+select v, variantElement(v, 'FixedString(4)') from format(CSV, 'v Variant(String, FixedString(4))', '\\N\n"string"\nstring\n"abcd"') format CSV;
+
+select 'Bool';
+select v, variantElement(v, 'Bool') from format(CSV, 'v Variant(String, Bool)', '\\N\nTruee\nTrue') format CSV;
+
+select 'Integers';
+select v, variantElement(v, 'Int8') from format(CSV, 'v Variant(String, Int8, UInt64)', '\n"string"\n-1\n0\n10000000000\n42d42') format CSV;
+select v, variantElement(v, 'UInt8') from format(CSV, 'v Variant(String, UInt8, Int64)', '\\N\n"string"\n-1\n0\n10000000000\n42d42') format CSV;
+select v, variantElement(v, 'Int16') from format(CSV, 'v Variant(String, Int16, Int64)', '\\N\n"string"\n-1\n0\n10000000000\n42d42') format CSV;
+select v, variantElement(v, 'UInt16') from format(CSV, 'v Variant(String, UInt16, Int64)', '\\N\n"string"\n-1\n0\n10000000000\n42d42') format CSV;
+select v, variantElement(v, 'Int32') from format(CSV, 'v Variant(String, Int32, Int64)', '\\N\n"string"\n-1\n0\n10000000000\n42d42') format CSV;
+select v, variantElement(v, 'UInt32') from format(CSV, 'v Variant(String, UInt32, Int64)', '\\N\n"string"\n-1\n0\n10000000000\n42d42') format CSV;
+select v, variantElement(v, 'Int64') from format(CSV, 'v Variant(String, Int64, Int128)', '\\N\n"string"\n-1\n0\n10000000000000000000000\n42d42') format CSV;
+select v, variantElement(v, 'UInt64') from format(CSV, 'v Variant(String, UInt64, Int128)', '\\N\n"string"\n-1\n0\n10000000000000000000000\n42d42') format CSV;
+select v, variantElement(v, 'Int128') from format(CSV, 'v Variant(String, Int128, Int256)', '\\N\n"string"\n-1\n0\n42d42') format CSV;
+select v, variantElement(v, 'UInt128') from format(CSV, 'v Variant(String, UInt128, Int256)', '\\N\n"string"\n-1\n0\n42d42') format CSV;
+
+select 'Floats';
+select v, variantElement(v, 'Float32') from format(CSV, 'v Variant(String, Float32)', '\\N\n"string"\n42.42\n42.d42') format CSV;
+select v, variantElement(v, 'Float64') from format(CSV, 'v Variant(String, Float64)', '\\N\n"string"\n42.42\n42.d42') format CSV;
+
+select 'Decimals';
+select v, variantElement(v, 'Decimal32(6)') from format(CSV, 'v Variant(String, Decimal32(6))', '\\N\n"string"\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format CSV;
+select v, variantElement(v, 'Decimal64(6)') from format(CSV, 'v Variant(String, Decimal64(6))', '\\N\n"string"\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format CSV;
+select v, variantElement(v, 'Decimal128(6)') from format(CSV, 'v Variant(String, Decimal128(6))', '\\N\n"string"\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format CSV;
+select v, variantElement(v, 'Decimal256(6)') from format(CSV, 'v Variant(String, Decimal256(6))', '\\N\n"string"\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format CSV;
+
+select 'Dates and DateTimes';
+select v, variantElement(v, 'Date') from format(CSV, 'v Variant(String, Date, DateTime64)', '\\N\n"string"\n"2020-01-d1"\n"2020-01-01"\n"2020-01-01 00:00:00.999"') format CSV;
+select v, variantElement(v, 'Date32') from format(CSV, 'v Variant(String, Date32, DateTime64)', '\\N\n"string"\n"2020-01-d1"\n"1900-01-01"\n"2020-01-01 00:00:00.999"') format CSV;
+select v, variantElement(v, 'DateTime') from format(CSV, 'v Variant(String, DateTime, DateTime64)', '\\N\n"string"\n"2020-01-d1"\n"2020-01-01 00:00:00"\n"2020-01-01 00:00:00.999"') format CSV;
+select v, variantElement(v, 'DateTime64') from format(CSV, 'v Variant(String, DateTime64)', '\\N\n"string"\n"2020-01-d1"\n"2020-01-01 00:00:00.999"\n"2020-01-01 00:00:00.999999999 ABC"') format CSV;
+
+select 'UUID';
+select v, variantElement(v, 'UUID') from format(CSV, 'v Variant(String, UUID)', '\\N\n"string"\n"c8619cca-0caa-445e-ae76-1d4f6e0b3927"\nc8619cca-0caa-445e-ae76-1d4f6e0b3927AAA') format CSV;
+
+select 'IPv4';
+select v, variantElement(v, 'IPv4') from format(CSV, 'v Variant(String, IPv4)', '\\N\n"string"\n"127.0.0.1"\n"127.0.0.1AAA"') format CSV;
+
+select 'IPv6';
+select v, variantElement(v, 'IPv6') from format(CSV, 'v Variant(String, IPv6)', '\\N\n"string"\n"2001:0db8:85a3:0000:0000:8a2e:0370:7334"\n2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA') format CSV;
+
+select 'Enum';
+select v, variantElement(v, 'Enum(''a'' = 1)') from format(CSV, 'v Variant(String, UInt32, Enum(''a'' = 1))', '\\N\n"string"\n"a"\n1\n2\naa') format CSV;
+
+select 'Map';
+select v, variantElement(v, 'Map(String, UInt64)') from format(CSV, 'v Variant(String, Map(String, UInt64))', '\\N\n"string"\n"{''a'' : 42, ''b'' : 43, ''c'' : null}"\n"{''c'' : 44, ''d'' : [1,2,3]}"\n"{''c'' : 44"') format CSV;
+
+select 'Array';
+select v, variantElement(v, 'Array(UInt64)') from format(CSV, 'v Variant(String, Array(UInt64))', '\\N\n"string"\n"[1, 2, 3]"\n"[null, null, null]"\n"[1, 2, ''hello'']"\n"[1, 2"') format CSV;
+
+select 'LowCardinality';
+select v, variantElement(v, 'LowCardinality(String)') from format(CSV, 'v Variant(LowCardinality(String), UInt64)', '\\N\n"string"\n42') format CSV;
+select v, variantElement(v, 'Array(LowCardinality(Nullable(String)))') from format(CSV, 'v Variant(Array(LowCardinality(Nullable(String))), UInt64, String)', '\\N\n"[''string'', null]"\n"[''string'', nul]"\n42') format CSV;
+
+select 'Nullable';
+select v, variantElement(v, 'Array(Nullable(String))') from format(CSV, 'v Variant(String, Array(Nullable(String)))', '\\N\n"string"\n"[''hello'', null, ''world'']"\n"[''hello'', nul]"') format CSV;
+
+select repeat('-', 80) format JSONEachRow;
+
+select 'TSV';
+select 'String';
+select v, variantElement(v, 'String') from format(TSV, 'v Variant(String, UInt64)', '\\N\nstring\n42') format TSV;
+
+select 'FixedString';
+select v, variantElement(v, 'FixedString(4)') from format(TSV, 'v Variant(String, FixedString(4))', '\\N\nstring\nabcd') format TSV;
+
+select 'Bool';
+select v, variantElement(v, 'Bool') from format(TSV, 'v Variant(String, Bool)', '\\N\nTruee\nTrue') format TSV;
+
+select 'Integers';
+select v, variantElement(v, 'Int8') from format(TSV, 'v Variant(String, Int8, UInt64)', '\\N\nstring\n-1\n0\n10000000000\n42d42') format TSV;
+select v, variantElement(v, 'UInt8') from format(TSV, 'v Variant(String, UInt8, Int64)', '\\N\nstring\n-1\n0\n10000000000\n42d42') format TSV;
+select v, variantElement(v, 'Int16') from format(TSV, 'v Variant(String, Int16, Int64)', '\\N\nstring\n-1\n0\n10000000000\n42d42') format TSV;
+select v, variantElement(v, 'UInt16') from format(TSV, 'v Variant(String, UInt16, Int64)', '\\N\nstring\n-1\n0\n10000000000\n42d42') format TSV;
+select v, variantElement(v, 'Int32') from format(TSV, 'v Variant(String, Int32, Int64)', '\\N\nstring\n-1\n0\n10000000000\n42d42') format TSV;
+select v, variantElement(v, 'UInt32') from format(TSV, 'v Variant(String, UInt32, Int64)', '\\N\nstring\n-1\n0\n10000000000\n42d42') format TSV;
+select v, variantElement(v, 'Int64') from format(TSV, 'v Variant(String, Int64, Int128)', '\\N\nstring\n-1\n0\n10000000000000000000000\n42d42') format TSV;
+select v, variantElement(v, 'UInt64') from format(TSV, 'v Variant(String, UInt64, Int128)', '\\N\nstring\n-1\n0\n10000000000000000000000\n42d42') format TSV;
+select v, variantElement(v, 'Int128') from format(TSV, 'v Variant(String, Int128, Int256)', '\\N\nstring\n-1\n0\n42d42') format TSV;
+select v, variantElement(v, 'UInt128') from format(TSV, 'v Variant(String, UInt128, Int256)', '\\N\nstring\n-1\n0\n42d42') format TSV;
+
+select 'Floats';
+select v, variantElement(v, 'Float32') from format(TSV, 'v Variant(String, Float32)', '\\N\nstring\n42.42\n42.d42') format TSV;
+select v, variantElement(v, 'Float64') from format(TSV, 'v Variant(String, Float64)', '\\N\nstring\n42.42\n42.d42') format TSV;
+
+select 'Decimals';
+select v, variantElement(v, 'Decimal32(6)') from format(TSV, 'v Variant(String, Decimal32(6))', '\\N\nstring\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format TSV;
+select v, variantElement(v, 'Decimal64(6)') from format(TSV, 'v Variant(String, Decimal64(6))', '\\N\nstring\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format TSV;
+select v, variantElement(v, 'Decimal128(6)') from format(TSV, 'v Variant(String, Decimal128(6))', '\\N\nstring\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format TSV;
+select v, variantElement(v, 'Decimal256(6)') from format(TSV, 'v Variant(String, Decimal256(6))', '\\N\nstring\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format TSV;
+
+select 'Dates and DateTimes';
+select v, variantElement(v, 'Date') from format(TSV, 'v Variant(String, Date, DateTime64)', '\\N\nstring\n2020-01-d1\n2020-01-01\n2020-01-01 00:00:00.999') format TSV;
+select v, variantElement(v, 'Date32') from format(TSV, 'v Variant(String, Date32, DateTime64)', '\\N\nstring\n2020-01-d1\n1900-01-01\n2020-01-01 00:00:00.999') format TSV;
+select v, variantElement(v, 'DateTime') from format(TSV, 'v Variant(String, DateTime, DateTime64)', '\\N\nstring\n2020-01-d1\n2020-01-01 00:00:00\n2020-01-01 00:00:00.999') format TSV;
+select v, variantElement(v, 'DateTime64') from format(TSV, 'v Variant(String, DateTime64)', '\\N\nstring\n2020-01-d1\n2020-01-01 00:00:00.999\n2020-01-01 00:00:00.999999999 ABC') format TSV;
+
+select 'UUID';
+select v, variantElement(v, 'UUID') from format(TSV, 'v Variant(String, UUID)', '\\N\nstring\nc8619cca-0caa-445e-ae76-1d4f6e0b3927\nc8619cca-0caa-445e-ae76-1d4f6e0b3927AAA') format TSV;
+
+select 'IPv4';
+select v, variantElement(v, 'IPv4') from format(TSV, 'v Variant(String, IPv4)', '\\N\nstring\n127.0.0.1\n127.0.0.1AAA') format TSV;
+
+select 'IPv6';
+select v, variantElement(v, 'IPv6') from format(TSV, 'v Variant(String, IPv6)', '\\N\nstring\n2001:0db8:85a3:0000:0000:8a2e:0370:7334\n2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA') format TSV;
+
+select 'Enum';
+select v, variantElement(v, 'Enum(''a'' = 1)') from format(TSV, 'v Variant(String, UInt32, Enum(''a'' = 1))', '\\N\nstring\na\n1\n2\naa') format TSV;
+
+select 'Map';
+select v, variantElement(v, 'Map(String, UInt64)') from format(TSV, 'v Variant(String, Map(String, UInt64))', '\\N\nstring\n{''a'' : 42, ''b'' : 43, ''c'' : null}\n{''c'' : 44, ''d'' : [1,2,3]}\n{''c'' : 44') format TSV;
+
+select 'Array';
+select v, variantElement(v, 'Array(UInt64)') from format(TSV, 'v Variant(String, Array(UInt64))', '\\N\nstring\n[1, 2, 3]\n[null, null, null]\n[1, 2, ''hello'']\n[1, 2') format TSV;
+
+select 'LowCardinality';
+select v, variantElement(v, 'LowCardinality(String)') from format(TSV, 'v Variant(LowCardinality(String), UInt64)', '\\N\nstring\n42') format TSV;
+select v, variantElement(v, 'Array(LowCardinality(Nullable(String)))') from format(TSV, 'v Variant(Array(LowCardinality(Nullable(String))), UInt64, String)', '\\N\n[''string'', null]\n[''string'', nul]\n42') format TSV;
+
+select 'Nullable';
+select v, variantElement(v, 'Array(Nullable(String))') from format(TSV, 'v Variant(String, Array(Nullable(String)))', '\\N\nstring\n[''hello'', null, ''world'']\n[''hello'', nul]') format TSV;
+
+select repeat('-', 80) format JSONEachRow;
+
+select 'Values';
+select 'String';
+select v, variantElement(v, 'String') from format(Values, 'v Variant(String, UInt64)', '(NULL), (''string''), (42)') format Values;
+
+select 'FixedString';
+select v, variantElement(v, 'FixedString(4)') from format(Values, 'v Variant(String, FixedString(4))', '(NULL), (''string''), (''abcd'')') format Values;
+
+select 'Bool';
+select v, variantElement(v, 'Bool') from format(Values, 'v Variant(String, Bool)', '(NULL), (True)') format Values;
+
+select 'Integers';
+select v, variantElement(v, 'Int8') from format(Values, 'v Variant(String, Int8, UInt64)', '(NULL), (''string''), (-1), (0), (10000000000)') format Values;
+select v, variantElement(v, 'UInt8') from format(Values, 'v Variant(String, UInt8, Int64)', '(NULL), (''string''), (-1), (0), (10000000000)') format Values;
+select v, variantElement(v, 'Int16') from format(Values, 'v Variant(String, Int16, Int64)', '(NULL), (''string''), (-1), (0), (10000000000)') format Values;
+select v, variantElement(v, 'UInt16') from format(Values, 'v Variant(String, UInt16, Int64)', '(NULL), (''string''), (-1), (0), (10000000000)') format Values;
+select v, variantElement(v, 'Int32') from format(Values, 'v Variant(String, Int32, Int64)', '(NULL), (''string''), (-1), (0), (10000000000)') format Values;
+select v, variantElement(v, 'UInt32') from format(Values, 'v Variant(String, UInt32, Int64)', '(NULL), (''string''), (-1), (0), (10000000000)') format Values;
+select v, variantElement(v, 'Int64') from format(Values, 'v Variant(String, Int64, Int128)', '(NULL), (''string''), (-1), (0), (10000000000000000000000)') format Values;
+select v, variantElement(v, 'UInt64') from format(Values, 'v Variant(String, UInt64, Int128)', '(NULL), (''string''), (-1), (0), (10000000000000000000000)') format Values;
+select v, variantElement(v, 'Int128') from format(Values, 'v Variant(String, Int128, Int256)', '(NULL), (''string''), (-1), (0)') format Values;
+select v, variantElement(v, 'UInt128') from format(Values, 'v Variant(String, UInt128, Int256)', '(NULL), (''string''), (-1), (0)') format Values;
+
+select 'Floats';
+select v, variantElement(v, 'Float32') from format(Values, 'v Variant(String, Float32)', '(NULL), (''string''), (42.42)') format Values;
+select v, variantElement(v, 'Float64') from format(Values, 'v Variant(String, Float64)', '(NULL), (''string''), (42.42)') format Values;
+
+select 'Decimals';
+select v, variantElement(v, 'Decimal32(6)') from format(Values, 'v Variant(String, Decimal32(6))', '(NULL), (''string''), (42.42)') format Values;
+select v, variantElement(v, 'Decimal64(6)') from format(Values, 'v Variant(String, Decimal64(6))', '(NULL), (''string''), (42.42)') format Values;
+select v, variantElement(v, 'Decimal128(6)') from format(Values, 'v Variant(String, Decimal128(6))', '(NULL), (''string''), (42.42)') format Values;
+select v, variantElement(v, 'Decimal256(6)') from format(Values, 'v Variant(String, Decimal256(6))', '(NULL), (''string''), (42.42)') format Values;
+
+select 'Dates and DateTimes';
+select v, variantElement(v, 'Date') from format(Values, 'v Variant(String, Date, DateTime64)', '(NULL), (''string''), (''2020-01-d1''), (''2020-01-01''), (''2020-01-01 00:00:00.999'')') format Values;
+select v, variantElement(v, 'Date32') from format(Values, 'v Variant(String, Date32, DateTime64)', '(NULL), (''string''), (''2020-01-d1''), (''1900-01-01''), (''2020-01-01 00:00:00.999'')') format Values;
+select v, variantElement(v, 'DateTime') from format(Values, 'v Variant(String, DateTime, DateTime64)', '(NULL), (''string''), (''2020-01-d1''), (''2020-01-01 00:00:00''), (''2020-01-01 00:00:00.999'')') format Values;
+select v, variantElement(v, 'DateTime64') from format(Values, 'v Variant(String, DateTime64)', '(NULL), (''string''), (''2020-01-d1''), (''2020-01-01 00:00:00.999''), (''2020-01-01 00:00:00.999999999 ABC'')') format Values;
+
+select 'UUID';
+select v, variantElement(v, 'UUID') from format(Values, 'v Variant(String, UUID)', '(NULL), (''string''), (''c8619cca-0caa-445e-ae76-1d4f6e0b3927''), (''c8619cca-0caa-445e-ae76-1d4f6e0b3927AAA'')') format Values;
+
+select 'IPv4';
+select v, variantElement(v, 'IPv4') from format(Values, 'v Variant(String, IPv4)', '(NULL), (''string''), (''127.0.0.1''), (''127.0.0.1AAA'')') format Values;
+
+select 'IPv6';
+select v, variantElement(v, 'IPv6') from format(Values, 'v Variant(String, IPv6)', '(NULL), (''string''), (''2001:0db8:85a3:0000:0000:8a2e:0370:7334''), (''2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA'')') format Values;
+
+select 'Enum';
+select v, variantElement(v, 'Enum(''a'' = 1)') from format(Values, 'v Variant(String, UInt32, Enum(''a'' = 1))', '(NULL), (''string''), (''a''), (1), (2), (''aa'')') format Values;
+
+select 'Map';
+select v, variantElement(v, 'Map(String, UInt64)') from format(Values, 'v Variant(String, Map(String, UInt64))', '(NULL), (''string''), ({''a'' : 42, ''b'' : 43, ''c'' : null})') format Values;
+
+select 'Array';
+select v, variantElement(v, 'Array(UInt64)') from format(Values, 'v Variant(String, Array(UInt64))', '(NULL), (''string''), ([1, 2, 3]), ([null, null, null])') format Values;
+
+select 'LowCardinality';
+select v, variantElement(v, 'LowCardinality(String)') from format(Values, 'v Variant(LowCardinality(String), UInt64)', '(NULL), (''string''), (42)') format Values;
+select v, variantElement(v, 'Array(LowCardinality(Nullable(String)))') from format(Values, 'v Variant(Array(LowCardinality(Nullable(String))), UInt64, String)', '(NULL), ([''string'', null]), (42)') format Values;
+
+select 'Nullable';
+select v, variantElement(v, 'Array(Nullable(String))') from format(Values, 'v Variant(String, Array(Nullable(String)))', '(NULL), (''string''), ([''hello'', null, ''world''])') format Values;
+
+select '';
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02941_variant_type_1.reference b/tests/queries/0_stateless/02941_variant_type_1.reference
new file mode 100644
index 00000000000..8a6e77d4f6d
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_1.reference
@@ -0,0 +1,2472 @@
+Memory
+test1 insert
+test1 select
+\N
+\N
+\N
+0
+1
+2
+str_0
+str_1
+str_2
+lc_str_0
+lc_str_1
+lc_str_2
+(0,1)
+(1,2)
+(2,3)
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+str_1
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+lc_str_1
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(1,2)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+-----------------------------------------------------------------------------------------------------------
+test2 insert
+test2 select
+\N
+\N
+\N
+0
+\N
+2
+str_0
+\N
+str_2
+lc_str_0
+\N
+lc_str_2
+(0,1)
+\N
+(2,3)
+[0]
+\N
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+\N
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+\N
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(0,0)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+-----------------------------------------------------------------------------------------------------------
+test3 insert
+test3 select
+\N
+str_1
+2
+lc_str_3
+(4,5)
+[0,1,2,3,4,5]
+\N
+str_7
+8
+lc_str_9
+(10,11)
+[0,1,2,3,4,5,6,7,8,9,10,11]
+\N
+str_13
+14
+lc_str_15
+(16,17)
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+str_1
+\N
+\N
+\N
+\N
+\N
+str_7
+\N
+\N
+\N
+\N
+\N
+str_13
+\N
+\N
+\N
+\N
+\N
+\N
+2
+\N
+\N
+\N
+\N
+\N
+8
+\N
+\N
+\N
+\N
+\N
+14
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_3
+\N
+\N
+\N
+\N
+\N
+lc_str_9
+\N
+\N
+\N
+\N
+\N
+lc_str_15
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(4,5)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(10,11)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(16,17)
+(0,0)
+\N
+\N
+\N
+\N
+4
+\N
+\N
+\N
+\N
+\N
+10
+\N
+\N
+\N
+\N
+\N
+16
+\N
+\N
+\N
+\N
+\N
+5
+\N
+\N
+\N
+\N
+\N
+11
+\N
+\N
+\N
+\N
+\N
+17
+\N
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+\N
+\N
+\N
+\N
+6
+\N
+\N
+\N
+\N
+\N
+12
+\N
+\N
+\N
+\N
+\N
+18
+-----------------------------------------------------------------------------------------------------------
+MergeTree compact
+test1 insert
+test1 select
+\N
+\N
+\N
+0
+1
+2
+str_0
+str_1
+str_2
+lc_str_0
+lc_str_1
+lc_str_2
+(0,1)
+(1,2)
+(2,3)
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+str_1
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+lc_str_1
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(1,2)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+-----------------------------------------------------------------------------------------------------------
+test1 select
+\N
+\N
+\N
+0
+1
+2
+str_0
+str_1
+str_2
+lc_str_0
+lc_str_1
+lc_str_2
+(0,1)
+(1,2)
+(2,3)
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+str_1
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+lc_str_1
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(1,2)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+-----------------------------------------------------------------------------------------------------------
+test2 insert
+test2 select
+\N
+\N
+\N
+0
+\N
+2
+str_0
+\N
+str_2
+lc_str_0
+\N
+lc_str_2
+(0,1)
+\N
+(2,3)
+[0]
+\N
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+\N
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+\N
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(0,0)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+-----------------------------------------------------------------------------------------------------------
+test2 select
+\N
+\N
+\N
+0
+\N
+2
+str_0
+\N
+str_2
+lc_str_0
+\N
+lc_str_2
+(0,1)
+\N
+(2,3)
+[0]
+\N
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+\N
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+\N
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(0,0)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+-----------------------------------------------------------------------------------------------------------
+test3 insert
+test3 select
+\N
+str_1
+2
+lc_str_3
+(4,5)
+[0,1,2,3,4,5]
+\N
+str_7
+8
+lc_str_9
+(10,11)
+[0,1,2,3,4,5,6,7,8,9,10,11]
+\N
+str_13
+14
+lc_str_15
+(16,17)
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+str_1
+\N
+\N
+\N
+\N
+\N
+str_7
+\N
+\N
+\N
+\N
+\N
+str_13
+\N
+\N
+\N
+\N
+\N
+\N
+2
+\N
+\N
+\N
+\N
+\N
+8
+\N
+\N
+\N
+\N
+\N
+14
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_3
+\N
+\N
+\N
+\N
+\N
+lc_str_9
+\N
+\N
+\N
+\N
+\N
+lc_str_15
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(4,5)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(10,11)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(16,17)
+(0,0)
+\N
+\N
+\N
+\N
+4
+\N
+\N
+\N
+\N
+\N
+10
+\N
+\N
+\N
+\N
+\N
+16
+\N
+\N
+\N
+\N
+\N
+5
+\N
+\N
+\N
+\N
+\N
+11
+\N
+\N
+\N
+\N
+\N
+17
+\N
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+\N
+\N
+\N
+\N
+6
+\N
+\N
+\N
+\N
+\N
+12
+\N
+\N
+\N
+\N
+\N
+18
+-----------------------------------------------------------------------------------------------------------
+test3 select
+\N
+str_1
+2
+lc_str_3
+(4,5)
+[0,1,2,3,4,5]
+\N
+str_7
+8
+lc_str_9
+(10,11)
+[0,1,2,3,4,5,6,7,8,9,10,11]
+\N
+str_13
+14
+lc_str_15
+(16,17)
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+str_1
+\N
+\N
+\N
+\N
+\N
+str_7
+\N
+\N
+\N
+\N
+\N
+str_13
+\N
+\N
+\N
+\N
+\N
+\N
+2
+\N
+\N
+\N
+\N
+\N
+8
+\N
+\N
+\N
+\N
+\N
+14
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_3
+\N
+\N
+\N
+\N
+\N
+lc_str_9
+\N
+\N
+\N
+\N
+\N
+lc_str_15
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(4,5)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(10,11)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(16,17)
+(0,0)
+\N
+\N
+\N
+\N
+4
+\N
+\N
+\N
+\N
+\N
+10
+\N
+\N
+\N
+\N
+\N
+16
+\N
+\N
+\N
+\N
+\N
+5
+\N
+\N
+\N
+\N
+\N
+11
+\N
+\N
+\N
+\N
+\N
+17
+\N
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+\N
+\N
+\N
+\N
+6
+\N
+\N
+\N
+\N
+\N
+12
+\N
+\N
+\N
+\N
+\N
+18
+-----------------------------------------------------------------------------------------------------------
+MergeTree wide
+test1 insert
+test1 select
+\N
+\N
+\N
+0
+1
+2
+str_0
+str_1
+str_2
+lc_str_0
+lc_str_1
+lc_str_2
+(0,1)
+(1,2)
+(2,3)
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+str_1
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+lc_str_1
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(1,2)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+-----------------------------------------------------------------------------------------------------------
+test1 select
+\N
+\N
+\N
+0
+1
+2
+str_0
+str_1
+str_2
+lc_str_0
+lc_str_1
+lc_str_2
+(0,1)
+(1,2)
+(2,3)
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+str_1
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+lc_str_1
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(1,2)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+-----------------------------------------------------------------------------------------------------------
+test2 insert
+test2 select
+\N
+\N
+\N
+0
+\N
+2
+str_0
+\N
+str_2
+lc_str_0
+\N
+lc_str_2
+(0,1)
+\N
+(2,3)
+[0]
+\N
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+\N
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+\N
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(0,0)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+-----------------------------------------------------------------------------------------------------------
+test2 select
+\N
+\N
+\N
+0
+\N
+2
+str_0
+\N
+str_2
+lc_str_0
+\N
+lc_str_2
+(0,1)
+\N
+(2,3)
+[0]
+\N
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+\N
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+\N
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(0,0)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+-----------------------------------------------------------------------------------------------------------
+test3 insert
+test3 select
+\N
+str_1
+2
+lc_str_3
+(4,5)
+[0,1,2,3,4,5]
+\N
+str_7
+8
+lc_str_9
+(10,11)
+[0,1,2,3,4,5,6,7,8,9,10,11]
+\N
+str_13
+14
+lc_str_15
+(16,17)
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+str_1
+\N
+\N
+\N
+\N
+\N
+str_7
+\N
+\N
+\N
+\N
+\N
+str_13
+\N
+\N
+\N
+\N
+\N
+\N
+2
+\N
+\N
+\N
+\N
+\N
+8
+\N
+\N
+\N
+\N
+\N
+14
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_3
+\N
+\N
+\N
+\N
+\N
+lc_str_9
+\N
+\N
+\N
+\N
+\N
+lc_str_15
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(4,5)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(10,11)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(16,17)
+(0,0)
+\N
+\N
+\N
+\N
+4
+\N
+\N
+\N
+\N
+\N
+10
+\N
+\N
+\N
+\N
+\N
+16
+\N
+\N
+\N
+\N
+\N
+5
+\N
+\N
+\N
+\N
+\N
+11
+\N
+\N
+\N
+\N
+\N
+17
+\N
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+\N
+\N
+\N
+\N
+6
+\N
+\N
+\N
+\N
+\N
+12
+\N
+\N
+\N
+\N
+\N
+18
+-----------------------------------------------------------------------------------------------------------
+test3 select
+\N
+str_1
+2
+lc_str_3
+(4,5)
+[0,1,2,3,4,5]
+\N
+str_7
+8
+lc_str_9
+(10,11)
+[0,1,2,3,4,5,6,7,8,9,10,11]
+\N
+str_13
+14
+lc_str_15
+(16,17)
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+str_1
+\N
+\N
+\N
+\N
+\N
+str_7
+\N
+\N
+\N
+\N
+\N
+str_13
+\N
+\N
+\N
+\N
+\N
+\N
+2
+\N
+\N
+\N
+\N
+\N
+8
+\N
+\N
+\N
+\N
+\N
+14
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_3
+\N
+\N
+\N
+\N
+\N
+lc_str_9
+\N
+\N
+\N
+\N
+\N
+lc_str_15
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(4,5)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(10,11)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(16,17)
+(0,0)
+\N
+\N
+\N
+\N
+4
+\N
+\N
+\N
+\N
+\N
+10
+\N
+\N
+\N
+\N
+\N
+16
+\N
+\N
+\N
+\N
+\N
+5
+\N
+\N
+\N
+\N
+\N
+11
+\N
+\N
+\N
+\N
+\N
+17
+\N
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+\N
+\N
+\N
+\N
+6
+\N
+\N
+\N
+\N
+\N
+12
+\N
+\N
+\N
+\N
+\N
+18
+-----------------------------------------------------------------------------------------------------------
diff --git a/tests/queries/0_stateless/02941_variant_type_1.sh b/tests/queries/0_stateless/02941_variant_type_1.sh
new file mode 100755
index 00000000000..774acb4bbef
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_1.sh
@@ -0,0 +1,124 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
+
+function test1_insert()
+{
+    echo "test1 insert"
+    $CH_CLIENT -q "insert into test select number, NULL from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 3, number from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 6, 'str_' || toString(number) from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 9, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 12, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 15, range(number + 1)::Array(UInt64) from numbers(3);"
+}
+
+function test1_select()
+{
+    echo "test1 select"
+    $CH_CLIENT -q "select v from test order by id;"
+    $CH_CLIENT -q "select v.String from test order by id;"
+    $CH_CLIENT -q "select v.UInt64 from test order by id;"
+    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test order by id;"
+    echo "-----------------------------------------------------------------------------------------------------------"
+}
+
+function test2_insert()
+{
+    echo "test2 insert"
+    $CH_CLIENT -q "insert into test select number, NULL from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 3, number % 2 ? NULL : number from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 6, number % 2 ? NULL : 'str_' || toString(number) from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 9, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(('lc_str_' || toString(number))::LowCardinality(String), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 12, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 15, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(range(number + 1)::Array(UInt64), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
+}
+
+function test2_select()
+{
+    echo "test2 select"
+    $CH_CLIENT -q "select v from test order by id;"
+    $CH_CLIENT -q "select v.String from test order by id;"
+    $CH_CLIENT -q "select v.UInt64 from test order by id;"
+    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test order by id;"
+    echo "-----------------------------------------------------------------------------------------------------------"
+}
+
+function test3_insert()
+{
+    echo "test3 insert"
+    $CH_CLIENT -q "insert into test with 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))' as type select number, multiIf(number % 6 == 0, CAST(NULL, type), number % 6 == 1, CAST('str_' || toString(number), type), number % 6 == 2, CAST(number, type), number % 6 == 3, CAST(('lc_str_' || toString(number))::LowCardinality(String), type), number % 6 == 4, CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), type), CAST(range(number + 1)::Array(UInt64), type)) as res from numbers(18);"
+}
+
+function test3_select()
+{
+    echo "test3 select"
+    $CH_CLIENT -q "select v from test order by id;"
+    $CH_CLIENT -q "select v.String from test order by id;"
+    $CH_CLIENT -q "select v.UInt64 from test order by id;"
+    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test order by id;"
+    echo "-----------------------------------------------------------------------------------------------------------"
+}
+
+function run()
+{
+    test1_insert
+    test1_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test1_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+    test2_insert
+    test2_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test2_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+    test3_insert
+    test3_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test3_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=Memory;"
+run 0
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+run 1
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+run 1
+$CH_CLIENT -q "drop table test;"
diff --git a/tests/queries/0_stateless/02941_variant_type_2.reference b/tests/queries/0_stateless/02941_variant_type_2.reference
new file mode 100644
index 00000000000..4b6d53c52ac
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_2.reference
@@ -0,0 +1,51 @@
+Memory
+test4 insert
+test4 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+MergeTree compact
+test4 insert
+test4 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+test4 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+MergeTree wide
+test4 insert
+test4 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+test4 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
diff --git a/tests/queries/0_stateless/02941_variant_type_2.sh b/tests/queries/0_stateless/02941_variant_type_2.sh
new file mode 100755
index 00000000000..aef5bc3fe02
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_2.sh
@@ -0,0 +1,71 @@
+#!/usr/bin/env bash
+# tags: long
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
+
+function test4_insert()
+{
+    echo "test4 insert"
+    $CH_CLIENT -q "insert into test select number, NULL from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 200000, number from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 400000, 'str_' || toString(number) from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 600000, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 800000, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 1000000, range(number % 20 + 1)::Array(UInt64) from numbers(200000);"
+}
+
+function test4_select
+{
+    echo "test4 select"
+    $CH_CLIENT -q "select v from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v);"
+    $CH_CLIENT -q "select v.String from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
+    $CH_CLIENT -q "select v.UInt64 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
+    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`LowCardinality(String)\`);"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test format Null;"
+    $CH_CLIENT -q "select count() from test where not empty(v.\`Array(UInt64)\`);"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
+}
+
+function run()
+{
+    test4_insert
+    test4_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test4_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=Memory;"
+run 0
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+run 1
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+run 1
+$CH_CLIENT -q "drop table test;"
diff --git a/tests/queries/0_stateless/02941_variant_type_3.reference b/tests/queries/0_stateless/02941_variant_type_3.reference
new file mode 100644
index 00000000000..1ccdb3acdff
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_3.reference
@@ -0,0 +1,51 @@
+Memory
+test5 insert
+test5 select
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
+MergeTree compact
+test5 insert
+test5 select
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
+test5 select
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
+MergeTree wide
+test5 insert
+test5 select
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
+test5 select
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
diff --git a/tests/queries/0_stateless/02941_variant_type_3.sh b/tests/queries/0_stateless/02941_variant_type_3.sh
new file mode 100755
index 00000000000..d3692270deb
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_3.sh
@@ -0,0 +1,71 @@
+#!/usr/bin/env bash
+# tags: long
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
+
+function test5_insert()
+{
+    echo "test5 insert"
+    $CH_CLIENT -q "insert into test select number, NULL from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 200000, number % 2 ? NULL : number from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 400000, number % 2 ? NULL : 'str_' || toString(number) from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 600000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(('lc_str_' || toString(number))::LowCardinality(String), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 800000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 1000000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(range(number % 20 + 1)::Array(UInt64), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
+}
+
+function test5_select()
+{
+    echo "test5 select"
+    $CH_CLIENT -q "select v from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v);"
+    $CH_CLIENT -q "select v.String from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
+    $CH_CLIENT -q "select v.UInt64 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
+    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`LowCardinality(String)\`);"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test format Null;"
+    $CH_CLIENT -q "select count() from test where not empty(v.\`Array(UInt64)\`);"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
+}
+
+function run()
+{
+    test5_insert
+    test5_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test5_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=Memory;"
+run 0
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+run 1
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+run 1
+$CH_CLIENT -q "drop table test;"
diff --git a/tests/queries/0_stateless/02941_variant_type_4.reference b/tests/queries/0_stateless/02941_variant_type_4.reference
new file mode 100644
index 00000000000..e13d5820343
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_4.reference
@@ -0,0 +1,56 @@
+Memory
+test6 insert
+test6 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+-----------------------------------------------------------------------------------------------------------
+MergeTree compact
+test6 insert
+test6 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+-----------------------------------------------------------------------------------------------------------
+test6 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+-----------------------------------------------------------------------------------------------------------
+MergeTree wide
+test6 insert
+test6 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+-----------------------------------------------------------------------------------------------------------
+test6 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+-----------------------------------------------------------------------------------------------------------
diff --git a/tests/queries/0_stateless/02941_variant_type_4.sh b/tests/queries/0_stateless/02941_variant_type_4.sh
new file mode 100755
index 00000000000..b3cc041bcd8
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_4.sh
@@ -0,0 +1,66 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
+
+function test6_insert()
+{
+    echo "test6 insert"
+    $CH_CLIENT -q "insert into test with 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))' as type select number, multiIf(number % 6 == 0, CAST(NULL, type), number % 6 == 1, CAST('str_' || toString(number), type), number % 6 == 2, CAST(number, type), number % 6 == 3, CAST(('lc_str_' || toString(number))::LowCardinality(String), type), number % 6 == 4, CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), type), CAST(range(number % 20 + 1)::Array(UInt64), type)) as res from numbers(1200000);"
+}
+
+function test6_select()
+{
+    echo "test6 select"
+    $CH_CLIENT -q "select v from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v);"
+    $CH_CLIENT -q "select v.String from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
+    $CH_CLIENT -q "select v.UInt64 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
+    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`LowCardinality(String)\`);"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test format Null;"
+    $CH_CLIENT -q "select count() from test where not empty(v.\`Array(UInt64)\`);"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
+    echo "-----------------------------------------------------------------------------------------------------------"
+}
+
+function run()
+{
+    test6_insert
+    test6_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test6_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=Memory;"
+run 0
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+run 1
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+run 1
+$CH_CLIENT -q "drop table test;"
diff --git a/tests/queries/0_stateless/02942_variant_cast.reference b/tests/queries/0_stateless/02942_variant_cast.reference
new file mode 100644
index 00000000000..f3fd7a9ba33
--- /dev/null
+++ b/tests/queries/0_stateless/02942_variant_cast.reference
@@ -0,0 +1,25 @@
+\N
+42
+0
+\N
+2
+\N
+Hello
+Hello
+NULL
+Hello
+Hello
+\N
+Hello
+\N
+0
+\N
+42
+\N
+Hello
+2
+\N
+Hello
+5
+0
+1
diff --git a/tests/queries/0_stateless/02942_variant_cast.sql b/tests/queries/0_stateless/02942_variant_cast.sql
new file mode 100644
index 00000000000..33587e3e438
--- /dev/null
+++ b/tests/queries/0_stateless/02942_variant_cast.sql
@@ -0,0 +1,23 @@
+set allow_experimental_variant_type=1;
+
+select NULL::Variant(String, UInt64);
+select 42::UInt64::Variant(String, UInt64);
+select 42::UInt32::Variant(String, UInt64); -- {serverError CANNOT_CONVERT_TYPE}
+select now()::Variant(String, UInt64); -- {serverError CANNOT_CONVERT_TYPE}
+select CAST(number % 2 ? NULL : number, 'Variant(String, UInt64)') from numbers(4);
+select 'Hello'::LowCardinality(String)::Variant(LowCardinality(String), UInt64);
+select 'Hello'::LowCardinality(Nullable(String))::Variant(LowCardinality(String), UInt64);
+select 'NULL'::LowCardinality(Nullable(String))::Variant(LowCardinality(String), UInt64);
+select 'Hello'::LowCardinality(Nullable(String))::Variant(LowCardinality(String), UInt64);
+select CAST(CAST(number % 2 ? NULL : 'Hello', 'LowCardinality(Nullable(String))'), 'Variant(LowCardinality(String), UInt64)') from numbers(4);
+
+select NULL::Variant(String, UInt64)::UInt64;
+select NULL::Variant(String, UInt64)::Nullable(UInt64);
+select '42'::Variant(String, UInt64)::UInt64;
+select 'str'::Variant(String, UInt64)::UInt64; -- {serverError CANNOT_PARSE_TEXT}
+select CAST(multiIf(number % 3 == 0, NULL::Variant(String, UInt64), number % 3 == 1, 'Hello'::Variant(String, UInt64), number::Variant(String, UInt64)), 'Nullable(String)') from numbers(6);
+select CAST(multiIf(number == 1, NULL::Variant(String, UInt64), number == 2, 'Hello'::Variant(String, UInt64), number::Variant(String, UInt64)), 'UInt64') from numbers(6); -- {serverError CANNOT_PARSE_TEXT}
+
+
+select number::Variant(UInt64)::Variant(String, UInt64)::Variant(Array(String), String, UInt64) from numbers(2);
+select 'str'::Variant(String, UInt64)::Variant(String, Array(UInt64)); -- {serverError CANNOT_CONVERT_TYPE}
diff --git a/tests/queries/0_stateless/02943_variant_element.reference b/tests/queries/0_stateless/02943_variant_element.reference
new file mode 100644
index 00000000000..ab8aaa8fdef
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_element.reference
@@ -0,0 +1,44 @@
+\N
+\N
+\N
+\N
+0
+1
+2
+3
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+str_0
+\N
+str_2
+\N
+\N
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[]
+[0,1,2]
+[]
+[[0]]
+[[NULL]]
+[[2]]
+[[NULL]]
diff --git a/tests/queries/0_stateless/02943_variant_element.sql b/tests/queries/0_stateless/02943_variant_element.sql
new file mode 100644
index 00000000000..c8eff9775ad
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_element.sql
@@ -0,0 +1,16 @@
+set allow_experimental_variant_type=1;
+set use_variant_when_no_common_type_in_if=1;
+
+select variantElement(NULL::Variant(String, UInt64), 'UInt64') from numbers(4);
+select variantElement(number::Variant(String, UInt64), 'UInt64') from numbers(4);
+select variantElement(number::Variant(String, UInt64), 'String') from numbers(4);
+select variantElement((number % 2 ? NULL : number)::Variant(String, UInt64), 'UInt64') from numbers(4);
+select variantElement((number % 2 ? NULL : number)::Variant(String, UInt64), 'String') from numbers(4);
+select variantElement((number % 2 ? NULL : 'str_' || toString(number))::LowCardinality(Nullable(String))::Variant(LowCardinality(String), UInt64), 'LowCardinality(String)') from numbers(4);
+select variantElement(NULL::LowCardinality(Nullable(String))::Variant(LowCardinality(String), UInt64), 'LowCardinality(String)') from numbers(4);
+select variantElement((number % 2 ? NULL : number)::Variant(Array(UInt64), UInt64), 'Array(UInt64)') from numbers(4);
+select variantElement(NULL::Variant(Array(UInt64), UInt64), 'Array(UInt64)') from numbers(4);
+select variantElement(number % 2 ? NULL : range(number + 1), 'Array(UInt64)') from numbers(4);
+
+select variantElement([[(number % 2 ? NULL : number)::Variant(String, UInt64)]], 'UInt64') from numbers(4);
+
diff --git a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference
new file mode 100644
index 00000000000..3803f39253c
--- /dev/null
+++ b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference
@@ -0,0 +1,96 @@
+Array(UInt8)	[1,2,3]
+Array(UInt8)	[1,2,3]
+String	str_1
+Nullable(String)	str_1
+String	str_1
+Nullable(String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Array(UInt8)	[1,2,3]
+Array(UInt8)	[1,2,3]
+String	str_1
+Nullable(String)	str_1
+String	str_1
+Nullable(String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Array(UInt8)	[1,2,3]
+Array(UInt8)	[1,2,3]
+String	str_1
+Nullable(String)	str_1
+String	str_1
+Nullable(String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+String	str_0
+String	str_1
+String	str_2
+String	str_3
+Nullable(String)	str_0
+Nullable(String)	str_1
+Nullable(String)	str_2
+Nullable(String)	str_3
+Array(UInt64)	[0]
+Array(UInt64)	[0,1]
+Array(UInt64)	[0,1,2]
+Array(UInt64)	[0,1,2,3]
+Array(UInt64)	[0]
+Array(UInt64)	[0,1]
+Array(UInt64)	[0,1,2]
+Array(UInt64)	[0,1,2,3]
+String	str_0
+String	str_1
+String	str_2
+String	str_3
+Nullable(String)	str_0
+Nullable(String)	str_1
+Nullable(String)	str_2
+Nullable(String)	str_3
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	str_1
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	str_3
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	str_1
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	str_3
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	[0]
+Variant(Array(UInt64), String, UInt64)	1
+Variant(Array(UInt64), String, UInt64)	str_2
+Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	4
+Variant(Array(UInt64), String, UInt64)	str_5
+Variant(Array(UInt64), String, UInt64)	[0]
+Variant(Array(UInt64), String, UInt64)	1
+Variant(Array(UInt64), String, UInt64)	str_2
+Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	4
+Variant(Array(UInt64), String, UInt64)	str_5
+Variant(Array(UInt64), String, UInt64)	[0]
+Variant(Array(UInt64), String, UInt64)	1
+Variant(Array(UInt64), String, UInt64)	str_2
+Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	4
+Variant(Array(UInt64), String, UInt64)	str_5
+Variant(Array(UInt64), String, UInt64)	[0]
+Variant(Array(UInt64), String, UInt64)	1
+Variant(Array(UInt64), String, UInt64)	str_2
+Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	4
+Variant(Array(UInt64), String, UInt64)	str_5
diff --git a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
new file mode 100644
index 00000000000..da36863bfda
--- /dev/null
+++ b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
@@ -0,0 +1,64 @@
+set allow_experimental_variant_type=1;
+set use_variant_when_no_common_type_in_if=1;
+
+select toTypeName(res), if(1, [1,2,3], 'str_1') as res;
+select toTypeName(res), if(1, [1,2,3], 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(0, [1,2,3], 'str_1') as res;
+select toTypeName(res), if(0, [1,2,3], 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(NULL, [1,2,3], 'str_1') as res;
+select toTypeName(res), if(NULL, [1,2,3], 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), [1,2,3], 'str_1') as res;
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), [1,2,3], 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(1, materialize([1,2,3]), 'str_1') as res;
+select toTypeName(res), if(1, materialize([1,2,3]), 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(0, materialize([1,2,3]), 'str_1') as res;
+select toTypeName(res), if(0, materialize([1,2,3]), 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(NULL, materialize([1,2,3]), 'str_1') as res;
+select toTypeName(res), if(NULL, materialize([1,2,3]), 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), materialize([1,2,3]), 'str_1') as res;
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), materialize([1,2,3]), 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(1, [1,2,3], materialize('str_1')) as res;
+select toTypeName(res), if(1, [1,2,3], materialize('str_1')::Nullable(String)) as res;
+
+select toTypeName(res), if(0, [1,2,3], materialize('str_1')) as res;
+select toTypeName(res), if(0, [1,2,3], materialize('str_1')::Nullable(String)) as res;
+
+select toTypeName(res), if(NULL, [1,2,3], materialize('str_1')) as res;
+select toTypeName(res), if(NULL, [1,2,3], materialize('str_1')::Nullable(String)) as res;
+
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), [1,2,3], materialize('str_1')) as res;
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), [1,2,3], materialize('str_1')::Nullable(String)) as res;
+
+
+select toTypeName(res), if(0, range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(0, range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(1, range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(1, range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(NULL, range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(NULL, range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(number % 2, range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(number % 2, range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(number % 2, range(number + 1), ('str_' || toString(number))::LowCardinality(String)) as res from numbers(4);
+select toTypeName(res), if(number % 2, range(number + 1), ('str_' || toString(number))::LowCardinality(Nullable(String))) as res from numbers(4);
+
+
+select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, 'str_' || toString(number)) as res from numbers(6);
+select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number,  ('str_' || toString(number))::Nullable(String)) as res from numbers(6);
+select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, ('str_' || toString(number))::LowCardinality(String)) as res from numbers(6);
+select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, ('str_' || toString(number))::LowCardinality(Nullable(String))) as res from numbers(6);
+

From 0a7ca36e7fbd02b4b64a30371fa3118144179e51 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 19 Dec 2023 17:08:35 +0000
Subject: [PATCH 027/245] Remove unneded changes in IColumn.h

---
 src/Columns/IColumn.h | 11 -----------
 1 file changed, 11 deletions(-)

diff --git a/src/Columns/IColumn.h b/src/Columns/IColumn.h
index 0dcba5b310c..3f866e6213d 100644
--- a/src/Columns/IColumn.h
+++ b/src/Columns/IColumn.h
@@ -631,17 +631,6 @@ struct IsMutableColumns<Arg, Args ...>
 template <>
 struct IsMutableColumns<> { static const bool value = true; };
 
-template <typename ... Args>
-struct IsMutableColumnsOrRvalueReferences;
-
-template <typename Arg, typename ... Args>
-struct IsMutableColumnsOrRvalueReferences<Arg, Args ...>
-{
-    static const bool value = (std::is_assignable<MutableColumnPtr &&, Arg>::value || std::is_rvalue_reference_v<Arg &&>) && IsMutableColumnsOrRvalueReferences<Args ...>::value;
-};
-
-template <>
-struct IsMutableColumnsOrRvalueReferences<> { static const bool value = true; };
 
 template <typename Type>
 const Type * checkAndGetColumn(const IColumn & column)

From bd84799aecb0f8103fd88e9fb1491720f9ec90c8 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 19 Dec 2023 17:21:45 +0000
Subject: [PATCH 028/245] Fix style

---
 src/Columns/ColumnVariant.h                        | 4 ++--
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 1 +
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Columns/ColumnVariant.h b/src/Columns/ColumnVariant.h
index 692fdd1709e..702107504f0 100644
--- a/src/Columns/ColumnVariant.h
+++ b/src/Columns/ColumnVariant.h
@@ -9,7 +9,7 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int LOGICAL_ERROR;
+    extern const int NOT_IMPLEMENTED;
 }
 
 /**
@@ -263,7 +263,7 @@ public:
     bool hasOnlyNulls() const
     {
         /// If all variants are empty, we have only NULL values.
-        return std::all_of(variants.begin(), variants.end(), [](const auto & v){ return v->empty(); } );
+        return std::all_of(variants.begin(), variants.end(), [](const WrappedPtr & v){ return v->empty(); });
     }
 
     /// Check if local and global order is the same.
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 637ab0ce6d4..bc03f4b39f8 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -2594,6 +2594,7 @@ uuid
 varPop
 varSamp
 variadic
+variantElement
 varint
 varpop
 varsamp

From e74ae96dd006f8ff5fc8150eba5ab0beb47ddba3 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 19 Dec 2023 17:35:13 +0000
Subject: [PATCH 029/245] Fux typo

---
 src/DataTypes/Serializations/SerializationNullable.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/DataTypes/Serializations/SerializationNullable.cpp b/src/DataTypes/Serializations/SerializationNullable.cpp
index e7f0e61f2a5..05c70827c35 100644
--- a/src/DataTypes/Serializations/SerializationNullable.cpp
+++ b/src/DataTypes/Serializations/SerializationNullable.cpp
@@ -206,7 +206,7 @@ ReturnType safeAppendToNullMap(ColumnNullable & column, bool is_null)
 }
 
 /// Deserialize value into non-nullable column. In case of NULL, insert default and set is_null to true.
-/// If ReturnType is bool, return true if parsing was succesfull and false in case of any error.
+/// If ReturnType is bool, return true if parsing was successful and false in case of any error.
 template <typename ReturnType = void, typename CheckForNull, typename DeserializeNested>
 static ReturnType deserializeImpl(IColumn & column, ReadBuffer & buf, CheckForNull && check_for_null, DeserializeNested && deserialize_nested, bool & is_null)
 {

From 9edbfb3a31e67722a6af3b418a119e9b2bbb164e Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 19 Dec 2023 17:55:42 +0000
Subject: [PATCH 030/245] Fix build after merging with master

---
 src/DataTypes/Serializations/SerializationEnum.cpp | 10 +++++-----
 src/DataTypes/Serializations/SerializationEnum.h   |  2 +-
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationEnum.cpp b/src/DataTypes/Serializations/SerializationEnum.cpp
index 6ad55913738..fb384547d64 100644
--- a/src/DataTypes/Serializations/SerializationEnum.cpp
+++ b/src/DataTypes/Serializations/SerializationEnum.cpp
@@ -47,7 +47,7 @@ bool SerializationEnum<Type>::tryDeserializeTextEscaped(IColumn & column, ReadBu
     {
         std::string field_name;
         readEscapedString(field_name, istr);
-        if (!this->tryGetValue(x, StringRef(field_name), true))
+        if (!ref_enum_values.tryGetValue(x, StringRef(field_name), true))
             return false;
     }
 
@@ -75,7 +75,7 @@ bool SerializationEnum<Type>::tryDeserializeTextQuoted(IColumn & column, ReadBuf
     std::string field_name;
     readQuotedStringWithSQLStyle(field_name, istr);
     FieldType x;
-    if (!this->tryGetValue(x, StringRef(field_name)))
+    if (!ref_enum_values.tryGetValue(x, StringRef(field_name)))
         return false;
     assert_cast<ColumnType &>(column).getData().push_back(x);
     return true;
@@ -111,7 +111,7 @@ bool SerializationEnum<Type>::tryDeserializeWholeText(IColumn & column, ReadBuff
     {
         std::string field_name;
         readStringUntilEOF(field_name, istr);
-        if (!this->tryGetValue(x, StringRef(field_name), true))
+        if (!ref_enum_values.tryGetValue(x, StringRef(field_name), true))
             return false;
     }
 
@@ -157,7 +157,7 @@ bool SerializationEnum<Type>::tryDeserializeTextJSON(IColumn & column, ReadBuffe
     {
         std::string field_name;
         readJSONString(field_name, istr);
-        if (!this->tryGetValue(x, StringRef(field_name)))
+        if (!ref_enum_values.tryGetValue(x, StringRef(field_name)))
             return false;
     }
 
@@ -198,7 +198,7 @@ bool SerializationEnum<Type>::tryDeserializeTextCSV(IColumn & column, ReadBuffer
     {
         std::string field_name;
         readCSVString(field_name, istr, settings.csv);
-        if (!this->tryGetValue(x, StringRef(field_name), true))
+        if (!ref_enum_values.tryGetValue(x, StringRef(field_name), true))
             return false;
     }
 
diff --git a/src/DataTypes/Serializations/SerializationEnum.h b/src/DataTypes/Serializations/SerializationEnum.h
index 708161dc5fd..5152a3fbc93 100644
--- a/src/DataTypes/Serializations/SerializationEnum.h
+++ b/src/DataTypes/Serializations/SerializationEnum.h
@@ -60,7 +60,7 @@ public:
 
     bool tryReadValue(ReadBuffer & istr, FieldType & x) const
     {
-       if (!tryReadText(x, istr) || !this->hasValue(x))
+       if (!tryReadText(x, istr) || !ref_enum_values.hasValue(x))
            return false;
 
        return true;

From 3c9dd07f7b2c036f5d299869f16ae0a39621b25f Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 19 Dec 2023 21:17:39 +0000
Subject: [PATCH 031/245] Fix special builds, fix test

---
 src/Columns/tests/gtest_column_variant.cpp                | 5 ++++-
 src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp | 7 +++----
 tests/queries/0_stateless/02941_variant_type_1.sh         | 1 +
 tests/queries/0_stateless/02941_variant_type_2.sh         | 2 +-
 tests/queries/0_stateless/02941_variant_type_3.sh         | 2 +-
 tests/queries/0_stateless/02941_variant_type_4.sh         | 1 +
 6 files changed, 11 insertions(+), 7 deletions(-)

diff --git a/src/Columns/tests/gtest_column_variant.cpp b/src/Columns/tests/gtest_column_variant.cpp
index b701e2d3183..0a6512c46b7 100644
--- a/src/Columns/tests/gtest_column_variant.cpp
+++ b/src/Columns/tests/gtest_column_variant.cpp
@@ -582,7 +582,10 @@ TEST(ColumnVariant, PermuteAndIndexOneColumnNoNulls)
     ASSERT_EQ((*permuted_column)[2].get<UInt64>(), 2);
 
     auto index = ColumnUInt64::create();
-    index->getData() = std::move(permutation);
+    index->getData().push_back(1);
+    index->getData().push_back(3);
+    index->getData().push_back(2);
+    index->getData().push_back(0);
     auto indexed_column = column->index(*index, 3);
     ASSERT_EQ(indexed_column->size(), 3);
     ASSERT_EQ((*indexed_column)[0].get<UInt64>(), 1);
diff --git a/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp b/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp
index 81c4af97401..dfcd24aff58 100644
--- a/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp
+++ b/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp
@@ -15,10 +15,10 @@ void SerializationIP<IPv>::deserializeText(DB::IColumn & column, DB::ReadBuffer
     IPv x;
     readText(x, istr);
 
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+
     if (whole && !istr.eof())
         throwUnexpectedDataAfterParsedValue(column, istr, settings, TypeName<IPv>.data());
-
-    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
 }
 
 template <typename IPv>
@@ -77,11 +77,10 @@ void SerializationIP<IPv>::deserializeTextJSON(DB::IColumn & column, DB::ReadBuf
     /// this code looks weird, but we want to throw specific exception to match original behavior...
     if (istr.eof())
         assertChar('"', istr);
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
     if (*istr.position() != '"')
         throwUnexpectedDataAfterParsedValue(column, istr, settings, TypeName<IPv>.data());
     istr.ignore();
-
-    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
 }
 
 template <typename IPv>
diff --git a/tests/queries/0_stateless/02941_variant_type_1.sh b/tests/queries/0_stateless/02941_variant_type_1.sh
index 774acb4bbef..4cf8ad25122 100755
--- a/tests/queries/0_stateless/02941_variant_type_1.sh
+++ b/tests/queries/0_stateless/02941_variant_type_1.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment
diff --git a/tests/queries/0_stateless/02941_variant_type_2.sh b/tests/queries/0_stateless/02941_variant_type_2.sh
index aef5bc3fe02..7064dfbf4ec 100755
--- a/tests/queries/0_stateless/02941_variant_type_2.sh
+++ b/tests/queries/0_stateless/02941_variant_type_2.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# tags: long
+# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment
diff --git a/tests/queries/0_stateless/02941_variant_type_3.sh b/tests/queries/0_stateless/02941_variant_type_3.sh
index d3692270deb..303039edef7 100755
--- a/tests/queries/0_stateless/02941_variant_type_3.sh
+++ b/tests/queries/0_stateless/02941_variant_type_3.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# tags: long
+# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment
diff --git a/tests/queries/0_stateless/02941_variant_type_4.sh b/tests/queries/0_stateless/02941_variant_type_4.sh
index b3cc041bcd8..169e43c6d69 100755
--- a/tests/queries/0_stateless/02941_variant_type_4.sh
+++ b/tests/queries/0_stateless/02941_variant_type_4.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment

From 1efd65b8c73951e60e94f74ccc45141a5b39d85e Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 20 Dec 2023 17:43:04 +0000
Subject: [PATCH 032/245] Fix tests

---
 src/Columns/ColumnVariant.cpp                        | 10 ++++++++++
 src/Columns/ColumnVariant.h                          |  1 +
 src/DataTypes/DataTypeVariant.cpp                    | 12 ++++++++++++
 src/DataTypes/DataTypeVariant.h                      |  1 +
 src/DataTypes/IDataType.h                            |  2 +-
 .../Serializations/SerializationVariantElement.cpp   |  2 +-
 6 files changed, 26 insertions(+), 2 deletions(-)

diff --git a/src/Columns/ColumnVariant.cpp b/src/Columns/ColumnVariant.cpp
index 67754e77992..a3a0362b646 100644
--- a/src/Columns/ColumnVariant.cpp
+++ b/src/Columns/ColumnVariant.cpp
@@ -480,6 +480,16 @@ void ColumnVariant::insertFrom(const IColumn & src_, size_t n)
     }
 }
 
+void ColumnVariant::insertIntoVariant(const DB::Field & x, Discriminator global_discr)
+{
+    if (global_discr > variants.size())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid global discriminator: {}. The number of variants is {}", size_t(global_discr), variants.size());
+    auto & variant = getVariantByGlobalDiscriminator(global_discr);
+    variant.insert(x);
+    getLocalDiscriminators().push_back(localDiscriminatorByGlobal(global_discr));
+    getOffsets().push_back(variant.size() - 1);
+}
+
 void ColumnVariant::insertRangeFrom(const IColumn & src_, size_t start, size_t length)
 {
     const size_t num_variants = variants.size();
diff --git a/src/Columns/ColumnVariant.h b/src/Columns/ColumnVariant.h
index 702107504f0..b388b118a69 100644
--- a/src/Columns/ColumnVariant.h
+++ b/src/Columns/ColumnVariant.h
@@ -174,6 +174,7 @@ public:
     StringRef getDataAt(size_t n) const override;
     void insertData(const char * pos, size_t length) override;
     void insert(const Field & x) override;
+    void insertIntoVariant(const Field & x, Discriminator global_discr);
     void insertFrom(const IColumn & src_, size_t n) override;
     void insertRangeFrom(const IColumn & src, size_t start, size_t length) override;
     void insertManyFrom(const IColumn & src, size_t position, size_t length) override;
diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index 77e1c504cf8..334ed2c7b10 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -1,9 +1,11 @@
 #include <Columns/ColumnVariant.h>
+#include <Columns/ColumnConst.h>
 #include <Core/Field.h>
 #include <DataTypes/DataTypeVariant.h>
 #include <DataTypes/DataTypeFactory.h>
 #include <DataTypes/Serializations/SerializationVariant.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/FieldToDataType.h>
 #include <Common/assert_cast.h>
 #include <IO/WriteHelpers.h>
 #include <IO/WriteBufferFromString.h>
@@ -94,6 +96,16 @@ MutableColumnPtr DataTypeVariant::createColumn() const
     return ColumnVariant::create(std::move(nested_columns));
 }
 
+ColumnPtr DataTypeVariant::createColumnConst(size_t size, const DB::Field & field) const
+{
+    auto field_type = applyVisitor(FieldToDataType(), field);
+    auto discr = tryGetVariantDiscriminator(field_type);
+    if (!discr)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot insert field \"{}\" into column with type {}", toString(field), getName());
+    auto column = createColumn();
+    assert_cast<ColumnVariant &>(*column).insertIntoVariant(field, *discr);
+    return ColumnConst::create(std::move(column), size);
+}
 
 Field DataTypeVariant::getDefault() const
 {
diff --git a/src/DataTypes/DataTypeVariant.h b/src/DataTypes/DataTypeVariant.h
index 60113a188b0..ca15dff1476 100644
--- a/src/DataTypes/DataTypeVariant.h
+++ b/src/DataTypes/DataTypeVariant.h
@@ -37,6 +37,7 @@ public:
 
     MutableColumnPtr createColumn() const override;
 
+    ColumnPtr createColumnConst(size_t size, const Field & field) const override;
     Field getDefault() const override;
 
     bool equals(const IDataType & rhs) const override;
diff --git a/src/DataTypes/IDataType.h b/src/DataTypes/IDataType.h
index ccdf54f57c3..4533c23a89f 100644
--- a/src/DataTypes/IDataType.h
+++ b/src/DataTypes/IDataType.h
@@ -150,7 +150,7 @@ public:
 
     /** Create ColumnConst for corresponding type, with specified size and value.
       */
-    ColumnPtr createColumnConst(size_t size, const Field & field) const;
+    virtual ColumnPtr createColumnConst(size_t size, const Field & field) const;
     ColumnPtr createColumnConstWithDefaultValue(size_t size) const;
 
     /** Get default value of data type.
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index 4b24ee5754e..1c0808db2a0 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -204,7 +204,7 @@ ColumnPtr SerializationVariantElement::VariantSubcolumnCreator::create(const DB:
     /// If this variant is empty, fill result column with default values.
     if (prev->empty())
     {
-        auto res = IColumn::mutate(makeNullableOrLowCardinalityNullableSafe(prev));
+        auto res = makeNullableOrLowCardinalityNullableSafe(prev)->cloneEmpty();
         res->insertManyDefaults(local_discriminators->size());
         return res;
     }

From 4f8789927db4dd0d9c79a80bebc805895d82297c Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 21 Dec 2023 15:53:21 +0000
Subject: [PATCH 033/245] Fix tests with analyzer, add more tests

---
 src/DataTypes/DataTypeVariant.cpp             |  18 +-
 ...different_local_and_global_order.reference | 244 ++++++++++++++++++
 ...e_with_different_local_and_global_order.sh |  82 ++++++
 .../02944_variant_as_if_multi_if_result.sql   |   1 +
 4 files changed, 340 insertions(+), 5 deletions(-)
 create mode 100644 tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
 create mode 100755 tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh

diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index 334ed2c7b10..0575f220f22 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -98,12 +98,20 @@ MutableColumnPtr DataTypeVariant::createColumn() const
 
 ColumnPtr DataTypeVariant::createColumnConst(size_t size, const DB::Field & field) const
 {
-    auto field_type = applyVisitor(FieldToDataType(), field);
-    auto discr = tryGetVariantDiscriminator(field_type);
-    if (!discr)
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot insert field \"{}\" into column with type {}", toString(field), getName());
     auto column = createColumn();
-    assert_cast<ColumnVariant &>(*column).insertIntoVariant(field, *discr);
+    if (field.isNull())
+    {
+        column->insertDefault();
+    }
+    else
+    {
+        auto field_type = applyVisitor(FieldToDataType(), field);
+        auto discr = tryGetVariantDiscriminator(field_type);
+        if (!discr)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot insert field \"{}\" into column with type {}", toString(field), getName());
+        assert_cast<ColumnVariant &>(*column).insertIntoVariant(field, *discr);
+    }
+
     return ColumnConst::create(std::move(column), size);
 }
 
diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
new file mode 100644
index 00000000000..f2e355824f9
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
@@ -0,0 +1,244 @@
+Memory
+test1 insert
+test1 select
+0	\N	0
+1	\N	1
+2	\N	2
+3	\N	3
+4	\N	4
+5	\N	5
+6	\N	6
+7	\N	7
+8	\N	8
+9	\N	9
+10	\N	10
+\N	\N	\N
+12	\N	12
+\N	\N	\N
+14	\N	14
+\N	\N	\N
+16	\N	16
+\N	\N	\N
+18	\N	18
+\N	\N	\N
+str_20	str_20	\N
+\N	\N	\N
+str_22	str_22	\N
+\N	\N	\N
+str_24	str_24	\N
+\N	\N	\N
+str_26	str_26	\N
+\N	\N	\N
+str_28	str_28	\N
+\N	\N	\N
+30	\N	30
+\N	\N	\N
+32	\N	32
+\N	\N	\N
+34	\N	34
+\N	\N	\N
+str_36	str_36	\N
+\N	\N	\N
+str_38	str_38	\N
+\N	\N	\N
+-----------------------------------------------------------------------------------------------------------
+test2 insert
+test2 select
+7000000
+1000000
+6000000
+-----------------------------------------------------------------------------------------------------------
+MergeTree compact
+test1 insert
+test1 select
+0	\N	0
+1	\N	1
+2	\N	2
+3	\N	3
+4	\N	4
+5	\N	5
+6	\N	6
+7	\N	7
+8	\N	8
+9	\N	9
+10	\N	10
+\N	\N	\N
+12	\N	12
+\N	\N	\N
+14	\N	14
+\N	\N	\N
+16	\N	16
+\N	\N	\N
+18	\N	18
+\N	\N	\N
+str_20	str_20	\N
+\N	\N	\N
+str_22	str_22	\N
+\N	\N	\N
+str_24	str_24	\N
+\N	\N	\N
+str_26	str_26	\N
+\N	\N	\N
+str_28	str_28	\N
+\N	\N	\N
+30	\N	30
+\N	\N	\N
+32	\N	32
+\N	\N	\N
+34	\N	34
+\N	\N	\N
+str_36	str_36	\N
+\N	\N	\N
+str_38	str_38	\N
+\N	\N	\N
+-----------------------------------------------------------------------------------------------------------
+test1 select
+0	\N	0
+1	\N	1
+2	\N	2
+3	\N	3
+4	\N	4
+5	\N	5
+6	\N	6
+7	\N	7
+8	\N	8
+9	\N	9
+10	\N	10
+\N	\N	\N
+12	\N	12
+\N	\N	\N
+14	\N	14
+\N	\N	\N
+16	\N	16
+\N	\N	\N
+18	\N	18
+\N	\N	\N
+str_20	str_20	\N
+\N	\N	\N
+str_22	str_22	\N
+\N	\N	\N
+str_24	str_24	\N
+\N	\N	\N
+str_26	str_26	\N
+\N	\N	\N
+str_28	str_28	\N
+\N	\N	\N
+30	\N	30
+\N	\N	\N
+32	\N	32
+\N	\N	\N
+34	\N	34
+\N	\N	\N
+str_36	str_36	\N
+\N	\N	\N
+str_38	str_38	\N
+\N	\N	\N
+-----------------------------------------------------------------------------------------------------------
+test2 insert
+test2 select
+7000000
+1000000
+6000000
+-----------------------------------------------------------------------------------------------------------
+test2 select
+7000000
+1000000
+6000000
+-----------------------------------------------------------------------------------------------------------
+MergeTree wide
+test1 insert
+test1 select
+0	\N	0
+1	\N	1
+2	\N	2
+3	\N	3
+4	\N	4
+5	\N	5
+6	\N	6
+7	\N	7
+8	\N	8
+9	\N	9
+10	\N	10
+\N	\N	\N
+12	\N	12
+\N	\N	\N
+14	\N	14
+\N	\N	\N
+16	\N	16
+\N	\N	\N
+18	\N	18
+\N	\N	\N
+str_20	str_20	\N
+\N	\N	\N
+str_22	str_22	\N
+\N	\N	\N
+str_24	str_24	\N
+\N	\N	\N
+str_26	str_26	\N
+\N	\N	\N
+str_28	str_28	\N
+\N	\N	\N
+30	\N	30
+\N	\N	\N
+32	\N	32
+\N	\N	\N
+34	\N	34
+\N	\N	\N
+str_36	str_36	\N
+\N	\N	\N
+str_38	str_38	\N
+\N	\N	\N
+-----------------------------------------------------------------------------------------------------------
+test1 select
+0	\N	0
+1	\N	1
+2	\N	2
+3	\N	3
+4	\N	4
+5	\N	5
+6	\N	6
+7	\N	7
+8	\N	8
+9	\N	9
+10	\N	10
+\N	\N	\N
+12	\N	12
+\N	\N	\N
+14	\N	14
+\N	\N	\N
+16	\N	16
+\N	\N	\N
+18	\N	18
+\N	\N	\N
+str_20	str_20	\N
+\N	\N	\N
+str_22	str_22	\N
+\N	\N	\N
+str_24	str_24	\N
+\N	\N	\N
+str_26	str_26	\N
+\N	\N	\N
+str_28	str_28	\N
+\N	\N	\N
+30	\N	30
+\N	\N	\N
+32	\N	32
+\N	\N	\N
+34	\N	34
+\N	\N	\N
+str_36	str_36	\N
+\N	\N	\N
+str_38	str_38	\N
+\N	\N	\N
+-----------------------------------------------------------------------------------------------------------
+test2 insert
+test2 select
+7000000
+1000000
+6000000
+-----------------------------------------------------------------------------------------------------------
+test2 select
+7000000
+1000000
+6000000
+-----------------------------------------------------------------------------------------------------------
diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
new file mode 100755
index 00000000000..88bd2d3bd42
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
@@ -0,0 +1,82 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+
+
+function test1_insert()
+{
+    echo "test1 insert"
+    $CH_CLIENT -q "insert into test select number, number::Variant(UInt64)::Variant(UInt64, Array(UInt64)) from numbers(10) settings max_block_size=3"
+    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)) as res from numbers(10, 10) settings max_block_size=3"
+    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64)) as res from numbers(20, 10) settings max_block_size=3"
+    $CH_CLIENT -q "insert into test select number, if(number < 35, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)), if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64))) from numbers(30, 10) settings max_block_size=3"
+}
+
+function test1_select()
+{
+    echo "test1 select"
+    $CH_CLIENT -q "select v, v.String, v.UInt64 from test order by id;"
+    echo "-----------------------------------------------------------------------------------------------------------"
+}
+
+function test2_insert()
+{
+    echo "test2 insert"
+    $CH_CLIENT -q "insert into test select number, number::Variant(UInt64)::Variant(UInt64, Array(UInt64)) from numbers(1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)) as res from numbers(1000000, 10000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64)) as res from numbers(2000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "insert into test select number, if(number < 5, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)), if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64))) from numbers(3000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+    }
+
+function test2_select()
+{
+    echo "test2 select"
+    $CH_CLIENT -q "select v from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v);"
+    $CH_CLIENT -q "select v.String from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
+    $CH_CLIENT -q "select v.UInt64 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
+    echo "-----------------------------------------------------------------------------------------------------------"
+}
+
+function run()
+{
+    test1_insert
+    test1_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test1_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+    test2_insert
+    test2_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test2_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, String, Array(UInt64))) engine=Memory;"
+run 0
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, String, Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+run 1
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, String, Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+run 1
+$CH_CLIENT -q "drop table test;"
diff --git a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
index da36863bfda..1121b21e383 100644
--- a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
+++ b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
@@ -1,3 +1,4 @@
+set allow_experimental_analyzer=0; -- The result type for if function with constant is different with analyzer.
 set allow_experimental_variant_type=1;
 set use_variant_when_no_common_type_in_if=1;
 

From 38ec9b5f719740b4e94758f9e5578acd562df939 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 22 Dec 2023 00:11:39 +0000
Subject: [PATCH 034/245] Fix variant element deserialization

---
 .../Serializations/SerializationVariant.cpp   |  27 ++--
 .../SerializationVariantElement.cpp           | 149 ++++++++++--------
 ...different_local_and_global_order.reference |  30 ++--
 ...e_with_different_local_and_global_order.sh |   8 +-
 4 files changed, 117 insertions(+), 97 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index ebd44fd6955..910ad1da303 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -277,13 +277,10 @@ void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to deserialize data into Variant column with not global variants order");
 
     /// First, deserialize new discriminators.
-    /// We deserialize them into a separate column to be able to use substream cache,
-    /// so if we also need to deserialize some of sub columns, we will read discriminators only once.
     settings.path.push_back(Substream::VariantDiscriminators);
-    ColumnPtr discriminators;
     if (auto cached_discriminators = getFromSubstreamsCache(cache, settings.path))
     {
-        discriminators = cached_discriminators;
+        col.getLocalDiscriminatorsPtr() = cached_discriminators;
     }
     else
     {
@@ -291,29 +288,31 @@ void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
         if (!discriminators_stream)
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariant::deserializeBinaryBulkWithMultipleStreams");
 
-        discriminators = ColumnVariant::ColumnDiscriminators::create();
-        SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*discriminators->assumeMutable(), *discriminators_stream, limit, 0);
-        addToSubstreamsCache(cache, settings.path, discriminators);
+        SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*col.getLocalDiscriminatorsPtr()->assumeMutable(), *discriminators_stream, limit, 0);
+        addToSubstreamsCache(cache, settings.path, col.getLocalDiscriminatorsPtr());
     }
 
     settings.path.pop_back();
 
-    /// Iterate through new discriminators, append them to column and calculate the limit for each variant.
+    /// Iterate through new discriminators and calculate the limit for each variant.
     /// While calculating limits we can also fill offsets column (we store offsets only in memory).
-    const auto & discriminators_data = assert_cast<const ColumnVariant::ColumnDiscriminators &>(*discriminators).getData();
-    auto & local_discriminators = col.getLocalDiscriminators();
-    local_discriminators.reserve(local_discriminators.size() + limit);
+    auto & discriminators_data = col.getLocalDiscriminators();
     auto & offsets = col.getOffsets();
     offsets.reserve(offsets.size() + limit);
     std::vector<size_t> variant_limits(variants.size(), 0);
-    for (size_t i = 0; i != limit; ++i)
+    size_t discriminators_offset = discriminators_data.size() - limit;
+    for (size_t i = discriminators_offset; i != discriminators_data.size(); ++i)
     {
         ColumnVariant::Discriminator discr = discriminators_data[i];
-        local_discriminators.push_back(discr);
         if (discr == ColumnVariant::NULL_DISCRIMINATOR)
+        {
             offsets.emplace_back();
+        }
         else
-            offsets.push_back(col.getVariantByLocalDiscriminator(discr).size() + variant_limits[discr]++);
+        {
+            offsets.push_back(col.getVariantByLocalDiscriminator(discr).size() + variant_limits[discr]);
+            ++variant_limits[discr];
+        }
     }
 
     /// Now we can deserialize variants according to their limits.
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index 1c0808db2a0..e06a20d2990 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -40,11 +40,31 @@ void SerializationVariantElement::serializeBinaryBulkStateSuffix(SerializeBinary
         ErrorCodes::NOT_IMPLEMENTED, "Method serializeBinaryBulkStateSuffix is not implemented for SerializationVariantElement");
 }
 
+struct DeserializeBinaryBulkStateVariantElement : public ISerialization::DeserializeBinaryBulkState
+{
+    /// During deserialization discriminators and variant streams can be shared.
+    /// For example we can read several variant elements together: "select v.UInt32, v.String from table",
+    /// or we can read the whole variant and some of variant elements: "select v, v.UInt32 from table".
+    /// To read the same column from the same stream more than once we use substream cache,
+    /// but this cache stores the whole column, not only the current range.
+    /// During deserialization of variant element discriminators and variant columns are not stored
+    /// in the result column, so we need to store them inside deserialization state, so we can use
+    /// substream cache correctly.
+    ColumnPtr discriminators;
+    ColumnPtr variant;
+
+    ISerialization::DeserializeBinaryBulkStatePtr variant_element_state;
+};
+
 void SerializationVariantElement::deserializeBinaryBulkStatePrefix(DeserializeBinaryBulkSettings & settings, DeserializeBinaryBulkStatePtr & state) const
 {
+    auto variant_element_state = std::make_shared<DeserializeBinaryBulkStateVariantElement>();
+
     addVariantToPath(settings.path);
-    nested_serialization->deserializeBinaryBulkStatePrefix(settings, state);
+    nested_serialization->deserializeBinaryBulkStatePrefix(settings, variant_element_state->variant_element_state);
     removeVariantFromPath(settings.path);
+
+    state = std::move(variant_element_state);
 }
 
 void SerializationVariantElement::serializeBinaryBulkWithMultipleStreams(const IColumn &, size_t, size_t, SerializeBinaryBulkSettings &, SerializeBinaryBulkStatePtr &) const
@@ -53,22 +73,19 @@ void SerializationVariantElement::serializeBinaryBulkWithMultipleStreams(const I
 }
 
 void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
-    ColumnPtr & column,
+    ColumnPtr & result_column,
     size_t limit,
     DeserializeBinaryBulkSettings & settings,
     DeserializeBinaryBulkStatePtr & state,
     SubstreamsCache * cache) const
 {
-    auto mutable_column = column->assumeMutable();
-    ColumnNullable * nullable_col = typeid_cast<ColumnNullable *>(mutable_column.get());
-    NullMap * null_map = nullable_col ? &nullable_col->getNullMapData() : nullptr;
+    auto * variant_element_state = checkAndGetState<DeserializeBinaryBulkStateVariantElement>(state);
 
     /// First, deserialize discriminators from Variant column.
     settings.path.push_back(Substream::VariantDiscriminators);
-    ColumnPtr discriminators;
     if (auto cached_discriminators = getFromSubstreamsCache(cache, settings.path))
     {
-        discriminators = cached_discriminators;
+        variant_element_state->discriminators = cached_discriminators;
     }
     else
     {
@@ -76,85 +93,87 @@ void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
         if (!discriminators_stream)
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams");
 
-        discriminators = ColumnVariant::ColumnDiscriminators::create();
-        SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*discriminators->assumeMutable(), *discriminators_stream, limit, 0);
-        addToSubstreamsCache(cache, settings.path, discriminators);
+        /// If we started to read a new column, reinitialize discriminators column in deserialization state.
+        if (!variant_element_state->discriminators || result_column->empty())
+            variant_element_state->discriminators = ColumnVariant::ColumnDiscriminators::create();
+
+        SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*variant_element_state->discriminators->assumeMutable(), *discriminators_stream, limit, 0);
+        addToSubstreamsCache(cache, settings.path, variant_element_state->discriminators);
     }
     settings.path.pop_back();
 
-    /// Iterate through discriminators to calculate the size of the variant.
-    const auto & discriminators_data = assert_cast<const ColumnVariant::ColumnDiscriminators &>(*discriminators).getData();
-    size_t variant_size = 0;
-    for (auto discr : discriminators_data)
-        variant_size += discr == variant_discriminator;
+    /// Iterate through new discriminators to calculate the limit for our variant.
+    const auto & discriminators_data = assert_cast<const ColumnVariant::ColumnDiscriminators &>(*variant_element_state->discriminators).getData();
+    size_t discriminators_offset = variant_element_state->discriminators->size() - limit;
+    size_t variant_limit = 0;
+    for (size_t i = discriminators_offset; i != discriminators_data.size(); ++i)
+        variant_limit += (discriminators_data[i] == variant_discriminator);
 
-    /// Now we know the size of the variant and can deserialize it.
+    /// Now we know the limit for our variant and can deserialize it.
 
-    /// If the size of variant column is the same as the size of discriminators,
-    /// we can deserialize new values directly into our column.
-    if (variant_size == discriminators_data.size())
+    /// If result column is Nullable, fill null map and extract nested column.
+    MutableColumnPtr mutable_column = result_column->assumeMutable();
+    if (isColumnNullable(*mutable_column))
     {
-        addVariantToPath(settings.path);
-        /// Special case when our result column is LowCardinality(Nullable(T)).
-        /// In this case the variant type is LowCardinality(T), and we cannot just
-        /// deserialize its values directly into LowCardinality(Nullable(T)) column.
-        /// We create a separate column with type LowCardinality(T), deserialize
-        /// values into it and then insert into result column using insertRangeFrom.
-        if (isColumnLowCardinalityNullable(*column))
+        auto & nullable_column = assert_cast<ColumnNullable &>(*mutable_column);
+        NullMap & null_map = nullable_column.getNullMapData();
+        /// If we have only our discriminator in range, fill null map with 0.
+        if (variant_limit == limit)
         {
-            ColumnPtr variant_col = mutable_column->cloneEmpty();
-            /// LowCardinality(Nullable(T)) -> LowCardinality(T)
-            assert_cast<ColumnLowCardinality &>(*variant_col->assumeMutable()).nestedRemoveNullable();
-            nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_col, limit, settings, state, cache);
-            mutable_column->insertRangeFrom(*variant_col, 0, variant_col->size());
+            null_map.resize_fill(null_map.size() + limit, 0);
         }
+        /// If no our discriminator in current range, fill null map with 1.
+        else if (variant_limit == 0)
+        {
+            null_map.resize_fill(null_map.size() + limit, 1);
+        }
+        /// Otherwise we should iterate through discriminators to fill null map.
         else
         {
-            nested_serialization->deserializeBinaryBulkWithMultipleStreams(nullable_col ? nullable_col->getNestedColumnPtr() : column, limit, settings, state, cache);
+            null_map.reserve(null_map.size() + limit);
+            for (size_t i = discriminators_offset; i != discriminators_data.size(); ++i)
+                null_map.push_back(discriminators_data[i] != variant_discriminator);
         }
-        if (nullable_col)
-            null_map->resize_fill(null_map->size() + limit, 0);
-        removeVariantFromPath(settings.path);
-        return;
+
+        mutable_column = nullable_column.getNestedColumnPtr()->assumeMutable();
     }
 
-    /// If variant size is 0, just fill column with default values.
-    if (variant_size == 0)
+    /// If we started to read a new column, reinitialize variant column in deserialization state.
+    if (!variant_element_state->variant || result_column->empty())
     {
-        mutable_column->insertManyDefaults(limit);
-        return;
+        variant_element_state->variant = mutable_column->cloneEmpty();
+
+        /// When result column is LowCardinality(Nullable(T)) we should
+        /// remove Nullable from variant column before deserialization.
+        if (isColumnLowCardinalityNullable(*mutable_column))
+            assert_cast<ColumnLowCardinality &>(*variant_element_state->variant->assumeMutable()).nestedRemoveNullable();
     }
 
-    /// In general case we should deserialize variant into a separate column,
-    /// iterate through discriminators and insert values from variant only when
-    /// row contains its discriminator and default value otherwise.
-    mutable_column->reserve(mutable_column->size() + limit);
-    mutable_column = nullable_col ? nullable_col->getNestedColumnPtr()->assumeMutable() : std::move(mutable_column);
-    ColumnPtr variant_col = mutable_column->cloneEmpty();
-
-    /// Special case when our result column is LowCardinality(Nullable(T)).
-    /// We should remove Nullable from variant column before deserialization.
-    if (isColumnLowCardinalityNullable(*column))
-        assert_cast<ColumnLowCardinality &>(*variant_col->assumeMutable()).nestedRemoveNullable();
-
     addVariantToPath(settings.path);
-    nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_col, variant_size, settings, state, cache);
+    nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_element_state->variant, variant_limit, settings, variant_element_state->variant_element_state, cache);
     removeVariantFromPath(settings.path);
 
-    size_t variant_index = 0;
-    for (auto discr : discriminators_data)
+    size_t variant_offset = variant_element_state->variant->size() - variant_limit;
+
+    /// If don't have our discriminator in range, just insert defaults.
+    if (variant_limit == 0)
     {
-        if (discr == variant_discriminator)
+        mutable_column->insertManyDefaults(limit);
+    }
+    /// If we have only our discriminator in range, insert the whole range to result column.
+    else if (variant_limit == limit)
+    {
+        mutable_column->insertRangeFrom(*variant_element_state->variant, variant_offset, variant_limit);
+    }
+    /// Otherwise iterate through discriminators and insert value from variant or default value depending on the discriminator.
+    else
+    {
+        for (size_t i = discriminators_offset; i != discriminators_data.size(); ++i)
         {
-            if (null_map)
-                null_map->push_back(0);
-            mutable_column->insertFrom(*variant_col, variant_index++);
-        }
-        else
-        {
-            if (null_map)
-                null_map->push_back(1);
-            mutable_column->insertDefault();
+            if (discriminators_data[i] == variant_discriminator)
+                mutable_column->insertFrom(*variant_element_state->variant, variant_offset++);
+            else
+                mutable_column->insertDefault();
         }
     }
 }
diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
index f2e355824f9..1736a307c42 100644
--- a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
@@ -44,9 +44,9 @@ str_38	str_38	\N
 -----------------------------------------------------------------------------------------------------------
 test2 insert
 test2 select
-7000000
-1000000
-6000000
+2500000
+750000
+1750000
 -----------------------------------------------------------------------------------------------------------
 MergeTree compact
 test1 insert
@@ -136,14 +136,14 @@ str_38	str_38	\N
 -----------------------------------------------------------------------------------------------------------
 test2 insert
 test2 select
-7000000
-1000000
-6000000
+2500000
+750000
+1750000
 -----------------------------------------------------------------------------------------------------------
 test2 select
-7000000
-1000000
-6000000
+2500000
+750000
+1750000
 -----------------------------------------------------------------------------------------------------------
 MergeTree wide
 test1 insert
@@ -233,12 +233,12 @@ str_38	str_38	\N
 -----------------------------------------------------------------------------------------------------------
 test2 insert
 test2 select
-7000000
-1000000
-6000000
+2500000
+750000
+1750000
 -----------------------------------------------------------------------------------------------------------
 test2 select
-7000000
-1000000
-6000000
+2500000
+750000
+1750000
 -----------------------------------------------------------------------------------------------------------
diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
index 88bd2d3bd42..9f4df8d7466 100755
--- a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment
@@ -29,14 +30,15 @@ function test2_insert()
 {
     echo "test2 insert"
     $CH_CLIENT -q "insert into test select number, number::Variant(UInt64)::Variant(UInt64, Array(UInt64)) from numbers(1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
-    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)) as res from numbers(1000000, 10000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)) as res from numbers(1000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
     $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64)) as res from numbers(2000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
-    $CH_CLIENT -q "insert into test select number, if(number < 5, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)), if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64))) from numbers(3000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
-    }
+    $CH_CLIENT -q "insert into test select number, if(number < 3500000, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)), if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64))) from numbers(3000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+}
 
 function test2_select()
 {
     echo "test2 select"
+    $CH_CLIENT -q "select v, v.String, v.UInt64 from test format Null;"
     $CH_CLIENT -q "select v from test format Null;"
     $CH_CLIENT -q "select count() from test where isNotNull(v);"
     $CH_CLIENT -q "select v.String from test format Null;"

From 319c20091efe8eebee5bde9bb8bae67e58a589d9 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 22 Dec 2023 00:15:44 +0000
Subject: [PATCH 035/245] Fix comments

---
 src/DataTypes/Serializations/SerializationVariant.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 910ad1da303..3b51c51872f 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -276,7 +276,7 @@ void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
     if (!col.hasGlobalVariantsOrder())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to deserialize data into Variant column with not global variants order");
 
-    /// First, deserialize new discriminators.
+    /// First, deserialize discriminators.
     settings.path.push_back(Substream::VariantDiscriminators);
     if (auto cached_discriminators = getFromSubstreamsCache(cache, settings.path))
     {
@@ -451,7 +451,7 @@ std::unordered_map<TypeIndex, size_t> getTypesTextDeserializePriorityMap()
 /// then for types with the same depth we sort by the types priority, and last we sort by the depth of LowCardinality/Nullable types,
 /// so if we have types with the same level of nesting and the same priority, we will first try to deserialize LowCardinality/Nullable types
 /// (for example if we have types Array(Array(String)) and Array(Array(Nullable(String))).
-/// This is just a batch of heuristics,
+/// This is just a batch of heuristics.
 std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataTypePtr & type, size_t nested_depth, size_t simple_nested_depth, std::unordered_map<TypeIndex, size_t> & priority_map)
 {
     if (const auto * nullable_type = typeid_cast<const DataTypeNullable *>(type.get()))
@@ -553,7 +553,7 @@ bool SerializationVariant::tryDeserializeImpl(
     for (size_t global_discr : deserialize_text_order)
     {
         ReadBufferFromString variant_buf(field);
-        /// Usually try_deserialize_variant should not throw an exception, but let's use try/catch just in case.
+        /// Usually try_deserialize_variant should not throw any exception, but let's use try/catch just in case.
         try
         {
             auto & variant_column = column_variant.getVariantByGlobalDiscriminator(global_discr);

From a61efedba8854e8f06b549deb595315ee40eb303 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Sat, 23 Dec 2023 00:10:58 +0000
Subject: [PATCH 036/245] Fix serialization again, add more tests

---
 src/Columns/ColumnVariant.h                   |  2 +-
 src/Columns/ColumnVector.cpp                  |  2 +-
 src/DataTypes/DataTypeVariant.cpp             | 15 +++++-
 .../Serializations/ISerialization.cpp         |  7 +++
 src/DataTypes/Serializations/ISerialization.h |  1 +
 .../Serializations/SerializationVariant.cpp   | 52 ++++++++++++++-----
 .../02943_variant_read_subcolumns_1.reference |  6 +++
 .../02943_variant_read_subcolumns_1.sh        | 38 ++++++++++++++
 .../02943_variant_read_subcolumns_2.reference |  6 +++
 .../02943_variant_read_subcolumns_2.sh        | 38 ++++++++++++++
 10 files changed, 150 insertions(+), 17 deletions(-)
 create mode 100644 tests/queries/0_stateless/02943_variant_read_subcolumns_1.reference
 create mode 100755 tests/queries/0_stateless/02943_variant_read_subcolumns_1.sh
 create mode 100644 tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference
 create mode 100755 tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh

diff --git a/src/Columns/ColumnVariant.h b/src/Columns/ColumnVariant.h
index b388b118a69..ec58553f5f3 100644
--- a/src/Columns/ColumnVariant.h
+++ b/src/Columns/ColumnVariant.h
@@ -163,7 +163,7 @@ public:
 
     size_t size() const override
     {
-        return local_discriminators->size();
+        return offsets->size();
     }
 
     Field operator[](size_t n) const override;
diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index 37e62c76596..b4e3fee5e42 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -469,7 +469,7 @@ void ColumnVector<T>::insertRangeFrom(const IColumn & src, size_t start, size_t
     const ColumnVector & src_vec = assert_cast<const ColumnVector &>(src);
 
     if (start + length > src_vec.data.size())
-        throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND,
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
                         "Parameters start = {}, length = {} are out of bound "
                         "in ColumnVector<T>::insertRangeFrom method (data.size() = {}).",
                         toString(start), toString(length), toString(src_vec.data.size()));
diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index 0575f220f22..5dc42cc7443 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -108,7 +108,20 @@ ColumnPtr DataTypeVariant::createColumnConst(size_t size, const DB::Field & fiel
         auto field_type = applyVisitor(FieldToDataType(), field);
         auto discr = tryGetVariantDiscriminator(field_type);
         if (!discr)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot insert field \"{}\" into column with type {}", toString(field), getName());
+        {
+            for (size_t i = 0; i != variants.size(); ++i)
+            {
+                if (field.getType() == variants[i]->getDefault().getType())
+                {
+                    discr = i;
+                    break;
+                }
+            }
+        }
+
+        if (!discr)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot insert field \"{}\" with type {} into column with type {}", toString(field), field.getTypeName(), getName());
+
         assert_cast<ColumnVariant &>(*column).insertIntoVariant(field, *discr);
     }
 
diff --git a/src/DataTypes/Serializations/ISerialization.cpp b/src/DataTypes/Serializations/ISerialization.cpp
index 86a37949dc8..46353fffb48 100644
--- a/src/DataTypes/Serializations/ISerialization.cpp
+++ b/src/DataTypes/Serializations/ISerialization.cpp
@@ -124,15 +124,20 @@ void ISerialization::deserializeBinaryBulkWithMultipleStreams(
     DeserializeBinaryBulkStatePtr & /* state */,
     SubstreamsCache * cache) const
 {
+    LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Deserialize path {}. Initial column size: {}", settings.path.toString(), column->size());
+
     auto cached_column = getFromSubstreamsCache(cache, settings.path);
     if (cached_column)
     {
         column = cached_column;
+        LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Use column from cache. Size: {}", cached_column->size());
     }
     else if (ReadBuffer * stream = settings.getter(settings.path))
     {
         auto mutable_column = column->assumeMutable();
+        LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Deserialize column. Initial size: {}", mutable_column->size());
         deserializeBinaryBulk(*mutable_column, *stream, limit, settings.avg_value_size_hint);
+        LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Deserialized column. Size: {}", mutable_column->size());
         column = std::move(mutable_column);
         addToSubstreamsCache(cache, settings.path, column);
     }
@@ -177,6 +182,8 @@ String getNameForSubstreamPath(
         }
         else if (it->type == Substream::VariantDiscriminators)
             stream_name += ".discr";
+        else if (it->type == Substream::VariantOffsets)
+            stream_name += ".variant_offsets";
         else if (it->type == Substream::VariantElement)
             stream_name += "." + it->variant_element_name;
     }
diff --git a/src/DataTypes/Serializations/ISerialization.h b/src/DataTypes/Serializations/ISerialization.h
index f0273f59d1f..5c6fe31ed9e 100644
--- a/src/DataTypes/Serializations/ISerialization.h
+++ b/src/DataTypes/Serializations/ISerialization.h
@@ -153,6 +153,7 @@ public:
             ObjectData,
 
             VariantDiscriminators,
+            VariantOffsets,
             VariantElements,
             VariantElement,
 
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 3b51c51872f..d36151fe8e9 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -291,28 +291,17 @@ void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
         SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*col.getLocalDiscriminatorsPtr()->assumeMutable(), *discriminators_stream, limit, 0);
         addToSubstreamsCache(cache, settings.path, col.getLocalDiscriminatorsPtr());
     }
-
     settings.path.pop_back();
 
-    /// Iterate through new discriminators and calculate the limit for each variant.
-    /// While calculating limits we can also fill offsets column (we store offsets only in memory).
-    auto & discriminators_data = col.getLocalDiscriminators();
-    auto & offsets = col.getOffsets();
-    offsets.reserve(offsets.size() + limit);
+    /// Second, calculate limits for each variant by iterating through new discriminators.
     std::vector<size_t> variant_limits(variants.size(), 0);
+    auto & discriminators_data = col.getLocalDiscriminators();
     size_t discriminators_offset = discriminators_data.size() - limit;
     for (size_t i = discriminators_offset; i != discriminators_data.size(); ++i)
     {
         ColumnVariant::Discriminator discr = discriminators_data[i];
-        if (discr == ColumnVariant::NULL_DISCRIMINATOR)
-        {
-            offsets.emplace_back();
-        }
-        else
-        {
-            offsets.push_back(col.getVariantByLocalDiscriminator(discr).size() + variant_limits[discr]);
+        if (discr != ColumnVariant::NULL_DISCRIMINATOR)
             ++variant_limits[discr];
-        }
     }
 
     /// Now we can deserialize variants according to their limits.
@@ -325,6 +314,41 @@ void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
         settings.path.pop_back();
     }
     settings.path.pop_back();
+
+    /// Fill offsets column.
+    /// It's important to do it after deserialization of all variants, because to fill offsets we need
+    /// initial variants sizes without values in current range, but some variants can be shared with
+    /// other columns via substream cache and they can already contain values from this range even
+    /// before we call deserialize for them. So, before deserialize we cannot know for sure if
+    /// variant columns already contain values from current range or not. But after calling deserialize
+    /// we know for sure that they contain these values, so we can use valiant limits and their
+    /// new sizes to calculate correct offsets.
+    settings.path.push_back(Substream::VariantOffsets);
+    if (auto cached_offsets = getFromSubstreamsCache(cache, settings.path))
+    {
+        col.getOffsetsPtr() = cached_offsets;
+    }
+    else
+    {
+        auto & offsets = col.getOffsets();
+        offsets.reserve(offsets.size() + limit);
+        std::vector<size_t> variant_offsets;
+        variant_offsets.reserve(variants.size());
+        for (size_t i = 0; i != variants.size(); ++i)
+            variant_offsets.push_back(col.getVariantByLocalDiscriminator(i).size() - variant_limits[i]);
+
+        for (size_t i = discriminators_offset; i != discriminators_data.size(); ++i)
+        {
+            ColumnVariant::Discriminator discr = discriminators_data[i];
+            if (discr == ColumnVariant::NULL_DISCRIMINATOR)
+                offsets.emplace_back();
+            else
+                offsets.push_back(variant_offsets[discr]++);
+        }
+
+        addToSubstreamsCache(cache, settings.path, col.getOffsetsPtr());
+    }
+    settings.path.pop_back();
 }
 
 void SerializationVariant::addVariantElementToPath(DB::ISerialization::SubstreamPath & path, size_t i) const
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_1.reference b/tests/queries/0_stateless/02943_variant_read_subcolumns_1.reference
new file mode 100644
index 00000000000..4b93782cddf
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_read_subcolumns_1.reference
@@ -0,0 +1,6 @@
+Memory
+test
+MergeTree compact
+test
+MergeTree wide
+test
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_1.sh b/tests/queries/0_stateless/02943_variant_read_subcolumns_1.sh
new file mode 100755
index 00000000000..9ccad55191f
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_read_subcolumns_1.sh
@@ -0,0 +1,38 @@
+#!/usr/bin/env bash
+# Tags: long
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+
+
+function test()
+{
+    echo "test"
+    $CH_CLIENT -q "insert into test select number, multiIf(number % 3 == 2, NULL, number % 3 == 1, number, arrayMap(x -> multiIf(number % 9 == 0, NULL, number % 9 == 3, 'str_' || toString(number), number), range(number % 10))) from numbers(1000000) settings min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "select v, v.UInt64, v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64 from test order by id format Null"
+    $CH_CLIENT -q "select v.UInt64, v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64 from test order by id format Null"
+    $CH_CLIENT -q "select v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64, v.\`Array(Variant(String, UInt64))\`.String from test order by id format Null"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=Memory"
+test
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=MergeTree order by id settings min_rows_for_wide_part=1000000000, min_bytes_for_wide_part=10000000000;"
+test
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+test
+$CH_CLIENT -q "drop table test;"
+
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference b/tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference
new file mode 100644
index 00000000000..4b93782cddf
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference
@@ -0,0 +1,6 @@
+Memory
+test
+MergeTree compact
+test
+MergeTree wide
+test
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh b/tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh
new file mode 100755
index 00000000000..9ccad55191f
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh
@@ -0,0 +1,38 @@
+#!/usr/bin/env bash
+# Tags: long
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+
+
+function test()
+{
+    echo "test"
+    $CH_CLIENT -q "insert into test select number, multiIf(number % 3 == 2, NULL, number % 3 == 1, number, arrayMap(x -> multiIf(number % 9 == 0, NULL, number % 9 == 3, 'str_' || toString(number), number), range(number % 10))) from numbers(1000000) settings min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "select v, v.UInt64, v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64 from test order by id format Null"
+    $CH_CLIENT -q "select v.UInt64, v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64 from test order by id format Null"
+    $CH_CLIENT -q "select v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64, v.\`Array(Variant(String, UInt64))\`.String from test order by id format Null"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=Memory"
+test
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=MergeTree order by id settings min_rows_for_wide_part=1000000000, min_bytes_for_wide_part=10000000000;"
+test
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+test
+$CH_CLIENT -q "drop table test;"
+

From 4931b363079aa5dd4fbc35ff6faea62efaf218de Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Sat, 23 Dec 2023 00:32:28 +0000
Subject: [PATCH 037/245] Fix style

---
 src/Columns/ColumnVector.cpp                        | 2 +-
 src/DataTypes/Serializations/SerializationArray.cpp | 5 +++--
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index b4e3fee5e42..37e62c76596 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -469,7 +469,7 @@ void ColumnVector<T>::insertRangeFrom(const IColumn & src, size_t start, size_t
     const ColumnVector & src_vec = assert_cast<const ColumnVector &>(src);
 
     if (start + length > src_vec.data.size())
-        throw Exception(ErrorCodes::LOGICAL_ERROR,
+        throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND,
                         "Parameters start = {}, length = {} are out of bound "
                         "in ColumnVector<T>::insertRangeFrom method (data.size() = {}).",
                         toString(start), toString(length), toString(src_vec.data.size()));
diff --git a/src/DataTypes/Serializations/SerializationArray.cpp b/src/DataTypes/Serializations/SerializationArray.cpp
index be23278ef25..bb22af16c69 100644
--- a/src/DataTypes/Serializations/SerializationArray.cpp
+++ b/src/DataTypes/Serializations/SerializationArray.cpp
@@ -348,6 +348,7 @@ void SerializationArray::deserializeBinaryBulkWithMultipleStreams(
 {
     auto mutable_column = column->assumeMutable();
     ColumnArray & column_array = typeid_cast<ColumnArray &>(*mutable_column);
+    size_t prev_last_offset = column_array.getOffsets().back();
     settings.path.push_back(Substream::ArraySizes);
 
     if (auto cached_column = getFromSubstreamsCache(cache, settings.path))
@@ -371,9 +372,9 @@ void SerializationArray::deserializeBinaryBulkWithMultipleStreams(
 
     /// Number of values corresponding with `offset_values` must be read.
     size_t last_offset = offset_values.back();
-    if (last_offset < nested_column->size())
+    if (last_offset < prev_last_offset)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Nested column is longer than last offset");
-    size_t nested_limit = last_offset - nested_column->size();
+    size_t nested_limit = last_offset - prev_last_offset;
 
     if (unlikely(nested_limit > MAX_ARRAYS_SIZE))
         throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Array sizes are too large: {}", nested_limit);

From 4e4aa90430d02f1fcc17b517946799f23c59b83e Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Sat, 23 Dec 2023 00:35:20 +0000
Subject: [PATCH 038/245] Remove debug logging

---
 src/DataTypes/Serializations/ISerialization.cpp | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/src/DataTypes/Serializations/ISerialization.cpp b/src/DataTypes/Serializations/ISerialization.cpp
index 46353fffb48..08575f06f2a 100644
--- a/src/DataTypes/Serializations/ISerialization.cpp
+++ b/src/DataTypes/Serializations/ISerialization.cpp
@@ -124,20 +124,15 @@ void ISerialization::deserializeBinaryBulkWithMultipleStreams(
     DeserializeBinaryBulkStatePtr & /* state */,
     SubstreamsCache * cache) const
 {
-    LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Deserialize path {}. Initial column size: {}", settings.path.toString(), column->size());
-
     auto cached_column = getFromSubstreamsCache(cache, settings.path);
     if (cached_column)
     {
         column = cached_column;
-        LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Use column from cache. Size: {}", cached_column->size());
     }
     else if (ReadBuffer * stream = settings.getter(settings.path))
     {
         auto mutable_column = column->assumeMutable();
-        LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Deserialize column. Initial size: {}", mutable_column->size());
         deserializeBinaryBulk(*mutable_column, *stream, limit, settings.avg_value_size_hint);
-        LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Deserialized column. Size: {}", mutable_column->size());
         column = std::move(mutable_column);
         addToSubstreamsCache(cache, settings.path, column);
     }

From f594ab34f50c1bcd860bd3b950c8d74ffe09662d Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Sat, 23 Dec 2023 12:56:11 +0000
Subject: [PATCH 039/245] Fix special build

---
 src/Columns/ColumnVariant.cpp                 |  8 +++---
 src/Columns/ColumnVariant.h                   |  2 +-
 .../Serializations/SerializationArray.cpp     |  5 ++--
 .../Serializations/SerializationVariant.cpp   | 26 +++++++------------
 src/Functions/if.cpp                          |  2 +-
 5 files changed, 17 insertions(+), 26 deletions(-)

diff --git a/src/Columns/ColumnVariant.cpp b/src/Columns/ColumnVariant.cpp
index a3a0362b646..f90ebfc54bb 100644
--- a/src/Columns/ColumnVariant.cpp
+++ b/src/Columns/ColumnVariant.cpp
@@ -102,7 +102,7 @@ ColumnVariant::ColumnVariant(MutableColumnPtr local_discriminators_, MutableColu
 {
 }
 
-ColumnVariant::ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumns && variants_, const std::vector<Discriminator> & global_discriminators) : ColumnVariant(std::move(local_discriminators_), nullptr, std::move(variants_), global_discriminators)
+ColumnVariant::ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_) : ColumnVariant(std::move(local_discriminators_), nullptr, std::move(variants_), local_to_global_discriminators_)
 {
 }
 
@@ -449,12 +449,12 @@ void ColumnVariant::insertData(const char *, size_t)
     throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method insertData is not supported for {}", getName());
 }
 
-void ColumnVariant::insert(const Field & field)
+void ColumnVariant::insert(const Field & x)
 {
-    if (field.isNull())
+    if (x.isNull())
         insertDefault();
     else
-        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Cannot insert field {} to column {}", toString(field), getName());
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Cannot insert field {} to column {}", toString(x), getName());
 }
 
 void ColumnVariant::insertFrom(const IColumn & src_, size_t n)
diff --git a/src/Columns/ColumnVariant.h b/src/Columns/ColumnVariant.h
index ec58553f5f3..eb96205924c 100644
--- a/src/Columns/ColumnVariant.h
+++ b/src/Columns/ColumnVariant.h
@@ -194,7 +194,7 @@ public:
     template <typename Type>
     ColumnPtr indexImpl(const PaddedPODArray<Type> & indexes, size_t limit) const;
     ColumnPtr replicate(const Offsets & replicate_offsets) const override;
-    MutableColumns scatter(ColumnIndex num_variants, const Selector & selector) const override;
+    MutableColumns scatter(ColumnIndex num_columns, const Selector & selector) const override;
     void gather(ColumnGathererStream & gatherer_stream) override;
 
     /// Variant type is not comparable.
diff --git a/src/DataTypes/Serializations/SerializationArray.cpp b/src/DataTypes/Serializations/SerializationArray.cpp
index bb22af16c69..be23278ef25 100644
--- a/src/DataTypes/Serializations/SerializationArray.cpp
+++ b/src/DataTypes/Serializations/SerializationArray.cpp
@@ -348,7 +348,6 @@ void SerializationArray::deserializeBinaryBulkWithMultipleStreams(
 {
     auto mutable_column = column->assumeMutable();
     ColumnArray & column_array = typeid_cast<ColumnArray &>(*mutable_column);
-    size_t prev_last_offset = column_array.getOffsets().back();
     settings.path.push_back(Substream::ArraySizes);
 
     if (auto cached_column = getFromSubstreamsCache(cache, settings.path))
@@ -372,9 +371,9 @@ void SerializationArray::deserializeBinaryBulkWithMultipleStreams(
 
     /// Number of values corresponding with `offset_values` must be read.
     size_t last_offset = offset_values.back();
-    if (last_offset < prev_last_offset)
+    if (last_offset < nested_column->size())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Nested column is longer than last offset");
-    size_t nested_limit = last_offset - prev_last_offset;
+    size_t nested_limit = last_offset - nested_column->size();
 
     if (unlikely(nested_limit > MAX_ARRAYS_SIZE))
         throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Array sizes are too large: {}", nested_limit);
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index d36151fe8e9..c88dd8e9e0d 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -564,7 +564,7 @@ bool SerializationVariant::tryDeserializeImpl(
     IColumn & column,
     const String & field,
     std::function<bool(ReadBuffer &)> check_for_null,
-    std::function<bool(IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer &)> try_deserialize_variant) const
+    std::function<bool(IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer &)> try_deserialize_nested) const
 {
     auto & column_variant = assert_cast<ColumnVariant &>(column);
     ReadBufferFromString null_buf(field);
@@ -577,25 +577,17 @@ bool SerializationVariant::tryDeserializeImpl(
     for (size_t global_discr : deserialize_text_order)
     {
         ReadBufferFromString variant_buf(field);
-        /// Usually try_deserialize_variant should not throw any exception, but let's use try/catch just in case.
-        try
+        auto & variant_column = column_variant.getVariantByGlobalDiscriminator(global_discr);
+        size_t prev_size = variant_column.size();
+        if (try_deserialize_nested(variant_column, variants[global_discr], variant_buf) && variant_buf.eof())
         {
-            auto & variant_column = column_variant.getVariantByGlobalDiscriminator(global_discr);
-            size_t prev_size = variant_column.size();
-            if (try_deserialize_variant(variant_column, variants[global_discr], variant_buf) && variant_buf.eof())
-            {
-                column_variant.getLocalDiscriminators().push_back(column_variant.localDiscriminatorByGlobal(global_discr));
-                column_variant.getOffsets().push_back(prev_size);
-                return true;
-            }
-            else if (variant_column.size() > prev_size)
-            {
-                variant_column.popBack(1);
-            }
+            column_variant.getLocalDiscriminators().push_back(column_variant.localDiscriminatorByGlobal(global_discr));
+            column_variant.getOffsets().push_back(prev_size);
+            return true;
         }
-        catch (...)
+        else if (variant_column.size() > prev_size)
         {
-            /// Try next variant.
+            variant_column.popBack(1);
         }
     }
 
diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index b15bc5938be..9ca4b487119 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -224,7 +224,7 @@ public:
         return std::make_shared<FunctionIf>(context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_when_no_common_type_in_if);
     }
 
-    FunctionIf(bool use_variant_when_no_common_type_ = false) : FunctionIfBase(), use_variant_when_no_common_type(use_variant_when_no_common_type_) {}
+    explicit FunctionIf(bool use_variant_when_no_common_type_ = false) : FunctionIfBase(), use_variant_when_no_common_type(use_variant_when_no_common_type_) {}
 
 private:
     bool use_variant_when_no_common_type = false;

From 5497fa79edfa6fdc2559d516486f80f88af40c68 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 27 Dec 2023 14:11:53 +0000
Subject: [PATCH 040/245] Fix tests

---
 src/DataTypes/Serializations/SerializationEnum.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/DataTypes/Serializations/SerializationEnum.cpp b/src/DataTypes/Serializations/SerializationEnum.cpp
index fb384547d64..14b1a33e2ce 100644
--- a/src/DataTypes/Serializations/SerializationEnum.cpp
+++ b/src/DataTypes/Serializations/SerializationEnum.cpp
@@ -73,7 +73,9 @@ template <typename Type>
 bool SerializationEnum<Type>::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     std::string field_name;
-    readQuotedStringWithSQLStyle(field_name, istr);
+    if (!tryReadQuotedStringWithSQLStyle(field_name, istr))
+        return false;
+
     FieldType x;
     if (!ref_enum_values.tryGetValue(x, StringRef(field_name)))
         return false;

From 4b2a0b99fc094e6b70e516af0360f126f62a886d Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Wed, 27 Dec 2023 20:02:50 +0100
Subject: [PATCH 041/245] Update
 docs/en/sql-reference/functions/other-functions.md

---
 docs/en/sql-reference/functions/other-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index d69d692d055..ebc80e4d308 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -2839,7 +2839,7 @@ Extracts a column with specified type from a `Variant` column.
 **Syntax**
 
 ```sql
-tupleElement(variant, type_name, [, default_value])
+variantElement(variant, type_name, [, default_value])
 ```
 
 **Arguments**

From 275fbe3e986c8faee3bd396e3ed87e3707f0f25f Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 27 Dec 2023 20:04:14 +0000
Subject: [PATCH 042/245] Support function to subcolumns optimization for
 Variant, better text priority for reading Bool

---
 .../Passes/FunctionToSubcolumnsPass.cpp         | 17 +++++++++++++++++
 .../Serializations/SerializationVariant.cpp     |  4 ++++
 .../RewriteFunctionToSubcolumnVisitor.cpp       | 15 +++++++++++++++
 3 files changed, 36 insertions(+)

diff --git a/src/Analyzer/Passes/FunctionToSubcolumnsPass.cpp b/src/Analyzer/Passes/FunctionToSubcolumnsPass.cpp
index cd635f87e0e..c74c1038173 100644
--- a/src/Analyzer/Passes/FunctionToSubcolumnsPass.cpp
+++ b/src/Analyzer/Passes/FunctionToSubcolumnsPass.cpp
@@ -176,6 +176,23 @@ public:
 
                 node = std::make_shared<ColumnNode>(column, column_source);
             }
+            else if (function_name == "variantElement" && isVariant(column_type) && second_argument_constant_node)
+            {
+                /// Replace `variantElement(variant_argument, type_name)` with `variant_argument.type_name`.
+                const auto & variant_element_constant_value = second_argument_constant_node->getValue();
+                String subcolumn_name;
+
+                if (variant_element_constant_value.getType() != Field::Types::String)
+                    return;
+
+                subcolumn_name = variant_element_constant_value.get<const String &>();
+
+                column.name += '.';
+                column.name += subcolumn_name;
+                column.type = function_node->getResultType();
+
+                node = std::make_shared<ColumnNode>(column, column_source);
+            }
             else if (function_name == "mapContains" && column_type.isMap())
             {
                 const auto & data_type_map = assert_cast<const DataTypeMap &>(*column.type);
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index c88dd8e9e0d..49ecb2fc546 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -534,6 +534,10 @@ std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataType
         return {max_depth, max_priority, max_simple_nested_depth};
     }
 
+    /// Bool type should have priority higher then all integers.
+    if (isBool(type))
+        return {nested_depth, priority_map[TypeIndex::Int8] + 1 , simple_nested_depth};
+
     return {nested_depth, priority_map[type->getTypeId()], simple_nested_depth};
 }
 
diff --git a/src/Interpreters/RewriteFunctionToSubcolumnVisitor.cpp b/src/Interpreters/RewriteFunctionToSubcolumnVisitor.cpp
index 506fa13b7ba..0717abd4782 100644
--- a/src/Interpreters/RewriteFunctionToSubcolumnVisitor.cpp
+++ b/src/Interpreters/RewriteFunctionToSubcolumnVisitor.cpp
@@ -122,6 +122,21 @@ void RewriteFunctionToSubcolumnData::visit(ASTFunction & function, ASTPtr & ast)
             ast = transformToSubcolumn(name_in_storage, subcolumn_name);
             ast->setAlias(alias);
         }
+        else if (function.name == "variantElement" && column_type_id == TypeIndex::Variant)
+        {
+            const auto * literal = arguments[1]->as<ASTLiteral>();
+            if (!literal)
+                return;
+
+            String subcolumn_name;
+            auto value_type = literal->value.getType();
+            if (value_type != Field::Types::String)
+                return;
+
+            subcolumn_name = literal->value.get<const String &>();
+            ast = transformToSubcolumn(name_in_storage, subcolumn_name);
+            ast->setAlias(alias);
+        }
         else
         {
             auto it = binary_function_to_subcolumn.find(function.name);

From 8b4157141c0501d4498278947b468d03638cdf8a Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 27 Dec 2023 20:36:10 +0000
Subject: [PATCH 043/245] Fix style

---
 src/DataTypes/Serializations/SerializationVariant.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 49ecb2fc546..9cfc4b9e26f 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -536,7 +536,7 @@ std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataType
 
     /// Bool type should have priority higher then all integers.
     if (isBool(type))
-        return {nested_depth, priority_map[TypeIndex::Int8] + 1 , simple_nested_depth};
+        return {nested_depth, priority_map[TypeIndex::Int8] + 1, simple_nested_depth};
 
     return {nested_depth, priority_map[type->getTypeId()], simple_nested_depth};
 }

From 4bb63f0a6f066bca972b5b3754a20f0a56354b8d Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 28 Dec 2023 13:05:15 +0100
Subject: [PATCH 044/245] Update test

---
 .../02916_broken_projection.reference         | 124 ------------------
 .../0_stateless/02916_broken_projection.sh    |  16 +--
 2 files changed, 8 insertions(+), 132 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index 358304de74a..d340326455a 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -2,11 +2,6 @@ insert new part
 insert new part
 insert new part
 insert new part
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -21,11 +16,6 @@ check table
 1
 0
 broke metadata of part 'proj' (parent part: all_2_2_0)
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -46,11 +36,6 @@ all_2_2_0
 broke data of part 'proj_2' (parent part: all_2_2_0)
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -63,11 +48,6 @@ check table
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
 all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -94,14 +74,6 @@ broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
 all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
 all_3_3_0	proj_2	NO_FILE_IN_DATA_PART
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	0	['proj','proj_2']
-all_3_5_1	1	['proj']
-all_4_4_0	0	['proj','proj_2']
-all_5_5_0	0	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -131,14 +103,6 @@ all_1_1_0	proj_2	FILE_DOESNT_EXIST
 all_2_2_0	proj	NO_FILE_IN_DATA_PART
 all_2_2_0	proj_2	FILE_DOESNT_EXIST
 all_3_3_0	proj_2	FILE_DOESNT_EXIST
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	0	['proj','proj_2']
-all_3_5_1	1	['proj']
-all_4_4_0	0	['proj','proj_2']
-all_5_5_0	0	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -155,18 +119,6 @@ check table full (test - all_1_1_0)
 all_1_1_0
 materialize projection proj
 check table full (test - )
-system.parts
-all_0_0_0	0	['proj','proj_2']
-all_0_0_0_6	1	['proj','proj_2']
-all_1_1_0	0	['proj','proj_2']
-all_1_1_0_6	1	['proj','proj_2']
-all_2_2_0	0	['proj','proj_2']
-all_2_2_0_6	1	['proj','proj_2']
-all_3_3_0	0	['proj','proj_2']
-all_3_5_1	0	['proj']
-all_3_5_1_6	1	['proj']
-all_4_4_0	0	['proj','proj_2']
-all_5_5_0	0	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -189,25 +141,6 @@ OPTIMIZE TABLE test FINAL
 insert new part
 optimize
 OPTIMIZE TABLE test FINAL
-system.parts
-all_0_0_0	0	['proj','proj_2']
-all_0_0_0_6	0	['proj','proj_2']
-all_0_0_0_7	0	['proj','proj_2']
-all_0_8_2_7	1	['proj_2']
-all_1_1_0	0	['proj','proj_2']
-all_1_1_0_6	0	['proj','proj_2']
-all_1_1_0_7	0	['proj','proj_2']
-all_2_2_0	0	['proj','proj_2']
-all_2_2_0_6	0	['proj','proj_2']
-all_2_2_0_7	0	['proj','proj_2']
-all_3_3_0	0	['proj','proj_2']
-all_3_5_1	0	['proj']
-all_3_5_1_6	0	['proj']
-all_3_5_1_7	0	['proj','proj_2']
-all_4_4_0	0	['proj','proj_2']
-all_5_5_0	0	['proj','proj_2']
-all_8_8_0	0	['proj','proj_2']
-all_9_9_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -224,9 +157,6 @@ insert new part
 insert new part
 insert new part
 insert new part
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
 select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
@@ -235,7 +165,6 @@ used projections
 SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
-system.parts
 select from projection 'proj'
 used projections
 SELECT c FROM test2_replica WHERE d == 12 OR d == 16 ORDER BY c;	proj
@@ -248,9 +177,6 @@ check table
 broke data of part 'proj' (parent part: all_0_0_0)
 check table full (test2 - all_0_0_0)
 all_0_0_0
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
 select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
@@ -262,9 +188,6 @@ check table
 broke data of part 'all_0_0_0'
 check table full (test2 - all_0_0_0)
 all_0_0_0
-system.parts
-all_0_0_0	0	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
 select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
@@ -273,9 +196,6 @@ used projections
 SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
 select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
@@ -288,11 +208,6 @@ insert new part
 insert new part
 insert new part
 insert new part
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -307,11 +222,6 @@ check table
 1
 0
 broke data of part 'proj' (parent part: all_2_2_0)
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
 FILE_DOESNT_EXIST
 select from projection 'proj_2'
@@ -325,11 +235,6 @@ broken projections info
 all_2_2_0	proj	NO_FILE_IN_DATA_PART
 BACKUP_CREATED
 RESTORED
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -345,11 +250,6 @@ check table
 broken projections info
 0
 broke all data of part 'proj' (parent part: all_2_2_0)
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
 STD_EXCEPTION
 select from projection 'proj_2'
@@ -363,15 +263,6 @@ broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
 FILE_DOESNT_EXIST
 materialize projection proj
-system.parts
-all_0_0_0	0	['proj','proj_2']
-all_0_0_0_4	1	['proj','proj_2']
-all_1_1_0	0	['proj','proj_2']
-all_1_1_0_4	1	['proj','proj_2']
-all_2_2_0	0	['proj','proj_2']
-all_2_2_0_4	1	['proj','proj_2']
-all_3_3_0	0	['proj','proj_2']
-all_3_3_0_4	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -388,11 +279,6 @@ broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
 BACKUP_CREATED
 RESTORED
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -407,11 +293,6 @@ check table
 1
 0
 broke all data of part 'proj' (parent part: all_1_1_0)
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
 select from projection 'proj_2'
 12
@@ -424,11 +305,6 @@ broken projections info
 all_1_1_0	proj	FILE_DOESNT_EXIST
 BACKUP_CREATED
 RESTORED
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 55e613b8f3a..a1df5dc858d 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-random-merge-tree-settings, no-random-settings
+# Tags: long, no-random-merge-tree-settings, no-random-settings, no-s3-storage
 # shellcheck disable=SC2046
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
@@ -149,12 +149,12 @@ function check()
         expected_error=$3
     fi
 
-    echo 'system.parts'
-    $CLICKHOUSE_CLIENT -q "
-    SELECT name, active, projections
-    FROM system.parts
-    WHERE table='$table' AND database=currentDatabase()
-    ORDER BY name;"
+    #echo 'system.parts'
+    #$CLICKHOUSE_CLIENT -q "
+    #SELECT name, active, projections
+    #FROM system.parts
+    #WHERE table='$table' AND database=currentDatabase()
+    #ORDER BY name;"
 
     query_id=$(random 8)
 
@@ -447,7 +447,7 @@ function test3()
 
     break_projection test proj all_2_2_0 part
 
-    check test proj STD_EXCEPTION
+    check test
 
     broken_projections_info test
 

From 3d2e95dbf5f81185d2a091d5e58490f66ed04bef Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 28 Dec 2023 13:49:49 +0100
Subject: [PATCH 045/245] Fix build

---
 src/Storages/MergeTree/checkDataPart.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index ea46b6f0d56..5b60f0a7fc2 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -332,7 +332,7 @@ static IMergeTreeDataPart::Checksums checkDataPart(
 
     if (throw_on_broken_projection && !broken_projections_message.empty())
     {
-        throw Exception(ErrorCodes::BROKEN_PROJECTION, broken_projections_message.data());
+        throw Exception(ErrorCodes::BROKEN_PROJECTION, "{}", broken_projections_message);
     }
 
     if (require_checksums && !projections_on_disk.empty())

From 493f938c455e9bd507d521b7974b1e7a9e7c81b2 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Thu, 28 Dec 2023 17:29:25 +0100
Subject: [PATCH 046/245] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index a1df5dc858d..ca62d275189 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -447,7 +447,7 @@ function test3()
 
     break_projection test proj all_2_2_0 part
 
-    check test
+    check test proj ErrnoException
 
     broken_projections_info test
 

From 91657185c8fc4349cb8825ac2e5d6126fddb8289 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 29 Dec 2023 13:05:15 +0100
Subject: [PATCH 047/245] Fxi

---
 tests/queries/0_stateless/02916_broken_projection.reference | 2 +-
 tests/queries/0_stateless/02916_broken_projection.sh        | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index d340326455a..beaca49f99c 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -251,7 +251,7 @@ broken projections info
 0
 broke all data of part 'proj' (parent part: all_2_2_0)
 select from projection 'proj', expect error: proj
-STD_EXCEPTION
+Errno
 select from projection 'proj_2'
 12
 16
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index ca62d275189..99e54b08b74 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -447,7 +447,7 @@ function test3()
 
     break_projection test proj all_2_2_0 part
 
-    check test proj ErrnoException
+    check test proj Errno
 
     broken_projections_info test
 

From e0f0100332085f3075951a6d9bf5c8d69f6d9940 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Fri, 29 Dec 2023 15:38:15 +0100
Subject: [PATCH 048/245] Update 02916_broken_projection.reference

---
 tests/queries/0_stateless/02916_broken_projection.reference | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index beaca49f99c..3967215e5de 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -252,6 +252,7 @@ broken projections info
 broke all data of part 'proj' (parent part: all_2_2_0)
 select from projection 'proj', expect error: proj
 Errno
+Errno
 select from projection 'proj_2'
 12
 16

From 3de5b27c48483962285de0b16f152cc35eadd1a6 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 8 Jan 2024 16:50:17 +0100
Subject: [PATCH 049/245] Fix conflicts

---
 .../Serializations/SerializationString.cpp    | 22 ++++++++++++++++++-
 1 file changed, 21 insertions(+), 1 deletion(-)

diff --git a/src/DataTypes/Serializations/SerializationString.cpp b/src/DataTypes/Serializations/SerializationString.cpp
index a6bf29336b7..b2c254e63c5 100644
--- a/src/DataTypes/Serializations/SerializationString.cpp
+++ b/src/DataTypes/Serializations/SerializationString.cpp
@@ -381,7 +381,7 @@ void SerializationString::deserializeTextJSON(IColumn & column, ReadBuffer & ist
             str_value = "false";
         }
 
-        read(column, [&](ColumnString::Chars & data) { data.insert(str_value.begin(), str_value.end()); });
+        read<void>(column, [&](ColumnString::Chars & data) { data.insert(str_value.begin(), str_value.end()); });
     }
     else if (settings.json.read_numbers_as_strings && !istr.eof() && *istr.position() != '"')
     {
@@ -406,6 +406,26 @@ bool SerializationString::tryDeserializeTextJSON(IColumn & column, ReadBuffer &
     if (settings.json.read_arrays_as_strings && !istr.eof() && *istr.position() == '[')
         return read<bool>(column, [&](ColumnString::Chars & data) { return readJSONArrayInto<ColumnString::Chars, bool>(data, istr); });
 
+    if (settings.json.read_bools_as_strings && !istr.eof() && (*istr.position() == 't' || *istr.position() == 'f'))
+    {
+        String str_value;
+        if (*istr.position() == 't')
+        {
+            if (!checkString("true", istr))
+                return false;
+            str_value = "true";
+        }
+        else if (*istr.position() == 'f')
+        {
+            if (!checkString("false", istr))
+                return false;
+            str_value = "false";
+        }
+
+        read<void>(column, [&](ColumnString::Chars & data) { data.insert(str_value.begin(), str_value.end()); });
+        return true;
+    }
+
     if (settings.json.read_numbers_as_strings && !istr.eof() && *istr.position() != '"')
     {
         String field;

From 21e4b453dfc7df905ed304c5513b50f57ef19228 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 8 Jan 2024 22:02:40 +0100
Subject: [PATCH 050/245] Fix pretty type name

---
 src/DataTypes/DataTypeVariant.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index 5dc42cc7443..2bc4dfa5a7a 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -71,17 +71,17 @@ std::string DataTypeVariant::doGetPrettyName(size_t indent) const
 {
     size_t size = variants.size();
     WriteBufferFromOwnString s;
-    s << "Variant(\n";
+    s << "Variant(";
 
     for (size_t i = 0; i != size; ++i)
     {
         if (i != 0)
-            s << ",\n";
+            s << ", ";
 
-        s << fourSpaceIndent(indent + 1) << variants[i]->getPrettyName(indent + 1);
+        s << variants[i]->getPrettyName(indent);
     }
 
-    s << '\n' << fourSpaceIndent(indent) << ')';
+    s << ')';
     return s.str();
 }
 

From 633b4a5dcfcf63bec8e2b5a1b5f38e648348639d Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 9 Jan 2024 19:23:34 +0100
Subject: [PATCH 051/245] Apply suggestions from code review

Co-authored-by: Antonio Andelic <antonio2368@users.noreply.github.com>
---
 src/Columns/ColumnNullable.cpp | 2 +-
 src/Columns/ColumnVariant.cpp  | 8 +++++---
 src/Columns/ColumnVariant.h    | 2 +-
 src/DataTypes/EnumValues.cpp   | 4 +---
 4 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/src/Columns/ColumnNullable.cpp b/src/Columns/ColumnNullable.cpp
index d2a579d6800..25b0e35e15e 100644
--- a/src/Columns/ColumnNullable.cpp
+++ b/src/Columns/ColumnNullable.cpp
@@ -928,7 +928,7 @@ ColumnPtr makeNullableOrLowCardinalityNullableSafe(const ColumnPtr & column)
         return assert_cast<const ColumnLowCardinality &>(*column).cloneNullable();
 
     if (column->canBeInsideNullable())
-        return makeNullableSafe(column);
+        return makeNullable(column);
 
     return column;
 }
diff --git a/src/Columns/ColumnVariant.cpp b/src/Columns/ColumnVariant.cpp
index f90ebfc54bb..10d79f59d37 100644
--- a/src/Columns/ColumnVariant.cpp
+++ b/src/Columns/ColumnVariant.cpp
@@ -631,9 +631,9 @@ void ColumnVariant::popBack(size_t n)
     size_t size = local_discriminators_data.size();
     const size_t num_variants = variants.size();
     std::vector<size_t> nested_n(num_variants, 0);
-    for (size_t i = 0; i != n; ++i)
+    for (size_t i = size - n; i < size; ++i)
     {
-        Discriminator discr = local_discriminators_data[size - i - 1];
+        Discriminator discr = local_discriminators_data[i];
         if (discr != NULL_DISCRIMINATOR)
             ++nested_n[discr];
     }
@@ -966,7 +966,7 @@ ColumnPtr ColumnVariant::replicate(const Offsets & replicate_offsets) const
         {
             new_offsets_data.reserve(new_size);
             for (size_t i = old_size; i < new_size; ++i)
-                new_offsets_data.push_back(new_offsets_data[i - 1] + 1);
+                new_offsets_data.push_back(i);
         }
         else
         {
@@ -1260,6 +1260,8 @@ std::optional<ColumnVariant::Discriminator> ColumnVariant::getLocalDiscriminator
     {
         if (variants[i]->size() == local_discriminators->size())
             return i;
+        if (!variants[i]->empty())
+            return std::nullopt
     }
 
     return std::nullopt;
diff --git a/src/Columns/ColumnVariant.h b/src/Columns/ColumnVariant.h
index eb96205924c..8f0c5a6eef9 100644
--- a/src/Columns/ColumnVariant.h
+++ b/src/Columns/ColumnVariant.h
@@ -205,7 +205,7 @@ public:
 
     void compareColumn(const IColumn &, size_t, PaddedPODArray<UInt64> *, PaddedPODArray<Int8> &, int, int) const override
     {
-        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method compareColumn is not supported for ColumnAggregateFunction");
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method compareColumn is not supported for ColumnVariant");
     }
 
     bool hasEqualValues() const override;
diff --git a/src/DataTypes/EnumValues.cpp b/src/DataTypes/EnumValues.cpp
index 8a4b1304d5e..a15136b9335 100644
--- a/src/DataTypes/EnumValues.cpp
+++ b/src/DataTypes/EnumValues.cpp
@@ -85,9 +85,7 @@ bool EnumValues<T>::tryGetValue(T & x, StringRef field_name, bool try_treat_as_i
         if (try_treat_as_id)
         {
             ReadBufferFromMemory tmp_buf(field_name.data, field_name.size);
-            if (!tryReadText(x, tmp_buf) || !tmp_buf.eof() || !value_to_name_map.contains(x))
-                return false;
-            return true;
+            return tryReadText(x, tmp_buf) && tmp_buf.eof() && value_to_name_map.contains(x);
         }
         return false;
     }

From fb758e48b04c5f799a5169af584f6a562866640d Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 9 Jan 2024 19:02:20 +0000
Subject: [PATCH 052/245] Apply suggestions

---
 src/Columns/ColumnVariant.cpp | 172 +++++++++++++++-------------------
 1 file changed, 74 insertions(+), 98 deletions(-)

diff --git a/src/Columns/ColumnVariant.cpp b/src/Columns/ColumnVariant.cpp
index 10d79f59d37..a707ec8e153 100644
--- a/src/Columns/ColumnVariant.cpp
+++ b/src/Columns/ColumnVariant.cpp
@@ -204,10 +204,13 @@ ColumnVariant::ColumnVariant(DB::MutableColumnPtr local_discriminators_, DB::Mut
     }
 }
 
-ColumnVariant::Ptr ColumnVariant::create(const Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
+namespace
+{
+
+MutableColumns getVariantsAssumeMutable(const Columns & variants)
 {
     MutableColumns mutable_variants;
-    mutable_variants.reserve(variants.size());
+
     for (const auto & variant : variants)
     {
         if (isColumnConst(*variant))
@@ -215,35 +218,24 @@ ColumnVariant::Ptr ColumnVariant::create(const Columns & variants, const std::ve
         mutable_variants.emplace_back(variant->assumeMutable());
     }
 
-    return ColumnVariant::create(std::move(mutable_variants), local_to_global_discriminators);
+    return mutable_variants;
+}
+
+}
+
+ColumnVariant::Ptr ColumnVariant::create(const Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
+{
+    return ColumnVariant::create(getVariantsAssumeMutable(variants), local_to_global_discriminators);
 }
 
 ColumnVariant::Ptr ColumnVariant::create(const DB::ColumnPtr & local_discriminators, const DB::Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
 {
-    MutableColumns mutable_variants;
-    mutable_variants.reserve(variants.size());
-    for (const auto & variant : variants)
-    {
-        if (isColumnConst(*variant))
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
-        mutable_variants.emplace_back(variant->assumeMutable());
-    }
-
-    return ColumnVariant::create(local_discriminators->assumeMutable(), std::move(mutable_variants), local_to_global_discriminators);
+    return ColumnVariant::create(local_discriminators->assumeMutable(), getVariantsAssumeMutable(variants), local_to_global_discriminators);
 }
 
 ColumnVariant::Ptr ColumnVariant::create(const DB::ColumnPtr & local_discriminators, const DB::ColumnPtr & offsets, const DB::Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
 {
-    MutableColumns mutable_variants;
-    mutable_variants.reserve(variants.size());
-    for (const auto & variant : variants)
-    {
-        if (isColumnConst(*variant))
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
-        mutable_variants.emplace_back(variant->assumeMutable());
-    }
-
-    return ColumnVariant::create(local_discriminators->assumeMutable(), offsets->assumeMutable(), std::move(mutable_variants), local_to_global_discriminators);
+    return ColumnVariant::create(local_discriminators->assumeMutable(), offsets->assumeMutable(), getVariantsAssumeMutable(variants), local_to_global_discriminators);
 }
 
 MutableColumnPtr ColumnVariant::cloneEmpty() const
@@ -309,104 +301,88 @@ MutableColumnPtr ColumnVariant::cloneResized(size_t new_size) const
     const auto & local_discriminators_data = getLocalDiscriminators();
     const auto & offsets_data = getOffsets();
 
-    /// We can find all variants sizes by scanning all new_size local_discriminators and calculating
-    /// sizes for all new variants. This code is below and commented.
-
-//    std::vector<size_t> new_nested_sizes(num_variants, 0);
-//    for (size_t i = 0; i != new_size; ++i)
-//    {
-//        Discriminator discr = local_discriminators_data[i];
-//        if (discr != NULL_DISCRIMINATOR)
-//            ++new_nested_sizes[discr];
-//    }
-//
-//    MutableColumns new_variants;
-//    new_variants.reserve(num_variants);
-//    for (size_t i = 0; i != num_variants; ++i)
-//    {
-//        if (new_nested_sizes[i])
-//            new_variants.emplace_back(variants[i]->cloneResized(new_nested_sizes[i]));
-//        else
-//            new_variants.emplace_back(variants[i]->cloneEmpty());
-//    }
-//
-//    return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
-
+    /// We can find all variants sizes by scanning all new_size local_discriminators and calculating sizes for all new variants.
     /// But instead we are trying to optimize it using offsets column:
     /// For all non-empty variants we are trying to find last occurrence of its discriminator in local_discriminators[:new_size] or
-    /// first occurrence in local_discriminators[new_size:]. The same row in offsets column will contain the desired size (or size - 1) of variant.
+    /// first occurrence in local_discriminators[new_size:] depending on what range is smaller. The same row in offsets column will
+    /// contain the desired size (or size - 1) of variant.
     /// All empty variants will remain empty.
-    /// Not sure how good this optimization is, feel free to remove it and use simpler version above.
+    /// Not sure how good this optimization is, feel free to remove it and use simpler version without using offsets.
 
     MutableColumns new_variants(num_variants);
-    std::unordered_set<Discriminator> seen_variants;
+    std::vector<UInt8> seen_variants(num_variants, 0);
+    size_t number_of_seen_variants = 0;
     /// First, check which variants are empty. They will remain empty.
     for (Discriminator i = 0; i != num_variants; ++i)
     {
         if (variants[i]->empty())
         {
-            seen_variants.insert(i);
+            seen_variants[i] = 1;
+            ++number_of_seen_variants;
             new_variants[i] = variants[i]->cloneEmpty();
         }
     }
 
-    /// Now, iterate through local discriminators using two pointers.
-    /// First will go from new_size - 1 to 0, second from new_size to size.
-    /// Finish when we find all variants or hit lower or upper bound.
-    ssize_t i = new_size - 1;
-    size_t j = new_size;
-    while (i != -1 && j != size)
+    /// Now, choose what range is smaller and use it.
+    /// [0, new_size)
+    if (2 * new_size <= size)
     {
-        Discriminator i_discr = local_discriminators_data[i];
-        if (i_discr != NULL_DISCRIMINATOR)
+        for (ssize_t i = new_size - 1; i > -1; --i)
         {
-            auto [_, inserted] = seen_variants.insert(i_discr);
-            /// If this is the first occurrence of this discriminator,
-            /// we can get new size for this variant.
-            if (inserted)
+            Discriminator discr = local_discriminators_data[i];
+            if (discr != NULL_DISCRIMINATOR)
             {
-                new_variants[i_discr] = variants[i_discr]->cloneResized(offsets_data[i] + 1);
-                if (seen_variants.size() == num_variants)
-                    break;
+                /// If this is the first occurrence of this discriminator,
+                /// we can get new size for this variant.
+                if (!seen_variants[discr])
+                {
+                    seen_variants[discr] = 1;
+                    ++number_of_seen_variants;
+                    new_variants[discr] = variants[discr]->cloneResized(offsets_data[i] + 1);
+                    /// Break if we found sizes for all variants.
+                    if (number_of_seen_variants == num_variants)
+                        break;
+                }
             }
         }
 
-        Discriminator j_discr = local_discriminators_data[j];
-        if (j_discr != NULL_DISCRIMINATOR)
+        /// All variants that weren't found in range [0, new_size] will be empty in the result column.
+        if (number_of_seen_variants != num_variants)
         {
-            auto [_, inserted] = seen_variants.insert(j_discr);
-            /// If this is the first occurrence of this discriminator,
-            /// we can get new size for this variant.
-            if (inserted)
-            {
-                new_variants[j_discr] = variants[j_discr]->cloneResized(offsets_data[j]);
-                if (seen_variants.size() == num_variants)
-                    break;
-            }
-        }
-
-        --i;
-        ++j;
-    }
-
-    /// We can finish in 3 cases:
-    ///   1) seen_variants.size() == num_variants - we found local_discriminators of all variants, nothing to do.
-    ///   2) i == -1 - we scanned all values in local_discriminators[:new_size]. Not found variants doesn't have
-    /// values in local_discriminators[:new_size], so they should be empty in the resized version.
-    ///   3) j == size - we scanned all values in local_discriminators[new_size:]. Not found variants doesn't have
-    /// values in local_discriminators[new_size:], so, we should use the full variant in the resized version.
-    if (seen_variants.size() != num_variants)
-    {
-        for (size_t discr = 0; discr != num_variants; ++discr)
-        {
-            if (!seen_variants.contains(discr))
-            {
-                if (i == -1)
+            for (size_t discr = 0; discr != num_variants; ++discr)
+                if (!seen_variants[discr])
                     new_variants[discr] = variants[discr]->cloneEmpty();
-                else
-                    new_variants[discr] = IColumn::mutate(variants[discr]);
+        }
+    }
+    /// [new_size, size)
+    else
+    {
+        for (size_t i = new_size; i < size; ++i)
+        {
+            Discriminator discr = local_discriminators_data[i];
+            if (discr != NULL_DISCRIMINATOR)
+            {
+                /// If this is the first occurrence of this discriminator,
+                /// we can get new size for this variant.
+                if (!seen_variants[discr])
+                {
+                    seen_variants[discr] = 1;
+                    ++number_of_seen_variants;
+                    new_variants[discr] = variants[discr]->cloneResized(offsets_data[i]);
+                    /// Break if we found sizes for all variants.
+                    if (number_of_seen_variants == num_variants)
+                        break;
+                }
             }
         }
+
+        if (number_of_seen_variants != num_variants)
+        {
+            /// All variants that weren't found in range [new_size, size) will not change their sizes.
+            for (size_t discr = 0; discr != num_variants; ++discr)
+                if (!seen_variants[discr])
+                    new_variants[discr] = IColumn::mutate(variants[discr]);
+        }
     }
 
     return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
@@ -1261,7 +1237,7 @@ std::optional<ColumnVariant::Discriminator> ColumnVariant::getLocalDiscriminator
         if (variants[i]->size() == local_discriminators->size())
             return i;
         if (!variants[i]->empty())
-            return std::nullopt
+            return std::nullopt;
     }
 
     return std::nullopt;

From 10af0d406fb536917a84d23f4bacba073ea9443e Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Wed, 10 Jan 2024 16:55:58 +0100
Subject: [PATCH 053/245] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 99e54b08b74..fbd26e59f6f 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-random-merge-tree-settings, no-random-settings, no-s3-storage
+# Tags: long, no-random-merge-tree-settings, no-random-settings, no-s3-storage, no-parallel
 # shellcheck disable=SC2046
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

From 1deaaf5466a2633d58fba87521435491546df0a2 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Thu, 11 Jan 2024 15:20:06 +0100
Subject: [PATCH 054/245] Apply suggestions from code review

Co-authored-by: Antonio Andelic <antonio2368@users.noreply.github.com>
---
 .../Serializations/SerializationDateTime64.cpp    |  6 +++---
 src/DataTypes/Serializations/SerializationEnum.h  |  5 +----
 .../Serializations/SerializationNamed.cpp         |  1 -
 .../Serializations/SerializationTuple.cpp         | 15 +++------------
 4 files changed, 7 insertions(+), 20 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationDateTime64.cpp b/src/DataTypes/Serializations/SerializationDateTime64.cpp
index a19619bf8d3..442e29edd52 100644
--- a/src/DataTypes/Serializations/SerializationDateTime64.cpp
+++ b/src/DataTypes/Serializations/SerializationDateTime64.cpp
@@ -50,7 +50,7 @@ void SerializationDateTime64::deserializeText(IColumn & column, ReadBuffer & ist
 bool SerializationDateTime64::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const
 {
     DateTime64 result = 0;
-    if (tryReadDateTime64Text(result, scale, istr, time_zone) || (whole && istr.eof()))
+    if (!tryReadDateTime64Text(result, scale, istr, time_zone) || (whole && !istr.eof()))
         return false;
 
     assert_cast<ColumnType &>(column).getData().push_back(result);
@@ -151,7 +151,7 @@ bool SerializationDateTime64::tryDeserializeTextQuoted(IColumn & column, ReadBuf
     DateTime64 x = 0;
     if (checkChar('\'', istr)) /// Cases: '2017-08-31 18:36:48' or '1504193808'
     {
-        if (tryReadText(x, scale, istr, settings, time_zone, utc_time_zone) || !checkChar('\'', istr))
+        if (!tryReadText(x, scale, istr, settings, time_zone, utc_time_zone) || !checkChar('\'', istr))
             return false;
     }
     else /// Just 1504193808 or 01504193808
@@ -265,7 +265,7 @@ bool SerializationDateTime64::tryDeserializeTextCSV(IColumn & column, ReadBuffer
     {
         if (settings.csv.delimiter != ',' || settings.date_time_input_format == FormatSettings::DateTimeInputFormat::Basic)
         {
-            if (tryReadText(x, scale, istr, settings, time_zone, utc_time_zone))
+            if (!tryReadText(x, scale, istr, settings, time_zone, utc_time_zone))
                 return false;
         }
         else
diff --git a/src/DataTypes/Serializations/SerializationEnum.h b/src/DataTypes/Serializations/SerializationEnum.h
index 5152a3fbc93..bb720ee9b1f 100644
--- a/src/DataTypes/Serializations/SerializationEnum.h
+++ b/src/DataTypes/Serializations/SerializationEnum.h
@@ -60,10 +60,7 @@ public:
 
     bool tryReadValue(ReadBuffer & istr, FieldType & x) const
     {
-       if (!tryReadText(x, istr) || !ref_enum_values.hasValue(x))
-           return false;
-
-       return true;
+       return tryReadText(x, istr) && ref_enum_values.hasValue(x);
     }
 
     std::optional<EnumValues<Type>> own_enum_values;
diff --git a/src/DataTypes/Serializations/SerializationNamed.cpp b/src/DataTypes/Serializations/SerializationNamed.cpp
index 1a9cbe9a37d..ca60948ce68 100644
--- a/src/DataTypes/Serializations/SerializationNamed.cpp
+++ b/src/DataTypes/Serializations/SerializationNamed.cpp
@@ -1,5 +1,4 @@
 #include <DataTypes/Serializations/SerializationNamed.h>
-#include <iostream>
 
 namespace DB
 {
diff --git a/src/DataTypes/Serializations/SerializationTuple.cpp b/src/DataTypes/Serializations/SerializationTuple.cpp
index c0b0658e6b4..79b7fa84242 100644
--- a/src/DataTypes/Serializations/SerializationTuple.cpp
+++ b/src/DataTypes/Serializations/SerializationTuple.cpp
@@ -212,10 +212,7 @@ ReturnType SerializationTuple::deserializeTextImpl(IColumn & column, ReadBuffer
         return ReturnType(true);
     };
 
-    if constexpr (throw_exception)
-        addElementSafe<ReturnType>(elems.size(), column, impl);
-    else
-        return addElementSafe<ReturnType>(elems.size(), column, impl);
+    return addElementSafe<ReturnType>(elems.size(), column, impl);
 }
 
 void SerializationTuple::deserializeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, bool whole) const
@@ -457,10 +454,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
             return ReturnType(true);
         };
 
-        if constexpr (throw_exception)
-            addElementSafe<ReturnType>(elems.size(), column, impl);
-        else
-            return addElementSafe<ReturnType>(elems.size(), column, impl);
+        return addElementSafe<ReturnType>(elems.size(), column, impl);
     }
     else
     {
@@ -502,10 +496,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
             return ReturnType(true);
         };
 
-        if constexpr (throw_exception)
-            addElementSafe<ReturnType>(elems.size(), column, impl);
-        else
-            return addElementSafe<ReturnType>(elems.size(), column, impl);
+        return addElementSafe<ReturnType>(elems.size(), column, impl);
     }
 }
 

From f05d89bc2b26206b1b6854ad48dd35840b82a123 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 11 Jan 2024 14:48:57 +0000
Subject: [PATCH 055/245] Apply review suggestions

---
 .../Serializations/ISerialization.cpp         |  47 +++---
 .../Serializations/SerializationTuple.cpp     |   3 +
 .../Serializations/SerializationVariant.cpp   | 135 +++++++++---------
 3 files changed, 101 insertions(+), 84 deletions(-)

diff --git a/src/DataTypes/Serializations/ISerialization.cpp b/src/DataTypes/Serializations/ISerialization.cpp
index 08575f06f2a..c699b3b0748 100644
--- a/src/DataTypes/Serializations/ISerialization.cpp
+++ b/src/DataTypes/Serializations/ISerialization.cpp
@@ -176,7 +176,7 @@ String getNameForSubstreamPath(
                 stream_name += "." + it->tuple_element_name;
         }
         else if (it->type == Substream::VariantDiscriminators)
-            stream_name += ".discr";
+            stream_name += ".variant_discr";
         else if (it->type == Substream::VariantOffsets)
             stream_name += ".variant_offsets";
         else if (it->type == Substream::VariantElement)
@@ -261,43 +261,51 @@ bool ISerialization::isSpecialCompressionAllowed(const SubstreamPath & path)
     return true;
 }
 
-#define TRY_DESERIALIZE_TEXT(deserialize)                \
-    size_t prev_size = column.size();                    \
-    try                                                  \
-    {                                                    \
-        deserialize(column, istr, settings);             \
-        return true;                                     \
-    }                                                    \
-    catch (...)                                          \
-    {                                                    \
-        if (column.size() > prev_size)                   \
-            column.popBack(column.size() - prev_size);   \
-        return false;                                    \
-    }                                                    \
+namespace
+{
+
+template <typename F>
+bool tryDeserializeText(const F deserialize, DB::IColumn & column)
+{
+    size_t prev_size = column.size();
+    try
+    {
+        deserialize(column);
+        return true;
+    }
+    catch (...)
+    {
+        if (column.size() > prev_size)
+            column.popBack(column.size() - prev_size);
+        return false;
+    }
+}
+
+}
 
 bool ISerialization::tryDeserializeTextCSV(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
 {
-    TRY_DESERIALIZE_TEXT(deserializeTextCSV)
+    return tryDeserializeText([&](DB::IColumn & my_column) { deserializeTextCSV(my_column, istr, settings); }, column);
 }
 
 bool ISerialization::tryDeserializeTextEscaped(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
 {
-    TRY_DESERIALIZE_TEXT(deserializeTextEscaped)
+    return tryDeserializeText([&](DB::IColumn & my_column) { deserializeTextEscaped(my_column, istr, settings); }, column);
 }
 
 bool ISerialization::tryDeserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
 {
-    TRY_DESERIALIZE_TEXT(deserializeTextJSON)
+    return tryDeserializeText([&](DB::IColumn & my_column) { deserializeTextJSON(my_column, istr, settings); }, column);
 }
 
 bool ISerialization::tryDeserializeTextQuoted(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
 {
-    TRY_DESERIALIZE_TEXT(deserializeTextQuoted)
+    return tryDeserializeText([&](DB::IColumn & my_column) { deserializeTextQuoted(my_column, istr, settings); }, column);
 }
 
 bool ISerialization::tryDeserializeWholeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
 {
-    TRY_DESERIALIZE_TEXT(deserializeWholeText)
+    return tryDeserializeText([&](DB::IColumn & my_column) { deserializeWholeText(my_column, istr, settings); }, column);
 }
 
 void ISerialization::deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
@@ -346,7 +354,6 @@ bool ISerialization::hasSubcolumnForPath(const SubstreamPath & path, size_t pref
     return path[last_elem].type == Substream::NullMap
             || path[last_elem].type == Substream::TupleElement
             || path[last_elem].type == Substream::ArraySizes
-            || path[last_elem].type == Substream::VariantDiscriminators
             || path[last_elem].type == Substream::VariantElement;
 }
 
diff --git a/src/DataTypes/Serializations/SerializationTuple.cpp b/src/DataTypes/Serializations/SerializationTuple.cpp
index 79b7fa84242..c249ee69e46 100644
--- a/src/DataTypes/Serializations/SerializationTuple.cpp
+++ b/src/DataTypes/Serializations/SerializationTuple.cpp
@@ -76,7 +76,10 @@ static ReturnType addElementSafe(size_t num_elems, IColumn & column, F && impl)
         {
             auto & element_column = extractElementColumn(column, i);
             if (element_column.size() > old_size)
+            {
+                chassert(old_size - element_column.size() == 1);
                 element_column.popBack(1);
+            }
         }
     };
 
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 9cfc4b9e26f..64fcb63d604 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -397,70 +397,76 @@ void SerializationVariant::deserializeBinary(IColumn & column, ReadBuffer & istr
 namespace
 {
 
-std::unordered_map<TypeIndex, size_t> getTypesTextDeserializePriorityMap()
+const std::unordered_map<TypeIndex, size_t> & getTypesTextDeserializePriorityMap()
 {
-    static const std::vector<TypeIndex> priorities = {
-        /// Complex types have highest priority.
-        TypeIndex::Array,
-        TypeIndex::Tuple,
-        TypeIndex::Map,
-        TypeIndex::AggregateFunction,
+    static std::unordered_map<TypeIndex, size_t> priority_map = []
+    {
+        static constexpr std::array priorities = {
+            /// Complex types have highest priority.
+            TypeIndex::Array,
+            TypeIndex::Tuple,
+            TypeIndex::Map,
+            TypeIndex::AggregateFunction,
 
-        /// Enums can be parsed both from strings and numbers.
-        /// So they have high enough priority.
-        TypeIndex::Enum8,
-        TypeIndex::Enum16,
+            /// Enums can be parsed both from strings and numbers.
+            /// So they have high enough priority.
+            TypeIndex::Enum8,
+            TypeIndex::Enum16,
 
-        /// Types that can be parsed from strings.
-        TypeIndex::UUID,
-        TypeIndex::IPv4,
-        TypeIndex::IPv6,
+            /// Types that can be parsed from strings.
+            TypeIndex::UUID,
+            TypeIndex::IPv4,
+            TypeIndex::IPv6,
 
-        /// Types that can be parsed from numbers.
-        /// The order:
-        ///    1) Integers
-        ///    2) Big Integers
-        ///    3) Decimals
-        ///    4) Floats
-        /// In each group small types have higher priority.
-        TypeIndex::Int8,
-        TypeIndex::UInt8,
-        TypeIndex::Int16,
-        TypeIndex::UInt16,
-        TypeIndex::Int32,
-        TypeIndex::UInt32,
-        TypeIndex::Int64,
-        TypeIndex::UInt64,
-        TypeIndex::Int128,
-        TypeIndex::UInt128,
-        TypeIndex::Int256,
-        TypeIndex::UInt256,
-        TypeIndex::Decimal32,
-        TypeIndex::Decimal64,
-        TypeIndex::Decimal128,
-        TypeIndex::Decimal256,
-        TypeIndex::Float32,
-        TypeIndex::Float64,
+            /// Types that can be parsed from numbers.
+            /// The order:
+            ///    1) Integers
+            ///    2) Big Integers
+            ///    3) Decimals
+            ///    4) Floats
+            /// In each group small types have higher priority.
+            TypeIndex::Int8,
+            TypeIndex::UInt8,
+            TypeIndex::Int16,
+            TypeIndex::UInt16,
+            TypeIndex::Int32,
+            TypeIndex::UInt32,
+            TypeIndex::Int64,
+            TypeIndex::UInt64,
+            TypeIndex::Int128,
+            TypeIndex::UInt128,
+            TypeIndex::Int256,
+            TypeIndex::UInt256,
+            TypeIndex::Decimal32,
+            TypeIndex::Decimal64,
+            TypeIndex::Decimal128,
+            TypeIndex::Decimal256,
+            TypeIndex::Float32,
+            TypeIndex::Float64,
 
-        /// Dates and DateTimes. More simple Date types have higher priority.
-        /// They have lower priority as numbers as some DateTimes sometimes can
-        /// be also parsed from numbers, but we don't want it usually.
-        TypeIndex::Date,
-        TypeIndex::Date32,
-        TypeIndex::DateTime,
-        TypeIndex::DateTime64,
+            /// Dates and DateTimes. More simple Date types have higher priority.
+            /// They have lower priority as numbers as some DateTimes sometimes can
+            /// be also parsed from numbers, but we don't want it usually.
+            TypeIndex::Date,
+            TypeIndex::Date32,
+            TypeIndex::DateTime,
+            TypeIndex::DateTime64,
 
-        /// String types have almost the lowest priority,
-        /// as in text formats almost all data can
-        /// be deserialized into String type.
-        TypeIndex::FixedString,
-        TypeIndex::String,
-    };
+            /// String types have almost the lowest priority,
+            /// as in text formats almost all data can
+            /// be deserialized into String type.
+            TypeIndex::FixedString,
+            TypeIndex::String,
+        };
+
+        std::unordered_map<TypeIndex, size_t> pm;
+
+        pm.reserve(priorities.size());
+        for (size_t i = 0; i != priorities.size(); ++i)
+            pm[priorities[i]] = priorities.size() - i;
+        return pm;
+    }();
 
-    std::unordered_map<TypeIndex, size_t> priority_map;
-    priority_map.reserve(priorities.size());
-    for (size_t i = 0; i != priorities.size(); ++i)
-        priority_map[priorities[i]] = priorities.size() - i;
     return priority_map;
 }
 
@@ -476,7 +482,7 @@ std::unordered_map<TypeIndex, size_t> getTypesTextDeserializePriorityMap()
 /// so if we have types with the same level of nesting and the same priority, we will first try to deserialize LowCardinality/Nullable types
 /// (for example if we have types Array(Array(String)) and Array(Array(Nullable(String))).
 /// This is just a batch of heuristics.
-std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataTypePtr & type, size_t nested_depth, size_t simple_nested_depth, std::unordered_map<TypeIndex, size_t> & priority_map)
+std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataTypePtr & type, size_t nested_depth, size_t simple_nested_depth, const std::unordered_map<TypeIndex, size_t> & priority_map)
 {
     if (const auto * nullable_type = typeid_cast<const DataTypeNullable *>(type.get()))
         return getTypeTextDeserializePriority(nullable_type->getNestedType(), nested_depth, simple_nested_depth + 1, priority_map);
@@ -487,7 +493,7 @@ std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataType
     if (const auto * array_type = typeid_cast<const DataTypeArray *>(type.get()))
     {
         auto [elements_nested_depth, elements_priority, elements_simple_nested_depth] = getTypeTextDeserializePriority(array_type->getNestedType(), nested_depth + 1, simple_nested_depth, priority_map);
-        return {elements_nested_depth, elements_priority + priority_map[TypeIndex::Array], elements_simple_nested_depth};
+        return {elements_nested_depth, elements_priority + priority_map.at(TypeIndex::Array), elements_simple_nested_depth};
     }
 
     if (const auto * tuple_type = typeid_cast<const DataTypeTuple *>(type.get()))
@@ -505,14 +511,14 @@ std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataType
                 max_simple_nested_depth = elem_simple_nested_depth;
         }
 
-        return {max_nested_depth, sum_priority + priority_map[TypeIndex::Tuple], max_simple_nested_depth};
+        return {max_nested_depth, sum_priority + priority_map.at(TypeIndex::Tuple), max_simple_nested_depth};
     }
 
     if (const auto * map_type = typeid_cast<const DataTypeMap *>(type.get()))
     {
         auto [key_max_depth, key_priority, key_simple_nested_depth] = getTypeTextDeserializePriority(map_type->getKeyType(), nested_depth + 1, simple_nested_depth, priority_map);
         auto [value_max_depth, value_priority, value_simple_nested_depth] = getTypeTextDeserializePriority(map_type->getValueType(), nested_depth + 1, simple_nested_depth, priority_map);
-        return {std::max(key_max_depth, value_max_depth), key_priority + value_priority + priority_map[TypeIndex::Map], std::max(key_simple_nested_depth, value_simple_nested_depth)};
+        return {std::max(key_max_depth, value_max_depth), key_priority + value_priority + priority_map.at(TypeIndex::Map), std::max(key_simple_nested_depth, value_simple_nested_depth)};
     }
 
     if (const auto * variant_type = typeid_cast<const DataTypeVariant *>(type.get()))
@@ -536,9 +542,10 @@ std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataType
 
     /// Bool type should have priority higher then all integers.
     if (isBool(type))
-        return {nested_depth, priority_map[TypeIndex::Int8] + 1, simple_nested_depth};
+        return {nested_depth, priority_map.at(TypeIndex::Int8) + 1, simple_nested_depth};
 
-    return {nested_depth, priority_map[type->getTypeId()], simple_nested_depth};
+    auto it = priority_map.find(type->getTypeId());
+    return {nested_depth, it == priority_map.end() ? 0 : it->second, simple_nested_depth};
 }
 
 }
@@ -549,7 +556,7 @@ std::vector<size_t> SerializationVariant::getVariantsDeserializeTextOrder(const
     priorities.reserve(variant_types.size());
     std::vector<size_t> order;
     order.reserve(variant_types.size());
-    auto priority_map = getTypesTextDeserializePriorityMap();
+    const auto & priority_map = getTypesTextDeserializePriorityMap();
     for (size_t i = 0; i != variant_types.size(); ++i)
     {
         priorities.push_back(getTypeTextDeserializePriority(variant_types[i], 0, 0, priority_map));

From 9e639df12e69c7373e400115977c432b8fdf31f2 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 11 Jan 2024 18:44:05 +0000
Subject: [PATCH 056/245] Add fixes, add new mode to getLeastSupertype and use
 it in if/multiIf

---
 .../Serializations/SerializationTuple.cpp     |  2 +-
 src/DataTypes/getLeastSupertype.cpp           | 73 ++++++++++++++++---
 src/DataTypes/getLeastSupertype.h             | 12 +++
 src/Functions/if.cpp                          | 14 +---
 src/Functions/multiIf.cpp                     |  8 +-
 ...940_variant_text_deserialization.reference |  2 +-
 6 files changed, 79 insertions(+), 32 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationTuple.cpp b/src/DataTypes/Serializations/SerializationTuple.cpp
index c249ee69e46..5d8c84b70bf 100644
--- a/src/DataTypes/Serializations/SerializationTuple.cpp
+++ b/src/DataTypes/Serializations/SerializationTuple.cpp
@@ -77,7 +77,7 @@ static ReturnType addElementSafe(size_t num_elems, IColumn & column, F && impl)
             auto & element_column = extractElementColumn(column, i);
             if (element_column.size() > old_size)
             {
-                chassert(old_size - element_column.size() == 1);
+                chassert(element_column.size() - old_size == 1);
                 element_column.popBack(1);
             }
         }
diff --git a/src/DataTypes/getLeastSupertype.cpp b/src/DataTypes/getLeastSupertype.cpp
index e5bdb4b267f..5d67f888c4b 100644
--- a/src/DataTypes/getLeastSupertype.cpp
+++ b/src/DataTypes/getLeastSupertype.cpp
@@ -18,6 +18,7 @@
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypesDecimal.h>
 #include <DataTypes/DataTypeFactory.h>
+#include <DataTypes/DataTypeVariant.h>
 
 
 namespace DB
@@ -58,6 +59,25 @@ DataTypePtr throwOrReturn(const DataTypes & types, std::string_view message_suff
     if constexpr (on_error == LeastSupertypeOnError::String)
         return std::make_shared<DataTypeString>();
 
+    if constexpr (on_error == LeastSupertypeOnError::Variant && std::is_same_v<DataTypes, std::vector<DataTypePtr>>)
+    {
+        DataTypes variants;
+        for (const auto & type : types)
+        {
+            if (isVariant(type))
+            {
+                const DataTypes & nested_variants = assert_cast<const DataTypeVariant &>(*type).getVariants();
+                variants.insert(variants.end(), nested_variants.begin(), nested_variants.end());
+            }
+            else
+            {
+                variants.push_back(removeNullableOrLowCardinalityNullable(type));
+            }
+        }
+
+        return std::make_shared<DataTypeVariant>(variants);
+    }
+
     if constexpr (on_error == LeastSupertypeOnError::Null)
         return nullptr;
 
@@ -67,8 +87,8 @@ DataTypePtr throwOrReturn(const DataTypes & types, std::string_view message_suff
     throw Exception(error_code, "There is no supertype for types {} {}", getExceptionMessagePrefix(types), message_suffix);
 }
 
-template <LeastSupertypeOnError on_error>
-DataTypePtr getNumericType(const TypeIndexSet & types)
+template <typename ThrowOrReturnFunc>
+DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOrReturnFunc)
 {
     bool all_numbers = true;
 
@@ -119,7 +139,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types)
     if (max_bits_of_signed_integer || max_bits_of_unsigned_integer || max_mantissa_bits_of_floating)
     {
         if (!all_numbers)
-            return throwOrReturn<on_error>(types, "because some of them are numbers and some of them are not", ErrorCodes::NO_COMMON_TYPE);
+            return throwOrReturnFunc(types, "because some of them are numbers and some of them are not", ErrorCodes::NO_COMMON_TYPE);
 
         /// If there are signed and unsigned types of same bit-width, the result must be signed number with at least one more bit.
         /// Example, common of Int32, UInt32 = Int64.
@@ -134,7 +154,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types)
             if (min_bit_width_of_integer != 64)
                 ++min_bit_width_of_integer;
             else
-                return throwOrReturn<on_error>(types,
+                return throwOrReturnFunc(types,
                     "because some of them are signed integers and some are unsigned integers,"
                     " but there is no signed integer type, that can exactly represent all required unsigned integer values",
                     ErrorCodes::NO_COMMON_TYPE);
@@ -149,7 +169,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types)
             else if (min_mantissa_bits <= 53)
                 return std::make_shared<DataTypeFloat64>();
             else
-                return throwOrReturn<on_error>(types,
+                return throwOrReturnFunc(types,
                     " because some of them are integers and some are floating point,"
                     " but there is no floating point type, that can exactly represent all required integers", ErrorCodes::NO_COMMON_TYPE);
         }
@@ -170,7 +190,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types)
             else if (min_bit_width_of_integer <= 256)
                 return std::make_shared<DataTypeInt256>();
             else
-                return throwOrReturn<on_error>(types,
+                return throwOrReturnFunc(types,
                     " because some of them are signed integers and some are unsigned integers,"
                     " but there is no signed integer type, that can exactly represent all required unsigned integer values", ErrorCodes::NO_COMMON_TYPE);
         }
@@ -190,7 +210,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types)
             else if (min_bit_width_of_integer <= 256)
                 return std::make_shared<DataTypeUInt256>();
             else
-                return throwOrReturn<on_error>(types,
+                return throwOrReturnFunc(types,
                     " but as all data types are unsigned integers, we must have found maximum unsigned integer type", ErrorCodes::NO_COMMON_TYPE);
         }
     }
@@ -382,7 +402,18 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
             if (!all_maps)
                 return throwOrReturn<on_error>(types, "because some of them are Maps and some of them are not", ErrorCodes::NO_COMMON_TYPE);
 
-            auto keys_common_type = getLeastSupertype<on_error>(key_types);
+            DataTypePtr keys_common_type;
+            if constexpr (on_error == LeastSupertypeOnError::Variant)
+            {
+                keys_common_type = getLeastSupertype<LeastSupertypeOnError::Null>(key_types);
+                if (!keys_common_type)
+                    return throwOrReturn<on_error>(types, "", ErrorCodes::NO_COMMON_TYPE);
+            }
+            else
+            {
+                keys_common_type = getLeastSupertype<on_error>(key_types);
+            }
+
             auto values_common_type = getLeastSupertype<on_error>(value_types);
             /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype for keys or values,
             /// keys_common_type or values_common_type will be nullptr, we should return nullptr in this case.
@@ -423,7 +454,18 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
                 return getLeastSupertype<on_error>(nested_types);
             else
             {
-                auto nested_type = getLeastSupertype<on_error>(nested_types);
+                DataTypePtr nested_type;
+                if constexpr (on_error == LeastSupertypeOnError::Variant)
+                {
+                    nested_type = getLeastSupertype<LeastSupertypeOnError::Null>(nested_types);
+                    if (!nested_type)
+                        return throwOrReturn<on_error>(types, "", ErrorCodes::NO_COMMON_TYPE);
+                }
+                else
+                {
+                    nested_type = getLeastSupertype<on_error>(nested_types);
+                }
+
                 /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype,
                 /// nested_type will be nullptr, we should return nullptr in this case.
                 if (!nested_type)
@@ -456,6 +498,8 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
         if (have_nullable)
         {
             auto nested_type = getLeastSupertype<on_error>(nested_types);
+            if (isVariant(nested_type))
+                return nested_type;
             /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype,
             /// nested_type will be nullptr, we should return nullptr in this case.
             if (!nested_type)
@@ -623,7 +667,8 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
     {
         /// First, if we have signed integers, try to convert all UInt64 to Int64 if possible.
         convertUInt64toInt64IfPossible(types, type_ids);
-        auto numeric_type = getNumericType<on_error>(type_ids);
+        auto throw_or_return = [&](const TypeIndexSet &, std::string_view message_suffix, int error_code){ return throwOrReturn<on_error>(types, message_suffix, error_code); };
+        auto numeric_type = getNumericType(type_ids, throw_or_return);
         if (numeric_type)
             return numeric_type;
     }
@@ -637,6 +682,11 @@ DataTypePtr getLeastSupertypeOrString(const DataTypes & types)
     return getLeastSupertype<LeastSupertypeOnError::String>(types);
 }
 
+DataTypePtr getLeastSupertypeOrVariant(const DataTypes & types)
+{
+    return getLeastSupertype<LeastSupertypeOnError::Variant>(types);
+}
+
 DataTypePtr tryGetLeastSupertype(const DataTypes & types)
 {
     return getLeastSupertype<LeastSupertypeOnError::Null>(types);
@@ -676,7 +726,8 @@ DataTypePtr getLeastSupertype(const TypeIndexSet & types)
         return std::make_shared<DataTypeString>();
     }
 
-    auto numeric_type = getNumericType<on_error>(types);
+    auto throw_or_return = [](const TypeIndexSet & type_ids, std::string_view message_suffix, int error_code){ return throwOrReturn<on_error>(type_ids, message_suffix, error_code); };
+    auto numeric_type = getNumericType(types, throw_or_return);
     if (numeric_type)
         return numeric_type;
 
diff --git a/src/DataTypes/getLeastSupertype.h b/src/DataTypes/getLeastSupertype.h
index 2ef4a0e6850..d949fad69c5 100644
--- a/src/DataTypes/getLeastSupertype.h
+++ b/src/DataTypes/getLeastSupertype.h
@@ -8,6 +8,7 @@ enum class LeastSupertypeOnError
 {
     Throw,
     String,
+    Variant,
     Null,
 };
 
@@ -24,6 +25,17 @@ DataTypePtr getLeastSupertype(const DataTypes & types);
 /// All types can be casted to String, because they can be serialized to String.
 DataTypePtr getLeastSupertypeOrString(const DataTypes & types);
 
+/// Same as getLeastSupertype but in case when there is no supertype for some types
+/// it uses Variant of these types as a supertype. Any type can be casted to a Variant
+/// that contains this type.
+/// As nested Variants are not allowed, if one of the types is Variant, it's variants
+/// are used in the resulting Variant.
+/// Examples:
+/// (UInt64, String) -> Variant(UInt64, String)
+/// (Array(UInt64), Array(String)) -> Array(Variant(UInt64, String))
+/// (Variant(UInt64, String), Array(UInt32)) -> Variant(UInt64, String, Array(UInt32))
+DataTypePtr getLeastSupertypeOrVariant(const DataTypes & types);
+
 /// Same as above but return nullptr instead of throwing exception.
 DataTypePtr tryGetLeastSupertype(const DataTypes & types);
 
diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 1dc7443f124..c247938f885 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -688,15 +688,9 @@ private:
 
         DataTypePtr common_type;
         if (use_variant_when_no_common_type)
-        {
-            common_type = tryGetLeastSupertype(DataTypes{arg1.type, arg2.type});
-            if (!common_type)
-                common_type = std::make_shared<DataTypeVariant>(DataTypes{removeNullableOrLowCardinalityNullable(arg1.type), removeNullableOrLowCardinalityNullable(arg2.type)});
-        }
+            common_type = getLeastSupertypeOrVariant(DataTypes{arg1.type, arg2.type});
         else
-        {
             common_type = getLeastSupertype(DataTypes{arg1.type, arg2.type});
-        }
 
         ColumnPtr col_then = castColumn(arg1, common_type);
         ColumnPtr col_else = castColumn(arg2, common_type);
@@ -1118,11 +1112,7 @@ public:
                 "Must be UInt8.", arguments[0]->getName());
 
         if (use_variant_when_no_common_type)
-        {
-            if (auto res = tryGetLeastSupertype(DataTypes{arguments[1], arguments[2]}))
-                return res;
-            return std::make_shared<DataTypeVariant>(DataTypes{removeNullableOrLowCardinalityNullable(arguments[1]), removeNullableOrLowCardinalityNullable(arguments[2])});
-        }
+            return getLeastSupertypeOrVariant(DataTypes{arguments[1], arguments[2]});
 
         return getLeastSupertype(DataTypes{arguments[1], arguments[2]});
     }
diff --git a/src/Functions/multiIf.cpp b/src/Functions/multiIf.cpp
index 7a2e9444b2c..cefbea9f352 100644
--- a/src/Functions/multiIf.cpp
+++ b/src/Functions/multiIf.cpp
@@ -119,13 +119,7 @@ public:
         });
 
         if (context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_when_no_common_type_in_if)
-        {
-            if (auto res = tryGetLeastSupertype(types_of_branches))
-                return res;
-            for (auto & type : types_of_branches)
-                type = removeNullableOrLowCardinalityNullable(type);
-            return std::make_shared<DataTypeVariant>(types_of_branches);
-        }
+            return getLeastSupertypeOrVariant(types_of_branches);
 
         return getLeastSupertype(types_of_branches);
     }
diff --git a/tests/queries/0_stateless/02940_variant_text_deserialization.reference b/tests/queries/0_stateless/02940_variant_text_deserialization.reference
index 98725917567..8836e6c4e57 100644
--- a/tests/queries/0_stateless/02940_variant_text_deserialization.reference
+++ b/tests/queries/0_stateless/02940_variant_text_deserialization.reference
@@ -505,7 +505,7 @@ String
 (NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000000000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000000000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0)(NULL,NULL),('string',NULL),(-1,NULL),(0,0)Floats
 (NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)Decimals
 (NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)Dates and DateTimes
-(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000',NULL),('2020-01-01','2020-01-01'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000',NULL),('1900-01-01','1900-01-01'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000',NULL),('2020-01-01 00:00:00','2020-01-01 00:00:00'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000','1970-01-01 00:00:00.000'),('2020-01-01 00:00:00.999',NULL),('2020-01-01 00:00:00.999999999 ABC',NULL)UUID
+(NULL,NULL),('string',NULL),('2020-01-d1',NULL),('2020-01-01','2020-01-01'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('2020-01-d1',NULL),('1900-01-01','1900-01-01'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('2020-01-d1',NULL),('2020-01-01 00:00:00','2020-01-01 00:00:00'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('2020-01-d1',NULL),('2020-01-01 00:00:00.999','2020-01-01 00:00:00.999'),('2020-01-01 00:00:00.999999999 ABC',NULL)UUID
 (NULL,NULL),('string',NULL),('c8619cca-0caa-445e-ae76-1d4f6e0b3927','c8619cca-0caa-445e-ae76-1d4f6e0b3927'),('c8619cca-0caa-445e-ae76-1d4f6e0b3927AAA',NULL)IPv4
 (NULL,NULL),('string',NULL),('127.0.0.1','127.0.0.1'),('127.0.0.1AAA',NULL)IPv6
 (NULL,NULL),('string',NULL),('2001:db8:85a3::8a2e:370:7334','2001:db8:85a3::8a2e:370:7334'),('2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA',NULL)Enum

From 3eba7678057df92e8a7f91912863843d377eecd4 Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Mon, 15 Jan 2024 19:17:13 +0000
Subject: [PATCH 057/245] init

---
 src/Interpreters/InterpreterCreateQuery.cpp            | 10 ++++++++--
 .../02973_dictionary_table_exception_fix.reference     |  0
 .../02973_dictionary_table_exception_fix.sql           |  6 ++++++
 3 files changed, 14 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/02973_dictionary_table_exception_fix.reference
 create mode 100644 tests/queries/0_stateless/02973_dictionary_table_exception_fix.sql

diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index 36e864ace26..c00f58de59a 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -1405,8 +1405,14 @@ bool InterpreterCreateQuery::doCreateTable(ASTCreateQuery & create,
             interpreter.execute();
         }
         else
-            throw Exception(storage_already_exists_error_code,
-                "{} {}.{} already exists", storage_name, backQuoteIfNeed(create.getDatabase()), backQuoteIfNeed(create.getTable()));
+        {
+            if (database->getTable(create.getTable(), getContext())->isDictionary())
+                throw Exception(ErrorCodes::DICTIONARY_ALREADY_EXISTS,
+                                "Dictionary {}.{} already exists", backQuoteIfNeed(create.getDatabase()), backQuoteIfNeed(create.getTable()));
+            else
+                throw Exception(ErrorCodes::TABLE_ALREADY_EXISTS,
+                                "Table {}.{} already exists", backQuoteIfNeed(create.getDatabase()), backQuoteIfNeed(create.getTable()));
+        }
     }
     else if (!create.attach)
     {
diff --git a/tests/queries/0_stateless/02973_dictionary_table_exception_fix.reference b/tests/queries/0_stateless/02973_dictionary_table_exception_fix.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02973_dictionary_table_exception_fix.sql b/tests/queries/0_stateless/02973_dictionary_table_exception_fix.sql
new file mode 100644
index 00000000000..f8061b42670
--- /dev/null
+++ b/tests/queries/0_stateless/02973_dictionary_table_exception_fix.sql
@@ -0,0 +1,6 @@
+CREATE TABLE test_table (i Int64) engine=MergeTree order by i;
+CREATE DICTIONARY test_dict (y String, value UInt64 DEFAULT 0) PRIMARY KEY y SOURCE(CLICKHOUSE(TABLE 'test_table')) LAYOUT(DIRECT());
+CREATE TABLE test_dict (y Int64) engine=MergeTree order by y; -- { serverError DICTIONARY_ALREADY_EXISTS }
+CREATE DICTIONARY test_table (y String, value UInt64 DEFAULT 0) PRIMARY KEY y SOURCE(CLICKHOUSE(TABLE 'test_table')) LAYOUT(DIRECT()); -- { serverError TABLE_ALREADY_EXISTS }
+CREATE DICTIONARY test_dict (y String, value UInt64 DEFAULT 0) PRIMARY KEY y SOURCE(CLICKHOUSE(TABLE 'test_table')) LAYOUT(DIRECT()); -- { serverError DICTIONARY_ALREADY_EXISTS }
+CREATE TABLE test_table (y Int64) engine=MergeTree order by y; -- { serverError TABLE_ALREADY_EXISTS }

From 7bc6a858c7778911a51e4c2430125f9c3741a535 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 16 Jan 2024 19:44:55 +0100
Subject: [PATCH 058/245] Rewrite bash test to integration test

---
 .../test_broken_projections/__init__.py       |   0
 .../config.d/backups.xml                      |  13 +
 .../test_broken_projections/test.py           | 492 +++++++++++++++++
 .../02916_broken_projection.reference         | 322 -----------
 .../0_stateless/02916_broken_projection.sh    | 515 ------------------
 5 files changed, 505 insertions(+), 837 deletions(-)
 create mode 100644 tests/integration/test_broken_projections/__init__.py
 create mode 100644 tests/integration/test_broken_projections/config.d/backups.xml
 create mode 100644 tests/integration/test_broken_projections/test.py
 delete mode 100644 tests/queries/0_stateless/02916_broken_projection.reference
 delete mode 100755 tests/queries/0_stateless/02916_broken_projection.sh

diff --git a/tests/integration/test_broken_projections/__init__.py b/tests/integration/test_broken_projections/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_broken_projections/config.d/backups.xml b/tests/integration/test_broken_projections/config.d/backups.xml
new file mode 100644
index 00000000000..4da8edffd67
--- /dev/null
+++ b/tests/integration/test_broken_projections/config.d/backups.xml
@@ -0,0 +1,13 @@
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <backups>
+                <type>local</type>
+                <path>/var/lib/clickhouse/disks/backups/</path>
+            </backups>
+        </disks>
+    </storage_configuration>
+    <backups>
+        <allowed_disk>backups</allowed_disk>
+    </backups>
+</clickhouse>
diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
new file mode 100644
index 00000000000..ca1a29817a5
--- /dev/null
+++ b/tests/integration/test_broken_projections/test.py
@@ -0,0 +1,492 @@
+import time
+import pytest
+import logging
+import string
+import random
+from helpers.cluster import ClickHouseCluster
+
+cluster = ClickHouseCluster(__file__)
+
+
+@pytest.fixture(scope="module")
+def cluster():
+    try:
+        cluster = ClickHouseCluster(__file__)
+        cluster.add_instance(
+            "node",
+            main_configs=["config.d/backups.xml"],
+            stay_alive=True,
+            with_zookeeper=True,
+        )
+
+        logging.info("Starting cluster...")
+        cluster.start()
+        logging.info("Cluster started")
+
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+def create_table(node, table, replica, data_prefix = ""):
+    if data_prefix == "":
+        data_prefix = table
+
+    node.query(
+        f"""
+    DROP TABLE IF EXISTS {table} SYNC;
+    CREATE TABLE {table}
+    (
+        a String,
+        b String,
+        c Int64,
+        d Int64,
+        e Int64,
+
+        PROJECTION proj
+        (
+            SELECT c ORDER BY d
+        ),
+        PROJECTION proj_2
+        (
+            SELECT d ORDER BY c
+        )
+    )
+    ENGINE = ReplicatedMergeTree('/test_broken_projection_{data_prefix}/data/', '{replica}') ORDER BY a
+    SETTINGS min_bytes_for_wide_part = 0,
+        max_parts_to_merge_at_once=3,
+        enable_vertical_merge_algorithm=1,
+        vertical_merge_algorithm_min_rows_to_activate = 1,
+        vertical_merge_algorithm_min_columns_to_activate = 1,
+        vertical_merge_algorithm_min_columns_to_activate = 1,
+        compress_primary_key=0;
+    """
+    )
+
+
+def insert(node, table, offset, size):
+    node.query(
+        f"""
+        INSERT INTO {table}
+        SELECT number, number, number, number, number%2 FROM numbers({offset}, {size})
+        SETTINGS insert_keeper_fault_injection_probability=0.0;
+        """
+    )
+
+
+def get_parts(node, table):
+    return (
+        node.query(
+            f"""
+    SELECT name
+    FROM system.parts
+    WHERE table='{table}' AND database=currentDatabase() AND active = 1
+    ORDER BY name;"
+    """
+        )
+        .strip()
+        .split("\n")
+    )
+
+
+def bash(node, command):
+    node.exec_in_container(["bash", "-c", command], privileged=True, user="root")
+
+
+def break_projection(node, table, part, parent_part, break_type):
+    part_path = node.query(
+        f"""
+    SELECT path
+    FROM system.projection_parts
+    WHERE table='{table}'
+    AND database=currentDatabase()
+    AND active=1
+    AND part_name='{part}'
+    AND parent_name='{parent_part}'
+    ORDER BY modification_time DESC
+    LIMIT 1;
+    """
+    ).strip()
+
+    node.query(
+        f"select throwIf(substring('{part_path}', 1, 1) != '/', 'Path is relative: {part_path}')"
+    )
+
+    if break_type == "data":
+        bash(node, f"rm '{part_path}/d.bin'")
+        bash(node, f"rm '{part_path}/c.bin'")
+    elif break_type == "metadata":
+        bash(node, f"rm '{part_path}/columns.txt'")
+    elif break_type == "part":
+        bash(node, f"rm -r '{part_path}'")
+
+
+def break_part(node, table, part):
+    part_path = node.query(
+        f"""
+    SELECT path
+    FROM system.parts
+    WHERE table='{table}'
+    AND database=currentDatabase()
+    AND active=1
+    AND part_name='{part}'
+    ORDER BY modification_time DESC
+    LIMIT 1;
+    """
+    ).strip()
+
+    node.query(
+        f"select throwIf(substring('{part_path}', 1, 1) != '/', 'Path is relative: {part_path}')"
+    )
+    bash(node, f"rm '{part_path}/columns.txt'")
+
+
+def get_broken_projections_info(node, table):
+    return node.query(
+        f"""
+    SELECT parent_name, name, errors.name FROM
+    (
+        SELECT parent_name, name, exception_code
+        FROM system.projection_parts
+        WHERE table='{table}'
+        AND database=currentDatabase()
+        AND is_broken = 1
+    ) AS parts_info
+    INNER JOIN system.errors AS errors
+    ON parts_info.exception_code = errors.code
+    ORDER BY parent_name, name
+    """
+    ).strip()
+
+
+def optimize(node, table, final, no_wait):
+    query = f"OPTIMIZE TABLE {table}"
+    if final:
+        query += " FINAL"
+    if no_wait:
+        query += " SETTINGS alter_sync=0"
+    node.query(query)
+
+
+def reattach(node, table):
+    node.query(
+        f"""
+    DETACH TABLE {table};
+    ATTACH TABLE {table};
+    """
+    )
+
+
+def materialize_projection(node, table, proj):
+    node.query(
+        f"ALTER TABLE {table} MATERIALIZE PROJECTION {proj} SETTINGS mutations_sync=2"
+    )
+
+
+def check_table_full(node, table):
+    return node.query(
+        f"CHECK TABLE {table} SETTINGS check_query_single_value_result = 0;"
+    ).strip()
+
+
+def random_str(length=6):
+    alphabet = string.ascii_lowercase + string.digits
+    return "".join(random.SystemRandom().choice(alphabet) for _ in range(length))
+
+
+def check(node, table, check_result, expect_broken_part="", expected_error=""):
+    query_id = random_str()
+
+    if expect_broken_part == "proj":
+        assert expected_error in node.query_and_get_error(
+            f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c"
+        )
+    else:
+        node.query(
+            f"SELECT c FROM '{table}' WHERE d == 12 OR d == 16 ORDER BY c",
+            query_id=query_id,
+        )
+        assert "proj" in node.query(
+            f"""
+        SYSTEM FLUSH LOGS;
+        SELECT query, splitByChar('.', arrayJoin(projections))[-1]
+        FROM system.query_log
+        WHERE current_database=currentDatabase() AND query_id='{query_id}' AND type='QueryFinish'
+        """
+        )
+
+    query_id = random_str()
+
+    if expect_broken_part == "proj_2":
+        assert expected_error in node.query_and_get_error(
+            f"SELECT d FROM '{table}' WHERE c == 12 ORDER BY d"
+        )
+    else:
+        node.query(
+            f"SELECT d FROM '{table}' WHERE c == 12 OR c == 16 ORDER BY d",
+            query_id=query_id,
+        )
+        assert "proj" in node.query(
+            f"""
+        SYSTEM FLUSH LOGS;
+        SELECT query, splitByChar('.', arrayJoin(projections))[-1]
+        FROM system.query_log
+        WHERE current_database=currentDatabase() AND query_id='{query_id}' AND type='QueryFinish'
+        """
+        )
+
+    assert check_result == int(node.query(f"CHECK TABLE {table}"))
+
+
+def test_broken_ignored(cluster):
+    node = cluster.instances["node"]
+
+    table_name = "test1"
+    create_table(node, table_name, 1)
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    assert ["all_0_0_0", "all_1_1_0", "all_2_2_0", "all_3_3_0"] == get_parts(
+        node, table_name
+    )
+
+    # Break metadata (columns.txt) file of projection 'proj'
+    break_projection(node, table_name, "proj", "all_2_2_0", "metadata")
+
+    # Do select and after "check table" query.
+    # Select works because it does not read columns.txt.
+    # But expect check table result as 0.
+    check(node, table_name, 0)
+
+    # Projection 'proj' from part all_2_2_0 will now appear in broken parts info
+    # because it was marked broken during "check table" query.
+    assert "all_2_2_0\tproj\tFILE_DOESNT_EXIST" in get_broken_projections_info(
+        node, table_name
+    )
+
+    # Check table query will also show a list of parts which have broken projections.
+    assert "all_2_2_0" in check_table_full(node, table_name)
+
+    # Break data file of projection 'proj_2' for part all_2_2_0
+    break_projection(node, table_name, "proj_2", "all_2_2_0", "data")
+
+    # It will not yet appear in broken projections info.
+    assert "proj_2" not in get_broken_projections_info(node, table_name)
+
+    # Select now fails with error "File doesn't exist"
+    check(node, table_name, 0, "proj_2", "FILE_DOESNT_EXIST")
+
+    # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
+    assert "all_2_2_0\tproj_2\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
+        node, table_name
+    )
+
+    # Second select works, because projection is now marked as broken.
+    check(node, table_name, 0)
+
+    # Break data file of projection 'proj_2' for part all_3_3_0
+    break_projection(node, table_name, "proj_2", "all_3_3_0", "data")
+
+    # It will not yet appear in broken projections info.
+    assert "all_3_3_0" not in get_broken_projections_info(node, table_name)
+
+    insert(node, table_name, 20, 5)
+    insert(node, table_name, 25, 5)
+
+    # Part all_3_3_0 has 'proj' and 'proj_2' projections, but 'proj_2' is broken and server does NOT know it yet.
+    # Parts all_4_4_0 and all_5_5_0 have both non-broken projections.
+    # So a merge will be create for future part all_3_5_1.
+    # During merge it will fail to read from 'proj_2' of part all_3_3_0 and proj_2 will be marked broken.
+    # Merge will be retried and on second attempt it will succeed.
+    # The result part all_3_5_1 will have only 1 projection - 'proj', because
+    # it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
+    optimize(node, table_name, 0, 1)
+    time.sleep(5)
+
+    # table_uuid=node.query(f"SELECT uuid FROM system.tables WHERE table='{table_name}' and database=currentDatabase()").strip()
+    # assert 0 < int(
+    #    node.query(
+    #        f"""
+    # SYSTEM FLUSH LOGS;
+    # SELECT count() FROM system.text_log
+    # WHERE level='Error'
+    # AND logger_name='MergeTreeBackgroundExecutor'
+    # AND message like 'Exception while executing background task %{table_uuid}:all_3_5_1%%Cannot open file%proj_2.proj/c.bin%'
+    # """)
+    # )
+
+    assert "all_3_3_0" in get_broken_projections_info(node, table_name)
+    check(node, table_name, 0)
+
+
+def test_materialize_broken_projection(cluster):
+    node = cluster.instances["node"]
+
+    table_name = "test2"
+    create_table(node, table_name, 1)
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    assert ["all_0_0_0", "all_1_1_0", "all_2_2_0", "all_3_3_0"] == get_parts(
+        node, table_name
+    )
+
+    break_projection(node, table_name, "proj", "all_1_1_0", "metadata")
+    reattach(node, table_name)
+
+    assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
+        node, table_name
+    )
+    assert "Part all_1_1_0 has a broken projection proj" in check_table_full(
+        node, table_name
+    )
+
+    break_projection(node, table_name, "proj_2", "all_1_1_0", "data")
+    reattach(node, table_name)
+
+    assert "all_1_1_0\tproj_2\tFILE_DOESNT_EXIST" in get_broken_projections_info(
+        node, table_name
+    )
+    assert "Part all_1_1_0 has a broken projection proj_2" in check_table_full(
+        node, table_name
+    )
+
+    materialize_projection(node, table_name, "proj")
+
+    assert "has a broken projection" not in check_table_full(node, table_name)
+
+
+def test_broken_ignored_replicated(cluster):
+    node = cluster.instances["node"]
+
+    table_name = "test3"
+    table_name2 = "test3_replica"
+    create_table(node, table_name, 1)
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    check(node, table_name, 1)
+
+    create_table(node, table_name2, 2, table_name)
+    check(node, table_name2, 1)
+
+    break_projection(node, table_name, "proj", "all_0_0_0", "data")
+    assert "Part all_0_0_0 has a broken projection proj" in check_table_full(
+        node, table_name
+    )
+
+    break_part(node, table_name, "all_0_0_0")
+    node.query(f"SYSTEM SYNC REPLICA {table_name}")
+    assert "has a broken projection" not in check_table_full(node, table_name)
+
+
+def test_broken_projections_in_backups(cluster):
+    node = cluster.instances["node"]
+
+    table_name = "test4"
+    create_table(node, table_name, 1)
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    check(node, table_name, 1)
+
+    break_projection(node, table_name, "proj", "all_2_2_0", "data")
+    check(node, table_name, 0, "proj", "FILE_DOESNT_EXIST")
+
+    assert "all_2_2_0\tproj\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
+        node, table_name
+    )
+
+    assert "BACKUP_CREATED" in node.query(
+        f"""
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    backup table {table_name} to Disk('backups', 'b1') settings check_projection_parts=false;
+    """
+    )
+
+    assert "RESTORED" in node.query(
+        f"""
+    drop table {table_name} sync;
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    restore table {table_name} from Disk('backups', 'b1');
+    """
+    )
+
+    check(node, table_name, 1)
+
+    assert "" == get_broken_projections_info(node, table_name)
+    # TODO: add a check for what projections are loaded
+
+    break_projection(node, table_name, "proj", "all_2_2_0", "part")
+
+    check(node, table_name, 0, "proj", "ErrnoException")
+
+    assert "all_2_2_0\tproj\tFILE_DOESNT_EXIST" == get_broken_projections_info(
+        node, table_name
+    )
+
+    assert "FILE_DOESNT_EXIST" in node.query_and_get_error(
+        f"""
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    backup table {table_name} to Disk('backups', 'b2')
+    """
+    )
+
+    materialize_projection(node, table_name, "proj")
+    check(node, table_name, 1)
+    # TODO:
+    # assert "all_2_2_0\tproj\tFILE_DOESNT_EXIST" == get_broken_projections_info(node, table_name)
+
+    assert "BACKUP_CREATED" in node.query(
+        f"""
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    backup table {table_name} to Disk('backups', 'b3') settings check_projection_parts=false;
+    """
+    )
+
+    assert "RESTORED" in node.query(
+        f"""
+    drop table {table_name} sync;
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    restore table {table_name} from Disk('backups', 'b3');
+    """
+    )
+    check(node, table_name, 1)
+
+    break_projection(node, table_name, "proj", "all_1_1_0", "part")
+    # TODO: check(node, table_name, 0, "proj", "FILE_DOESNT_EXIST")
+    assert "Part all_1_1_0 has a broken projection proj" in check_table_full(
+        node, table_name
+    )
+    assert "all_1_1_0\tproj\tFILE_DOESNT_EXIST" == get_broken_projections_info(
+        node, table_name
+    )
+
+    assert "BACKUP_CREATED" in node.query(
+        f"""
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    backup table {table_name} to Disk('backups', 'b4') settings check_projection_parts=false;
+    """
+    )
+
+    assert "RESTORED" in node.query(
+        f"""
+    drop table {table_name} sync;
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    restore table {table_name} from Disk('backups', 'b4');
+    """
+    )
+    check(node, table_name, 1)
+    assert "" == get_broken_projections_info(node, table_name)
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
deleted file mode 100644
index 3967215e5de..00000000000
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ /dev/null
@@ -1,322 +0,0 @@
-insert new part
-insert new part
-insert new part
-insert new part
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-0
-broke metadata of part 'proj' (parent part: all_2_2_0)
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-check table full (test - all_2_2_0)
-all_2_2_0
-0
-broke data of part 'proj_2' (parent part: all_2_2_0)
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: proj_2
-FILE_DOESNT_EXIST
-check table
-0
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-0
-broke data of part 'proj_2' (parent part: all_3_3_0)
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
-insert new part
-insert new part
-optimize
-OPTIMIZE TABLE test SETTINGS alter_sync=0
-0
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
-all_3_3_0	proj_2	NO_FILE_IN_DATA_PART
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-0
-broke metadata of part 'proj' (parent part: all_1_1_0)
-Detach - Attach
-broken projections info
-all_1_1_0	proj	NO_FILE_IN_DATA_PART
-all_2_2_0	proj	NO_FILE_IN_DATA_PART
-all_2_2_0	proj_2	FILE_DOESNT_EXIST
-all_3_3_0	proj_2	FILE_DOESNT_EXIST
-0
-broke data of part 'proj_2' (parent part: all_1_1_0)
-Detach - Attach
-broken projections info
-all_1_1_0	proj	NO_FILE_IN_DATA_PART
-all_1_1_0	proj_2	FILE_DOESNT_EXIST
-all_2_2_0	proj	NO_FILE_IN_DATA_PART
-all_2_2_0	proj_2	FILE_DOESNT_EXIST
-all_3_3_0	proj_2	FILE_DOESNT_EXIST
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-check table full (test - all_1_1_0)
-all_1_1_0
-materialize projection proj
-check table full (test - )
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-materialize projection proj_2
-check table full (test - )
-0
-broke data of part 'proj' (parent part: all_3_5_1_7)
-insert new part
-optimize
-OPTIMIZE TABLE test FINAL
-insert new part
-optimize
-OPTIMIZE TABLE test FINAL
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj_2
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-insert new part
-insert new part
-insert new part
-insert new part
-select from projection 'proj'
-used projections
-SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-used projections
-SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-select from projection 'proj'
-used projections
-SELECT c FROM test2_replica WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-used projections
-SELECT d FROM test2_replica WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-0
-broke data of part 'proj' (parent part: all_0_0_0)
-check table full (test2 - all_0_0_0)
-all_0_0_0
-select from projection 'proj'
-used projections
-SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-used projections
-SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-broke data of part 'all_0_0_0'
-check table full (test2 - all_0_0_0)
-all_0_0_0
-select from projection 'proj'
-used projections
-SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-used projections
-SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-select from projection 'proj'
-used projections
-SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-used projections
-SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-insert new part
-insert new part
-insert new part
-insert new part
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-0
-broke data of part 'proj' (parent part: all_2_2_0)
-select from projection 'proj', expect error: proj
-FILE_DOESNT_EXIST
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-broken projections info
-all_2_2_0	proj	NO_FILE_IN_DATA_PART
-BACKUP_CREATED
-RESTORED
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-broken projections info
-0
-broke all data of part 'proj' (parent part: all_2_2_0)
-select from projection 'proj', expect error: proj
-Errno
-Errno
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-FILE_DOESNT_EXIST
-materialize projection proj
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-BACKUP_CREATED
-RESTORED
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-0
-broke all data of part 'proj' (parent part: all_1_1_0)
-select from projection 'proj', expect error: proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-broken projections info
-all_1_1_0	proj	FILE_DOESNT_EXIST
-BACKUP_CREATED
-RESTORED
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-broken projections info
-all_1_1_0	proj	NO_FILE_IN_DATA_PART
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
deleted file mode 100755
index fbd26e59f6f..00000000000
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ /dev/null
@@ -1,515 +0,0 @@
-#!/usr/bin/env bash
-# Tags: long, no-random-merge-tree-settings, no-random-settings, no-s3-storage, no-parallel
-# shellcheck disable=SC2046
-
-CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CURDIR"/../shell_config.sh
-
-function create_table()
-{
-    test_id=$1
-    name=$2
-    replica=$3
-    $CLICKHOUSE_CLIENT -nm -q "
-    DROP TABLE IF EXISTS $name SYNC;
-    CREATE TABLE $name
-    (
-        a String,
-        b String,
-        c Int64,
-        d Int64,
-        e Int64,
-
-        PROJECTION proj
-        (
-            SELECT c ORDER BY d
-        ),
-        PROJECTION proj_2
-        (
-            SELECT d ORDER BY c
-        )
-    )
-    ENGINE = ReplicatedMergeTree('/test_broken_projection_32_$test_id/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '$replica') ORDER BY a
-    SETTINGS min_bytes_for_wide_part = 0,
-        max_parts_to_merge_at_once=3,
-        enable_vertical_merge_algorithm=1,
-        vertical_merge_algorithm_min_rows_to_activate = 1,
-        vertical_merge_algorithm_min_columns_to_activate = 1,
-        vertical_merge_algorithm_min_columns_to_activate = 1,
-        compress_primary_key=0;
-    "
-}
-
-function random()
-{
-    cat /dev/urandom | LC_ALL=C tr -dc 'a-zA-Z' | fold -w ${1:-8} | head -n 1
-}
-
-function insert()
-{
-    table=$1
-    offset=$2
-    size=$3
-    echo 'insert new part'
-    $CLICKHOUSE_CLIENT -q "INSERT INTO $table SELECT number, number, number, number, number%2 FROM numbers($offset, $size) SETTINGS insert_keeper_fault_injection_probability=0.0;"
-}
-
-function break_projection()
-{
-    table=$1
-    part_name=$2
-    parent_name=$3
-    break_type=$4
-
-    read -r part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
-    SELECT path
-    FROM system.projection_parts
-    WHERE table='$table'
-    AND database=currentDatabase()
-    AND active=1
-    AND part_name='$part_name'
-    AND parent_name='$parent_name'
-    ORDER BY modification_time DESC
-    LIMIT 1;
-    ")
-
-    $CLICKHOUSE_CLIENT -q "select throwIf(substring('$part_path', 1, 1) != '/', 'Path is relative: $part_path')" || exit
-
-    if [ "$break_type" = "data" ]
-        then
-           rm "$part_path/d.bin"
-           rm "$part_path/c.bin"
-           echo "broke data of part '$part_name' (parent part: $parent_name)"
-    fi
-    if [ "$break_type" = "metadata" ]
-        then
-           rm "$part_path/columns.txt"
-           echo "broke metadata of part '$part_name' (parent part: $parent_name)"
-    fi
-    if [ "$break_type" = "part" ]
-        then
-           rm -r "$part_path"
-           echo "broke all data of part '$part_name' (parent part: $parent_name)"
-    fi
-}
-
-function break_part()
-{
-    table=$1
-    part_name=$2
-
-    read -r part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
-    SELECT path
-    FROM system.parts
-    WHERE table='$table'
-    AND database=currentDatabase()
-    AND active=1
-    AND part_name='$part_name'
-    ORDER BY modification_time DESC
-    LIMIT 1;
-    ")
-
-    if [ "$part_path" = "" ]
-       then
-           echo "Part path is empty"
-           exit
-    fi
-
-    rm $part_path/columns.txt
-    echo "broke data of part '$part_name'"
-}
-
-function broken_projections_info()
-{
-    table=$1
-    echo 'broken projections info'
-    $CLICKHOUSE_CLIENT -q "
-    SELECT parent_name, name, errors.name FROM
-    (
-        SELECT parent_name, name, exception_code
-        FROM system.projection_parts
-        WHERE table='$table'
-        AND database=currentDatabase()
-        AND is_broken = 1
-    ) AS parts_info
-    INNER JOIN system.errors AS errors
-    ON parts_info.exception_code = errors.code
-    ORDER BY parent_name, name
-"
-}
-
-function check()
-{
-    table=$1
-    expect_broken_part=""
-    expected_error=""
-    if [ $# -gt 1 ]; then
-        expect_broken_part=$2
-        expected_error=$3
-    fi
-
-    #echo 'system.parts'
-    #$CLICKHOUSE_CLIENT -q "
-    #SELECT name, active, projections
-    #FROM system.parts
-    #WHERE table='$table' AND database=currentDatabase()
-    #ORDER BY name;"
-
-    query_id=$(random 8)
-
-    if [ "$expect_broken_part" = "proj" ]
-        then
-            echo "select from projection 'proj', expect error: $expect_broken_part"
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
-                SET send_logs_level='fatal';
-                SELECT c FROM $table WHERE d == 12 ORDER BY c;
-            " 2>&1 | grep -oF "$expected_error"
-        else
-            echo "select from projection 'proj'"
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM $table WHERE d == 12 OR d == 16 ORDER BY c;"
-            echo 'used projections'
-            $CLICKHOUSE_CLIENT -nm -q "
-                SYSTEM FLUSH LOGS;
-                SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
-            "
-    fi
-
-    query_id=$(random 8)
-
-    if [ "$expect_broken_part" = "proj_2" ]
-        then
-            echo "select from projection 'proj_2', expect error: $expect_broken_part"
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
-                SET send_logs_level='fatal';
-                SELECT d FROM $table WHERE c == 12 ORDER BY d;
-            " 2>&1 | grep -oF "$expected_error"
-        else
-            echo "select from projection 'proj_2'"
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM $table WHERE c == 12 OR c == 16 ORDER BY d;"
-            echo 'used projections'
-            $CLICKHOUSE_CLIENT -nm -q "
-                SYSTEM FLUSH LOGS;
-                SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
-            "
-    fi
-
-    echo 'check table'
-    $CLICKHOUSE_CLIENT -nm -q "
-    SET send_logs_level='fatal';
-    CHECK TABLE $table;"
-}
-
-function optimize()
-{
-    final=$1
-    no_wait=$2
-
-    echo 'optimize'
-    query="OPTIMIZE TABLE test"
-
-    if [ $final -eq 1 ]; then
-        query="$query FINAL"
-    fi
-    if [ $no_wait -eq 1 ]; then
-        query="$query SETTINGS alter_sync=0"
-    fi
-
-    echo $query
-
-    $CLICKHOUSE_CLIENT -q "$query"
-}
-
-function reattach()
-{
-    echo 'Detach - Attach'
-    $CLICKHOUSE_CLIENT -nm -q "
-    SET send_logs_level='fatal';
-    DETACH TABLE test;
-    ATTACH TABLE test;
-    "
-}
-
-function materialize_projection
-{
-    table=$1
-    projection=$2
-    echo "materialize projection $projection"
-    $CLICKHOUSE_CLIENT -q "ALTER TABLE $table MATERIALIZE PROJECTION $projection SETTINGS mutations_sync=2"
-}
-
-function check_table_full()
-{
-    table=$1
-    expect_broken_part=$2
-    echo "check table full ($1 - $2)"
-    if [ "$expect_broken_part" = "" ]
-       then
-           $CLICKHOUSE_CLIENT -nm -q "
-           SET send_logs_level='fatal';
-           CHECK TABLE $table SETTINGS check_query_single_value_result = 0;
-           " | grep "broken"
-       else
-           $CLICKHOUSE_CLIENT -nm -q "
-           SET send_logs_level='fatal';
-           CHECK TABLE $table SETTINGS check_query_single_value_result = 0;
-           " | grep "broken" | grep -o $expect_broken_part | head -n 1
-    fi
-}
-
-function test1()
-{
-    create_table test1 test 1
-
-    table_uuid=$($CLICKHOUSE_CLIENT -q "SELECT uuid FROM system.tables WHERE table='test' and database=currentDatabase()")
-
-    insert test 0 5
-
-    insert test 5 5
-
-    insert test 10 5
-
-    insert test 15 5
-
-    check test
-
-    # Break metadata file of projection 'proj'
-    break_projection test proj all_2_2_0 metadata
-
-    # Do select and after "check table" query.
-    # Select works because it does not read columns.txt.
-    check test
-
-    # Projection 'proj' from part all_2_2_0 will now appear in broken parts info
-    # because it was marked broken during "check table" query.
-    # TODO: try to mark it during select as well
-    broken_projections_info test
-
-    # Check table query will also show a list of parts which have broken projections.
-    check_table_full test "all_2_2_0"
-
-    # Break data file of projection 'proj_2' for part all_2_2_0
-    break_projection test proj_2 all_2_2_0 data
-
-    # It will not yet appear in broken projections info.
-    broken_projections_info test
-
-    # Select now fails with error "File doesn't exist"
-    check test "proj_2" FILE_DOESNT_EXIST
-
-    # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
-    broken_projections_info test
-
-    # Second select works, because projection is now marked as broken.
-    check test
-
-    # Break data file of projection 'proj_2' for part all_3_3_0
-    break_projection test proj_2 all_3_3_0 data
-
-    # It will not yet appear in broken projections info.
-    broken_projections_info test
-
-    insert test 20 5
-
-    insert test 25 5
-
-    # Part all_3_3_0 has 'proj' and 'proj_2' projections, but 'proj_2' is broken and server does NOT know it yet.
-    # Parts all_4_4_0 and all_5_5_0 have both non-broken projections.
-    # So a merge will be create for future part all_3_5_1.
-    # During merge it will fail to read from 'proj_2' of part all_3_3_0 and proj_2 will be marked broken.
-    # Merge will be retried and on second attempt it will succeed.
-    # The result part all_3_5_1 will have only 1 projection - 'proj', because
-    # it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
-    optimize 0 1
-    sleep 2
-
-    $CLICKHOUSE_CLIENT -nm -q "
-    SYSTEM FLUSH LOGS;
-    SELECT count() FROM system.text_log
-    WHERE level='Error'
-    AND logger_name='MergeTreeBackgroundExecutor'
-    AND message like 'Exception while executing background task {$table_uuid:all_3_5_1}%Cannot open file%proj_2.proj/c.bin%'
-    "
-
-    # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
-    broken_projections_info test
-
-    check test
-
-    break_projection test proj all_1_1_0 metadata
-
-    reattach
-
-    broken_projections_info test
-
-    break_projection test proj_2 all_1_1_0 data
-
-    reattach
-
-    broken_projections_info test
-
-    check test
-
-    check_table_full test all_1_1_0
-
-    materialize_projection test proj
-
-    check_table_full test
-
-    check test
-
-    materialize_projection test proj_2
-
-    check_table_full test
-
-    break_projection test proj all_3_5_1_7 data
-
-    insert test 30 5
-
-    optimize 1 0
-
-    insert test 35 5
-
-    optimize 1 0
-
-    check test
-}
-
-function test2()
-{
-    create_table test2 test2 1
-
-    insert test2 0 5
-
-    insert test2 5 5
-
-    insert test 10 5
-
-    insert test 15 5
-
-    check test2
-
-    create_table test2 test2_replica 2
-
-    check test2_replica
-
-    break_projection test2 proj all_0_0_0 data
-
-    check_table_full test2 all_0_0_0
-
-    check test2
-
-    break_part test2 all_0_0_0
-
-    check_table_full test2 all_0_0_0
-
-    check test2
-
-    $CLICKHOUSE_CLIENT -q "SYSTEM SYNC REPLICA test2;"
-
-    check test2
-}
-
-function test3()
-{
-    create_table test3 test 1
-
-    insert test 0 5
-
-    insert test 5 5
-
-    insert test 10 5
-
-    insert test 15 5
-
-    check test
-
-    break_projection test proj all_2_2_0 data
-
-    check test proj FILE_DOESNT_EXIST
-
-    broken_projections_info test
-
-    ${CLICKHOUSE_CLIENT} -nm --query "
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}') settings check_projection_parts=false;
-    " | grep -o "BACKUP_CREATED"
-
-    ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
-    drop table test sync;
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}');
-    " | grep -o "RESTORED"
-
-    check test
-
-    broken_projections_info test
-
-    break_projection test proj all_2_2_0 part
-
-    check test proj Errno
-
-    broken_projections_info test
-
-    ${CLICKHOUSE_CLIENT} -nm --query "
-    set send_logs_level='fatal';
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2')
-    " 2>&1 | grep -o "FILE_DOESNT_EXIST"
-
-    materialize_projection test proj
-
-    check test
-
-    broken_projections_info test
-
-    ${CLICKHOUSE_CLIENT} -nm --query "
-    set send_logs_level='fatal';
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3')
-    " | grep -o "BACKUP_CREATED"
-
-    ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
-    drop table test sync;
-    set send_logs_level='fatal';
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3');
-    " | grep -o "RESTORED"
-
-    check test
-
-    break_projection test proj all_1_1_0 part
-
-    check test proj FILE_DOESNT_EXIST
-
-    broken_projections_info test
-
-    ${CLICKHOUSE_CLIENT} -nm --query "
-    set send_logs_level='fatal';
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_4')
-    settings check_projection_parts=false, allow_backup_broken_projections=true;
-    " | grep -o "BACKUP_CREATED"
-
-    ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
-    drop table test sync;
-    set send_logs_level='fatal';
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_4');
-    " | grep -o "RESTORED"
-
-    check test
-
-    broken_projections_info test
-}
-
-test1
-test2
-test3
-
-
-$CLICKHOUSE_CLIENT -nm -q "
-DROP TABLE IF EXISTS test SYNC;
-DROP TABLE IF EXISTS test2 SYNC;
-DROP TABLE IF EXISTS test2_replica SYNC;
-"

From 216769f43ea536a38b9e7d5650cdd02fae972caf Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Tue, 16 Jan 2024 18:55:23 +0000
Subject: [PATCH 059/245] Automatic style fix

---
 tests/integration/test_broken_projections/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index ca1a29817a5..cc3e55402b3 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -28,7 +28,7 @@ def cluster():
         cluster.shutdown()
 
 
-def create_table(node, table, replica, data_prefix = ""):
+def create_table(node, table, replica, data_prefix=""):
     if data_prefix == "":
         data_prefix = table
 

From dea8b10ae972b4fc2b20dbf90d90e362bf7e4207 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 17 Jan 2024 15:39:57 +0100
Subject: [PATCH 060/245] Fix test

---
 tests/integration/test_broken_projections/test.py | 11 +++--------
 1 file changed, 3 insertions(+), 8 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index ca1a29817a5..90d82f9f010 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -425,9 +425,7 @@ def test_broken_projections_in_backups(cluster):
     )
 
     check(node, table_name, 1)
-
     assert "" == get_broken_projections_info(node, table_name)
-    # TODO: add a check for what projections are loaded
 
     break_projection(node, table_name, "proj", "all_2_2_0", "part")
 
@@ -446,8 +444,6 @@ def test_broken_projections_in_backups(cluster):
 
     materialize_projection(node, table_name, "proj")
     check(node, table_name, 1)
-    # TODO:
-    # assert "all_2_2_0\tproj\tFILE_DOESNT_EXIST" == get_broken_projections_info(node, table_name)
 
     assert "BACKUP_CREATED" in node.query(
         f"""
@@ -466,7 +462,6 @@ def test_broken_projections_in_backups(cluster):
     check(node, table_name, 1)
 
     break_projection(node, table_name, "proj", "all_1_1_0", "part")
-    # TODO: check(node, table_name, 0, "proj", "FILE_DOESNT_EXIST")
     assert "Part all_1_1_0 has a broken projection proj" in check_table_full(
         node, table_name
     )
@@ -477,7 +472,7 @@ def test_broken_projections_in_backups(cluster):
     assert "BACKUP_CREATED" in node.query(
         f"""
     set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table {table_name} to Disk('backups', 'b4') settings check_projection_parts=false;
+    backup table {table_name} to Disk('backups', 'b4') settings check_projection_parts=false, allow_backup_broken_projections=true;
     """
     )
 
@@ -488,5 +483,5 @@ def test_broken_projections_in_backups(cluster):
     restore table {table_name} from Disk('backups', 'b4');
     """
     )
-    check(node, table_name, 1)
-    assert "" == get_broken_projections_info(node, table_name)
+    check(node, table_name, 0)
+    assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(node, table_name)

From 1e9de73bf57de1eb66007cba0fecb9f0459c973e Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 17 Jan 2024 15:40:46 +0100
Subject: [PATCH 061/245] Fix style check

---
 tests/integration/test_broken_projections/test.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index eb8c452fff0..1b192e0df24 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -484,4 +484,6 @@ def test_broken_projections_in_backups(cluster):
     """
     )
     check(node, table_name, 0)
-    assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(node, table_name)
+    assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(
+        node, table_name
+    )

From 8ac04c6dd8a945e0f189aae572c54ee4458f75dd Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 18 Jan 2024 15:15:57 +0000
Subject: [PATCH 062/245] Address comments

---
 src/DataTypes/DataTypeVariant.cpp             |  9 ++++
 .../Serializations/SerializationVariant.cpp   | 48 +++++++------------
 .../Serializations/SerializationVariant.h     | 23 +++++++++
 .../SerializationVariantElement.cpp           | 14 +++---
 4 files changed, 57 insertions(+), 37 deletions(-)

diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index 2bc4dfa5a7a..e0510373960 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -105,6 +105,15 @@ ColumnPtr DataTypeVariant::createColumnConst(size_t size, const DB::Field & fiel
     }
     else
     {
+        /// We don't have exact mapping Field type -> Data type, so we cannot
+        /// always know in which variant we need to insert the field by it's type.
+        /// Examples:
+        /// Field(42) and Variant(UInt16, String). Type of the Field - UInt64, but we can insert it in UInt16
+        /// Field(42) and Variant(Date, String). Type of the Field - UInt64, but we can insert it in Date
+
+        /// Let's first apply FieldToDataType visitor to find best Data type for this field.
+        /// If we have variant with such type, we will insert this field into it.
+        /// Otherwise we will try to find the first variant that has default Field value with the same type.
         auto field_type = applyVisitor(FieldToDataType(), field);
         auto discr = tryGetVariantDiscriminator(field_type);
         if (!discr)
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 64fcb63d604..78ec0a5e2da 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -200,19 +200,12 @@ void SerializationVariant::serializeBinaryBulkWithMultipleStreams(
         for (size_t i = 0; i != limit; ++i)
             writeBinaryLittleEndian(non_empty_global_discr, *discriminators_stream);
 
-        /// Second, serialize variants in global order.
+        /// Second, serialize non-empty variant (other variants are empty and we can skip their serialization).
         settings.path.push_back(Substream::VariantElements);
-        for (size_t i = 0; i != variants.size(); ++i)
-        {
-            addVariantElementToPath(settings.path, i);
-            /// For non empty variant use the same offset/limit as for whole Variant column
-            if (i == non_empty_global_discr)
-                variants[i]->serializeBinaryBulkWithMultipleStreams(col.getVariantByGlobalDiscriminator(i), offset, limit, settings, variant_state->states[i]);
-            /// For empty variants, use just 0/0, they won't serialize anything.
-            else
-                variants[i]->serializeBinaryBulkWithMultipleStreams(col.getVariantByGlobalDiscriminator(i), 0, 0, settings, variant_state->states[i]);
-            settings.path.pop_back();
-        }
+        addVariantElementToPath(settings.path, non_empty_global_discr);
+        /// We can use the same offset/limit as for whole Variant column
+        variants[non_empty_global_discr]->serializeBinaryBulkWithMultipleStreams(col.getVariantByGlobalDiscriminator(non_empty_global_discr), offset, limit, settings, variant_state->states[non_empty_global_discr]);
+        settings.path.pop_back();
         settings.path.pop_back();
         return;
     }
@@ -237,26 +230,22 @@ void SerializationVariant::serializeBinaryBulkWithMultipleStreams(
         }
     }
 
-    /// If limit for some variant is 0, it means that we don't have its discriminator in the range.
-    /// Set offset to the size of column for such variants, so we won't serialize values from them.
-    for (size_t i = 0; i != variant_offsets_and_limits.size(); ++i)
-    {
-        if (!variant_offsets_and_limits[i].second)
-            variant_offsets_and_limits[i].first = col.getVariantByGlobalDiscriminator(i).size();
-    }
-
     /// Serialize variants in global order.
     settings.path.push_back(Substream::VariantElements);
     for (size_t i = 0; i != variants.size(); ++i)
     {
-        addVariantElementToPath(settings.path, i);
-        variants[i]->serializeBinaryBulkWithMultipleStreams(
-            col.getVariantByGlobalDiscriminator(i),
-            variant_offsets_and_limits[i].first,
-            variant_offsets_and_limits[i].second,
-            settings,
-            variant_state->states[i]);
-        settings.path.pop_back();
+        /// Serialize variant only if we have its discriminator in the range.
+        if (variant_offsets_and_limits[i].second)
+        {
+            addVariantElementToPath(settings.path, i);
+            variants[i]->serializeBinaryBulkWithMultipleStreams(
+                col.getVariantByGlobalDiscriminator(i),
+                variant_offsets_and_limits[i].first,
+                variant_offsets_and_limits[i].second,
+                settings,
+                variant_state->states[i]);
+            settings.path.pop_back();
+        }
     }
     settings.path.pop_back();
 }
@@ -564,9 +553,6 @@ std::vector<size_t> SerializationVariant::getVariantsDeserializeTextOrder(const
     }
 
     std::sort(order.begin(), order.end(), [&](size_t left, size_t right) { return priorities[left] > priorities[right]; });
-    String types_order;
-    for (auto i : order)
-        types_order += " " + variant_types[i]->getName();
     return order;
 }
 
diff --git a/src/DataTypes/Serializations/SerializationVariant.h b/src/DataTypes/Serializations/SerializationVariant.h
index b6bee94c65f..3f53dcf1339 100644
--- a/src/DataTypes/Serializations/SerializationVariant.h
+++ b/src/DataTypes/Serializations/SerializationVariant.h
@@ -6,6 +6,29 @@
 namespace DB
 {
 
+/// Class for serializing/deserializing column with Variant type.
+/// It supports both text and binary bulk serializations/deserializations.
+///
+/// During text serialization it checks discriminator of the current row and
+/// uses corresponding text serialization of this variant.
+///
+/// During text deserialization it tries all variants deserializations
+/// (using tryDeserializeText* methods of ISerialization) in predefined order
+/// and inserts data in the first variant with succeeded deserialization.
+///
+/// During binary bulk serialization it transforms local discriminators
+/// to global and serializes them into a separate stream VariantDiscriminators.
+/// Each variant is serialized into a separate stream with path VariantElements/VariantElement
+/// (VariantElements stream is needed for correct sub-columns creation). We store and serialize
+/// variants in a sparse form (the size of a variant column equals to the number of its discriminator
+/// in the discriminators column), so during deserialization the limit for each variant is
+/// calculated according to discriminators column.
+/// Offsets column is not serialized and stored only in memory.
+///
+/// During binary bulk deserialization we first deserialize discriminators from corresponding stream
+/// and use them to calculate the limit for each variant. Each variant is deserialized from
+/// corresponding stream using calculated limit. Offsets column is not deserialized and constructed
+/// according to discriminators.
 class SerializationVariant : public ISerialization
 {
 public:
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index e06a20d2990..be91e0ba2ee 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -149,19 +149,21 @@ void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
             assert_cast<ColumnLowCardinality &>(*variant_element_state->variant->assumeMutable()).nestedRemoveNullable();
     }
 
+    /// If nothing to deserialize, just insert defaults.
+    if (variant_limit == 0)
+    {
+        mutable_column->insertManyDefaults(limit);
+        return;
+    }
+
     addVariantToPath(settings.path);
     nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_element_state->variant, variant_limit, settings, variant_element_state->variant_element_state, cache);
     removeVariantFromPath(settings.path);
 
     size_t variant_offset = variant_element_state->variant->size() - variant_limit;
 
-    /// If don't have our discriminator in range, just insert defaults.
-    if (variant_limit == 0)
-    {
-        mutable_column->insertManyDefaults(limit);
-    }
     /// If we have only our discriminator in range, insert the whole range to result column.
-    else if (variant_limit == limit)
+    if (variant_limit == limit)
     {
         mutable_column->insertRangeFrom(*variant_element_state->variant, variant_offset, variant_limit);
     }

From f202d713711857c083de5aaba1198198d2eaa3a4 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 18 Jan 2024 17:29:36 +0000
Subject: [PATCH 063/245] Make alter with variant espansion as no-op, add tests
 for alters

---
 src/DataTypes/DataTypeVariant.cpp             |  22 ++
 src/DataTypes/DataTypeVariant.h               |   4 +
 .../Serializations/SerializationVariant.cpp   |   2 +-
 .../SerializationVariantElement.cpp           |  16 +-
 src/Storages/MergeTree/MutateTask.cpp         |  20 +-
 .../02941_variant_type_alters.reference       | 330 ++++++++++++++++++
 .../0_stateless/02941_variant_type_alters.sh  |  61 ++++
 7 files changed, 452 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/02941_variant_type_alters.reference
 create mode 100755 tests/queries/0_stateless/02941_variant_type_alters.sh

diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index e0510373960..3a39fdf9ea8 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -230,6 +230,28 @@ static DataTypePtr create(const ASTPtr & arguments)
     return std::make_shared<DataTypeVariant>(nested_types);
 }
 
+bool isVariantExtension(const DataTypePtr & from_type, const DataTypePtr & to_type)
+{
+    const auto * from_variant = typeid_cast<const DataTypeVariant *>(from_type.get());
+    const auto * to_variant = typeid_cast<const DataTypeVariant *>(to_type.get());
+    if (!from_variant || !to_variant)
+        return false;
+
+    const auto & to_variants = to_variant->getVariants();
+    std::unordered_set<String> to_variant_types;
+    to_variant_types.reserve(to_variants.size());
+    for (const auto & variant : to_variants)
+        to_variant_types.insert(variant->getName());
+
+    for (const auto & variant : from_variant->getVariants())
+    {
+        if (!to_variant_types.contains(variant->getName()))
+            return false;
+    }
+
+    return true;
+}
+
 
 void registerDataTypeVariant(DataTypeFactory & factory)
 {
diff --git a/src/DataTypes/DataTypeVariant.h b/src/DataTypes/DataTypeVariant.h
index ca15dff1476..1a1cb6c12f2 100644
--- a/src/DataTypes/DataTypeVariant.h
+++ b/src/DataTypes/DataTypeVariant.h
@@ -61,5 +61,9 @@ private:
     SerializationPtr doGetDefaultSerialization() const override;
 };
 
+/// Check if conversion from from_type to to_type is Variant extension
+/// (both types are Variants and to_type contains all variants from from_type).
+bool isVariantExtension(const DataTypePtr & from_type, const DataTypePtr & to_type);
+
 }
 
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 78ec0a5e2da..48a78dd54a9 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -275,7 +275,7 @@ void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
     {
         auto * discriminators_stream = settings.getter(settings.path);
         if (!discriminators_stream)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariant::deserializeBinaryBulkWithMultipleStreams");
+            return;
 
         SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*col.getLocalDiscriminatorsPtr()->assumeMutable(), *discriminators_stream, limit, 0);
         addToSubstreamsCache(cache, settings.path, col.getLocalDiscriminatorsPtr());
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index be91e0ba2ee..80524cbd814 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -91,7 +91,7 @@ void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
     {
         auto * discriminators_stream = settings.getter(settings.path);
         if (!discriminators_stream)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams");
+            return;
 
         /// If we started to read a new column, reinitialize discriminators column in deserialization state.
         if (!variant_element_state->discriminators || result_column->empty())
@@ -156,10 +156,24 @@ void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
         return;
     }
 
+    size_t prev_variant_size = variant_element_state->variant->size();
     addVariantToPath(settings.path);
     nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_element_state->variant, variant_limit, settings, variant_element_state->variant_element_state, cache);
     removeVariantFromPath(settings.path);
 
+    /// If nothing was deserialized when variant_limit > 0
+    /// it means that we don't have a stream for such sub-column.
+    /// It may happen during ALTER MODIFY column with Variant extension.
+    /// In this case we should just insert default values.
+    if (variant_element_state->variant->empty())
+    {
+        mutable_column->insertManyDefaults(limit);
+        return;
+    }
+
+    if (variant_element_state->variant->size() != prev_variant_size + variant_limit)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected variant column size after deserialization. Expected {}, got {}", prev_variant_size + variant_limit, variant_element_state->variant->size());
+
     size_t variant_offset = variant_element_state->variant->size() - variant_limit;
 
     /// If we have only our discriminator in range, insert the whole range to result column.
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index e4070aa8262..44734ec98c0 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -22,6 +22,7 @@
 #include <Storages/MergeTree/MergeTreeDataMergerMutator.h>
 #include <Storages/MergeTree/MergeTreeIndexInverted.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeVariant.h>
 #include <boost/algorithm/string/replace.hpp>
 #include <Common/ProfileEventsScope.h>
 
@@ -1921,7 +1922,7 @@ static bool canSkipConversionToNullable(const MergeTreeDataPartPtr & part, const
     if (!part_column)
         return false;
 
-    /// For ALTER MODIFY COLUMN from 'Type' to 'Nullable(Type)' we can skip mutatation and
+    /// For ALTER MODIFY COLUMN from 'Type' to 'Nullable(Type)' we can skip mutation and
     /// apply only metadata conversion. But it doesn't work for custom serialization.
     const auto * to_nullable = typeid_cast<const DataTypeNullable *>(command.data_type.get());
     if (!to_nullable)
@@ -1937,6 +1938,20 @@ static bool canSkipConversionToNullable(const MergeTreeDataPartPtr & part, const
     return true;
 }
 
+static bool canSkipConversionToVariant(const MergeTreeDataPartPtr & part, const MutationCommand & command)
+{
+    if (command.type != MutationCommand::READ_COLUMN)
+        return false;
+
+    auto part_column = part->tryGetColumn(command.column_name);
+    if (!part_column)
+        return false;
+
+    /// For ALTER MODIFY COLUMN with Variant extension (like 'Variant(T1, T2)' to 'Variant(T1, T2, T3, ...)')
+    /// we can skip mutation and apply only metadata conversion.
+    return isVariantExtension(part_column->type, command.data_type);
+}
+
 static bool canSkipMutationCommandForPart(const MergeTreeDataPartPtr & part, const MutationCommand & command, const ContextPtr & context)
 {
     if (command.partition)
@@ -1952,6 +1967,9 @@ static bool canSkipMutationCommandForPart(const MergeTreeDataPartPtr & part, con
     if (canSkipConversionToNullable(part, command))
         return true;
 
+    if (canSkipConversionToVariant(part, command))
+        return true;
+
     return false;
 }
 
diff --git a/tests/queries/0_stateless/02941_variant_type_alters.reference b/tests/queries/0_stateless/02941_variant_type_alters.reference
new file mode 100644
index 00000000000..52c834e455b
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_alters.reference
@@ -0,0 +1,330 @@
+Memory
+initial insert
+alter add column 1
+0	0	\N	\N	\N
+1	1	\N	\N	\N
+2	2	\N	\N	\N
+insert after alter add column 1
+0	0	\N	\N	\N
+1	1	\N	\N	\N
+2	2	\N	\N	\N
+3	3	3	\N	3
+4	4	4	\N	4
+5	5	5	\N	5
+6	6	str_6	str_6	\N
+7	7	str_7	str_7	\N
+8	8	str_8	str_8	\N
+9	9	\N	\N	\N
+10	10	\N	\N	\N
+11	11	\N	\N	\N
+12	12	12	\N	12
+13	13	str_13	str_13	\N
+14	14	\N	\N	\N
+alter modify column 1
+0	0	\N	\N	\N	\N
+1	1	\N	\N	\N	\N
+2	2	\N	\N	\N	\N
+3	3	3	\N	3	\N
+4	4	4	\N	4	\N
+5	5	5	\N	5	\N
+6	6	str_6	str_6	\N	\N
+7	7	str_7	str_7	\N	\N
+8	8	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N
+10	10	\N	\N	\N	\N
+11	11	\N	\N	\N	\N
+12	12	12	\N	12	\N
+13	13	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N
+insert after alter modify column 1
+0	0	\N	\N	\N	\N
+1	1	\N	\N	\N	\N
+2	2	\N	\N	\N	\N
+3	3	3	\N	3	\N
+4	4	4	\N	4	\N
+5	5	5	\N	5	\N
+6	6	str_6	str_6	\N	\N
+7	7	str_7	str_7	\N	\N
+8	8	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N
+10	10	\N	\N	\N	\N
+11	11	\N	\N	\N	\N
+12	12	12	\N	12	\N
+13	13	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N
+15	15	1970-01-16	\N	\N	1970-01-16
+16	16	1970-01-17	\N	\N	1970-01-17
+17	17	1970-01-18	\N	\N	1970-01-18
+18	18	1970-01-19	\N	\N	1970-01-19
+19	19	\N	\N	\N	\N
+20	20	20	\N	20	\N
+21	21	str_21	str_21	\N	\N
+alter modify column 2
+0	0	\N	\N	\N	\N	\N	\N
+1	1	\N	\N	\N	\N	\N	\N
+2	2	\N	\N	\N	\N	\N	\N
+3	3	\N	\N	3	\N	3	\N
+4	4	\N	\N	4	\N	4	\N
+5	5	\N	\N	5	\N	5	\N
+6	6	\N	\N	str_6	str_6	\N	\N
+7	7	\N	\N	str_7	str_7	\N	\N
+8	8	\N	\N	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N	\N	\N
+10	10	\N	\N	\N	\N	\N	\N
+11	11	\N	\N	\N	\N	\N	\N
+12	12	\N	\N	12	\N	12	\N
+13	13	\N	\N	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N	\N	\N
+15	15	\N	\N	1970-01-16	\N	\N	1970-01-16
+16	16	\N	\N	1970-01-17	\N	\N	1970-01-17
+17	17	\N	\N	1970-01-18	\N	\N	1970-01-18
+18	18	\N	\N	1970-01-19	\N	\N	1970-01-19
+19	19	\N	\N	\N	\N	\N	\N
+20	20	\N	\N	20	\N	20	\N
+21	21	\N	\N	str_21	str_21	\N	\N
+insert after alter modify column 2
+0	0	\N	\N	\N	\N	\N	\N
+1	1	\N	\N	\N	\N	\N	\N
+2	2	\N	\N	\N	\N	\N	\N
+3	3	\N	\N	3	\N	3	\N
+4	4	\N	\N	4	\N	4	\N
+5	5	\N	\N	5	\N	5	\N
+6	6	\N	\N	str_6	str_6	\N	\N
+7	7	\N	\N	str_7	str_7	\N	\N
+8	8	\N	\N	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N	\N	\N
+10	10	\N	\N	\N	\N	\N	\N
+11	11	\N	\N	\N	\N	\N	\N
+12	12	\N	\N	12	\N	12	\N
+13	13	\N	\N	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N	\N	\N
+15	15	\N	\N	1970-01-16	\N	\N	1970-01-16
+16	16	\N	\N	1970-01-17	\N	\N	1970-01-17
+17	17	\N	\N	1970-01-18	\N	\N	1970-01-18
+18	18	\N	\N	1970-01-19	\N	\N	1970-01-19
+19	19	\N	\N	\N	\N	\N	\N
+20	20	\N	\N	20	\N	20	\N
+21	21	\N	\N	str_21	str_21	\N	\N
+22	str_22	\N	str_22	\N	\N	\N	\N
+23	\N	\N	\N	\N	\N	\N	\N
+24	24	24	\N	\N	\N	\N	\N
+MergeTree compact
+initial insert
+alter add column 1
+0	0	\N	\N	\N
+1	1	\N	\N	\N
+2	2	\N	\N	\N
+insert after alter add column 1
+0	0	\N	\N	\N
+1	1	\N	\N	\N
+2	2	\N	\N	\N
+3	3	3	\N	3
+4	4	4	\N	4
+5	5	5	\N	5
+6	6	str_6	str_6	\N
+7	7	str_7	str_7	\N
+8	8	str_8	str_8	\N
+9	9	\N	\N	\N
+10	10	\N	\N	\N
+11	11	\N	\N	\N
+12	12	12	\N	12
+13	13	str_13	str_13	\N
+14	14	\N	\N	\N
+alter modify column 1
+0	0	\N	\N	\N	\N
+1	1	\N	\N	\N	\N
+2	2	\N	\N	\N	\N
+3	3	3	\N	3	\N
+4	4	4	\N	4	\N
+5	5	5	\N	5	\N
+6	6	str_6	str_6	\N	\N
+7	7	str_7	str_7	\N	\N
+8	8	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N
+10	10	\N	\N	\N	\N
+11	11	\N	\N	\N	\N
+12	12	12	\N	12	\N
+13	13	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N
+insert after alter modify column 1
+0	0	\N	\N	\N	\N
+1	1	\N	\N	\N	\N
+2	2	\N	\N	\N	\N
+3	3	3	\N	3	\N
+4	4	4	\N	4	\N
+5	5	5	\N	5	\N
+6	6	str_6	str_6	\N	\N
+7	7	str_7	str_7	\N	\N
+8	8	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N
+10	10	\N	\N	\N	\N
+11	11	\N	\N	\N	\N
+12	12	12	\N	12	\N
+13	13	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N
+15	15	1970-01-16	\N	\N	1970-01-16
+16	16	1970-01-17	\N	\N	1970-01-17
+17	17	1970-01-18	\N	\N	1970-01-18
+18	18	1970-01-19	\N	\N	1970-01-19
+19	19	\N	\N	\N	\N
+20	20	20	\N	20	\N
+21	21	str_21	str_21	\N	\N
+alter modify column 2
+0	0	0	\N	\N	\N	\N	\N
+1	1	1	\N	\N	\N	\N	\N
+2	2	2	\N	\N	\N	\N	\N
+3	3	3	\N	3	\N	3	\N
+4	4	4	\N	4	\N	4	\N
+5	5	5	\N	5	\N	5	\N
+6	6	6	\N	str_6	str_6	\N	\N
+7	7	7	\N	str_7	str_7	\N	\N
+8	8	8	\N	str_8	str_8	\N	\N
+9	9	9	\N	\N	\N	\N	\N
+10	10	10	\N	\N	\N	\N	\N
+11	11	11	\N	\N	\N	\N	\N
+12	12	12	\N	12	\N	12	\N
+13	13	13	\N	str_13	str_13	\N	\N
+14	14	14	\N	\N	\N	\N	\N
+15	15	15	\N	1970-01-16	\N	\N	1970-01-16
+16	16	16	\N	1970-01-17	\N	\N	1970-01-17
+17	17	17	\N	1970-01-18	\N	\N	1970-01-18
+18	18	18	\N	1970-01-19	\N	\N	1970-01-19
+19	19	19	\N	\N	\N	\N	\N
+20	20	20	\N	20	\N	20	\N
+21	21	21	\N	str_21	str_21	\N	\N
+insert after alter modify column 2
+0	0	0	\N	\N	\N	\N	\N
+1	1	1	\N	\N	\N	\N	\N
+2	2	2	\N	\N	\N	\N	\N
+3	3	3	\N	3	\N	3	\N
+4	4	4	\N	4	\N	4	\N
+5	5	5	\N	5	\N	5	\N
+6	6	6	\N	str_6	str_6	\N	\N
+7	7	7	\N	str_7	str_7	\N	\N
+8	8	8	\N	str_8	str_8	\N	\N
+9	9	9	\N	\N	\N	\N	\N
+10	10	10	\N	\N	\N	\N	\N
+11	11	11	\N	\N	\N	\N	\N
+12	12	12	\N	12	\N	12	\N
+13	13	13	\N	str_13	str_13	\N	\N
+14	14	14	\N	\N	\N	\N	\N
+15	15	15	\N	1970-01-16	\N	\N	1970-01-16
+16	16	16	\N	1970-01-17	\N	\N	1970-01-17
+17	17	17	\N	1970-01-18	\N	\N	1970-01-18
+18	18	18	\N	1970-01-19	\N	\N	1970-01-19
+19	19	19	\N	\N	\N	\N	\N
+20	20	20	\N	20	\N	20	\N
+21	21	21	\N	str_21	str_21	\N	\N
+22	str_22	\N	str_22	\N	\N	\N	\N
+23	\N	\N	\N	\N	\N	\N	\N
+24	24	24	\N	\N	\N	\N	\N
+MergeTree wide
+initial insert
+alter add column 1
+0	0	\N	\N	\N
+1	1	\N	\N	\N
+2	2	\N	\N	\N
+insert after alter add column 1
+0	0	\N	\N	\N
+1	1	\N	\N	\N
+2	2	\N	\N	\N
+3	3	3	\N	3
+4	4	4	\N	4
+5	5	5	\N	5
+6	6	str_6	str_6	\N
+7	7	str_7	str_7	\N
+8	8	str_8	str_8	\N
+9	9	\N	\N	\N
+10	10	\N	\N	\N
+11	11	\N	\N	\N
+12	12	12	\N	12
+13	13	str_13	str_13	\N
+14	14	\N	\N	\N
+alter modify column 1
+0	0	\N	\N	\N	\N
+1	1	\N	\N	\N	\N
+2	2	\N	\N	\N	\N
+3	3	3	\N	3	\N
+4	4	4	\N	4	\N
+5	5	5	\N	5	\N
+6	6	str_6	str_6	\N	\N
+7	7	str_7	str_7	\N	\N
+8	8	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N
+10	10	\N	\N	\N	\N
+11	11	\N	\N	\N	\N
+12	12	12	\N	12	\N
+13	13	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N
+insert after alter modify column 1
+0	0	\N	\N	\N	\N
+1	1	\N	\N	\N	\N
+2	2	\N	\N	\N	\N
+3	3	3	\N	3	\N
+4	4	4	\N	4	\N
+5	5	5	\N	5	\N
+6	6	str_6	str_6	\N	\N
+7	7	str_7	str_7	\N	\N
+8	8	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N
+10	10	\N	\N	\N	\N
+11	11	\N	\N	\N	\N
+12	12	12	\N	12	\N
+13	13	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N
+15	15	1970-01-16	\N	\N	1970-01-16
+16	16	1970-01-17	\N	\N	1970-01-17
+17	17	1970-01-18	\N	\N	1970-01-18
+18	18	1970-01-19	\N	\N	1970-01-19
+19	19	\N	\N	\N	\N
+20	20	20	\N	20	\N
+21	21	str_21	str_21	\N	\N
+alter modify column 2
+0	0	0	\N	\N	\N	\N	\N
+1	1	1	\N	\N	\N	\N	\N
+2	2	2	\N	\N	\N	\N	\N
+3	3	3	\N	3	\N	3	\N
+4	4	4	\N	4	\N	4	\N
+5	5	5	\N	5	\N	5	\N
+6	6	6	\N	str_6	str_6	\N	\N
+7	7	7	\N	str_7	str_7	\N	\N
+8	8	8	\N	str_8	str_8	\N	\N
+9	9	9	\N	\N	\N	\N	\N
+10	10	10	\N	\N	\N	\N	\N
+11	11	11	\N	\N	\N	\N	\N
+12	12	12	\N	12	\N	12	\N
+13	13	13	\N	str_13	str_13	\N	\N
+14	14	14	\N	\N	\N	\N	\N
+15	15	15	\N	1970-01-16	\N	\N	1970-01-16
+16	16	16	\N	1970-01-17	\N	\N	1970-01-17
+17	17	17	\N	1970-01-18	\N	\N	1970-01-18
+18	18	18	\N	1970-01-19	\N	\N	1970-01-19
+19	19	19	\N	\N	\N	\N	\N
+20	20	20	\N	20	\N	20	\N
+21	21	21	\N	str_21	str_21	\N	\N
+insert after alter modify column 2
+0	0	0	\N	\N	\N	\N	\N
+1	1	1	\N	\N	\N	\N	\N
+2	2	2	\N	\N	\N	\N	\N
+3	3	3	\N	3	\N	3	\N
+4	4	4	\N	4	\N	4	\N
+5	5	5	\N	5	\N	5	\N
+6	6	6	\N	str_6	str_6	\N	\N
+7	7	7	\N	str_7	str_7	\N	\N
+8	8	8	\N	str_8	str_8	\N	\N
+9	9	9	\N	\N	\N	\N	\N
+10	10	10	\N	\N	\N	\N	\N
+11	11	11	\N	\N	\N	\N	\N
+12	12	12	\N	12	\N	12	\N
+13	13	13	\N	str_13	str_13	\N	\N
+14	14	14	\N	\N	\N	\N	\N
+15	15	15	\N	1970-01-16	\N	\N	1970-01-16
+16	16	16	\N	1970-01-17	\N	\N	1970-01-17
+17	17	17	\N	1970-01-18	\N	\N	1970-01-18
+18	18	18	\N	1970-01-19	\N	\N	1970-01-19
+19	19	19	\N	\N	\N	\N	\N
+20	20	20	\N	20	\N	20	\N
+21	21	21	\N	str_21	str_21	\N	\N
+22	str_22	\N	str_22	\N	\N	\N	\N
+23	\N	\N	\N	\N	\N	\N	\N
+24	24	24	\N	\N	\N	\N	\N
diff --git a/tests/queries/0_stateless/02941_variant_type_alters.sh b/tests/queries/0_stateless/02941_variant_type_alters.sh
new file mode 100755
index 00000000000..9b0d4febd65
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_alters.sh
@@ -0,0 +1,61 @@
+#!/usr/bin/env bash
+# Tags: long
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+
+function run()
+{
+    echo "initial insert"
+    $CH_CLIENT -q "insert into test select number, number from numbers(3)"
+
+    echo "alter add column 1"
+    $CH_CLIENT -q "alter table test add column v Variant(UInt64, String) settings mutations_sync=1"
+    $CH_CLIENT -q "select x, y, v, v.String, v.UInt64 from test order by x"
+
+    echo "insert after alter add column 1"
+    $CH_CLIENT -q "insert into test select number, number, number from numbers(3, 3)"
+    $CH_CLIENT -q "insert into test select number, number, 'str_' || toString(number) from numbers(6, 3)"
+    $CH_CLIENT -q "insert into test select number, number, NULL from numbers(9, 3)"
+    $CH_CLIENT -q "insert into test select number, number, multiIf(number % 3 == 0, number, number % 3 == 1, 'str_' || toString(number), NULL) from numbers(12, 3)"
+    $CH_CLIENT -q "select x, y, v, v.String, v.UInt64 from test order by x"
+
+    echo "alter modify column 1"
+    $CH_CLIENT -q "alter table test modify column v Variant(UInt64, String, Date) settings mutations_sync=1"
+    $CH_CLIENT -q "select x, y, v, v.String, v.UInt64, v.Date from test order by x"
+
+    echo "insert after alter modify column 1"
+    $CH_CLIENT -q "insert into test select number, number, toDate(number) from numbers(15, 3)"
+    $CH_CLIENT -q "insert into test select number, number, multiIf(number % 4 == 0, number, number % 4 == 1, 'str_' || toString(number), number % 4 == 2, toDate(number), NULL) from numbers(18, 4)"
+    $CH_CLIENT -q "select x, y, v, v.String, v.UInt64, v.Date from test order by x"
+
+    echo "alter modify column 2"
+    $CH_CLIENT -q "alter table test modify column y Variant(UInt64, String) settings mutations_sync=1"
+    $CH_CLIENT -q "select x, y, y.UInt64, y.String, v, v.String, v.UInt64, v.Date from test order by x"
+
+    echo "insert after alter modify column 2"
+    $CH_CLIENT -q "insert into test select number, multiIf(number % 3 == 0, number, number % 3 == 1, 'str_' || toString(number), NULL), NULL from numbers(22, 3)"
+    $CH_CLIENT -q "select x, y, y.UInt64, y.String, v, v.String, v.UInt64, v.Date from test order by x"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (x UInt64, y UInt64) engine=Memory"
+run
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (x UInt64, y UInt64) engine=MergeTree order by x settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+run
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (x UInt64, y UInt64 ) engine=MergeTree order by x settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+run
+$CH_CLIENT -q "drop table test;"

From 4109b6608186b1b9d9dce60f1821313294b7e7c4 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 18 Jan 2024 17:30:32 +0000
Subject: [PATCH 064/245] Remove unneded tag from test

---
 tests/queries/0_stateless/02941_variant_type_alters.sh | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/queries/0_stateless/02941_variant_type_alters.sh b/tests/queries/0_stateless/02941_variant_type_alters.sh
index 9b0d4febd65..7e2ecbd67aa 100755
--- a/tests/queries/0_stateless/02941_variant_type_alters.sh
+++ b/tests/queries/0_stateless/02941_variant_type_alters.sh
@@ -1,5 +1,4 @@
 #!/usr/bin/env bash
-# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment

From 3dcc2056a59f9b374b4de3b72c30107dd7825d47 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 18 Jan 2024 20:39:36 +0000
Subject: [PATCH 065/245] Fix conflicts

---
 src/DataTypes/Serializations/ISerialization.cpp       | 1 +
 src/DataTypes/Serializations/ISerialization.h         | 1 +
 src/DataTypes/Serializations/SerializationVariant.cpp | 2 +-
 3 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/DataTypes/Serializations/ISerialization.cpp b/src/DataTypes/Serializations/ISerialization.cpp
index 2f1eb1887af..7d57d72090b 100644
--- a/src/DataTypes/Serializations/ISerialization.cpp
+++ b/src/DataTypes/Serializations/ISerialization.cpp
@@ -54,6 +54,7 @@ const std::set<SubstreamType> ISerialization::Substream::named_types
     TupleElement,
     NamedOffsets,
     NamedNullMap,
+    NamedVariantDiscriminators,
 };
 
 String ISerialization::Substream::toString() const
diff --git a/src/DataTypes/Serializations/ISerialization.h b/src/DataTypes/Serializations/ISerialization.h
index 64a7a889640..7fba9db4acf 100644
--- a/src/DataTypes/Serializations/ISerialization.h
+++ b/src/DataTypes/Serializations/ISerialization.h
@@ -155,6 +155,7 @@ public:
             ObjectData,
 
             VariantDiscriminators,
+            NamedVariantDiscriminators,
             VariantOffsets,
             VariantElements,
             VariantElement,
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 48a78dd54a9..5af94364167 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -36,7 +36,7 @@ void SerializationVariant::enumerateStreams(
     const auto * type_variant = data.type ? &assert_cast<const DataTypeVariant &>(*data.type) : nullptr;
     const auto * column_variant = data.column ? &assert_cast<const ColumnVariant &>(*data.column) : nullptr;
 
-    auto discriminators_serialization = std::make_shared<SerializationNamed>(std::make_shared<SerializationNumber<ColumnVariant::Discriminator>>(), "discr", false);
+    auto discriminators_serialization = std::make_shared<SerializationNamed>(std::make_shared<SerializationNumber<ColumnVariant::Discriminator>>(), "discr", SubstreamType::NamedVariantDiscriminators);
     auto local_discriminators = column_variant ? column_variant->getLocalDiscriminatorsPtr() : nullptr;
 
     settings.path.push_back(Substream::VariantDiscriminators);

From cfc8c60aa70917e48281e3583adc922967326d50 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 18 Jan 2024 21:26:55 +0000
Subject: [PATCH 066/245] Fix build

---
 src/DataTypes/Serializations/SerializationVariantElement.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index 80524cbd814..8d0acee1c2b 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -208,8 +208,8 @@ void SerializationVariantElement::removeVariantFromPath(DB::ISerialization::Subs
 }
 
 SerializationVariantElement::VariantSubcolumnCreator::VariantSubcolumnCreator(
-    const DB::ColumnPtr & local_discriminators_,
-    const DB::String & variant_element_name_,
+    const ColumnPtr & local_discriminators_,
+    const String & variant_element_name_,
     const ColumnVariant::Discriminator global_variant_discriminator_,
     const ColumnVariant::Discriminator local_variant_discriminator_)
     : local_discriminators(local_discriminators_)

From 7ae631de1ed1ff4bcb8bac5e06c2026db3ff972c Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 19 Jan 2024 10:23:40 +0000
Subject: [PATCH 067/245] Remove wron check, remove duplicate tests

---
 .../SerializationVariantElement.cpp           |  4 --
 ...> 02943_variant_read_subcolumns.reference} |  0
 ..._1.sh => 02943_variant_read_subcolumns.sh} |  0
 .../02943_variant_read_subcolumns_2.reference |  6 ---
 .../02943_variant_read_subcolumns_2.sh        | 38 -------------------
 5 files changed, 48 deletions(-)
 rename tests/queries/0_stateless/{02943_variant_read_subcolumns_1.reference => 02943_variant_read_subcolumns.reference} (100%)
 rename tests/queries/0_stateless/{02943_variant_read_subcolumns_1.sh => 02943_variant_read_subcolumns.sh} (100%)
 delete mode 100644 tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference
 delete mode 100755 tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh

diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index 8d0acee1c2b..56f0e5d77be 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -156,7 +156,6 @@ void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
         return;
     }
 
-    size_t prev_variant_size = variant_element_state->variant->size();
     addVariantToPath(settings.path);
     nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_element_state->variant, variant_limit, settings, variant_element_state->variant_element_state, cache);
     removeVariantFromPath(settings.path);
@@ -171,9 +170,6 @@ void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
         return;
     }
 
-    if (variant_element_state->variant->size() != prev_variant_size + variant_limit)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected variant column size after deserialization. Expected {}, got {}", prev_variant_size + variant_limit, variant_element_state->variant->size());
-
     size_t variant_offset = variant_element_state->variant->size() - variant_limit;
 
     /// If we have only our discriminator in range, insert the whole range to result column.
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_1.reference b/tests/queries/0_stateless/02943_variant_read_subcolumns.reference
similarity index 100%
rename from tests/queries/0_stateless/02943_variant_read_subcolumns_1.reference
rename to tests/queries/0_stateless/02943_variant_read_subcolumns.reference
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_1.sh b/tests/queries/0_stateless/02943_variant_read_subcolumns.sh
similarity index 100%
rename from tests/queries/0_stateless/02943_variant_read_subcolumns_1.sh
rename to tests/queries/0_stateless/02943_variant_read_subcolumns.sh
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference b/tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference
deleted file mode 100644
index 4b93782cddf..00000000000
--- a/tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference
+++ /dev/null
@@ -1,6 +0,0 @@
-Memory
-test
-MergeTree compact
-test
-MergeTree wide
-test
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh b/tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh
deleted file mode 100755
index 9ccad55191f..00000000000
--- a/tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh
+++ /dev/null
@@ -1,38 +0,0 @@
-#!/usr/bin/env bash
-# Tags: long
-
-CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# reset --log_comment
-CLICKHOUSE_LOG_COMMENT=
-# shellcheck source=../shell_config.sh
-. "$CUR_DIR"/../shell_config.sh
-
-CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
-
-
-function test()
-{
-    echo "test"
-    $CH_CLIENT -q "insert into test select number, multiIf(number % 3 == 2, NULL, number % 3 == 1, number, arrayMap(x -> multiIf(number % 9 == 0, NULL, number % 9 == 3, 'str_' || toString(number), number), range(number % 10))) from numbers(1000000) settings min_insert_block_size_rows=100000"
-    $CH_CLIENT -q "select v, v.UInt64, v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64 from test order by id format Null"
-    $CH_CLIENT -q "select v.UInt64, v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64 from test order by id format Null"
-    $CH_CLIENT -q "select v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64, v.\`Array(Variant(String, UInt64))\`.String from test order by id format Null"
-}
-
-$CH_CLIENT -q "drop table if exists test;"
-
-echo "Memory"
-$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=Memory"
-test
-$CH_CLIENT -q "drop table test;"
-
-echo "MergeTree compact"
-$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=MergeTree order by id settings min_rows_for_wide_part=1000000000, min_bytes_for_wide_part=10000000000;"
-test
-$CH_CLIENT -q "drop table test;"
-
-echo "MergeTree wide"
-$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
-test
-$CH_CLIENT -q "drop table test;"
-

From 0c85339ddb26e00ac64d6c763a0f5019b7ee2619 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 19 Jan 2024 10:50:13 +0000
Subject: [PATCH 068/245] Fix style

---
 src/DataTypes/Serializations/SerializationVariantElement.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index 56f0e5d77be..053f8d22d5a 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -9,7 +9,6 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int NOT_IMPLEMENTED;
-    extern const int LOGICAL_ERROR;
 }
 
 void SerializationVariantElement::enumerateStreams(

From a196d04a1c2d5f36ec43c2b0947916be7321037c Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 19 Jan 2024 12:04:16 +0100
Subject: [PATCH 069/245] Update test

---
 .../test_broken_projections/test.py           | 94 +++++++++++++++++--
 1 file changed, 84 insertions(+), 10 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 1b192e0df24..48ed10d0f87 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -159,6 +159,19 @@ def get_broken_projections_info(node, table):
     ).strip()
 
 
+def get_projections_info(node, table):
+    return node.query(
+        f"""
+    SELECT parent_name, name, is_broken
+    FROM system.projection_parts
+    WHERE table='{table}'
+    AND active = 1
+    AND database=currentDatabase()
+    ORDER BY parent_name, name
+    """
+    ).strip()
+
+
 def optimize(node, table, final, no_wait):
     query = f"OPTIMIZE TABLE {table}"
     if final:
@@ -389,6 +402,11 @@ def test_broken_ignored_replicated(cluster):
     assert "has a broken projection" not in check_table_full(node, table_name)
 
 
+def get_random_string(string_length=8):
+    alphabet = string.ascii_letters + string.digits
+    return "".join((random.choice(alphabet) for _ in range(string_length)))
+
+
 def test_broken_projections_in_backups(cluster):
     node = cluster.instances["node"]
 
@@ -400,6 +418,10 @@ def test_broken_projections_in_backups(cluster):
     insert(node, table_name, 10, 5)
     insert(node, table_name, 15, 5)
 
+    assert ["all_0_0_0", "all_1_1_0", "all_2_2_0", "all_3_3_0"] == get_parts(
+        node, table_name
+    )
+
     check(node, table_name, 1)
 
     break_projection(node, table_name, "proj", "all_2_2_0", "data")
@@ -409,10 +431,23 @@ def test_broken_projections_in_backups(cluster):
         node, table_name
     )
 
+    assert (
+        "all_0_0_0\tproj\t0\n"
+        "all_0_0_0\tproj_2\t0\n"
+        "all_1_1_0\tproj\t0\n"
+        "all_1_1_0\tproj_2\t0\n"
+        "all_2_2_0\tproj\t1\n"
+        "all_2_2_0\tproj_2\t0\n"
+        "all_3_3_0\tproj\t0\n"
+        "all_3_3_0\tproj_2\t0"
+        == get_projections_info(node, table_name)
+    )
+
+    backup_name = f"b1-{get_random_string()}"
     assert "BACKUP_CREATED" in node.query(
         f"""
     set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table {table_name} to Disk('backups', 'b1') settings check_projection_parts=false;
+    backup table {table_name} to Disk('backups', '{backup_name}') settings check_projection_parts=false;
     """
     )
 
@@ -420,18 +455,30 @@ def test_broken_projections_in_backups(cluster):
         f"""
     drop table {table_name} sync;
     set backup_restore_keeper_fault_injection_probability=0.0;
-    restore table {table_name} from Disk('backups', 'b1');
+    restore table {table_name} from Disk('backups', '{backup_name}');
     """
     )
 
+    assert (
+        "all_0_0_0\tproj\t0\n"
+        "all_0_0_0\tproj_2\t0\n"
+        "all_1_1_0\tproj\t0\n"
+        "all_1_1_0\tproj_2\t0\n"
+        "all_2_2_0\tproj\t0\n"
+        "all_2_2_0\tproj_2\t0\n"
+        "all_3_3_0\tproj\t0\n"
+        "all_3_3_0\tproj_2\t0"
+        == get_projections_info(node, table_name)
+    )
+
     check(node, table_name, 1)
     assert "" == get_broken_projections_info(node, table_name)
 
-    break_projection(node, table_name, "proj", "all_2_2_0", "part")
+    break_projection(node, table_name, "proj_2", "all_2_2_0", "part")
 
-    check(node, table_name, 0, "proj", "ErrnoException")
+    check(node, table_name, 0, "proj_2", "ErrnoException")
 
-    assert "all_2_2_0\tproj\tFILE_DOESNT_EXIST" == get_broken_projections_info(
+    assert "all_2_2_0\tproj_2\tFILE_DOESNT_EXIST" == get_broken_projections_info(
         node, table_name
     )
 
@@ -442,13 +489,14 @@ def test_broken_projections_in_backups(cluster):
     """
     )
 
-    materialize_projection(node, table_name, "proj")
+    materialize_projection(node, table_name, "proj_2")
     check(node, table_name, 1)
 
+    backup_name = f"b3-{get_random_string()}"
     assert "BACKUP_CREATED" in node.query(
         f"""
     set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table {table_name} to Disk('backups', 'b3') settings check_projection_parts=false;
+    backup table {table_name} to Disk('backups', '{backup_name}') settings check_projection_parts=false;
     """
     )
 
@@ -456,11 +504,23 @@ def test_broken_projections_in_backups(cluster):
         f"""
     drop table {table_name} sync;
     set backup_restore_keeper_fault_injection_probability=0.0;
-    restore table {table_name} from Disk('backups', 'b3');
+    restore table {table_name} from Disk('backups', '{backup_name}');
     """
     )
     check(node, table_name, 1)
 
+    assert (
+        "all_0_0_0\tproj\t0\n"
+        "all_0_0_0\tproj_2\t0\n"
+        "all_1_1_0\tproj\t0\n"
+        "all_1_1_0\tproj_2\t0\n"
+        "all_2_2_0\tproj\t0\n"
+        "all_2_2_0\tproj_2\t0\n"
+        "all_3_3_0\tproj\t0\n"
+        "all_3_3_0\tproj_2\t0"
+        == get_projections_info(node, table_name)
+    )
+
     break_projection(node, table_name, "proj", "all_1_1_0", "part")
     assert "Part all_1_1_0 has a broken projection proj" in check_table_full(
         node, table_name
@@ -469,10 +529,11 @@ def test_broken_projections_in_backups(cluster):
         node, table_name
     )
 
+    backup_name = f"b4-{get_random_string()}"
     assert "BACKUP_CREATED" in node.query(
         f"""
     set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table {table_name} to Disk('backups', 'b4') settings check_projection_parts=false, allow_backup_broken_projections=true;
+    backup table {table_name} to Disk('backups', '{backup_name}') settings check_projection_parts=false, allow_backup_broken_projections=true;
     """
     )
 
@@ -480,9 +541,22 @@ def test_broken_projections_in_backups(cluster):
         f"""
     drop table {table_name} sync;
     set backup_restore_keeper_fault_injection_probability=0.0;
-    restore table {table_name} from Disk('backups', 'b4');
+    restore table {table_name} from Disk('backups', '{backup_name}');
     """
     )
+
+    assert (
+        "all_0_0_0\tproj\t0\n"
+        "all_0_0_0\tproj_2\t0\n"
+        "all_1_1_0\tproj\t1\n"
+        "all_1_1_0\tproj_2\t0\n"
+        "all_2_2_0\tproj\t0\n"
+        "all_2_2_0\tproj_2\t0\n"
+        "all_3_3_0\tproj\t0\n"
+        "all_3_3_0\tproj_2\t0"
+        == get_projections_info(node, table_name)
+    )
+
     check(node, table_name, 0)
     assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(
         node, table_name

From 580501c2b42231eacc4e843968aeb876ff784297 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 19 Jan 2024 11:08:56 +0000
Subject: [PATCH 070/245] Add new settings to settings changes history

---
 src/Core/SettingsChangesHistory.h | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 62ffd837a33..af213983b66 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -83,7 +83,9 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
 {
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
-              {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"}}},
+              {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},
+              {"allow_experimental_variant_type", false, false, "Add new experimental Variant type"},
+              {"use_variant_when_no_common_type_in_if", false, false, "Allow to use Variant in if/multiIf if there is no common type"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},

From 7c66141e08ec203dbff908d69d929ea3bfc0995f Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 19 Jan 2024 11:11:13 +0000
Subject: [PATCH 071/245] Automatic style fix

---
 tests/integration/test_broken_projections/test.py | 12 ++++--------
 1 file changed, 4 insertions(+), 8 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 48ed10d0f87..8e3978a078e 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -439,8 +439,7 @@ def test_broken_projections_in_backups(cluster):
         "all_2_2_0\tproj\t1\n"
         "all_2_2_0\tproj_2\t0\n"
         "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0"
-        == get_projections_info(node, table_name)
+        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
     )
 
     backup_name = f"b1-{get_random_string()}"
@@ -467,8 +466,7 @@ def test_broken_projections_in_backups(cluster):
         "all_2_2_0\tproj\t0\n"
         "all_2_2_0\tproj_2\t0\n"
         "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0"
-        == get_projections_info(node, table_name)
+        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
     )
 
     check(node, table_name, 1)
@@ -517,8 +515,7 @@ def test_broken_projections_in_backups(cluster):
         "all_2_2_0\tproj\t0\n"
         "all_2_2_0\tproj_2\t0\n"
         "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0"
-        == get_projections_info(node, table_name)
+        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
     )
 
     break_projection(node, table_name, "proj", "all_1_1_0", "part")
@@ -553,8 +550,7 @@ def test_broken_projections_in_backups(cluster):
         "all_2_2_0\tproj\t0\n"
         "all_2_2_0\tproj_2\t0\n"
         "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0"
-        == get_projections_info(node, table_name)
+        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
     )
 
     check(node, table_name, 0)

From c51d1f04f6d135c63f5123d4aaef47cef5474525 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Fri, 19 Jan 2024 15:57:20 +0100
Subject: [PATCH 072/245] Add settings max_unexpected_write_error_retries for
 Azure Blob Storage

---
 src/Core/Settings.h                                    |  1 +
 src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp       | 10 +++++-----
 src/Disks/IO/WriteBufferFromAzureBlobStorage.h         |  2 ++
 .../AzureBlobStorage/AzureBlobStorageAuth.cpp          |  3 ++-
 .../AzureBlobStorage/AzureObjectStorage.cpp            |  1 +
 .../AzureBlobStorage/AzureObjectStorage.h              |  5 ++++-
 6 files changed, 15 insertions(+), 7 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 292e945a29c..59f32c60f63 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -86,6 +86,7 @@ class IColumn;
     M(UInt64, azure_max_single_part_upload_size, 100*1024*1024, "The maximum size of object to upload using singlepart upload to Azure blob storage.", 0) \
     M(UInt64, s3_max_single_read_retries, 4, "The maximum number of retries during single S3 read.", 0) \
     M(UInt64, azure_max_single_read_retries, 4, "The maximum number of retries during single Azure blob storage read.", 0) \
+    M(UInt64, azure_max_unexpected_write_error_retries, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write", 0) \
     M(UInt64, s3_max_unexpected_write_error_retries, 4, "The maximum number of retries in case of unexpected errors during S3 write.", 0) \
     M(UInt64, s3_max_redirects, 10, "Max number of S3 redirects hops allowed.", 0) \
     M(UInt64, s3_max_connections, 1024, "The maximum number of connections per server.", 0) \
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index 60bc04f5f95..b4665eb7346 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -18,17 +18,17 @@ namespace ProfileEvents
 namespace DB
 {
 
-static constexpr auto DEFAULT_RETRY_NUM = 3;
-
 WriteBufferFromAzureBlobStorage::WriteBufferFromAzureBlobStorage(
     std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> blob_container_client_,
     const String & blob_path_,
     size_t max_single_part_upload_size_,
+    size_t max_unexpected_write_error_retries_,
     size_t buf_size_,
     const WriteSettings & write_settings_)
     : WriteBufferFromFileBase(buf_size_, nullptr, 0)
     , log(&Poco::Logger::get("WriteBufferFromAzureBlobStorage"))
     , max_single_part_upload_size(max_single_part_upload_size_)
+    , max_unexpected_write_error_retries(max_unexpected_write_error_retries_)
     , blob_path(blob_path_)
     , write_settings(write_settings_)
     , blob_container_client(blob_container_client_)
@@ -77,13 +77,13 @@ void WriteBufferFromAzureBlobStorage::execWithRetry(std::function<void()> func,
 
 void WriteBufferFromAzureBlobStorage::finalizeImpl()
 {
-    execWithRetry([this](){ next(); }, DEFAULT_RETRY_NUM);
+    execWithRetry([this](){ next(); }, max_unexpected_write_error_retries);
 
     if (tmp_buffer_write_offset > 0)
         uploadBlock(tmp_buffer->data(), tmp_buffer_write_offset);
 
     auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
-    execWithRetry([&](){ block_blob_client.CommitBlockList(block_ids); }, DEFAULT_RETRY_NUM);
+    execWithRetry([&](){ block_blob_client.CommitBlockList(block_ids); }, max_unexpected_write_error_retries);
 
     LOG_TRACE(log, "Committed {} blocks for blob `{}`", block_ids.size(), blob_path);
 }
@@ -94,7 +94,7 @@ void WriteBufferFromAzureBlobStorage::uploadBlock(const char * data, size_t size
     const std::string & block_id = block_ids.emplace_back(getRandomASCIIString(64));
 
     Azure::Core::IO::MemoryBodyStream memory_stream(reinterpret_cast<const uint8_t *>(data), size);
-    execWithRetry([&](){ block_blob_client.StageBlock(block_id, memory_stream); }, DEFAULT_RETRY_NUM, size);
+    execWithRetry([&](){ block_blob_client.StageBlock(block_id, memory_stream); }, max_unexpected_write_error_retries, size);
     tmp_buffer_write_offset = 0;
 
     LOG_TRACE(log, "Staged block (id: {}) of size {} (blob path: {}).", block_id, size, blob_path);
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
index f1be81922e1..7494130134b 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
@@ -30,6 +30,7 @@ public:
         AzureClientPtr blob_container_client_,
         const String & blob_path_,
         size_t max_single_part_upload_size_,
+        size_t max_unexpected_write_error_retries_,
         size_t buf_size_,
         const WriteSettings & write_settings_);
 
@@ -48,6 +49,7 @@ private:
     Poco::Logger * log;
 
     const size_t max_single_part_upload_size;
+    const size_t max_unexpected_write_error_retries;
     const std::string blob_path;
     const WriteSettings write_settings;
 
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
index a5c8afe0264..a209049ceee 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
@@ -164,7 +164,8 @@ std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Po
         config.getUInt64(config_prefix + ".min_bytes_for_seek", 1024 * 1024),
         config.getInt(config_prefix + ".max_single_read_retries", 3),
         config.getInt(config_prefix + ".max_single_download_retries", 3),
-        config.getInt(config_prefix + ".list_object_keys_size", 1000)
+        config.getInt(config_prefix + ".list_object_keys_size", 1000),
+        config.getUInt64(config_prefix + ".max_unexpected_write_error_retries", 4)
     );
 }
 
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
index 068e2aebab1..683bfeb74a7 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
@@ -268,6 +268,7 @@ std::unique_ptr<WriteBufferFromFileBase> AzureObjectStorage::writeObject( /// NO
         client.get(),
         object.remote_path,
         settings.get()->max_single_part_upload_size,
+        settings.get()->max_unexpected_write_error_retries,
         buf_size,
         patchSettings(write_settings));
 }
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 4718dce9bf9..2d505c6a022 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -23,12 +23,14 @@ struct AzureObjectStorageSettings
         uint64_t min_bytes_for_seek_,
         int max_single_read_retries_,
         int max_single_download_retries_,
-        int list_object_keys_size_)
+        int list_object_keys_size_,
+        size_t max_unexpected_write_error_retries_)
         : max_single_part_upload_size(max_single_part_upload_size_)
         , min_bytes_for_seek(min_bytes_for_seek_)
         , max_single_read_retries(max_single_read_retries_)
         , max_single_download_retries(max_single_download_retries_)
         , list_object_keys_size(list_object_keys_size_)
+        , max_unexpected_write_error_retries (max_unexpected_write_error_retries_)
     {
     }
 
@@ -39,6 +41,7 @@ struct AzureObjectStorageSettings
     size_t max_single_read_retries = 3;
     size_t max_single_download_retries = 3;
     int list_object_keys_size = 1000;
+    size_t max_unexpected_write_error_retries = 4;
 };
 
 using AzureClient = Azure::Storage::Blobs::BlobContainerClient;

From d22fc3a224ac29857f3dc3eb60ff872221829006 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Fri, 19 Jan 2024 16:13:58 +0100
Subject: [PATCH 073/245] Updated to fetch default from settings

---
 .../ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
index a209049ceee..e0199fde98b 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
@@ -7,6 +7,7 @@
 #include <optional>
 #include <azure/identity/managed_identity_credential.hpp>
 #include <Poco/Util/AbstractConfiguration.h>
+#include <Interpreters/Context.h>
 
 using namespace Azure::Storage::Blobs;
 
@@ -157,7 +158,7 @@ std::unique_ptr<BlobContainerClient> getAzureBlobContainerClient(
     }
 }
 
-std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Poco::Util::AbstractConfiguration & config, const String & config_prefix, ContextPtr /*context*/)
+std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Poco::Util::AbstractConfiguration & config, const String & config_prefix, ContextPtr context)
 {
     return std::make_unique<AzureObjectStorageSettings>(
         config.getUInt64(config_prefix + ".max_single_part_upload_size", 100 * 1024 * 1024),
@@ -165,7 +166,7 @@ std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Po
         config.getInt(config_prefix + ".max_single_read_retries", 3),
         config.getInt(config_prefix + ".max_single_download_retries", 3),
         config.getInt(config_prefix + ".list_object_keys_size", 1000),
-        config.getUInt64(config_prefix + ".max_unexpected_write_error_retries", 4)
+        config.getUInt64(config_prefix + ".max_unexpected_write_error_retries", context->getSettings().azure_max_unexpected_write_error_retries)
     );
 }
 

From caf9d8df6d789203a4e408341c9494952eb14ad2 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Sat, 20 Jan 2024 14:59:13 +0100
Subject: [PATCH 074/245] Update test.py

---
 tests/integration/test_broken_projections/test.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 8e3978a078e..d750bb5827d 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -413,6 +413,8 @@ def test_broken_projections_in_backups(cluster):
     table_name = "test4"
     create_table(node, table_name, 1)
 
+    node.qeury("SYSTEM STOP MERGES")
+
     insert(node, table_name, 0, 5)
     insert(node, table_name, 5, 5)
     insert(node, table_name, 10, 5)
@@ -557,3 +559,4 @@ def test_broken_projections_in_backups(cluster):
     assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(
         node, table_name
     )
+    node.qeury("SYSTEM START MERGES")

From e5c3b67f379efdd6d403be08f8bce164348663a1 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Sat, 20 Jan 2024 16:10:09 +0100
Subject: [PATCH 075/245] Update test.py

---
 tests/integration/test_broken_projections/test.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index d750bb5827d..acf0160cf1b 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -413,7 +413,7 @@ def test_broken_projections_in_backups(cluster):
     table_name = "test4"
     create_table(node, table_name, 1)
 
-    node.qeury("SYSTEM STOP MERGES")
+    node.query("SYSTEM STOP MERGES")
 
     insert(node, table_name, 0, 5)
     insert(node, table_name, 5, 5)
@@ -559,4 +559,4 @@ def test_broken_projections_in_backups(cluster):
     assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(
         node, table_name
     )
-    node.qeury("SYSTEM START MERGES")
+    node.query("SYSTEM START MERGES")

From 02b178cc9c9b38a30344e2ddd896c1eaf429c3de Mon Sep 17 00:00:00 2001
From: MochiXu <mochi_xu@icloud.com>
Date: Mon, 22 Jan 2024 11:08:03 +0800
Subject: [PATCH 076/245] fix drop inverted index

---
 src/Storages/MergeTree/MutateTask.cpp | 22 ++++++++++++++--------
 1 file changed, 14 insertions(+), 8 deletions(-)

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index e4070aa8262..8ed8b8bba4c 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -674,15 +674,21 @@ static NameToNameVector collectFilesForRenames(
     {
         if (command.type == MutationCommand::Type::DROP_INDEX)
         {
-            if (source_part->checksums.has(INDEX_FILE_PREFIX + command.column_name + ".idx2"))
+            const std::vector<String> suffixes = {".idx2", ".idx", ".gin_dict", ".gin_post", ".gin_seg", ".gin_sid"};
+
+            for (const auto& suffix : suffixes)
             {
-                add_rename(INDEX_FILE_PREFIX + command.column_name + ".idx2", "");
-                add_rename(INDEX_FILE_PREFIX + command.column_name + mrk_extension, "");
-            }
-            else if (source_part->checksums.has(INDEX_FILE_PREFIX + command.column_name + ".idx"))
-            {
-                add_rename(INDEX_FILE_PREFIX + command.column_name + ".idx", "");
-                add_rename(INDEX_FILE_PREFIX + command.column_name + mrk_extension, "");
+                String filename = INDEX_FILE_PREFIX + command.column_name + suffix;
+
+                if ((suffix == ".idx2" || suffix == ".idx") && source_part->checksums.has(filename))
+                {
+                    add_rename(filename, "");
+                    add_rename(INDEX_FILE_PREFIX + command.column_name + mrk_extension, "");
+                }
+                else if (source_part->checksums.has(filename))
+                {
+                    add_rename(filename, "");
+                }
             }
         }
         else if (command.type == MutationCommand::Type::DROP_PROJECTION)

From b4dcd6755a8a2384e5937991e0656058aed4f95a Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 22 Jan 2024 13:41:58 +0000
Subject: [PATCH 077/245] Use ColumnConst instead of Field in
 IColumn::createWithOffsets

---
 src/Columns/ColumnConst.cpp                   | 22 +++++++++++++++++++
 src/Columns/ColumnConst.h                     |  5 +++++
 src/Columns/ColumnNullable.cpp                | 16 ++++++--------
 src/Columns/ColumnNullable.h                  |  2 +-
 src/Columns/ColumnObject.cpp                  |  3 ++-
 src/Columns/ColumnSparse.cpp                  |  3 ++-
 src/Columns/ColumnVector.cpp                  |  5 +++--
 src/Columns/ColumnVector.h                    |  2 +-
 src/Columns/IColumn.cpp                       |  6 ++---
 src/Columns/IColumn.h                         |  5 +++--
 src/Functions/IFunction.cpp                   |  4 ++--
 .../0_stateless/02941_variant_type_alters.sh  |  1 +
 12 files changed, 52 insertions(+), 22 deletions(-)

diff --git a/src/Columns/ColumnConst.cpp b/src/Columns/ColumnConst.cpp
index 9aa0f5cfa49..6e5a3c45c4e 100644
--- a/src/Columns/ColumnConst.cpp
+++ b/src/Columns/ColumnConst.cpp
@@ -159,4 +159,26 @@ void ColumnConst::compareColumn(
     std::fill(compare_results.begin(), compare_results.end(), res);
 }
 
+ColumnConst::Ptr createColumnConst(const ColumnPtr & column, Field value)
+{
+    auto data = column->cloneEmpty();
+    data->insert(value);
+    return ColumnConst::create(std::move(data), 1);
+}
+
+ColumnConst::Ptr createColumnConst(const ColumnPtr & column, size_t const_value_index)
+{
+    auto data = column->cloneEmpty();
+    data->insertFrom(*column, const_value_index);
+    return ColumnConst::create(std::move(data), 1);
+}
+
+ColumnConst::Ptr createColumnConstWithDefaultValue(const ColumnPtr & column)
+{
+    auto data = column->cloneEmpty();
+    data->insertDefault();
+    return ColumnConst::create(std::move(data), 1);
+}
+
+
 }
diff --git a/src/Columns/ColumnConst.h b/src/Columns/ColumnConst.h
index dc84e0c2402..3c646a62795 100644
--- a/src/Columns/ColumnConst.h
+++ b/src/Columns/ColumnConst.h
@@ -292,4 +292,9 @@ public:
     bool isCollationSupported() const override { return data->isCollationSupported(); }
 };
 
+ColumnConst::Ptr createColumnConst(const ColumnPtr & column, Field value);
+ColumnConst::Ptr createColumnConst(const ColumnPtr & column, size_t const_value_index);
+ColumnConst::Ptr createColumnConstWithDefaultValue(const ColumnPtr  &column);
+
+
 }
diff --git a/src/Columns/ColumnNullable.cpp b/src/Columns/ColumnNullable.cpp
index 25b0e35e15e..c0b13204b8e 100644
--- a/src/Columns/ColumnNullable.cpp
+++ b/src/Columns/ColumnNullable.cpp
@@ -827,24 +827,22 @@ void ColumnNullable::checkConsistency() const
                         "Logical error: Sizes of nested column and null map of Nullable column are not equal");
 }
 
-ColumnPtr ColumnNullable::createWithOffsets(const IColumn::Offsets & offsets, const Field & default_field, size_t total_rows, size_t shift) const
+ColumnPtr ColumnNullable::createWithOffsets(const IColumn::Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const
 {
     ColumnPtr new_values;
     ColumnPtr new_null_map;
 
-    if (default_field.getType() == Field::Types::Null)
+    const ColumnNullable & nullable_column_with_default_value = assert_cast<const ColumnNullable &>(column_with_default_value.getDataColumn());
+    if (nullable_column_with_default_value.isNullAt(0))
     {
-        auto default_column = nested_column->cloneEmpty();
-        default_column->insertDefault();
-
         /// Value in main column, when null map is 1 is implementation defined. So, take any value.
-        new_values = nested_column->createWithOffsets(offsets, (*default_column)[0], total_rows, shift);
-        new_null_map = null_map->createWithOffsets(offsets, Field(1u), total_rows, shift);
+        new_values = nested_column->createWithOffsets(offsets, *createColumnConstWithDefaultValue(nested_column), total_rows, shift);
+        new_null_map = null_map->createWithOffsets(offsets, *createColumnConst(null_map, Field(1u)), total_rows, shift);
     }
     else
     {
-        new_values = nested_column->createWithOffsets(offsets, default_field, total_rows, shift);
-        new_null_map = null_map->createWithOffsets(offsets, Field(0u), total_rows, shift);
+        new_values = nested_column->createWithOffsets(offsets, *ColumnConst::create(nullable_column_with_default_value.getNestedColumnPtr(), 1), total_rows, shift);
+        new_null_map = null_map->createWithOffsets(offsets, *createColumnConst(null_map, Field(0u)), total_rows, shift);
     }
 
     return ColumnNullable::create(new_values, new_null_map);
diff --git a/src/Columns/ColumnNullable.h b/src/Columns/ColumnNullable.h
index 60c7750f8fc..3e04ba8a180 100644
--- a/src/Columns/ColumnNullable.h
+++ b/src/Columns/ColumnNullable.h
@@ -167,7 +167,7 @@ public:
         getIndicesOfNonDefaultRowsImpl<ColumnNullable>(indices, from, limit);
     }
 
-    ColumnPtr createWithOffsets(const Offsets & offsets, const Field & default_field, size_t total_rows, size_t shift) const override;
+    ColumnPtr createWithOffsets(const Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const override;
 
     bool isNullable() const override { return true; }
     bool isFixedAndContiguous() const override { return false; }
diff --git a/src/Columns/ColumnObject.cpp b/src/Columns/ColumnObject.cpp
index f7176568a1b..0ec9c616bab 100644
--- a/src/Columns/ColumnObject.cpp
+++ b/src/Columns/ColumnObject.cpp
@@ -2,6 +2,7 @@
 #include <Columns/ColumnObject.h>
 #include <Columns/ColumnsNumber.h>
 #include <Columns/ColumnArray.h>
+#include <Columns/ColumnConst.h>
 #include <Common/iota.h>
 #include <DataTypes/ObjectUtils.h>
 #include <DataTypes/getLeastSupertype.h>
@@ -475,7 +476,7 @@ void ColumnObject::Subcolumn::finalize()
             {
                 auto values = part->index(*offsets, offsets->size());
                 values = castColumn({values, from_type, ""}, to_type);
-                part = values->createWithOffsets(offsets_data, to_type->getDefault(), part_size, /*shift=*/ 0);
+                part = values->createWithOffsets(offsets_data, *createColumnConstWithDefaultValue(result_column->getPtr()), part_size, /*shift=*/ 0);
             }
         }
 
diff --git a/src/Columns/ColumnSparse.cpp b/src/Columns/ColumnSparse.cpp
index 02e6e9e56b4..eeeec912ce8 100644
--- a/src/Columns/ColumnSparse.cpp
+++ b/src/Columns/ColumnSparse.cpp
@@ -1,6 +1,7 @@
 #include <Columns/ColumnCompressed.h>
 #include <Columns/ColumnSparse.h>
 #include <Columns/ColumnTuple.h>
+#include <Columns/ColumnConst.h>
 #include <Columns/ColumnsCommon.h>
 #include <Processors/Transforms/ColumnGathererTransform.h>
 #include <Common/HashTable/Hash.h>
@@ -130,7 +131,7 @@ StringRef ColumnSparse::getDataAt(size_t n) const
 
 ColumnPtr ColumnSparse::convertToFullColumnIfSparse() const
 {
-    return values->createWithOffsets(getOffsetsData(), (*values)[0], _size, /*shift=*/ 1);
+    return values->createWithOffsets(getOffsetsData(), *createColumnConst(values, 0), _size, /*shift=*/ 1);
 }
 
 void ColumnSparse::insertSingleValue(const Inserter & inserter)
diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index b1cf449dfde..3aadc530878 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -2,6 +2,7 @@
 
 #include <Columns/ColumnCompressed.h>
 #include <Columns/ColumnsCommon.h>
+#include <Columns/ColumnConst.h>
 #include <Columns/MaskOperations.h>
 #include <Columns/RadixSortHelper.h>
 #include <IO/WriteHelpers.h>
@@ -940,7 +941,7 @@ ColumnPtr ColumnVector<T>::compress() const
 }
 
 template <typename T>
-ColumnPtr ColumnVector<T>::createWithOffsets(const IColumn::Offsets & offsets, const Field & default_field, size_t total_rows, size_t shift) const
+ColumnPtr ColumnVector<T>::createWithOffsets(const IColumn::Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const
 {
     if (offsets.size() + shift != size())
         throw Exception(ErrorCodes::LOGICAL_ERROR,
@@ -949,7 +950,7 @@ ColumnPtr ColumnVector<T>::createWithOffsets(const IColumn::Offsets & offsets, c
     auto res = this->create();
     auto & res_data = res->getData();
 
-    T default_value = static_cast<T>(default_field.safeGet<T>());
+    T default_value = assert_cast<const ColumnVector<T> &>(column_with_default_value.getDataColumn()).getElement(0);
     res_data.resize_fill(total_rows, default_value);
     for (size_t i = 0; i < offsets.size(); ++i)
         res_data[offsets[i]] = data[i + shift];
diff --git a/src/Columns/ColumnVector.h b/src/Columns/ColumnVector.h
index fab2d5f06aa..652cc1f5ff9 100644
--- a/src/Columns/ColumnVector.h
+++ b/src/Columns/ColumnVector.h
@@ -379,7 +379,7 @@ public:
         return this->template getIndicesOfNonDefaultRowsImpl<Self>(indices, from, limit);
     }
 
-    ColumnPtr createWithOffsets(const IColumn::Offsets & offsets, const Field & default_field, size_t total_rows, size_t shift) const override;
+    ColumnPtr createWithOffsets(const IColumn::Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const override;
 
     ColumnPtr compress() const override;
 
diff --git a/src/Columns/IColumn.cpp b/src/Columns/IColumn.cpp
index 82dc82e0bd9..d7f83b822d2 100644
--- a/src/Columns/IColumn.cpp
+++ b/src/Columns/IColumn.cpp
@@ -35,7 +35,7 @@ void IColumn::insertFrom(const IColumn & src, size_t n)
     insert(src[n]);
 }
 
-ColumnPtr IColumn::createWithOffsets(const Offsets & offsets, const Field & default_field, size_t total_rows, size_t shift) const
+ColumnPtr IColumn::createWithOffsets(const Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const
 {
     if (offsets.size() + shift != size())
         throw Exception(ErrorCodes::LOGICAL_ERROR,
@@ -51,14 +51,14 @@ ColumnPtr IColumn::createWithOffsets(const Offsets & offsets, const Field & defa
         current_offset = offsets[i];
 
         if (offsets_diff > 1)
-            res->insertMany(default_field, offsets_diff - 1);
+            res->insertManyFrom(column_with_default_value.getDataColumn(), 0, offsets_diff - 1);
 
         res->insertFrom(*this, i + shift);
     }
 
     ssize_t offsets_diff = static_cast<ssize_t>(total_rows) - current_offset;
     if (offsets_diff > 1)
-        res->insertMany(default_field, offsets_diff - 1);
+        res->insertManyFrom(column_with_default_value.getDataColumn(), 0, offsets_diff - 1);
 
     return res;
 }
diff --git a/src/Columns/IColumn.h b/src/Columns/IColumn.h
index 3f866e6213d..1dcd3acdd19 100644
--- a/src/Columns/IColumn.h
+++ b/src/Columns/IColumn.h
@@ -34,6 +34,7 @@ class Arena;
 class ColumnGathererStream;
 class Field;
 class WeakHash32;
+class ColumnConst;
 
 /*
  * Represents a set of equal ranges in previous column to perform sorting in current column.
@@ -462,10 +463,10 @@ public:
 
     /// Returns column with @total_size elements.
     /// In result column values from current column are at positions from @offsets.
-    /// Other values are filled by @default_value.
+    /// Other values are filled by value from @column_with_default_value.
     /// @shift means how much rows to skip from the beginning of current column.
     /// Used to create full column from sparse.
-    [[nodiscard]] virtual Ptr createWithOffsets(const Offsets & offsets, const Field & default_field, size_t total_rows, size_t shift) const;
+    [[nodiscard]] virtual Ptr createWithOffsets(const Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const;
 
     /// Compress column in memory to some representation that allows to decompress it back.
     /// Return itself if compression is not applicable for this column type.
diff --git a/src/Functions/IFunction.cpp b/src/Functions/IFunction.cpp
index a46f4d2a11d..d4c6b8f4ba6 100644
--- a/src/Functions/IFunction.cpp
+++ b/src/Functions/IFunction.cpp
@@ -313,7 +313,7 @@ ColumnPtr IExecutableFunction::execute(const ColumnsWithTypeAndName & arguments,
 {
     bool use_default_implementation_for_sparse_columns = useDefaultImplementationForSparseColumns();
     /// DataTypeFunction does not support obtaining default (isDefaultAt())
-    /// ColumnFunction does not support getting specific values
+    /// ColumnFunction does not support getting specific values.
     if (result_type->getTypeId() != TypeIndex::Function && use_default_implementation_for_sparse_columns)
     {
         size_t num_sparse_columns = 0;
@@ -368,7 +368,7 @@ ColumnPtr IExecutableFunction::execute(const ColumnsWithTypeAndName & arguments,
             if (!result_type->canBeInsideSparseColumns() || !res->isDefaultAt(0) || res->getNumberOfDefaultRows() != 1)
             {
                 const auto & offsets_data = assert_cast<const ColumnVector<UInt64> &>(*sparse_offsets).getData();
-                return res->createWithOffsets(offsets_data, (*res)[0], input_rows_count, /*shift=*/ 1);
+                return res->createWithOffsets(offsets_data, *createColumnConst(res, 0), input_rows_count, /*shift=*/ 1);
             }
 
             return ColumnSparse::create(res, sparse_offsets, input_rows_count);
diff --git a/tests/queries/0_stateless/02941_variant_type_alters.sh b/tests/queries/0_stateless/02941_variant_type_alters.sh
index 7e2ecbd67aa..9b0d4febd65 100755
--- a/tests/queries/0_stateless/02941_variant_type_alters.sh
+++ b/tests/queries/0_stateless/02941_variant_type_alters.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment

From 15e3a5b3961ac304a30ef211594f57bda3a2f584 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 22 Jan 2024 14:57:10 +0100
Subject: [PATCH 078/245] Try fix flaky test

---
 .../integration/test_broken_projections/test.py  | 16 +++++++++++-----
 1 file changed, 11 insertions(+), 5 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index acf0160cf1b..87d910b9c77 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -28,10 +28,17 @@ def cluster():
         cluster.shutdown()
 
 
-def create_table(node, table, replica, data_prefix=""):
+def create_table(node, table, replica, data_prefix="", aggressive_merge=True):
     if data_prefix == "":
         data_prefix = table
 
+    if aggressive_merge:
+        vertical_merge_algorithm_min_rows_to_activate = 1
+        vertical_merge_algorithm_min_columns_to_activate = 1
+    else:
+        vertical_merge_algorithm_min_rows_to_activate = 100000
+        vertical_merge_algorithm_min_columns_to_activate = 100
+
     node.query(
         f"""
     DROP TABLE IF EXISTS {table} SYNC;
@@ -56,9 +63,8 @@ def create_table(node, table, replica, data_prefix=""):
     SETTINGS min_bytes_for_wide_part = 0,
         max_parts_to_merge_at_once=3,
         enable_vertical_merge_algorithm=1,
-        vertical_merge_algorithm_min_rows_to_activate = 1,
-        vertical_merge_algorithm_min_columns_to_activate = 1,
-        vertical_merge_algorithm_min_columns_to_activate = 1,
+        vertical_merge_algorithm_min_rows_to_activate = {vertical_merge_algorithm_min_rows_to_activate},
+        vertical_merge_algorithm_min_columns_to_activate = {vertical_merge_algorithm_min_columns_to_activate},
         compress_primary_key=0;
     """
     )
@@ -411,7 +417,7 @@ def test_broken_projections_in_backups(cluster):
     node = cluster.instances["node"]
 
     table_name = "test4"
-    create_table(node, table_name, 1)
+    create_table(node, table_name, 1, aggressive_merge=False)
 
     node.query("SYSTEM STOP MERGES")
 

From 0606a772674fdecf08a9a904ef46293e8bba9acc Mon Sep 17 00:00:00 2001
From: mochi <mochi_xu@icloud.com>
Date: Mon, 22 Jan 2024 22:02:50 +0800
Subject: [PATCH 079/245] Update src/Storages/MergeTree/MutateTask.cpp

Co-authored-by: Dmitry Novik <mrnovikd@gmail.com>
---
 src/Storages/MergeTree/MutateTask.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 8ed8b8bba4c..fccee6bd887 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -676,7 +676,7 @@ static NameToNameVector collectFilesForRenames(
         {
             const std::vector<String> suffixes = {".idx2", ".idx", ".gin_dict", ".gin_post", ".gin_seg", ".gin_sid"};
 
-            for (const auto& suffix : suffixes)
+            for (const auto & suffix : suffixes)
             {
                 String filename = INDEX_FILE_PREFIX + command.column_name + suffix;
 

From 4e5249275ed67c52d958007978c66619db22a1a5 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Mon, 22 Jan 2024 16:45:25 +0100
Subject: [PATCH 080/245] Do not resolve remote table id on initiator

---
 src/Storages/StorageDistributed.cpp | 9 +--------
 1 file changed, 1 insertion(+), 8 deletions(-)

diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 987ea4a4957..9972517bbac 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -779,18 +779,11 @@ QueryTreeNodePtr buildQueryTreeDistributed(SelectQueryInfo & query_info,
     }
     else
     {
-        auto resolved_remote_storage_id = remote_storage_id;
-        // In case of cross-replication we don't know what database is used for the table.
-        // `storage_id.hasDatabase()` can return false only on the initiator node.
-        // Each shard will use the default database (in the case of cross-replication shards may have different defaults).
-        if (remote_storage_id.hasDatabase())
-            resolved_remote_storage_id = query_context->resolveStorageID(remote_storage_id);
-
         auto get_column_options = GetColumnsOptions(GetColumnsOptions::All).withExtendedObjects().withVirtuals();
 
         auto column_names_and_types = distributed_storage_snapshot->getColumns(get_column_options);
 
-        auto storage = std::make_shared<StorageDummy>(resolved_remote_storage_id, ColumnsDescription{column_names_and_types});
+        auto storage = std::make_shared<StorageDummy>(remote_storage_id, ColumnsDescription{column_names_and_types});
         auto table_node = std::make_shared<TableNode>(std::move(storage), query_context);
 
         if (table_expression_modifiers)

From c59f3e164ffedf1a7561b0fd0a65c2555685ca91 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Thu, 18 Jan 2024 12:08:29 -0800
Subject: [PATCH 081/245] Return baseline component as fourth array

---
 .../sql-reference/functions/time-series-functions.md   |  8 ++++++--
 src/Functions/seriesDecomposeSTL.cpp                   | 10 +++++++++-
 .../0_stateless/02813_seriesDecomposeSTL.reference     |  8 ++++----
 3 files changed, 19 insertions(+), 7 deletions(-)

diff --git a/docs/en/sql-reference/functions/time-series-functions.md b/docs/en/sql-reference/functions/time-series-functions.md
index 144d832b36a..2e42aa884b4 100644
--- a/docs/en/sql-reference/functions/time-series-functions.md
+++ b/docs/en/sql-reference/functions/time-series-functions.md
@@ -77,8 +77,8 @@ The number of data points in `series` should be at least twice the value of `per
 
 **Returned value**
 
-- An array of three arrays where the first array include seasonal components, the second array - trend,
-and the third array - residue component.
+- An array of four arrays where the first array include seasonal components, the second array - trend,
+the third array - residue component, and the fourth array - baseline component.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 
@@ -107,6 +107,10 @@ Result:
     [
         0, 0.0000019073486, -0.0000019073486, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, -0.0000019073486, 0,
         0
+    ],
+    [
+        10.1, 20.449999, 40.340004, 10.100001, 20.45, 40.34, 10.100001, 20.45, 40.34, 10.1, 20.45, 40.34,
+        10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.100002, 20.45, 40.34
     ]]                                                                                                                   │
 └────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┘
 ```
diff --git a/src/Functions/seriesDecomposeSTL.cpp b/src/Functions/seriesDecomposeSTL.cpp
index 21e36761213..0c44afa32a6 100644
--- a/src/Functions/seriesDecomposeSTL.cpp
+++ b/src/Functions/seriesDecomposeSTL.cpp
@@ -128,6 +128,10 @@ public:
                 res_data.insert(residue.begin(), residue.end());
                 res_col_offsets_data.push_back(res_data.size());
 
+                // Create Baseline = seasonal + trend 
+                std::transform(seasonal.begin(), seasonal.end(), trend.begin(), std::back_inserter(res_data), std::plus<Float32>());
+                res_col_offsets_data.push_back(res_data.size());
+
                 root_offsets_data.push_back(res_col_offsets->size());
 
                 prev_src_offset = curr_offset;
@@ -201,7 +205,7 @@ The number of data points in `series` should be at least twice the value of `per
 
 **Returned value**
 
-- An array of three arrays where the first array include seasonal components, the second array - trend, and the third array - residue component.
+- An array of four arrays where the first array include seasonal components, the second array - trend, the third array - residue component, and the fourth array - baseline component.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 
@@ -230,6 +234,10 @@ Result:
     [
         0, 0.0000019073486, -0.0000019073486, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, -0.0000019073486, 0,
         0
+    ],
+    [
+        10.1, 20.449999, 40.340004, 10.100001, 20.45, 40.34, 10.100001, 20.45, 40.34, 10.1, 20.45, 40.34,
+        10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.100002, 20.45, 40.34
     ]]                                                                                                                   │
 └────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┘
 ```)",
diff --git a/tests/queries/0_stateless/02813_seriesDecomposeSTL.reference b/tests/queries/0_stateless/02813_seriesDecomposeSTL.reference
index dc30e7f8371..28dae705335 100644
--- a/tests/queries/0_stateless/02813_seriesDecomposeSTL.reference
+++ b/tests/queries/0_stateless/02813_seriesDecomposeSTL.reference
@@ -1,4 +1,4 @@
-[[-13.529999,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.530001,-3.18,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1799994,16.71,-13.529999,-3.1799994,16.709997],[23.63,23.63,23.630003,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.630001,23.630001,23.630001,23.630003],[0,0.0000019073486,-0.0000019073486,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-0.0000019073486,0,0]]
-[[4.04452e-8,-1.7846537e-8,-5.9488454e-9,0,0,0,0,0,0,-1.9868216e-8,-9.5297715e-8,2.2540547e-9,3.4229203e-8,8.573613e-8],[1.9999999,2,2,2,2,2,2,2,2,2,2,2,1.9999996,1.9999996],[1.1920929e-7,0,0,0,0,0,0,0,0,0,0,0,3.5762787e-7,2.3841858e-7]]
-[[-13.529999,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.530001,-3.18,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1799994,16.71,-13.529999,-3.1799994,16.709997],[23.63,23.63,23.630003,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.630001,23.630001,23.630001,23.630003],[0,0.0000019073486,-0.0000019073486,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-0.0000019073486,0,0]]
-[[53.946846,-4.8119445,43.525013,-23.71359,-42.472305,-51.636955,-50.458298,-51.982674,37.62072,-15.9006605,56.65076,-5.809669,57.143845,-2.0370207,54.050922,-4.897961,43.954018,-23.808758,-42.651337,-51.86827,-50.709732,-52.18156,37.734905,-15.853402,56.91643,-5.8815174,57.253094,-2.012879,54.157806,-4.9817176,44.384747,-23.902956,-42.830154,-52.10025,-50.96271,-52.3829,37.84573,-15.81032,57.177113,-5.958963,57.356136,-1.9952412,54.27533,-5.066312,44.878296,-23.956438,-42.993656,-52.337124,-51.208073,-52.615646,37.91102,-15.8062525,57.49891,-6.056076,57.45604,-1.9797823,54.39525,-5.1483474,45.374573],[88.028534,88.95315,89.87776,90.802376,91.64913,92.49588,93.342636,94.19737,95.0521,95.90684,96.712975,97.51912,98.32526,98.36342,98.40158,98.43974,98.36777,98.29579,98.223816,98.536446,98.849075,99.161705,99.7552,100.348694,100.94219,101.53184,102.12149,102.711136,103.79921,104.88729,105.975365,107.50462,109.033875,110.56313,111.79767,113.032196,114.26673,115.02128,115.775826,116.53037,117.15541,117.78044,118.40548,118.86489,119.3243,119.783714,120.04031,120.29691,120.55351,120.78621,121.01891,121.25161,121.533585,121.81555,122.09753,122.41821,122.7389,123.059586,123.39267],[-2.97538,2.8587952,-23.402771,0.91121674,4.8231735,9.141075,8.115662,10.785301,0.32717896,5.99382,-12.363731,5.29055,0.53089905,-2.3264008,-3.4524994,1.4582214,-2.321785,2.51297,5.4275208,3.3318253,5.8606567,0.019859314,-4.4901123,-12.495293,-5.8586197,-1.650322,-11.374588,4.3017426,4.042984,1.094429,9.639885,3.3983307,-3.20372,-5.462883,-5.834961,-6.649292,-1.1124649,3.7890396,16.047066,-2.5714111,8.488449,-2.785202,2.319191,-0.79857635,13.797401,-5.827278,-6.0466614,-5.9597855,-7.3454437,-3.1705627,6.0700684,3.5546417,1.9675064,-0.7594757,2.446434,0.5615692,0.86585236,-3.9112396,1.2327576]]
+[[-13.529999,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.530001,-3.18,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1799994,16.71,-13.529999,-3.1799994,16.709997],[23.63,23.63,23.630003,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.630001,23.630001,23.630001,23.630003],[0,0.0000019073486,-0.0000019073486,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-0.0000019073486,0,0],[10.1,20.449999,40.340004,10.100001,20.45,40.34,10.100001,20.45,40.34,10.1,20.45,40.34,10.1,20.45,40.34,10.1,20.45,40.34,10.1,20.45,40.34,10.100002,20.45,40.34]]
+[[4.04452e-8,-1.7846537e-8,-5.9488454e-9,0,0,0,0,0,0,-1.9868216e-8,-9.5297715e-8,2.2540547e-9,3.4229203e-8,8.573613e-8],[1.9999999,2,2,2,2,2,2,2,2,2,2,2,1.9999996,1.9999996],[1.1920929e-7,0,0,0,0,0,0,0,0,0,0,0,3.5762787e-7,2.3841858e-7],[1.9999999,2,2,2,2,2,2,2,2,2,1.9999999,2,1.9999996,1.9999998]]
+[[-13.529999,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.530001,-3.18,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1799994,16.71,-13.529999,-3.1799994,16.709997],[23.63,23.63,23.630003,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.630001,23.630001,23.630001,23.630003],[0,0.0000019073486,-0.0000019073486,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-0.0000019073486,0,0],[10.1,20.449999,40.340004,10.100001,20.45,40.34,10.100001,20.45,40.34,10.1,20.45,40.34,10.1,20.45,40.34,10.1,20.45,40.34,10.1,20.45,40.34,10.100002,20.45,40.34]]
+[[53.946846,-4.8119445,43.525013,-23.71359,-42.472305,-51.636955,-50.458298,-51.982674,37.62072,-15.9006605,56.65076,-5.809669,57.143845,-2.0370207,54.050922,-4.897961,43.954018,-23.808758,-42.651337,-51.86827,-50.709732,-52.18156,37.734905,-15.853402,56.91643,-5.8815174,57.253094,-2.012879,54.157806,-4.9817176,44.384747,-23.902956,-42.830154,-52.10025,-50.96271,-52.3829,37.84573,-15.81032,57.177113,-5.958963,57.356136,-1.9952412,54.27533,-5.066312,44.878296,-23.956438,-42.993656,-52.337124,-51.208073,-52.615646,37.91102,-15.8062525,57.49891,-6.056076,57.45604,-1.9797823,54.39525,-5.1483474,45.374573],[88.028534,88.95315,89.87776,90.802376,91.64913,92.49588,93.342636,94.19737,95.0521,95.90684,96.712975,97.51912,98.32526,98.36342,98.40158,98.43974,98.36777,98.29579,98.223816,98.536446,98.849075,99.161705,99.7552,100.348694,100.94219,101.53184,102.12149,102.711136,103.79921,104.88729,105.975365,107.50462,109.033875,110.56313,111.79767,113.032196,114.26673,115.02128,115.775826,116.53037,117.15541,117.78044,118.40548,118.86489,119.3243,119.783714,120.04031,120.29691,120.55351,120.78621,121.01891,121.25161,121.533585,121.81555,122.09753,122.41821,122.7389,123.059586,123.39267],[-2.97538,2.8587952,-23.402771,0.91121674,4.8231735,9.141075,8.115662,10.785301,0.32717896,5.99382,-12.363731,5.29055,0.53089905,-2.3264008,-3.4524994,1.4582214,-2.321785,2.51297,5.4275208,3.3318253,5.8606567,0.019859314,-4.4901123,-12.495293,-5.8586197,-1.650322,-11.374588,4.3017426,4.042984,1.094429,9.639885,3.3983307,-3.20372,-5.462883,-5.834961,-6.649292,-1.1124649,3.7890396,16.047066,-2.5714111,8.488449,-2.785202,2.319191,-0.79857635,13.797401,-5.827278,-6.0466614,-5.9597855,-7.3454437,-3.1705627,6.0700684,3.5546417,1.9675064,-0.7594757,2.446434,0.5615692,0.86585236,-3.9112396,1.2327576],[141.97537,84.141205,133.40277,67.08878,49.176826,40.858925,42.88434,42.2147,132.67282,80.00618,153.36374,91.70945,155.4691,96.3264,152.4525,93.54178,142.32178,74.48703,55.57248,46.668175,48.139343,46.980145,137.49011,84.49529,157.85863,95.65032,159.37459,100.69826,157.95702,99.90557,150.3601,83.60167,66.20372,58.462883,60.834957,60.649296,152.11246,99.21096,172.95294,110.57141,174.51155,115.7852,172.68082,113.79858,164.2026,95.82728,77.04666,67.95979,69.34544,68.17056,158.92993,105.44536,179.0325,115.759476,179.55356,120.43843,177.13416,117.91124,168.76724]]

From f935493f284e1acd94eacdf0c50f91de688d817e Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Fri, 19 Jan 2024 09:05:04 -0800
Subject: [PATCH 082/245] fix trailing whitespaces

---
 docs/en/sql-reference/functions/time-series-functions.md | 2 +-
 src/Functions/seriesDecomposeSTL.cpp                     | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/en/sql-reference/functions/time-series-functions.md b/docs/en/sql-reference/functions/time-series-functions.md
index 2e42aa884b4..21e66302ad2 100644
--- a/docs/en/sql-reference/functions/time-series-functions.md
+++ b/docs/en/sql-reference/functions/time-series-functions.md
@@ -78,7 +78,7 @@ The number of data points in `series` should be at least twice the value of `per
 **Returned value**
 
 - An array of four arrays where the first array include seasonal components, the second array - trend,
-the third array - residue component, and the fourth array - baseline component.
+the third array - residue component, and the fourth array - baseline(seasoanl + trend) component.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 
diff --git a/src/Functions/seriesDecomposeSTL.cpp b/src/Functions/seriesDecomposeSTL.cpp
index 0c44afa32a6..9a6a229e282 100644
--- a/src/Functions/seriesDecomposeSTL.cpp
+++ b/src/Functions/seriesDecomposeSTL.cpp
@@ -128,7 +128,7 @@ public:
                 res_data.insert(residue.begin(), residue.end());
                 res_col_offsets_data.push_back(res_data.size());
 
-                // Create Baseline = seasonal + trend 
+                // Create Baseline = seasonal + trend
                 std::transform(seasonal.begin(), seasonal.end(), trend.begin(), std::back_inserter(res_data), std::plus<Float32>());
                 res_col_offsets_data.push_back(res_data.size());
 
@@ -205,7 +205,7 @@ The number of data points in `series` should be at least twice the value of `per
 
 **Returned value**
 
-- An array of four arrays where the first array include seasonal components, the second array - trend, the third array - residue component, and the fourth array - baseline component.
+- An array of four arrays where the first array include seasonal components, the second array - trend, the third array - residue component, and the fourth array - baseline(seasoanl + trend) component.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 

From d9edd5a7f36491a8d86705e6c7221c1a74cd6ef5 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Fri, 19 Jan 2024 10:20:01 -0800
Subject: [PATCH 083/245] fix spell check

---
 docs/en/sql-reference/functions/time-series-functions.md | 2 +-
 src/Functions/seriesDecomposeSTL.cpp                     | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/sql-reference/functions/time-series-functions.md b/docs/en/sql-reference/functions/time-series-functions.md
index 21e66302ad2..016c3410944 100644
--- a/docs/en/sql-reference/functions/time-series-functions.md
+++ b/docs/en/sql-reference/functions/time-series-functions.md
@@ -78,7 +78,7 @@ The number of data points in `series` should be at least twice the value of `per
 **Returned value**
 
 - An array of four arrays where the first array include seasonal components, the second array - trend,
-the third array - residue component, and the fourth array - baseline(seasoanl + trend) component.
+the third array - residue component, and the fourth array - baseline(seasonal + trend) component.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 
diff --git a/src/Functions/seriesDecomposeSTL.cpp b/src/Functions/seriesDecomposeSTL.cpp
index 9a6a229e282..4376691868b 100644
--- a/src/Functions/seriesDecomposeSTL.cpp
+++ b/src/Functions/seriesDecomposeSTL.cpp
@@ -205,7 +205,7 @@ The number of data points in `series` should be at least twice the value of `per
 
 **Returned value**
 
-- An array of four arrays where the first array include seasonal components, the second array - trend, the third array - residue component, and the fourth array - baseline(seasoanl + trend) component.
+- An array of four arrays where the first array include seasonal components, the second array - trend, the third array - residue component, and the fourth array - baseline(seasonal + trend) component.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 

From 084ee74b6898214024feafcfa292ff8419bc0050 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Mon, 22 Jan 2024 07:31:33 -0800
Subject: [PATCH 084/245] minor fix

---
 src/Functions/seriesDecomposeSTL.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/seriesDecomposeSTL.cpp b/src/Functions/seriesDecomposeSTL.cpp
index 4376691868b..e9276c4aefb 100644
--- a/src/Functions/seriesDecomposeSTL.cpp
+++ b/src/Functions/seriesDecomposeSTL.cpp
@@ -129,7 +129,7 @@ public:
                 res_col_offsets_data.push_back(res_data.size());
 
                 // Create Baseline = seasonal + trend
-                std::transform(seasonal.begin(), seasonal.end(), trend.begin(), std::back_inserter(res_data), std::plus<Float32>());
+                std::transform(seasonal.begin(), seasonal.end(), trend.begin(), std::back_inserter(res_data), std::plus<>());
                 res_col_offsets_data.push_back(res_data.size());
 
                 root_offsets_data.push_back(res_col_offsets->size());

From 78df07199bc57c8dac9a56fb8092eb1256ad8b56 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Tue, 23 Jan 2024 07:16:38 +0000
Subject: [PATCH 085/245] More consistent tests for inverted index

---
 ...> 02346_inverted_index_bug47393.reference} |  0
 .../02346_inverted_index_bug47393.sql         | 25 +++++++++++++++++++
 ...> 02346_inverted_index_bug52019.reference} |  0
 ....sql => 02346_inverted_index_bug52019.sql} | 17 ++++++++++---
 ...46_inverted_index_detach_attach.reference} |  0
 ...=> 02346_inverted_index_detach_attach.sql} |  6 ++---
 ...nverted_index_experimental_flag.reference} |  0
 ...2346_inverted_index_experimental_flag.sql} |  3 +++
 ..._inverted_index_match_predicate.reference} |  0
 ... 02346_inverted_index_match_predicate.sql} |  2 ++
 .../02346_inverted_index_mutation.sql         | 25 -------------------
 ... => 02346_inverted_index_search.reference} |  0
 ...ch.sql => 02346_inverted_index_search.sql} |  0
 13 files changed, 47 insertions(+), 31 deletions(-)
 rename tests/queries/0_stateless/{02346_inverted_index_mutation.reference => 02346_inverted_index_bug47393.reference} (100%)
 create mode 100644 tests/queries/0_stateless/02346_inverted_index_bug47393.sql
 rename tests/queries/0_stateless/{02696_inverted_idx_checksums.reference => 02346_inverted_index_bug52019.reference} (100%)
 rename tests/queries/0_stateless/{02862_index_inverted_incorrect_args.sql => 02346_inverted_index_bug52019.sql} (62%)
 rename tests/queries/0_stateless/{02862_index_inverted_incorrect_args.reference => 02346_inverted_index_detach_attach.reference} (100%)
 rename tests/queries/0_stateless/{02696_inverted_idx_checksums.sql => 02346_inverted_index_detach_attach.sql} (75%)
 rename tests/queries/0_stateless/{02895_forbid_create_inverted_index.reference => 02346_inverted_index_experimental_flag.reference} (100%)
 rename tests/queries/0_stateless/{02895_forbid_create_inverted_index.sql => 02346_inverted_index_experimental_flag.sql} (72%)
 rename tests/queries/0_stateless/{02951_inverted_index_support_match.reference => 02346_inverted_index_match_predicate.reference} (100%)
 rename tests/queries/0_stateless/{02951_inverted_index_support_match.sql => 02346_inverted_index_match_predicate.sql} (97%)
 delete mode 100644 tests/queries/0_stateless/02346_inverted_index_mutation.sql
 rename tests/queries/0_stateless/{02346_full_text_search.reference => 02346_inverted_index_search.reference} (100%)
 rename tests/queries/0_stateless/{02346_full_text_search.sql => 02346_inverted_index_search.sql} (100%)

diff --git a/tests/queries/0_stateless/02346_inverted_index_mutation.reference b/tests/queries/0_stateless/02346_inverted_index_bug47393.reference
similarity index 100%
rename from tests/queries/0_stateless/02346_inverted_index_mutation.reference
rename to tests/queries/0_stateless/02346_inverted_index_bug47393.reference
diff --git a/tests/queries/0_stateless/02346_inverted_index_bug47393.sql b/tests/queries/0_stateless/02346_inverted_index_bug47393.sql
new file mode 100644
index 00000000000..166e051b120
--- /dev/null
+++ b/tests/queries/0_stateless/02346_inverted_index_bug47393.sql
@@ -0,0 +1,25 @@
+SET allow_experimental_inverted_index = 1;
+
+DROP TABLE IF EXISTS tab;
+CREATE TABLE tab
+(
+    id UInt64,
+    str String,
+    INDEX idx str TYPE inverted(3) GRANULARITY 1
+)
+ENGINE = MergeTree
+ORDER BY tuple()
+SETTINGS min_rows_for_wide_part = 1, min_bytes_for_wide_part = 1;
+
+INSERT INTO tab (str) VALUES ('I am inverted');
+
+SELECT data_version FROM system.parts WHERE database = currentDatabase() AND table = 'tab' AND active = 1;
+
+-- update column synchronously
+ALTER TABLE tab UPDATE str = 'I am not inverted' WHERE 1 SETTINGS mutations_sync=1;
+
+SELECT data_version FROM system.parts WHERE database = currentDatabase() AND table = 'tab' AND active = 1;
+
+SELECT str FROM tab WHERE str LIKE '%inverted%' SETTINGS force_data_skipping_indices = 'idx';
+
+DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02696_inverted_idx_checksums.reference b/tests/queries/0_stateless/02346_inverted_index_bug52019.reference
similarity index 100%
rename from tests/queries/0_stateless/02696_inverted_idx_checksums.reference
rename to tests/queries/0_stateless/02346_inverted_index_bug52019.reference
diff --git a/tests/queries/0_stateless/02862_index_inverted_incorrect_args.sql b/tests/queries/0_stateless/02346_inverted_index_bug52019.sql
similarity index 62%
rename from tests/queries/0_stateless/02862_index_inverted_incorrect_args.sql
rename to tests/queries/0_stateless/02346_inverted_index_bug52019.sql
index 7ba122a7155..c61e17d9cea 100644
--- a/tests/queries/0_stateless/02862_index_inverted_incorrect_args.sql
+++ b/tests/queries/0_stateless/02346_inverted_index_bug52019.sql
@@ -1,9 +1,20 @@
--- https://github.com/ClickHouse/ClickHouse/issues/52019
-DROP TABLE IF EXISTS tab;
+-- Test for Bug 52019: Undefined behavior
+
 SET allow_experimental_inverted_index=1;
-CREATE TABLE tab (`k` UInt64, `s` Map(String, String), INDEX af mapKeys(s) TYPE inverted(2) GRANULARITY 1) ENGINE = MergeTree ORDER BY k SETTINGS index_granularity = 2, index_granularity_bytes = '10Mi';
+
+DROP TABLE IF EXISTS tab;
+
+CREATE TABLE tab (
+    k UInt64,
+    s Map(String, String),
+    INDEX idx mapKeys(s) TYPE inverted(2) GRANULARITY 1)
+ENGINE = MergeTree
+ORDER BY k
+SETTINGS index_granularity = 2, index_granularity_bytes = '10Mi';
+
 INSERT INTO tab (k) VALUES (0);
 SELECT * FROM tab PREWHERE (s[NULL]) = 'Click a03' SETTINGS allow_experimental_analyzer=1;
 SELECT * FROM tab PREWHERE (s[1]) = 'Click a03' SETTINGS allow_experimental_analyzer=1; -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT * FROM tab PREWHERE (s['foo']) = 'Click a03' SETTINGS allow_experimental_analyzer=1;
+
 DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02862_index_inverted_incorrect_args.reference b/tests/queries/0_stateless/02346_inverted_index_detach_attach.reference
similarity index 100%
rename from tests/queries/0_stateless/02862_index_inverted_incorrect_args.reference
rename to tests/queries/0_stateless/02346_inverted_index_detach_attach.reference
diff --git a/tests/queries/0_stateless/02696_inverted_idx_checksums.sql b/tests/queries/0_stateless/02346_inverted_index_detach_attach.sql
similarity index 75%
rename from tests/queries/0_stateless/02696_inverted_idx_checksums.sql
rename to tests/queries/0_stateless/02346_inverted_index_detach_attach.sql
index 92ffa7a6196..762d78922fe 100644
--- a/tests/queries/0_stateless/02696_inverted_idx_checksums.sql
+++ b/tests/queries/0_stateless/02346_inverted_index_detach_attach.sql
@@ -2,8 +2,8 @@ SET allow_experimental_inverted_index = 1;
 
 CREATE TABLE t
 (
-    `key` UInt64,
-    `str` String,
+    key UInt64,
+    str String,
     INDEX inv_idx str TYPE inverted(0) GRANULARITY 1
 )
 ENGINE = MergeTree
@@ -13,4 +13,4 @@ INSERT INTO t VALUES (1, 'Hello World');
 
 ALTER TABLE t DETACH PART 'all_1_1_0';
 
-ALTER TABLE t ATTACH PART 'all_1_1_0';
\ No newline at end of file
+ALTER TABLE t ATTACH PART 'all_1_1_0';
diff --git a/tests/queries/0_stateless/02895_forbid_create_inverted_index.reference b/tests/queries/0_stateless/02346_inverted_index_experimental_flag.reference
similarity index 100%
rename from tests/queries/0_stateless/02895_forbid_create_inverted_index.reference
rename to tests/queries/0_stateless/02346_inverted_index_experimental_flag.reference
diff --git a/tests/queries/0_stateless/02895_forbid_create_inverted_index.sql b/tests/queries/0_stateless/02346_inverted_index_experimental_flag.sql
similarity index 72%
rename from tests/queries/0_stateless/02895_forbid_create_inverted_index.sql
rename to tests/queries/0_stateless/02346_inverted_index_experimental_flag.sql
index dc92d9198fb..bf89265372e 100644
--- a/tests/queries/0_stateless/02895_forbid_create_inverted_index.sql
+++ b/tests/queries/0_stateless/02346_inverted_index_experimental_flag.sql
@@ -1,4 +1,7 @@
+-- Tests that the inverted index can only be supported when allow_experimental_inverted_index = 1.
+
 SET allow_experimental_inverted_index = 0;
+
 DROP TABLE IF EXISTS tab;
 CREATE TABLE tab
 (
diff --git a/tests/queries/0_stateless/02951_inverted_index_support_match.reference b/tests/queries/0_stateless/02346_inverted_index_match_predicate.reference
similarity index 100%
rename from tests/queries/0_stateless/02951_inverted_index_support_match.reference
rename to tests/queries/0_stateless/02346_inverted_index_match_predicate.reference
diff --git a/tests/queries/0_stateless/02951_inverted_index_support_match.sql b/tests/queries/0_stateless/02346_inverted_index_match_predicate.sql
similarity index 97%
rename from tests/queries/0_stateless/02951_inverted_index_support_match.sql
rename to tests/queries/0_stateless/02346_inverted_index_match_predicate.sql
index 9ebf10412d9..99405c0acf2 100644
--- a/tests/queries/0_stateless/02951_inverted_index_support_match.sql
+++ b/tests/queries/0_stateless/02346_inverted_index_match_predicate.sql
@@ -1,3 +1,5 @@
+-- Tests that match() utilizes the inverted index
+
 SET allow_experimental_inverted_index = true;
 
 DROP TABLE IF EXISTS tab;
diff --git a/tests/queries/0_stateless/02346_inverted_index_mutation.sql b/tests/queries/0_stateless/02346_inverted_index_mutation.sql
deleted file mode 100644
index 83b73807cd7..00000000000
--- a/tests/queries/0_stateless/02346_inverted_index_mutation.sql
+++ /dev/null
@@ -1,25 +0,0 @@
-SET allow_experimental_inverted_index=1;
-
-DROP TABLE IF EXISTS t;
-CREATE TABLE t
-(
-    `timestamp` UInt64,
-    `s` String,
-    INDEX idx s TYPE inverted(3) GRANULARITY 1
-)
-ENGINE = MergeTree
-ORDER BY tuple()
-SETTINGS min_rows_for_wide_part = 1, min_bytes_for_wide_part = 1;
-
-INSERT INTO t (s) VALUES ('I am inverted');
-
-SELECT data_version FROM system.parts WHERE database=currentDatabase() AND table='t' AND active=1;
-
--- do update column synchronously
-ALTER TABLE t UPDATE s='I am not inverted' WHERE 1 SETTINGS mutations_sync=1;
-
-SELECT data_version FROM system.parts WHERE database=currentDatabase() AND table='t' AND active=1;
-
-SELECT s FROM t WHERE s LIKE '%inverted%' SETTINGS force_data_skipping_indices='idx';
-
-DROP TABLE t;
diff --git a/tests/queries/0_stateless/02346_full_text_search.reference b/tests/queries/0_stateless/02346_inverted_index_search.reference
similarity index 100%
rename from tests/queries/0_stateless/02346_full_text_search.reference
rename to tests/queries/0_stateless/02346_inverted_index_search.reference
diff --git a/tests/queries/0_stateless/02346_full_text_search.sql b/tests/queries/0_stateless/02346_inverted_index_search.sql
similarity index 100%
rename from tests/queries/0_stateless/02346_full_text_search.sql
rename to tests/queries/0_stateless/02346_inverted_index_search.sql

From bfec324b2818a3764c09347508125051273dac25 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Tue, 23 Jan 2024 10:06:25 +0000
Subject: [PATCH 086/245] Some fixups + test

---
 src/Storages/MergeTree/MutateTask.cpp         | 18 ++++++++++-------
 .../02346_inverted_index_bug59039.reference   |  0
 .../02346_inverted_index_bug59039.sql         | 20 +++++++++++++++++++
 3 files changed, 31 insertions(+), 7 deletions(-)
 create mode 100644 tests/queries/0_stateless/02346_inverted_index_bug59039.reference
 create mode 100644 tests/queries/0_stateless/02346_inverted_index_bug59039.sql

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index fccee6bd887..48aad368dd4 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -674,21 +674,25 @@ static NameToNameVector collectFilesForRenames(
     {
         if (command.type == MutationCommand::Type::DROP_INDEX)
         {
-            const std::vector<String> suffixes = {".idx2", ".idx", ".gin_dict", ".gin_post", ".gin_seg", ".gin_sid"};
+            static const std::array<String, 2> suffixes = {".idx2", ".idx"};
+            static const std::array<String, 4> gin_suffixes = {".gin_dict", ".gin_post", ".gin_seg", ".gin_sid"}; /// .gin_* is inverted index
 
             for (const auto & suffix : suffixes)
             {
-                String filename = INDEX_FILE_PREFIX + command.column_name + suffix;
+                const String filename = INDEX_FILE_PREFIX + command.column_name + suffix;
+                const String filename_mrk = INDEX_FILE_PREFIX + command.column_name + mrk_extension;
 
-                if ((suffix == ".idx2" || suffix == ".idx") && source_part->checksums.has(filename))
+                if (source_part->checksums.has(filename))
                 {
                     add_rename(filename, "");
-                    add_rename(INDEX_FILE_PREFIX + command.column_name + mrk_extension, "");
+                    add_rename(filename_mrk, "");
                 }
-                else if (source_part->checksums.has(filename))
-                {
+            }
+            for (const auto & gin_suffix : gin_suffixes)
+            {
+                const String filename = INDEX_FILE_PREFIX + command.column_name + gin_suffix;
+                if (source_part->checksums.has(filename))
                     add_rename(filename, "");
-                }
             }
         }
         else if (command.type == MutationCommand::Type::DROP_PROJECTION)
diff --git a/tests/queries/0_stateless/02346_inverted_index_bug59039.reference b/tests/queries/0_stateless/02346_inverted_index_bug59039.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02346_inverted_index_bug59039.sql b/tests/queries/0_stateless/02346_inverted_index_bug59039.sql
new file mode 100644
index 00000000000..0ef0cb0c733
--- /dev/null
+++ b/tests/queries/0_stateless/02346_inverted_index_bug59039.sql
@@ -0,0 +1,20 @@
+-- This is supposed to test that DROP INDEX removes all index related files. Can't test this directly but at least run the statement and
+-- check that no bad things happen.
+
+SET allow_experimental_inverted_index = 1;
+
+DROP TABLE IF EXISTS tab;
+
+CREATE TABLE tab
+(
+    id UInt64,
+    doc String,
+    INDEX text_idx doc TYPE inverted
+)
+ENGINE = MergeTree
+ORDER BY id
+SETTINGS index_granularity = 2, index_granularity_bytes = '10Mi', min_bytes_for_wide_part = 0, min_rows_for_wide_part = 0;
+
+ALTER TABLE tab DROP INDEX text_idx;
+
+DROP TABLE tab;

From bef0fcb482c4b8782a1d2e485be9f6d8ffc2dfe9 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Tue, 23 Jan 2024 14:56:24 +0100
Subject: [PATCH 087/245] Fix is_order_by_all flag in QueryNode

---
 src/Analyzer/QueryNode.cpp | 28 +++++++++++++++++-----------
 1 file changed, 17 insertions(+), 11 deletions(-)

diff --git a/src/Analyzer/QueryNode.cpp b/src/Analyzer/QueryNode.cpp
index 738b1ac62e8..a82fb4489b5 100644
--- a/src/Analyzer/QueryNode.cpp
+++ b/src/Analyzer/QueryNode.cpp
@@ -119,6 +119,9 @@ void QueryNode::dumpTreeImpl(WriteBuffer & buffer, FormatState & format_state, s
     if (is_group_by_all)
         buffer << ", is_group_by_all: " << is_group_by_all;
 
+    if (is_order_by_all)
+        buffer << ", is_order_by_all: " << is_order_by_all;
+
     std::string group_by_type;
     if (is_group_by_with_rollup)
         group_by_type = "rollup";
@@ -257,6 +260,7 @@ bool QueryNode::isEqualImpl(const IQueryTreeNode & rhs) const
         is_group_by_with_cube == rhs_typed.is_group_by_with_cube &&
         is_group_by_with_grouping_sets == rhs_typed.is_group_by_with_grouping_sets &&
         is_group_by_all == rhs_typed.is_group_by_all &&
+        is_order_by_all == rhs_typed.is_order_by_all &&
         cte_name == rhs_typed.cte_name &&
         projection_columns == rhs_typed.projection_columns &&
         settings_changes == rhs_typed.settings_changes;
@@ -288,6 +292,7 @@ void QueryNode::updateTreeHashImpl(HashState & state) const
     state.update(is_group_by_with_cube);
     state.update(is_group_by_with_grouping_sets);
     state.update(is_group_by_all);
+    state.update(is_order_by_all);
 
     state.update(settings_changes.size());
 
@@ -306,18 +311,19 @@ QueryTreeNodePtr QueryNode::cloneImpl() const
 {
     auto result_query_node = std::make_shared<QueryNode>(context);
 
-    result_query_node->is_subquery = is_subquery;
-    result_query_node->is_cte = is_cte;
-    result_query_node->is_distinct = is_distinct;
-    result_query_node->is_limit_with_ties = is_limit_with_ties;
-    result_query_node->is_group_by_with_totals = is_group_by_with_totals;
-    result_query_node->is_group_by_with_rollup = is_group_by_with_rollup;
-    result_query_node->is_group_by_with_cube = is_group_by_with_cube;
+    result_query_node->is_subquery                    = is_subquery;
+    result_query_node->is_cte                         = is_cte;
+    result_query_node->is_distinct                    = is_distinct;
+    result_query_node->is_limit_with_ties             = is_limit_with_ties;
+    result_query_node->is_group_by_with_totals        = is_group_by_with_totals;
+    result_query_node->is_group_by_with_rollup        = is_group_by_with_rollup;
+    result_query_node->is_group_by_with_cube          = is_group_by_with_cube;
     result_query_node->is_group_by_with_grouping_sets = is_group_by_with_grouping_sets;
-    result_query_node->is_group_by_all = is_group_by_all;
-    result_query_node->cte_name = cte_name;
-    result_query_node->projection_columns = projection_columns;
-    result_query_node->settings_changes = settings_changes;
+    result_query_node->is_group_by_all                = is_group_by_all;
+    result_query_node->is_order_by_all                = is_order_by_all;
+    result_query_node->cte_name                       = cte_name;
+    result_query_node->projection_columns             = projection_columns;
+    result_query_node->settings_changes               = settings_changes;
 
     return result_query_node;
 }

From 799a94081ba7587ec47d85554bdbb458ffb1436d Mon Sep 17 00:00:00 2001
From: Arthur Passos <arthur.ti@outlook.com>
Date: Tue, 23 Jan 2024 11:40:42 -0300
Subject: [PATCH 088/245] Revert "Revert "Allow to attach partition from table
 with different partition expression when destination partition expression
 doesn't re-partition""

This reverts commit a1c83e2f51117a69d484c7ae7884c3bc5dd98129.
---
 .../statements/alter/partition.md             |   2 +-
 src/Interpreters/MonotonicityCheckVisitor.h   | 102 +++-
 src/Interpreters/applyFunction.cpp            |  43 ++
 src/Interpreters/applyFunction.h              |  16 +
 src/Parsers/queryToString.cpp                 |   5 +
 src/Parsers/queryToString.h                   |   1 +
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  37 +-
 src/Storages/MergeTree/IMergeTreeDataPart.h   |   1 +
 src/Storages/MergeTree/KeyCondition.cpp       |  83 +--
 src/Storages/MergeTree/MergeTreeData.cpp      | 350 +++++--------
 src/Storages/MergeTree/MergeTreeData.h        |  18 +
 .../MergeTree/MergeTreeDataPartCloner.cpp     | 320 ++++++++++++
 .../MergeTree/MergeTreeDataPartCloner.h       |  43 ++
 src/Storages/MergeTree/MergeTreePartition.cpp |  39 ++
 src/Storages/MergeTree/MergeTreePartition.h   |  10 +-
 ...ergeTreePartitionCompatibilityVerifier.cpp |  91 ++++
 .../MergeTreePartitionCompatibilityVerifier.h |  30 ++
 ...TreePartitionGlobalMinMaxIdxCalculator.cpp |  25 +
 ...geTreePartitionGlobalMinMaxIdxCalculator.h |  24 +
 src/Storages/StorageMergeTree.cpp             |  93 +++-
 src/Storages/StorageReplicatedMergeTree.cpp   | 135 ++++-
 .../__init__.py                               |   0
 .../configs/remote_servers.xml                |  17 +
 .../test.py                                   | 214 ++++++++
 ...artition_different_partition_exp.reference | 467 +++++++++++++++++
 ...tach_partition_different_partition_exp.sql | 485 ++++++++++++++++++
 26 files changed, 2310 insertions(+), 341 deletions(-)
 create mode 100644 src/Interpreters/applyFunction.cpp
 create mode 100644 src/Interpreters/applyFunction.h
 create mode 100644 src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
 create mode 100644 src/Storages/MergeTree/MergeTreeDataPartCloner.h
 create mode 100644 src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.cpp
 create mode 100644 src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h
 create mode 100644 src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.cpp
 create mode 100644 src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h
 create mode 100644 tests/integration/test_attach_partition_distinct_expression_replicated/__init__.py
 create mode 100644 tests/integration/test_attach_partition_distinct_expression_replicated/configs/remote_servers.xml
 create mode 100644 tests/integration/test_attach_partition_distinct_expression_replicated/test.py
 create mode 100644 tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.reference
 create mode 100644 tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.sql

diff --git a/docs/en/sql-reference/statements/alter/partition.md b/docs/en/sql-reference/statements/alter/partition.md
index 114b8d5ffe3..5659a0565c5 100644
--- a/docs/en/sql-reference/statements/alter/partition.md
+++ b/docs/en/sql-reference/statements/alter/partition.md
@@ -112,7 +112,7 @@ Note that:
 For the query to run successfully, the following conditions must be met:
 
 - Both tables must have the same structure.
-- Both tables must have the same partition key, the same order by key and the same primary key.
+- Both tables must have the same order by key and the same primary key.
 - Both tables must have the same indices and projections.
 - Both tables must have the same storage policy.
 
diff --git a/src/Interpreters/MonotonicityCheckVisitor.h b/src/Interpreters/MonotonicityCheckVisitor.h
index cc386825024..4e71bd56851 100644
--- a/src/Interpreters/MonotonicityCheckVisitor.h
+++ b/src/Interpreters/MonotonicityCheckVisitor.h
@@ -1,13 +1,17 @@
 #pragma once
 
 #include <AggregateFunctions/AggregateFunctionFactory.h>
+#include <Core/Range.h>
 #include <DataTypes/DataTypeFactory.h>
+#include <DataTypes/FieldToDataType.h>
 #include <Functions/FunctionFactory.h>
 #include <IO/WriteHelpers.h>
-#include <Interpreters/InDepthNodeVisitor.h>
 #include <Interpreters/IdentifierSemantic.h>
+#include <Interpreters/InDepthNodeVisitor.h>
+#include <Interpreters/applyFunction.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTIdentifier.h>
+#include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTOrderByElement.h>
 #include <Parsers/ASTTablesInSelectQuery.h>
 #include <Parsers/IAST.h>
@@ -33,6 +37,8 @@ public:
         ASTIdentifier * identifier = nullptr;
         DataTypePtr arg_data_type = {};
 
+        Range range = Range::createWholeUniverse();
+
         void reject() { monotonicity.is_monotonic = false; }
         bool isRejected() const { return !monotonicity.is_monotonic; }
 
@@ -97,13 +103,30 @@ public:
         if (data.isRejected())
             return;
 
-        /// TODO: monotonicity for functions of several arguments
-        if (!ast_function.arguments || ast_function.arguments->children.size() != 1)
+        /// Monotonicity check only works for functions that contain at most two arguments and one of them must be a constant.
+        if (!ast_function.arguments)
         {
             data.reject();
             return;
         }
 
+        auto arguments_size = ast_function.arguments->children.size();
+
+        if (arguments_size == 0 || arguments_size > 2)
+        {
+            data.reject();
+            return;
+        }
+        else if (arguments_size == 2)
+        {
+            /// If the function has two arguments, then one of them must be a constant.
+            if (!ast_function.arguments->children[0]->as<ASTLiteral>() && !ast_function.arguments->children[1]->as<ASTLiteral>())
+            {
+                data.reject();
+                return;
+            }
+        }
+
         if (!data.canOptimize(ast_function))
         {
             data.reject();
@@ -124,14 +147,33 @@ public:
             return;
         }
 
-        ColumnsWithTypeAndName args;
-        args.emplace_back(data.arg_data_type, "tmp");
-        auto function_base = function->build(args);
+        auto function_arguments = getFunctionArguments(ast_function, data);
+
+        auto function_base = function->build(function_arguments);
 
         if (function_base && function_base->hasInformationAboutMonotonicity())
         {
             bool is_positive = data.monotonicity.is_positive;
-            data.monotonicity = function_base->getMonotonicityForRange(*data.arg_data_type, Field(), Field());
+            data.monotonicity = function_base->getMonotonicityForRange(*data.arg_data_type, data.range.left, data.range.right);
+
+            auto & key_range = data.range;
+
+            /// If we apply function to open interval, we can get empty intervals in result.
+            /// E.g. for ('2020-01-03', '2020-01-20') after applying 'toYYYYMM' we will get ('202001', '202001').
+            /// To avoid this we make range left and right included.
+            /// Any function that treats NULL specially is not monotonic.
+            /// Thus we can safely use isNull() as an -Inf/+Inf indicator here.
+            if (!key_range.left.isNull())
+            {
+                key_range.left = applyFunction(function_base, data.arg_data_type, key_range.left);
+                key_range.left_included = true;
+            }
+
+            if (!key_range.right.isNull())
+            {
+                key_range.right = applyFunction(function_base, data.arg_data_type, key_range.right);
+                key_range.right_included = true;
+            }
 
             if (!is_positive)
                 data.monotonicity.is_positive = !data.monotonicity.is_positive;
@@ -143,13 +185,53 @@ public:
 
     static bool needChildVisit(const ASTPtr & parent, const ASTPtr &)
     {
-        /// Currently we check monotonicity only for single-argument functions.
-        /// Although, multi-argument functions with all but one constant arguments can also be monotonic.
+        /// Multi-argument functions with all but one constant arguments can be monotonic.
         if (const auto * func = typeid_cast<const ASTFunction *>(parent.get()))
-            return func->arguments->children.size() < 2;
+            return func->arguments->children.size() <= 2;
 
         return true;
     }
+
+    static ColumnWithTypeAndName extractLiteralColumnAndTypeFromAstLiteral(const ASTLiteral * literal)
+    {
+        ColumnWithTypeAndName result;
+
+        result.type = applyVisitor(FieldToDataType(), literal->value);
+        result.column = result.type->createColumnConst(0, literal->value);
+
+        return result;
+    }
+
+    static ColumnsWithTypeAndName getFunctionArguments(const ASTFunction & ast_function, const Data & data)
+    {
+        ColumnsWithTypeAndName args;
+
+        auto arguments_size = ast_function.arguments->children.size();
+
+        chassert(arguments_size == 1 || arguments_size == 2);
+
+        if (arguments_size == 2)
+        {
+            if (ast_function.arguments->children[0]->as<ASTLiteral>())
+            {
+                const auto * literal = ast_function.arguments->children[0]->as<ASTLiteral>();
+                args.push_back(extractLiteralColumnAndTypeFromAstLiteral(literal));
+                args.emplace_back(data.arg_data_type, "tmp");
+            }
+            else
+            {
+                const auto * literal = ast_function.arguments->children[1]->as<ASTLiteral>();
+                args.emplace_back(data.arg_data_type, "tmp");
+                args.push_back(extractLiteralColumnAndTypeFromAstLiteral(literal));
+            }
+        }
+        else
+        {
+            args.emplace_back(data.arg_data_type, "tmp");
+        }
+
+        return args;
+    }
 };
 
 using MonotonicityCheckVisitor = ConstInDepthNodeVisitor<MonotonicityCheckMatcher, false>;
diff --git a/src/Interpreters/applyFunction.cpp b/src/Interpreters/applyFunction.cpp
new file mode 100644
index 00000000000..a53f14f0381
--- /dev/null
+++ b/src/Interpreters/applyFunction.cpp
@@ -0,0 +1,43 @@
+#include <Interpreters/applyFunction.h>
+
+#include <Core/Range.h>
+#include <Functions/IFunction.h>
+
+namespace DB
+{
+
+static Field applyFunctionForField(const FunctionBasePtr & func, const DataTypePtr & arg_type, const Field & arg_value)
+{
+    ColumnsWithTypeAndName columns{
+        {arg_type->createColumnConst(1, arg_value), arg_type, "x"},
+    };
+
+    auto col = func->execute(columns, func->getResultType(), 1);
+    return (*col)[0];
+}
+
+FieldRef applyFunction(const FunctionBasePtr & func, const DataTypePtr & current_type, const FieldRef & field)
+{
+    /// Fallback for fields without block reference.
+    if (field.isExplicit())
+        return applyFunctionForField(func, current_type, field);
+
+    String result_name = "_" + func->getName() + "_" + toString(field.column_idx);
+    const auto & columns = field.columns;
+    size_t result_idx = columns->size();
+
+    for (size_t i = 0; i < result_idx; ++i)
+        if ((*columns)[i].name == result_name)
+            result_idx = i;
+
+    if (result_idx == columns->size())
+    {
+        ColumnsWithTypeAndName args{(*columns)[field.column_idx]};
+        field.columns->emplace_back(ColumnWithTypeAndName{nullptr, func->getResultType(), result_name});
+        (*columns)[result_idx].column = func->execute(args, (*columns)[result_idx].type, columns->front().column->size());
+    }
+
+    return {field.columns, field.row_idx, result_idx};
+}
+
+}
diff --git a/src/Interpreters/applyFunction.h b/src/Interpreters/applyFunction.h
new file mode 100644
index 00000000000..9b8ae43a53c
--- /dev/null
+++ b/src/Interpreters/applyFunction.h
@@ -0,0 +1,16 @@
+#pragma once
+
+#include <memory>
+
+namespace DB
+{
+struct FieldRef;
+
+class IFunctionBase;
+class IDataType;
+
+using DataTypePtr = std::shared_ptr<const IDataType>;
+using FunctionBasePtr = std::shared_ptr<const IFunctionBase>;
+
+FieldRef applyFunction(const FunctionBasePtr & func, const DataTypePtr & current_type, const FieldRef & field);
+}
diff --git a/src/Parsers/queryToString.cpp b/src/Parsers/queryToString.cpp
index 9721aa1f128..4a1903393f6 100644
--- a/src/Parsers/queryToString.cpp
+++ b/src/Parsers/queryToString.cpp
@@ -3,6 +3,11 @@
 
 namespace DB
 {
+    String queryToStringNullable(const ASTPtr & query)
+    {
+        return query ? queryToString(query) : "";
+    }
+
     String queryToString(const ASTPtr & query)
     {
         return queryToString(*query);
diff --git a/src/Parsers/queryToString.h b/src/Parsers/queryToString.h
index 873de218293..3acd560b1e2 100644
--- a/src/Parsers/queryToString.h
+++ b/src/Parsers/queryToString.h
@@ -6,4 +6,5 @@ namespace DB
 {
     String queryToString(const ASTPtr & query);
     String queryToString(const IAST & query);
+    String queryToStringNullable(const ASTPtr & query);
 }
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 87f23b0da2a..f3057a8254f 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -81,6 +81,7 @@ void IMergeTreeDataPart::MinMaxIndex::load(const MergeTreeData & data, const Par
     auto minmax_column_types = data.getMinMaxColumnsTypes(partition_key);
     size_t minmax_idx_size = minmax_column_types.size();
 
+    hyperrectangle.clear();
     hyperrectangle.reserve(minmax_idx_size);
     for (size_t i = 0; i < minmax_idx_size; ++i)
     {
@@ -104,6 +105,39 @@ void IMergeTreeDataPart::MinMaxIndex::load(const MergeTreeData & data, const Par
     initialized = true;
 }
 
+Block IMergeTreeDataPart::MinMaxIndex::getBlock(const MergeTreeData & data) const
+{
+    if (!initialized)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to get block from uninitialized MinMax index.");
+
+    Block block;
+
+    const auto metadata_snapshot = data.getInMemoryMetadataPtr();
+    const auto & partition_key = metadata_snapshot->getPartitionKey();
+
+    const auto minmax_column_names = data.getMinMaxColumnsNames(partition_key);
+    const auto minmax_column_types = data.getMinMaxColumnsTypes(partition_key);
+    const auto minmax_idx_size = minmax_column_types.size();
+
+    for (size_t i = 0; i < minmax_idx_size; ++i)
+    {
+        const auto & data_type = minmax_column_types[i];
+        const auto & column_name = minmax_column_names[i];
+
+        const auto column = data_type->createColumn();
+
+        const auto min_val = hyperrectangle.at(i).left;
+        const auto max_val = hyperrectangle.at(i).right;
+
+        column->insert(min_val);
+        column->insert(max_val);
+
+        block.insert(ColumnWithTypeAndName(column->getPtr(), data_type, column_name));
+    }
+
+    return block;
+}
+
 IMergeTreeDataPart::MinMaxIndex::WrittenFiles IMergeTreeDataPart::MinMaxIndex::store(
     const MergeTreeData & data, IDataPartStorage & part_storage, Checksums & out_checksums) const
 {
@@ -185,8 +219,7 @@ void IMergeTreeDataPart::MinMaxIndex::merge(const MinMaxIndex & other)
 
     if (!initialized)
     {
-        hyperrectangle = other.hyperrectangle;
-        initialized = true;
+        *this = other;
     }
     else
     {
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 640a1f1d0a3..29f0f54d419 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -336,6 +336,7 @@ public:
         }
 
         void load(const MergeTreeData & data, const PartMetadataManagerPtr & manager);
+        Block getBlock(const MergeTreeData & data) const;
 
         using WrittenFiles = std::vector<std::unique_ptr<WriteBufferFromFileBase>>;
 
diff --git a/src/Storages/MergeTree/KeyCondition.cpp b/src/Storages/MergeTree/KeyCondition.cpp
index d5922ae1bc2..e5bcb11091f 100644
--- a/src/Storages/MergeTree/KeyCondition.cpp
+++ b/src/Storages/MergeTree/KeyCondition.cpp
@@ -1,36 +1,37 @@
-#include <Storages/MergeTree/KeyCondition.h>
-#include <Storages/MergeTree/BoolMask.h>
-#include <DataTypes/DataTypesNumber.h>
+#include <Columns/ColumnConst.h>
+#include <Columns/ColumnSet.h>
 #include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/DataTypeNothing.h>
 #include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/FieldToDataType.h>
-#include <DataTypes/getLeastSupertype.h>
 #include <DataTypes/Utils.h>
-#include <Interpreters/TreeRewriter.h>
-#include <Interpreters/ExpressionAnalyzer.h>
-#include <Interpreters/ExpressionActions.h>
-#include <Interpreters/castColumn.h>
-#include <Interpreters/misc.h>
-#include <Functions/FunctionFactory.h>
-#include <Functions/indexHint.h>
+#include <DataTypes/getLeastSupertype.h>
 #include <Functions/CastOverloadResolver.h>
+#include <Functions/FunctionFactory.h>
 #include <Functions/IFunction.h>
-#include <Common/FieldVisitorToString.h>
-#include <Common/MortonUtils.h>
-#include <Common/typeid_cast.h>
-#include <Columns/ColumnSet.h>
-#include <Columns/ColumnConst.h>
-#include <Interpreters/convertFieldToType.h>
+#include <Functions/indexHint.h>
+#include <IO/Operators.h>
+#include <IO/WriteBufferFromString.h>
+#include <Interpreters/ExpressionActions.h>
+#include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/Set.h>
-#include <Parsers/queryToString.h>
+#include <Interpreters/TreeRewriter.h>
+#include <Interpreters/applyFunction.h>
+#include <Interpreters/castColumn.h>
+#include <Interpreters/convertFieldToType.h>
+#include <Interpreters/misc.h>
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTSelectQuery.h>
-#include <IO/WriteBufferFromString.h>
-#include <IO/Operators.h>
+#include <Parsers/queryToString.h>
+#include <Storages/MergeTree/BoolMask.h>
+#include <Storages/MergeTree/KeyCondition.h>
 #include <Storages/MergeTree/MergeTreeIndexUtils.h>
+#include <Common/FieldVisitorToString.h>
+#include <Common/MortonUtils.h>
+#include <Common/typeid_cast.h>
 
 #include <algorithm>
 #include <cassert>
@@ -836,21 +837,6 @@ bool KeyCondition::getConstant(const ASTPtr & expr, Block & block_with_constants
     return node.tryGetConstant(out_value, out_type);
 }
 
-
-static Field applyFunctionForField(
-    const FunctionBasePtr & func,
-    const DataTypePtr & arg_type,
-    const Field & arg_value)
-{
-    ColumnsWithTypeAndName columns
-    {
-        { arg_type->createColumnConst(1, arg_value), arg_type, "x" },
-    };
-
-    auto col = func->execute(columns, func->getResultType(), 1);
-    return (*col)[0];
-}
-
 /// The case when arguments may have types different than in the primary key.
 static std::pair<Field, DataTypePtr> applyFunctionForFieldOfUnknownType(
     const FunctionBasePtr & func,
@@ -890,33 +876,6 @@ static std::pair<Field, DataTypePtr> applyBinaryFunctionForFieldOfUnknownType(
     return {std::move(result), std::move(return_type)};
 }
 
-
-static FieldRef applyFunction(const FunctionBasePtr & func, const DataTypePtr & current_type, const FieldRef & field)
-{
-    /// Fallback for fields without block reference.
-    if (field.isExplicit())
-        return applyFunctionForField(func, current_type, field);
-
-    String result_name = "_" + func->getName() + "_" + toString(field.column_idx);
-    const auto & columns = field.columns;
-    size_t result_idx = columns->size();
-
-    for (size_t i = 0; i < result_idx; ++i)
-    {
-        if ((*columns)[i].name == result_name)
-            result_idx = i;
-    }
-
-    if (result_idx == columns->size())
-    {
-        ColumnsWithTypeAndName args{(*columns)[field.column_idx]};
-        field.columns->emplace_back(ColumnWithTypeAndName {nullptr, func->getResultType(), result_name});
-        (*columns)[result_idx].column = func->execute(args, (*columns)[result_idx].type, columns->front().column->size());
-    }
-
-    return {field.columns, field.row_idx, result_idx};
-}
-
 /** When table's key has expression with these functions from a column,
   * and when a column in a query is compared with a constant, such as:
   * CREATE TABLE (x String) ORDER BY toDate(x)
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 61332a4ff38..c3e348a549a 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -8,21 +8,6 @@
 #include <Backups/BackupEntryWrappedWith.h>
 #include <Backups/IBackup.h>
 #include <Backups/RestorerFromBackup.h>
-#include <Common/Config/ConfigHelper.h>
-#include <Common/CurrentMetrics.h>
-#include <Common/Increment.h>
-#include <Common/ProfileEventsScope.h>
-#include <Common/SimpleIncrement.h>
-#include <Common/Stopwatch.h>
-#include <Common/StringUtils/StringUtils.h>
-#include <Common/ThreadFuzzer.h>
-#include <Common/escapeForFileName.h>
-#include <Common/getNumberOfPhysicalCPUCores.h>
-#include <Common/noexcept_scope.h>
-#include <Common/quoteString.h>
-#include <Common/scope_guard_safe.h>
-#include <Common/typeid_cast.h>
-#include <Storages/MergeTree/RangesInDataPart.h>
 #include <Compression/CompressedReadBuffer.h>
 #include <Core/QueryProcessingStage.h>
 #include <DataTypes/DataTypeEnum.h>
@@ -43,19 +28,20 @@
 #include <IO/WriteHelpers.h>
 #include <Interpreters/Aggregator.h>
 #include <Interpreters/Context.h>
-#include <Interpreters/convertFieldToType.h>
-#include <Interpreters/evaluateConstantExpression.h>
 #include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/InterpreterSelectQuery.h>
 #include <Interpreters/MergeTreeTransaction.h>
 #include <Interpreters/PartLog.h>
 #include <Interpreters/TransactionLog.h>
 #include <Interpreters/TreeRewriter.h>
+#include <Interpreters/convertFieldToType.h>
+#include <Interpreters/evaluateConstantExpression.h>
 #include <Interpreters/inplaceBlockConversions.h>
+#include <Parsers/ASTAlterQuery.h>
 #include <Parsers/ASTExpressionList.h>
-#include <Parsers/ASTIndexDeclaration.h>
-#include <Parsers/ASTHelpers.h>
 #include <Parsers/ASTFunction.h>
+#include <Parsers/ASTHelpers.h>
+#include <Parsers/ASTIndexDeclaration.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTNameTypePair.h>
 #include <Parsers/ASTPartition.h>
@@ -64,26 +50,41 @@
 #include <Parsers/ExpressionListParsers.h>
 #include <Parsers/parseQuery.h>
 #include <Parsers/queryToString.h>
-#include <Parsers/ASTAlterQuery.h>
 #include <Processors/Formats/IInputFormat.h>
 #include <Processors/QueryPlan/QueryIdHolder.h>
 #include <Processors/QueryPlan/ReadFromMergeTree.h>
 #include <Storages/AlterCommands.h>
 #include <Storages/BlockNumberColumn.h>
 #include <Storages/Freeze.h>
+#include <Storages/MergeTree/ActiveDataPartSet.h>
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
 #include <Storages/MergeTree/MergeTreeDataPartBuilder.h>
+#include <Storages/MergeTree/MergeTreeDataPartCloner.h>
 #include <Storages/MergeTree/MergeTreeDataPartCompact.h>
 #include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
 #include <Storages/MergeTree/MergeTreeDataPartWide.h>
 #include <Storages/Statistics/Estimator.h>
 #include <Storages/MergeTree/MergeTreeSelectProcessor.h>
+#include <Storages/MergeTree/RangesInDataPart.h>
 #include <Storages/MergeTree/checkDataPart.h>
 #include <Storages/MutationCommands.h>
-#include <Storages/MergeTree/ActiveDataPartSet.h>
 #include <Storages/StorageMergeTree.h>
 #include <Storages/StorageReplicatedMergeTree.h>
 #include <Storages/VirtualColumnUtils.h>
+#include <Common/Config/ConfigHelper.h>
+#include <Common/CurrentMetrics.h>
+#include <Common/Increment.h>
+#include <Common/ProfileEventsScope.h>
+#include <Common/SimpleIncrement.h>
+#include <Common/Stopwatch.h>
+#include <Common/StringUtils/StringUtils.h>
+#include <Common/ThreadFuzzer.h>
+#include <Common/escapeForFileName.h>
+#include <Common/getNumberOfPhysicalCPUCores.h>
+#include <Common/noexcept_scope.h>
+#include <Common/quoteString.h>
+#include <Common/scope_guard_safe.h>
+#include <Common/typeid_cast.h>
 
 #include <boost/range/algorithm_ext/erase.hpp>
 #include <boost/algorithm/string/join.hpp>
@@ -197,6 +198,50 @@ namespace ErrorCodes
     extern const int LIMIT_EXCEEDED;
 }
 
+static size_t getPartitionAstFieldsCount(const ASTPartition & partition_ast, ASTPtr partition_value_ast)
+{
+    if (partition_ast.fields_count.has_value())
+        return *partition_ast.fields_count;
+
+    if (partition_value_ast->as<ASTLiteral>())
+        return 1;
+
+    const auto * tuple_ast = partition_value_ast->as<ASTFunction>();
+
+    if (!tuple_ast)
+    {
+        throw Exception(
+            ErrorCodes::INVALID_PARTITION_VALUE, "Expected literal or tuple for partition key, got {}", partition_value_ast->getID());
+    }
+
+    if (tuple_ast->name != "tuple")
+    {
+        if (!isFunctionCast(tuple_ast))
+            throw Exception(ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
+
+        if (tuple_ast->arguments->as<ASTExpressionList>()->children.empty())
+            throw Exception(ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
+
+        auto first_arg = tuple_ast->arguments->as<ASTExpressionList>()->children.at(0);
+        if (const auto * inner_tuple = first_arg->as<ASTFunction>(); inner_tuple && inner_tuple->name == "tuple")
+        {
+            const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
+            return arguments_ast ? arguments_ast->children.size() : 0;
+        }
+        else if (const auto * inner_literal_tuple = first_arg->as<ASTLiteral>(); inner_literal_tuple)
+        {
+            return inner_literal_tuple->value.getType() == Field::Types::Tuple ? inner_literal_tuple->value.safeGet<Tuple>().size() : 1;
+        }
+
+        throw Exception(ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
+    }
+    else
+    {
+        const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
+        return arguments_ast ? arguments_ast->children.size() : 0;
+    }
+}
+
 static void checkSuspiciousIndices(const ASTFunction * index_function)
 {
     std::unordered_set<UInt64> unique_index_expression_hashes;
@@ -4854,7 +4899,7 @@ void MergeTreeData::removePartContributionToColumnAndSecondaryIndexSizes(const D
 }
 
 void MergeTreeData::checkAlterPartitionIsPossible(
-    const PartitionCommands & commands, const StorageMetadataPtr & /*metadata_snapshot*/, const Settings & settings, ContextPtr local_context) const
+    const PartitionCommands & commands, const StorageMetadataPtr & /*metadata_snapshot*/, const Settings & settings, ContextPtr) const
 {
     for (const auto & command : commands)
     {
@@ -4882,7 +4927,15 @@ void MergeTreeData::checkAlterPartitionIsPossible(
                         throw DB::Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Only support DROP/DETACH PARTITION ALL currently");
                 }
                 else
-                    getPartitionIDFromQuery(command.partition, local_context);
+                {
+                    // The below `getPartitionIDFromQuery` call will not work for attach / replace because it assumes the partition expressions
+                    // are the same and deliberately uses this storage. Later on, `MergeTreeData::replaceFrom` is called, and it makes the right
+                    // call to `getPartitionIDFromQuery` using source storage.
+                    // Note: `PartitionCommand::REPLACE_PARTITION` is used both for `REPLACE PARTITION` and `ATTACH PARTITION FROM` queries.
+                    // But not for `ATTACH PARTITION` queries.
+                    if (command.type != PartitionCommand::REPLACE_PARTITION)
+                        getPartitionIDFromQuery(command.partition, getContext());
+                }
             }
         }
     }
@@ -5616,69 +5669,8 @@ String MergeTreeData::getPartitionIDFromQuery(const ASTPtr & ast, ContextPtr loc
         MergeTreePartInfo::validatePartitionID(partition_ast.id->clone(), format_version);
         return partition_ast.id->as<ASTLiteral>()->value.safeGet<String>();
     }
-    size_t partition_ast_fields_count = 0;
     ASTPtr partition_value_ast = partition_ast.value->clone();
-    if (!partition_ast.fields_count.has_value())
-    {
-        if (partition_value_ast->as<ASTLiteral>())
-        {
-            partition_ast_fields_count = 1;
-        }
-        else if (const auto * tuple_ast = partition_value_ast->as<ASTFunction>())
-        {
-            if (tuple_ast->name != "tuple")
-            {
-                if (isFunctionCast(tuple_ast))
-                {
-                    if (tuple_ast->arguments->as<ASTExpressionList>()->children.empty())
-                    {
-                        throw Exception(
-                            ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
-                    }
-                    auto first_arg = tuple_ast->arguments->as<ASTExpressionList>()->children.at(0);
-                    if (const auto * inner_tuple = first_arg->as<ASTFunction>(); inner_tuple && inner_tuple->name == "tuple")
-                    {
-                        const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
-                        if (arguments_ast)
-                            partition_ast_fields_count = arguments_ast->children.size();
-                        else
-                            partition_ast_fields_count = 0;
-                    }
-                    else if (const auto * inner_literal_tuple = first_arg->as<ASTLiteral>(); inner_literal_tuple)
-                    {
-                        if (inner_literal_tuple->value.getType() == Field::Types::Tuple)
-                            partition_ast_fields_count = inner_literal_tuple->value.safeGet<Tuple>().size();
-                        else
-                            partition_ast_fields_count = 1;
-                    }
-                    else
-                    {
-                        throw Exception(
-                            ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
-                    }
-                }
-                else
-                    throw Exception(ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
-            }
-            else
-            {
-                const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
-                if (arguments_ast)
-                    partition_ast_fields_count = arguments_ast->children.size();
-                else
-                    partition_ast_fields_count = 0;
-            }
-        }
-        else
-        {
-            throw Exception(
-                ErrorCodes::INVALID_PARTITION_VALUE, "Expected literal or tuple for partition key, got {}", partition_value_ast->getID());
-        }
-    }
-    else
-    {
-        partition_ast_fields_count = *partition_ast.fields_count;
-    }
+    auto partition_ast_fields_count = getPartitionAstFieldsCount(partition_ast, partition_value_ast);
 
     if (format_version < MERGE_TREE_DATA_MIN_FORMAT_VERSION_WITH_CUSTOM_PARTITIONING)
     {
@@ -7014,23 +7006,35 @@ MergeTreeData & MergeTreeData::checkStructureAndGetMergeTreeData(IStorage & sour
     if (my_snapshot->getColumns().getAllPhysical().sizeOfDifference(src_snapshot->getColumns().getAllPhysical()))
         throw Exception(ErrorCodes::INCOMPATIBLE_COLUMNS, "Tables have different structure");
 
-    auto query_to_string = [] (const ASTPtr & ast)
-    {
-        return ast ? queryToString(ast) : "";
-    };
-
-    if (query_to_string(my_snapshot->getSortingKeyAST()) != query_to_string(src_snapshot->getSortingKeyAST()))
+    if (queryToStringNullable(my_snapshot->getSortingKeyAST()) != queryToStringNullable(src_snapshot->getSortingKeyAST()))
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Tables have different ordering");
 
-    if (query_to_string(my_snapshot->getPartitionKeyAST()) != query_to_string(src_snapshot->getPartitionKeyAST()))
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Tables have different partition key");
-
     if (format_version != src_data->format_version)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Tables have different format_version");
 
-    if (query_to_string(my_snapshot->getPrimaryKeyAST()) != query_to_string(src_snapshot->getPrimaryKeyAST()))
+    if (queryToStringNullable(my_snapshot->getPrimaryKeyAST()) != queryToStringNullable(src_snapshot->getPrimaryKeyAST()))
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Tables have different primary key");
 
+    const auto is_a_subset_of = [](const auto & lhs, const auto & rhs)
+    {
+        if (lhs.size() > rhs.size())
+            return false;
+
+        const auto rhs_set = NameSet(rhs.begin(), rhs.end());
+        for (const auto & lhs_element : lhs)
+            if (!rhs_set.contains(lhs_element))
+                return false;
+
+        return true;
+    };
+
+    if (!is_a_subset_of(my_snapshot->getColumnsRequiredForPartitionKey(), src_snapshot->getColumnsRequiredForPartitionKey()))
+    {
+        throw Exception(
+            ErrorCodes::BAD_ARGUMENTS,
+            "Destination table partition expression columns must be a subset of source table partition expression columns");
+    }
+
     const auto check_definitions = [](const auto & my_descriptions, const auto & src_descriptions)
     {
         if (my_descriptions.size() != src_descriptions.size())
@@ -7071,128 +7075,56 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
     const ReadSettings & read_settings,
     const WriteSettings & write_settings)
 {
-    /// Check that the storage policy contains the disk where the src_part is located.
-    bool does_storage_policy_allow_same_disk = false;
-    for (const DiskPtr & disk : getStoragePolicy()->getDisks())
-    {
-        if (disk->getName() == src_part->getDataPartStorage().getDiskName())
-        {
-            does_storage_policy_allow_same_disk = true;
-            break;
-        }
-    }
-    if (!does_storage_policy_allow_same_disk)
-        throw Exception(
-            ErrorCodes::BAD_ARGUMENTS,
-            "Could not clone and load part {} because disk does not belong to storage policy",
-            quoteString(src_part->getDataPartStorage().getFullPath()));
+    return MergeTreeDataPartCloner::clone(
+        this, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, require_part_metadata, params, read_settings, write_settings);
+}
 
-    String dst_part_name = src_part->getNewName(dst_part_info);
-    String tmp_dst_part_name = tmp_part_prefix + dst_part_name;
-    auto temporary_directory_lock = getTemporaryPartDirectoryHolder(tmp_dst_part_name);
+std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
+    const MergeTreeData::DataPartPtr & src_part,
+    const MergeTreePartition & new_partition,
+    const String & partition_id,
+    const IMergeTreeDataPart::MinMaxIndex & min_max_index,
+    const String & tmp_part_prefix,
+    const StorageMetadataPtr & my_metadata_snapshot,
+    const IDataPartStorage::ClonePartParams & clone_params,
+    ContextPtr local_context,
+    Int64 min_block,
+    Int64 max_block
+)
+{
+    MergeTreePartInfo dst_part_info(partition_id, min_block, max_block, src_part->info.level);
 
-    /// Why it is needed if we only hardlink files?
-    auto reservation = src_part->getDataPartStorage().reserve(src_part->getBytesOnDisk());
-    auto src_part_storage = src_part->getDataPartStoragePtr();
+    return MergeTreeDataPartCloner::cloneWithDistinctPartitionExpression(
+        this,
+        src_part,
+        my_metadata_snapshot,
+        dst_part_info,
+        tmp_part_prefix,
+        local_context->getReadSettings(),
+        local_context->getWriteSettings(),
+        new_partition,
+        min_max_index,
+        false,
+        clone_params);
+}
 
-    scope_guard src_flushed_tmp_dir_lock;
-    MergeTreeData::MutableDataPartPtr src_flushed_tmp_part;
+std::pair<MergeTreePartition, IMergeTreeDataPart::MinMaxIndex> MergeTreeData::createPartitionAndMinMaxIndexFromSourcePart(
+    const MergeTreeData::DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    ContextPtr local_context)
+{
+    const auto & src_data = src_part->storage;
 
-    /// If source part is in memory, flush it to disk and clone it already in on-disk format
-    /// Protect tmp dir from removing by cleanup thread with src_flushed_tmp_dir_lock
-    /// Construct src_flushed_tmp_part in order to delete part with its directory at destructor
-    if (auto src_part_in_memory = asInMemoryPart(src_part))
-    {
-        auto flushed_part_path = *src_part_in_memory->getRelativePathForPrefix(tmp_part_prefix);
+    auto metadata_manager = std::make_shared<PartMetadataManagerOrdinary>(src_part.get());
+    IMergeTreeDataPart::MinMaxIndex min_max_index;
 
-        auto tmp_src_part_file_name = fs::path(tmp_dst_part_name).filename();
-        src_flushed_tmp_dir_lock = src_part->storage.getTemporaryPartDirectoryHolder(tmp_src_part_file_name);
+    min_max_index.load(src_data, metadata_manager);
 
-        auto flushed_part_storage = src_part_in_memory->flushToDisk(flushed_part_path, metadata_snapshot);
+    MergeTreePartition new_partition;
 
-        src_flushed_tmp_part = MergeTreeDataPartBuilder(*this, src_part->name, flushed_part_storage)
-            .withPartInfo(src_part->info)
-            .withPartFormatFromDisk()
-            .build();
+    new_partition.create(metadata_snapshot, min_max_index.getBlock(src_data), 0u, local_context);
 
-        src_flushed_tmp_part->is_temp = true;
-        src_part_storage = flushed_part_storage;
-    }
-
-    String with_copy;
-    if (params.copy_instead_of_hardlink)
-        with_copy = " (copying data)";
-
-    auto dst_part_storage = src_part_storage->freeze(
-        relative_data_path,
-        tmp_dst_part_name,
-        read_settings,
-        write_settings,
-        /* save_metadata_callback= */ {},
-        params);
-
-    if (params.metadata_version_to_write.has_value())
-    {
-        chassert(!params.keep_metadata_version);
-        auto out_metadata = dst_part_storage->writeFile(IMergeTreeDataPart::METADATA_VERSION_FILE_NAME, 4096, getContext()->getWriteSettings());
-        writeText(metadata_snapshot->getMetadataVersion(), *out_metadata);
-        out_metadata->finalize();
-        if (getSettings()->fsync_after_insert)
-            out_metadata->sync();
-    }
-
-    LOG_DEBUG(log, "Clone{} part {} to {}{}",
-              src_flushed_tmp_part ? " flushed" : "",
-              src_part_storage->getFullPath(),
-              std::string(fs::path(dst_part_storage->getFullRootPath()) / tmp_dst_part_name),
-              with_copy);
-
-    auto dst_data_part = MergeTreeDataPartBuilder(*this, dst_part_name, dst_part_storage)
-        .withPartFormatFromDisk()
-        .build();
-
-    if (!params.copy_instead_of_hardlink && params.hardlinked_files)
-    {
-        params.hardlinked_files->source_part_name = src_part->name;
-        params.hardlinked_files->source_table_shared_id = src_part->storage.getTableSharedID();
-
-        for (auto it = src_part->getDataPartStorage().iterate(); it->isValid(); it->next())
-        {
-            if (!params.files_to_copy_instead_of_hardlinks.contains(it->name())
-                && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
-                && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
-            {
-                params.hardlinked_files->hardlinks_from_source_part.insert(it->name());
-            }
-        }
-
-        auto projections = src_part->getProjectionParts();
-        for (const auto & [name, projection_part] : projections)
-        {
-            const auto & projection_storage = projection_part->getDataPartStorage();
-            for (auto it = projection_storage.iterate(); it->isValid(); it->next())
-            {
-                auto file_name_with_projection_prefix = fs::path(projection_storage.getPartDirectory()) / it->name();
-                if (!params.files_to_copy_instead_of_hardlinks.contains(file_name_with_projection_prefix)
-                    && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
-                    && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
-                {
-                    params.hardlinked_files->hardlinks_from_source_part.insert(file_name_with_projection_prefix);
-                }
-            }
-        }
-    }
-
-    /// We should write version metadata on part creation to distinguish it from parts that were created without transaction.
-    TransactionID tid = params.txn ? params.txn->tid : Tx::PrehistoricTID;
-    dst_data_part->version.setCreationTID(tid, nullptr);
-    dst_data_part->storeVersionMetadata();
-
-    dst_data_part->is_temp = true;
-
-    dst_data_part->loadColumnsChecksumsIndexes(require_part_metadata, true);
-    dst_data_part->modification_time = dst_part_storage->getLastModified().epochTime();
-    return std::make_pair(dst_data_part, std::move(temporary_directory_lock));
+    return {new_partition, min_max_index};
 }
 
 String MergeTreeData::getFullPathOnDisk(const DiskPtr & disk) const
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index f0dbaf0e307..9c433e11b84 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -231,6 +231,7 @@ public:
         }
     };
 
+
     using DataParts = std::set<DataPartPtr, LessDataPart>;
     using MutableDataParts = std::set<MutableDataPartPtr, LessDataPart>;
     using DataPartsVector = std::vector<DataPartPtr>;
@@ -848,6 +849,23 @@ public:
         const ReadSettings & read_settings,
         const WriteSettings & write_settings);
 
+    std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
+        const MergeTreeData::DataPartPtr & src_part,
+        const MergeTreePartition & new_partition,
+        const String & partition_id,
+        const IMergeTreeDataPart::MinMaxIndex & min_max_index,
+        const String & tmp_part_prefix,
+        const StorageMetadataPtr & my_metadata_snapshot,
+        const IDataPartStorage::ClonePartParams & clone_params,
+        ContextPtr local_context,
+        Int64 min_block,
+        Int64 max_block);
+
+    static std::pair<MergeTreePartition, IMergeTreeDataPart::MinMaxIndex> createPartitionAndMinMaxIndexFromSourcePart(
+        const MergeTreeData::DataPartPtr & src_part,
+        const StorageMetadataPtr & metadata_snapshot,
+        ContextPtr local_context);
+
     virtual std::vector<MergeTreeMutationStatus> getMutationsStatus() const = 0;
 
     /// Returns true if table can create new parts with adaptive granularity
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
new file mode 100644
index 00000000000..78cb9aa0624
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
@@ -0,0 +1,320 @@
+#include <Interpreters/MergeTreeTransaction.h>
+#include <Storages/MergeTree/MergeTreeData.h>
+#include <Storages/MergeTree/MergeTreeDataPartBuilder.h>
+#include <Storages/MergeTree/MergeTreeDataPartCloner.h>
+#include <Common/escapeForFileName.h>
+#include <Common/logger_useful.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+extern const int BAD_ARGUMENTS;
+}
+
+static Poco::Logger * log = &Poco::Logger::get("MergeTreeDataPartCloner");
+
+namespace DistinctPartitionExpression
+{
+std::unique_ptr<WriteBufferFromFileBase> updatePartitionFile(
+    const MergeTreeData & merge_tree_data,
+    const MergeTreePartition & partition,
+    const MergeTreeData::MutableDataPartPtr & dst_part,
+    IDataPartStorage & storage)
+{
+    storage.removeFile("partition.dat");
+    // Leverage already implemented MergeTreePartition::store to create & store partition.dat.
+    // Checksum is re-calculated later.
+    return partition.store(merge_tree_data, storage, dst_part->checksums);
+}
+
+IMergeTreeDataPart::MinMaxIndex::WrittenFiles updateMinMaxFiles(
+    const MergeTreeData & merge_tree_data,
+    const MergeTreeData::MutableDataPartPtr & dst_part,
+    IDataPartStorage & storage,
+    const StorageMetadataPtr & metadata_snapshot)
+{
+    for (const auto & column_name : MergeTreeData::getMinMaxColumnsNames(metadata_snapshot->partition_key))
+    {
+        auto file = "minmax_" + escapeForFileName(column_name) + ".idx";
+        storage.removeFile(file);
+    }
+
+    return dst_part->minmax_idx->store(merge_tree_data, storage, dst_part->checksums);
+}
+
+void finalizeNewFiles(const std::vector<std::unique_ptr<WriteBufferFromFileBase>> & files, bool sync_new_files)
+{
+    for (const auto & file : files)
+    {
+        file->finalize();
+        if (sync_new_files)
+            file->sync();
+    }
+}
+
+void updateNewPartFiles(
+    const MergeTreeData & merge_tree_data,
+    const MergeTreeData::MutableDataPartPtr & dst_part,
+    const MergeTreePartition & new_partition,
+    const IMergeTreeDataPart::MinMaxIndex & new_min_max_index,
+    const StorageMetadataPtr & src_metadata_snapshot,
+    bool sync_new_files)
+{
+    auto & storage = dst_part->getDataPartStorage();
+
+    *dst_part->minmax_idx = new_min_max_index;
+
+    auto partition_file = updatePartitionFile(merge_tree_data, new_partition, dst_part, storage);
+
+    auto min_max_files = updateMinMaxFiles(merge_tree_data, dst_part, storage, src_metadata_snapshot);
+
+    IMergeTreeDataPart::MinMaxIndex::WrittenFiles written_files;
+
+    if (partition_file)
+        written_files.emplace_back(std::move(partition_file));
+
+    written_files.insert(written_files.end(), std::make_move_iterator(min_max_files.begin()), std::make_move_iterator(min_max_files.end()));
+
+    finalizeNewFiles(written_files, sync_new_files);
+
+    // MergeTreeDataPartCloner::finalize_part calls IMergeTreeDataPart::loadColumnsChecksumsIndexes, which will re-create
+    // the checksum file if it doesn't exist. Relying on that is cumbersome, but this refactoring is simply a code extraction
+    // with small improvements. It can be further improved in the future.
+    storage.removeFile("checksums.txt");
+}
+}
+
+namespace
+{
+bool doesStoragePolicyAllowSameDisk(MergeTreeData * merge_tree_data, const MergeTreeData::DataPartPtr & src_part)
+{
+    for (const DiskPtr & disk : merge_tree_data->getStoragePolicy()->getDisks())
+        if (disk->getName() == src_part->getDataPartStorage().getDiskName())
+            return true;
+    return false;
+}
+
+DataPartStoragePtr flushPartStorageToDiskIfInMemory(
+    MergeTreeData * merge_tree_data,
+    const MergeTreeData::DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    const String & tmp_part_prefix,
+    const String & tmp_dst_part_name,
+    scope_guard & src_flushed_tmp_dir_lock,
+    MergeTreeData::MutableDataPartPtr src_flushed_tmp_part)
+{
+    if (auto src_part_in_memory = asInMemoryPart(src_part))
+    {
+        auto flushed_part_path = src_part_in_memory->getRelativePathForPrefix(tmp_part_prefix);
+        auto tmp_src_part_file_name = fs::path(tmp_dst_part_name).filename();
+
+        src_flushed_tmp_dir_lock = src_part->storage.getTemporaryPartDirectoryHolder(tmp_src_part_file_name);
+
+        auto flushed_part_storage = src_part_in_memory->flushToDisk(*flushed_part_path, metadata_snapshot);
+
+        src_flushed_tmp_part = MergeTreeDataPartBuilder(*merge_tree_data, src_part->name, flushed_part_storage)
+                                   .withPartInfo(src_part->info)
+                                   .withPartFormatFromDisk()
+                                   .build();
+
+        src_flushed_tmp_part->is_temp = true;
+
+        return flushed_part_storage;
+    }
+
+    return src_part->getDataPartStoragePtr();
+}
+
+std::shared_ptr<IDataPartStorage> hardlinkAllFiles(
+    MergeTreeData * merge_tree_data,
+    const DB::ReadSettings & read_settings,
+    const DB::WriteSettings & write_settings,
+    const DataPartStoragePtr & storage,
+    const String & path,
+    const DB::IDataPartStorage::ClonePartParams & params)
+{
+    return storage->freeze(
+        merge_tree_data->getRelativeDataPath(),
+        path,
+        read_settings,
+        write_settings,
+        /*save_metadata_callback=*/{},
+        params);
+}
+
+std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneSourcePart(
+    MergeTreeData * merge_tree_data,
+    const MergeTreeData::DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    const MergeTreePartInfo & dst_part_info,
+    const String & tmp_part_prefix,
+    const ReadSettings & read_settings,
+    const WriteSettings & write_settings,
+    const DB::IDataPartStorage::ClonePartParams & params)
+{
+    const auto dst_part_name = src_part->getNewName(dst_part_info);
+
+    const auto tmp_dst_part_name = tmp_part_prefix + dst_part_name;
+
+    auto temporary_directory_lock = merge_tree_data->getTemporaryPartDirectoryHolder(tmp_dst_part_name);
+
+    src_part->getDataPartStorage().reserve(src_part->getBytesOnDisk());
+
+    scope_guard src_flushed_tmp_dir_lock;
+    MergeTreeData::MutableDataPartPtr src_flushed_tmp_part;
+
+    auto src_part_storage = flushPartStorageToDiskIfInMemory(
+        merge_tree_data, src_part, metadata_snapshot, tmp_part_prefix, tmp_dst_part_name, src_flushed_tmp_dir_lock, src_flushed_tmp_part);
+
+    auto dst_part_storage = hardlinkAllFiles(merge_tree_data, read_settings, write_settings, src_part_storage, tmp_dst_part_name, params);
+
+    if (params.metadata_version_to_write.has_value())
+    {
+        chassert(!params.keep_metadata_version);
+        auto out_metadata = dst_part_storage->writeFile(
+            IMergeTreeDataPart::METADATA_VERSION_FILE_NAME, 4096, merge_tree_data->getContext()->getWriteSettings());
+        writeText(metadata_snapshot->getMetadataVersion(), *out_metadata);
+        out_metadata->finalize();
+        if (merge_tree_data->getSettings()->fsync_after_insert)
+            out_metadata->sync();
+    }
+
+    LOG_DEBUG(
+        log,
+        "Clone {} part {} to {}{}",
+        src_flushed_tmp_part ? "flushed" : "",
+        src_part_storage->getFullPath(),
+        std::string(fs::path(dst_part_storage->getFullRootPath()) / tmp_dst_part_name),
+        false);
+
+
+    auto part = MergeTreeDataPartBuilder(*merge_tree_data, dst_part_name, dst_part_storage).withPartFormatFromDisk().build();
+
+    return std::make_pair(part, std::move(temporary_directory_lock));
+}
+
+void handleHardLinkedParameterFiles(const MergeTreeData::DataPartPtr & src_part, const DB::IDataPartStorage::ClonePartParams & params)
+{
+    const auto & hardlinked_files = params.hardlinked_files;
+
+    hardlinked_files->source_part_name = src_part->name;
+    hardlinked_files->source_table_shared_id = src_part->storage.getTableSharedID();
+
+    for (auto it = src_part->getDataPartStorage().iterate(); it->isValid(); it->next())
+    {
+        if (!params.files_to_copy_instead_of_hardlinks.contains(it->name())
+            && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
+            && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
+        {
+            hardlinked_files->hardlinks_from_source_part.insert(it->name());
+        }
+    }
+}
+
+void handleProjections(const MergeTreeData::DataPartPtr & src_part, const DB::IDataPartStorage::ClonePartParams & params)
+{
+    auto projections = src_part->getProjectionParts();
+    for (const auto & [name, projection_part] : projections)
+    {
+        const auto & projection_storage = projection_part->getDataPartStorage();
+        for (auto it = projection_storage.iterate(); it->isValid(); it->next())
+        {
+            auto file_name_with_projection_prefix = fs::path(projection_storage.getPartDirectory()) / it->name();
+            if (!params.files_to_copy_instead_of_hardlinks.contains(file_name_with_projection_prefix)
+                && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
+                && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
+            {
+                params.hardlinked_files->hardlinks_from_source_part.insert(file_name_with_projection_prefix);
+            }
+        }
+    }
+}
+
+MergeTreeData::MutableDataPartPtr finalizePart(
+    const MergeTreeData::MutableDataPartPtr & dst_part, const DB::IDataPartStorage::ClonePartParams & params, bool require_part_metadata)
+{
+    /// We should write version metadata on part creation to distinguish it from parts that were created without transaction.
+    TransactionID tid = params.txn ? params.txn->tid : Tx::PrehistoricTID;
+    dst_part->version.setCreationTID(tid, nullptr);
+    dst_part->storeVersionMetadata();
+
+    dst_part->is_temp = true;
+
+    dst_part->loadColumnsChecksumsIndexes(require_part_metadata, true);
+
+    dst_part->modification_time = dst_part->getDataPartStorage().getLastModified().epochTime();
+
+    return dst_part;
+}
+
+std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> cloneAndHandleHardlinksAndProjections(
+    MergeTreeData * merge_tree_data,
+    const DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    const MergeTreePartInfo & dst_part_info,
+    const String & tmp_part_prefix,
+    const ReadSettings & read_settings,
+    const WriteSettings & write_settings,
+    const IDataPartStorage::ClonePartParams & params)
+{
+    if (!doesStoragePolicyAllowSameDisk(merge_tree_data, src_part))
+        throw Exception(
+            ErrorCodes::BAD_ARGUMENTS,
+            "Could not clone and load part {} because disk does not belong to storage policy",
+            quoteString(src_part->getDataPartStorage().getFullPath()));
+
+    auto [destination_part, temporary_directory_lock] = cloneSourcePart(
+        merge_tree_data, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, read_settings, write_settings, params);
+
+    if (!params.copy_instead_of_hardlink && params.hardlinked_files)
+    {
+        handleHardLinkedParameterFiles(src_part, params);
+        handleProjections(src_part, params);
+    }
+
+    return std::make_pair(destination_part, std::move(temporary_directory_lock));
+}
+}
+
+std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> MergeTreeDataPartCloner::clone(
+    MergeTreeData * merge_tree_data,
+    const DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    const MergeTreePartInfo & dst_part_info,
+    const String & tmp_part_prefix,
+    bool require_part_metadata,
+    const IDataPartStorage::ClonePartParams & params,
+    const ReadSettings & read_settings,
+    const WriteSettings & write_settings)
+{
+    auto [destination_part, temporary_directory_lock] = cloneAndHandleHardlinksAndProjections(
+        merge_tree_data, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, read_settings, write_settings, params);
+
+    return std::make_pair(finalizePart(destination_part, params, require_part_metadata), std::move(temporary_directory_lock));
+}
+
+std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> MergeTreeDataPartCloner::cloneWithDistinctPartitionExpression(
+    MergeTreeData * merge_tree_data,
+    const DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    const MergeTreePartInfo & dst_part_info,
+    const String & tmp_part_prefix,
+    const ReadSettings & read_settings,
+    const WriteSettings & write_settings,
+    const MergeTreePartition & new_partition,
+    const IMergeTreeDataPart::MinMaxIndex & new_min_max_index,
+    bool sync_new_files,
+    const IDataPartStorage::ClonePartParams & params)
+{
+    auto [destination_part, temporary_directory_lock] = cloneAndHandleHardlinksAndProjections(
+        merge_tree_data, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, read_settings, write_settings, params);
+
+    DistinctPartitionExpression::updateNewPartFiles(
+        *merge_tree_data, destination_part, new_partition, new_min_max_index, src_part->storage.getInMemoryMetadataPtr(), sync_new_files);
+
+    return std::make_pair(finalizePart(destination_part, params, false), std::move(temporary_directory_lock));
+}
+
+}
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.h b/src/Storages/MergeTree/MergeTreeDataPartCloner.h
new file mode 100644
index 00000000000..53585f20b7f
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreeDataPartCloner.h
@@ -0,0 +1,43 @@
+#pragma once
+
+namespace DB
+{
+
+struct StorageInMemoryMetadata;
+using StorageMetadataPtr = std::shared_ptr<const StorageInMemoryMetadata>;
+struct MergeTreePartition;
+class IMergeTreeDataPart;
+
+class MergeTreeDataPartCloner
+{
+public:
+    using DataPart = IMergeTreeDataPart;
+    using MutableDataPartPtr = std::shared_ptr<DataPart>;
+    using DataPartPtr = std::shared_ptr<const DataPart>;
+
+    static std::pair<MutableDataPartPtr, scope_guard> clone(
+        MergeTreeData * merge_tree_data,
+        const DataPartPtr & src_part,
+        const StorageMetadataPtr & metadata_snapshot,
+        const MergeTreePartInfo & dst_part_info,
+        const String & tmp_part_prefix,
+        bool require_part_metadata,
+        const IDataPartStorage::ClonePartParams & params,
+        const ReadSettings & read_settings,
+        const WriteSettings & write_settings);
+
+    static std::pair<MutableDataPartPtr, scope_guard> cloneWithDistinctPartitionExpression(
+        MergeTreeData * merge_tree_data,
+        const DataPartPtr & src_part,
+        const StorageMetadataPtr & metadata_snapshot,
+        const MergeTreePartInfo & dst_part_info,
+        const String & tmp_part_prefix,
+        const ReadSettings & read_settings,
+        const WriteSettings & write_settings,
+        const MergeTreePartition & new_partition,
+        const IMergeTreeDataPart::MinMaxIndex & new_min_max_index,
+        bool sync_new_files,
+        const IDataPartStorage::ClonePartParams & params);
+};
+
+}
diff --git a/src/Storages/MergeTree/MergeTreePartition.cpp b/src/Storages/MergeTree/MergeTreePartition.cpp
index ddeaf69136a..76ef3be25b3 100644
--- a/src/Storages/MergeTree/MergeTreePartition.cpp
+++ b/src/Storages/MergeTree/MergeTreePartition.cpp
@@ -467,6 +467,45 @@ void MergeTreePartition::create(const StorageMetadataPtr & metadata_snapshot, Bl
     }
 }
 
+void MergeTreePartition::createAndValidateMinMaxPartitionIds(
+    const StorageMetadataPtr & metadata_snapshot, Block block_with_min_max_partition_ids, ContextPtr context)
+{
+    if (!metadata_snapshot->hasPartitionKey())
+        return;
+
+    auto partition_key_names_and_types = executePartitionByExpression(metadata_snapshot, block_with_min_max_partition_ids, context);
+    value.resize(partition_key_names_and_types.size());
+
+    /// Executing partition_by expression adds new columns to passed block according to partition functions.
+    /// The block is passed by reference and is used afterwards. `moduloLegacy` needs to be substituted back
+    /// with just `modulo`, because it was a temporary substitution.
+    static constexpr std::string_view modulo_legacy_function_name = "moduloLegacy";
+
+    size_t i = 0;
+    for (const auto & element : partition_key_names_and_types)
+    {
+        auto & partition_column = block_with_min_max_partition_ids.getByName(element.name);
+
+        if (element.name.starts_with(modulo_legacy_function_name))
+            partition_column.name.replace(0, modulo_legacy_function_name.size(), "modulo");
+
+        Field extracted_min_partition_id_field;
+        Field extracted_max_partition_id_field;
+
+        partition_column.column->get(0, extracted_min_partition_id_field);
+        partition_column.column->get(1, extracted_max_partition_id_field);
+
+        if (extracted_min_partition_id_field != extracted_max_partition_id_field)
+        {
+            throw Exception(
+                ErrorCodes::INVALID_PARTITION_VALUE,
+                "Can not create the partition. A partition can not contain values that have different partition ids");
+        }
+
+        partition_column.column->get(0u, value[i++]);
+    }
+}
+
 NamesAndTypesList MergeTreePartition::executePartitionByExpression(const StorageMetadataPtr & metadata_snapshot, Block & block, ContextPtr context)
 {
     auto adjusted_partition_key = adjustPartitionKey(metadata_snapshot, context);
diff --git a/src/Storages/MergeTree/MergeTreePartition.h b/src/Storages/MergeTree/MergeTreePartition.h
index 78b141f26ec..fd7ae02cde4 100644
--- a/src/Storages/MergeTree/MergeTreePartition.h
+++ b/src/Storages/MergeTree/MergeTreePartition.h
@@ -1,11 +1,12 @@
 #pragma once
 
-#include <base/types.h>
+#include <Core/Field.h>
 #include <Disks/IDisk.h>
 #include <IO/WriteBuffer.h>
 #include <Storages/KeyDescription.h>
 #include <Storages/MergeTree/IPartMetadataManager.h>
-#include <Core/Field.h>
+#include <Storages/MergeTree/PartMetadataManagerOrdinary.h>
+#include <base/types.h>
 
 namespace DB
 {
@@ -51,6 +52,11 @@ public:
 
     void create(const StorageMetadataPtr & metadata_snapshot, Block block, size_t row, ContextPtr context);
 
+    /// Copy of MergeTreePartition::create, but also validates if min max partition keys are equal. If they are different,
+    /// it means the partition can't be created because the data doesn't belong to the same partition.
+    void createAndValidateMinMaxPartitionIds(
+        const StorageMetadataPtr & metadata_snapshot, Block block_with_min_max_partition_ids, ContextPtr context);
+
     static void appendFiles(const MergeTreeData & storage, Strings & files);
 
     /// Adjust partition key and execute its expression on block. Return sample block according to used expression.
diff --git a/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.cpp b/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.cpp
new file mode 100644
index 00000000000..21bcdb84a96
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.cpp
@@ -0,0 +1,91 @@
+#include <Interpreters/MonotonicityCheckVisitor.h>
+#include <Interpreters/getTableExpressions.h>
+#include <Storages/MergeTree/MergeTreeData.h>
+#include <Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h>
+#include <Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+extern const int BAD_ARGUMENTS;
+}
+
+namespace
+{
+bool isDestinationPartitionExpressionMonotonicallyIncreasing(
+    const std::vector<Range> & hyperrectangle, const MergeTreeData & destination_storage)
+{
+    auto destination_table_metadata = destination_storage.getInMemoryMetadataPtr();
+
+    auto key_description = destination_table_metadata->getPartitionKey();
+    auto definition_ast = key_description.definition_ast->clone();
+
+    auto table_identifier = std::make_shared<ASTIdentifier>(destination_storage.getStorageID().getTableName());
+    auto table_with_columns
+        = TableWithColumnNamesAndTypes{DatabaseAndTableWithAlias(table_identifier), destination_table_metadata->getColumns().getOrdinary()};
+
+    auto expression_list = extractKeyExpressionList(definition_ast);
+
+    MonotonicityCheckVisitor::Data data{{table_with_columns}, destination_storage.getContext(), /*group_by_function_hashes*/ {}};
+
+    for (auto i = 0u; i < expression_list->children.size(); i++)
+    {
+        data.range = hyperrectangle[i];
+
+        MonotonicityCheckVisitor(data).visit(expression_list->children[i]);
+
+        if (!data.monotonicity.is_monotonic || !data.monotonicity.is_positive)
+            return false;
+    }
+
+    return true;
+}
+
+bool isExpressionDirectSubsetOf(const ASTPtr source, const ASTPtr destination)
+{
+    auto source_expression_list = extractKeyExpressionList(source);
+    auto destination_expression_list = extractKeyExpressionList(destination);
+
+    std::unordered_set<std::string> source_columns;
+
+    for (auto i = 0u; i < source_expression_list->children.size(); ++i)
+        source_columns.insert(source_expression_list->children[i]->getColumnName());
+
+    for (auto i = 0u; i < destination_expression_list->children.size(); ++i)
+        if (!source_columns.contains(destination_expression_list->children[i]->getColumnName()))
+            return false;
+
+    return true;
+}
+}
+
+void MergeTreePartitionCompatibilityVerifier::verify(
+    const MergeTreeData & source_storage, const MergeTreeData & destination_storage, const DataPartsVector & source_parts)
+{
+    const auto source_metadata = source_storage.getInMemoryMetadataPtr();
+    const auto destination_metadata = destination_storage.getInMemoryMetadataPtr();
+
+    const auto source_partition_key_ast = source_metadata->getPartitionKeyAST();
+    const auto destination_partition_key_ast = destination_metadata->getPartitionKeyAST();
+
+    // If destination partition expression columns are a subset of source partition expression columns,
+    // there is no need to check for monotonicity.
+    if (isExpressionDirectSubsetOf(source_partition_key_ast, destination_partition_key_ast))
+        return;
+
+    const auto src_global_min_max_indexes = MergeTreePartitionGlobalMinMaxIdxCalculator::calculate(source_parts, destination_storage);
+
+    assert(!src_global_min_max_indexes.hyperrectangle.empty());
+
+    if (!isDestinationPartitionExpressionMonotonicallyIncreasing(src_global_min_max_indexes.hyperrectangle, destination_storage))
+        throw DB::Exception(ErrorCodes::BAD_ARGUMENTS, "Destination table partition expression is not monotonically increasing");
+
+    MergeTreePartition().createAndValidateMinMaxPartitionIds(
+        destination_storage.getInMemoryMetadataPtr(),
+        src_global_min_max_indexes.getBlock(destination_storage),
+        destination_storage.getContext());
+}
+
+}
diff --git a/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h b/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h
new file mode 100644
index 00000000000..1682add3ebd
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h
@@ -0,0 +1,30 @@
+#pragma once
+
+#include <Core/Field.h>
+#include <Storages/MergeTree/IMergeTreeDataPart.h>
+
+namespace DB
+{
+
+/*
+ * Verifies that source and destination partitions are compatible.
+ * To be compatible, one of the following criteria must be met:
+ * 1. Destination partition expression columns are a subset of source partition columns; or
+ * 2. Destination partition expression is monotonic on the source global min_max idx Range AND the computer partition id for
+ * the source global min_max idx range is the same.
+ *
+ * If not, an exception is thrown.
+ * */
+
+class MergeTreePartitionCompatibilityVerifier
+{
+public:
+    using DataPart = IMergeTreeDataPart;
+    using DataPartPtr = std::shared_ptr<const DataPart>;
+    using DataPartsVector = std::vector<DataPartPtr>;
+
+    static void
+    verify(const MergeTreeData & source_storage, const MergeTreeData & destination_storage, const DataPartsVector & source_parts);
+};
+
+}
diff --git a/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.cpp b/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.cpp
new file mode 100644
index 00000000000..0871efadf0c
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.cpp
@@ -0,0 +1,25 @@
+#include <Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h>
+
+namespace DB
+{
+
+IMergeTreeDataPart::MinMaxIndex
+MergeTreePartitionGlobalMinMaxIdxCalculator::calculate(const DataPartsVector & parts, const MergeTreeData & storage)
+{
+    IMergeTreeDataPart::MinMaxIndex global_min_max_indexes;
+
+    for (const auto & part : parts)
+    {
+        auto metadata_manager = std::make_shared<PartMetadataManagerOrdinary>(part.get());
+
+        auto local_min_max_index = MergeTreeData::DataPart::MinMaxIndex();
+
+        local_min_max_index.load(storage, metadata_manager);
+
+        global_min_max_indexes.merge(local_min_max_index);
+    }
+
+    return global_min_max_indexes;
+}
+
+}
diff --git a/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h b/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h
new file mode 100644
index 00000000000..4f271177246
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h
@@ -0,0 +1,24 @@
+#pragma once
+
+#include <utility>
+
+#include <Core/Field.h>
+#include <Storages/MergeTree/MergeTreeData.h>
+
+namespace DB
+{
+
+/*
+ * Calculates global min max indexes for a given set of parts on given storage.
+ * */
+class MergeTreePartitionGlobalMinMaxIdxCalculator
+{
+    using DataPart = IMergeTreeDataPart;
+    using DataPartPtr = std::shared_ptr<const DataPart>;
+    using DataPartsVector = std::vector<DataPartPtr>;
+
+public:
+    static IMergeTreeDataPart::MinMaxIndex calculate(const DataPartsVector & parts, const MergeTreeData & storage);
+};
+
+}
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 4761ccd8b58..fd5354a00a9 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -5,9 +5,9 @@
 #include <optional>
 #include <ranges>
 
-#include <base/sort.h>
 #include <Backups/BackupEntriesCollector.h>
 #include <Databases/IDatabase.h>
+#include <IO/copyData.h>
 #include "Common/Exception.h"
 #include <Common/MemoryTracker.h>
 #include <Common/escapeForFileName.h>
@@ -20,25 +20,30 @@
 #include <Interpreters/TransactionLog.h>
 #include <Interpreters/ClusterProxy/executeQuery.h>
 #include <Interpreters/ClusterProxy/SelectStreamFactory.h>
+#include <Interpreters/InterpreterAlterQuery.h>
 #include <Interpreters/InterpreterSelectQueryAnalyzer.h>
-#include <IO/copyData.h>
 #include <Parsers/ASTCheckQuery.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTPartition.h>
 #include <Parsers/ASTSetQuery.h>
-#include <Parsers/queryToString.h>
 #include <Parsers/formatAST.h>
+#include <Parsers/queryToString.h>
+#include <Planner/Utils.h>
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <Storages/MergeTree/ActiveDataPartSet.h>
 #include <Storages/AlterCommands.h>
-#include <Storages/PartitionCommands.h>
-#include <Storages/MergeTree/MergeTreeSink.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
-#include <Storages/MergeTree/MergePlainMergeTreeTask.h>
-#include <Storages/MergeTree/PartitionPruner.h>
 #include <Storages/MergeTree/MergeList.h>
+#include <Storages/MergeTree/MergePlainMergeTreeTask.h>
+#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
+#include <Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h>
+#include <Storages/MergeTree/MergeTreeSink.h>
+#include <Storages/MergeTree/PartMetadataManagerOrdinary.h>
+#include <Storages/MergeTree/PartitionPruner.h>
 #include <Storages/MergeTree/checkDataPart.h>
+#include <Storages/PartitionCommands.h>
+#include <base/sort.h>
+#include <Storages/buildQueryTreeForShard.h>
 #include <QueryPipeline/Pipe.h>
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
@@ -2039,41 +2044,73 @@ void StorageMergeTree::replacePartitionFrom(const StoragePtr & source_table, con
     ProfileEventsScope profile_events_scope;
 
     MergeTreeData & src_data = checkStructureAndGetMergeTreeData(source_table, source_metadata_snapshot, my_metadata_snapshot);
-    String partition_id = getPartitionIDFromQuery(partition, local_context);
+    String partition_id = src_data.getPartitionIDFromQuery(partition, local_context);
 
     DataPartsVector src_parts = src_data.getVisibleDataPartsVectorInPartition(local_context, partition_id);
+
+    bool attach_empty_partition = !replace && src_parts.empty();
+    if (attach_empty_partition)
+        return;
+
     MutableDataPartsVector dst_parts;
     std::vector<scope_guard> dst_parts_locks;
 
     static const String TMP_PREFIX = "tmp_replace_from_";
 
-    for (const DataPartPtr & src_part : src_parts)
+    const auto my_partition_expression = my_metadata_snapshot->getPartitionKeyAST();
+    const auto src_partition_expression = source_metadata_snapshot->getPartitionKeyAST();
+    const auto is_partition_exp_different = queryToStringNullable(my_partition_expression) != queryToStringNullable(src_partition_expression);
+
+    if (is_partition_exp_different && !src_parts.empty())
+        MergeTreePartitionCompatibilityVerifier::verify(src_data, /* destination_storage */ *this, src_parts);
+
+    for (DataPartPtr & src_part : src_parts)
     {
         if (!canReplacePartition(src_part))
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
                             "Cannot replace partition '{}' because part '{}' has inconsistent granularity with table",
                             partition_id, src_part->name);
 
-        /// This will generate unique name in scope of current server process.
-        Int64 temp_index = insert_increment.get();
-        MergeTreePartInfo dst_part_info(partition_id, temp_index, temp_index, src_part->info.level);
-
         IDataPartStorage::ClonePartParams clone_params{.txn = local_context->getCurrentTransaction()};
-        auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
-            src_part,
-            TMP_PREFIX,
-            dst_part_info,
-            my_metadata_snapshot,
-            clone_params,
-            local_context->getReadSettings(),
-            local_context->getWriteSettings());
-        dst_parts.emplace_back(std::move(dst_part));
-        dst_parts_locks.emplace_back(std::move(part_lock));
-    }
+        /// This will generate unique name in scope of current server process.
+        auto index = insert_increment.get();
 
-    /// ATTACH empty part set
-    if (!replace && dst_parts.empty())
-        return;
+        if (is_partition_exp_different)
+        {
+            auto [new_partition, new_min_max_index] = createPartitionAndMinMaxIndexFromSourcePart(
+                src_part, my_metadata_snapshot, local_context);
+
+            auto [dst_part, part_lock] = cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
+                src_part,
+                new_partition,
+                new_partition.getID(*this),
+                new_min_max_index,
+                TMP_PREFIX,
+                my_metadata_snapshot,
+                clone_params,
+                local_context,
+                index,
+                index);
+
+            dst_parts.emplace_back(std::move(dst_part));
+            dst_parts_locks.emplace_back(std::move(part_lock));
+        }
+        else
+        {
+            MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
+
+            auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
+                src_part,
+                TMP_PREFIX,
+                dst_part_info,
+                my_metadata_snapshot,
+                clone_params,
+                local_context->getReadSettings(),
+                local_context->getWriteSettings());
+            dst_parts.emplace_back(std::move(dst_part));
+            dst_parts_locks.emplace_back(std::move(part_lock));
+        }
+    }
 
     MergeTreePartInfo drop_range;
     if (replace)
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index f7e6783dbc2..512811e39d7 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -26,22 +26,21 @@
 
 #include <base/sort.h>
 
-#include <Storages/buildQueryTreeForShard.h>
 #include <Storages/AlterCommands.h>
 #include <Storages/ColumnsDescription.h>
 #include <Storages/Freeze.h>
 #include <Storages/MergeTree/AsyncBlockIDsCache.h>
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
-#include <Storages/MergeTree/extractZkPathFromCreateQuery.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
 #include <Storages/MergeTree/LeaderElection.h>
-#include <Storages/MergeTree/MergedBlockOutputStream.h>
 #include <Storages/MergeTree/MergeFromLogEntryTask.h>
 #include <Storages/MergeTree/MergeList.h>
 #include <Storages/MergeTree/MergeTreeBackgroundExecutor.h>
 #include <Storages/MergeTree/MergeTreeDataFormatVersion.h>
 #include <Storages/MergeTree/MergeTreePartInfo.h>
+#include <Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h>
 #include <Storages/MergeTree/MergeTreeReaderCompact.h>
+#include <Storages/MergeTree/MergedBlockOutputStream.h>
 #include <Storages/MergeTree/MutateFromLogEntryTask.h>
 #include <Storages/MergeTree/PinnedPartUUIDs.h>
 #include <Storages/MergeTree/ReplicatedMergeTreeAddress.h>
@@ -53,9 +52,11 @@
 #include <Storages/MergeTree/ReplicatedMergeTreeSink.h>
 #include <Storages/MergeTree/ReplicatedMergeTreeTableMetadata.h>
 #include <Storages/MergeTree/ZeroCopyLock.h>
+#include <Storages/MergeTree/extractZkPathFromCreateQuery.h>
 #include <Storages/PartitionCommands.h>
 #include <Storages/StorageReplicatedMergeTree.h>
 #include <Storages/VirtualColumnUtils.h>
+#include <Storages/buildQueryTreeForShard.h>
 
 #include <Databases/DatabaseOnDisk.h>
 #include <Databases/DatabaseReplicated.h>
@@ -2713,16 +2714,48 @@ bool StorageReplicatedMergeTree::executeReplaceRange(LogEntry & entry)
                 .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || ((our_zero_copy_enabled || source_zero_copy_enabled) && part_desc->src_table_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
             };
-            auto [res_part, temporary_part_lock] = cloneAndLoadDataPartOnSameDisk(
-                part_desc->src_table_part,
-                TMP_PREFIX + "clone_",
-                part_desc->new_part_info,
-                metadata_snapshot,
-                clone_params,
-                getContext()->getReadSettings(),
-                getContext()->getWriteSettings());
-            part_desc->res_part = std::move(res_part);
-            part_desc->temporary_part_lock = std::move(temporary_part_lock);
+
+            const auto my_partition_expression = metadata_snapshot->getPartitionKeyAST();
+            const auto src_partition_expression = source_table->getInMemoryMetadataPtr()->getPartitionKeyAST();
+
+            const auto is_partition_exp_different = queryToStringNullable(my_partition_expression) != queryToStringNullable(src_partition_expression);
+
+            if (is_partition_exp_different)
+            {
+                auto [new_partition, new_min_max_index] = createPartitionAndMinMaxIndexFromSourcePart(
+                    part_desc->src_table_part, metadata_snapshot, getContext());
+
+                auto partition_id = new_partition.getID(*this);
+
+                auto [res_part, temporary_part_lock] = cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
+                    part_desc->src_table_part,
+                    new_partition,
+                    partition_id,
+                    new_min_max_index,
+                    TMP_PREFIX + "clone_",
+                    metadata_snapshot,
+                    clone_params,
+                    getContext(),
+                    part_desc->new_part_info.min_block,
+                    part_desc->new_part_info.max_block);
+
+                part_desc->res_part = std::move(res_part);
+                part_desc->temporary_part_lock = std::move(temporary_part_lock);
+            }
+            else
+            {
+                auto [res_part, temporary_part_lock] = cloneAndLoadDataPartOnSameDisk(
+                    part_desc->src_table_part,
+                    TMP_PREFIX + "clone_",
+                    part_desc->new_part_info,
+                    metadata_snapshot,
+                    clone_params,
+                    getContext()->getReadSettings(),
+                    getContext()->getWriteSettings());
+
+                part_desc->res_part = std::move(res_part);
+                part_desc->temporary_part_lock = std::move(temporary_part_lock);
+            }
         }
         else if (!part_desc->replica.empty())
         {
@@ -7852,11 +7885,22 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
     ProfileEventsScope profile_events_scope;
 
     MergeTreeData & src_data = checkStructureAndGetMergeTreeData(source_table, source_metadata_snapshot, metadata_snapshot);
-    String partition_id = getPartitionIDFromQuery(partition, query_context);
+    String partition_id = src_data.getPartitionIDFromQuery(partition, query_context);
 
     /// NOTE: Some covered parts may be missing in src_all_parts if corresponding log entries are not executed yet.
     DataPartsVector src_all_parts = src_data.getVisibleDataPartsVectorInPartition(query_context, partition_id);
 
+    bool attach_empty_partition = !replace && src_all_parts.empty();
+    if (attach_empty_partition)
+        return;
+
+    const auto my_partition_expression = metadata_snapshot->getPartitionKeyAST();
+    const auto src_partition_expression = source_metadata_snapshot->getPartitionKeyAST();
+    const auto is_partition_exp_different = queryToStringNullable(my_partition_expression) != queryToStringNullable(src_partition_expression);
+
+    if (is_partition_exp_different && !src_all_parts.empty())
+        MergeTreePartitionCompatibilityVerifier::verify(src_data, /* destination_storage */ *this, src_all_parts);
+
     LOG_DEBUG(log, "Cloning {} parts", src_all_parts.size());
 
     static const String TMP_PREFIX = "tmp_replace_from_";
@@ -7911,6 +7955,18 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
                                 "Cannot replace partition '{}' because part '{}"
                                 "' has inconsistent granularity with table", partition_id, src_part->name);
 
+            IMergeTreeDataPart::MinMaxIndex min_max_index = *src_part->minmax_idx;
+            MergeTreePartition merge_tree_partition = src_part->partition;
+
+            if (is_partition_exp_different)
+            {
+                auto [new_partition, new_min_max_index] = createPartitionAndMinMaxIndexFromSourcePart(src_part, metadata_snapshot, query_context);
+
+                merge_tree_partition = new_partition;
+                min_max_index = new_min_max_index;
+                partition_id = merge_tree_partition.getID(*this);
+            }
+
             String hash_hex = src_part->checksums.getTotalChecksumHex();
             const bool is_duplicated_part = replaced_parts.contains(hash_hex);
             replaced_parts.insert(hash_hex);
@@ -7929,27 +7985,52 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
                 continue;
             }
 
-            UInt64 index = lock->getNumber();
-            MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
-
             bool zero_copy_enabled = storage_settings_ptr->allow_remote_fs_zero_copy_replication
                 || dynamic_cast<const MergeTreeData *>(source_table.get())->getSettings()->allow_remote_fs_zero_copy_replication;
+
+            UInt64 index = lock->getNumber();
+
             IDataPartStorage::ClonePartParams clone_params
             {
                 .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || (zero_copy_enabled && src_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
             };
-            auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
-                src_part,
-                TMP_PREFIX,
-                dst_part_info,
-                metadata_snapshot,
-                clone_params,
-                query_context->getReadSettings(),
-                query_context->getWriteSettings());
+
+            if (is_partition_exp_different)
+            {
+                auto [dst_part, part_lock] = cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
+                    src_part,
+                    merge_tree_partition,
+                    partition_id,
+                    min_max_index,
+                    TMP_PREFIX,
+                    metadata_snapshot,
+                    clone_params,
+                    query_context,
+                    index,
+                    index);
+
+                dst_parts.emplace_back(dst_part);
+                dst_parts_locks.emplace_back(std::move(part_lock));
+            }
+            else
+            {
+                MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
+
+                auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
+                    src_part,
+                    TMP_PREFIX,
+                    dst_part_info,
+                    metadata_snapshot,
+                    clone_params,
+                    query_context->getReadSettings(),
+                    query_context->getWriteSettings());
+
+                dst_parts.emplace_back(dst_part);
+                dst_parts_locks.emplace_back(std::move(part_lock));
+            }
+
             src_parts.emplace_back(src_part);
-            dst_parts.emplace_back(dst_part);
-            dst_parts_locks.emplace_back(std::move(part_lock));
             ephemeral_locks.emplace_back(std::move(*lock));
             block_id_paths.emplace_back(block_id_path);
             part_checksums.emplace_back(hash_hex);
diff --git a/tests/integration/test_attach_partition_distinct_expression_replicated/__init__.py b/tests/integration/test_attach_partition_distinct_expression_replicated/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_attach_partition_distinct_expression_replicated/configs/remote_servers.xml b/tests/integration/test_attach_partition_distinct_expression_replicated/configs/remote_servers.xml
new file mode 100644
index 00000000000..b40730e9f7d
--- /dev/null
+++ b/tests/integration/test_attach_partition_distinct_expression_replicated/configs/remote_servers.xml
@@ -0,0 +1,17 @@
+<clickhouse>
+    <remote_servers>
+        <test_cluster>
+            <shard>
+                <internal_replication>true</internal_replication>
+                <replica>
+                    <host>replica1</host>
+                    <port>9000</port>
+                </replica>
+                <replica>
+                    <host>replica2</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </test_cluster>
+    </remote_servers>
+</clickhouse>
diff --git a/tests/integration/test_attach_partition_distinct_expression_replicated/test.py b/tests/integration/test_attach_partition_distinct_expression_replicated/test.py
new file mode 100644
index 00000000000..1d8ac4e9e37
--- /dev/null
+++ b/tests/integration/test_attach_partition_distinct_expression_replicated/test.py
@@ -0,0 +1,214 @@
+import pytest
+from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import assert_eq_with_retry
+
+cluster = ClickHouseCluster(__file__)
+
+replica1 = cluster.add_instance(
+    "replica1", with_zookeeper=True, main_configs=["configs/remote_servers.xml"]
+)
+replica2 = cluster.add_instance(
+    "replica2", with_zookeeper=True, main_configs=["configs/remote_servers.xml"]
+)
+
+
+@pytest.fixture(scope="module")
+def start_cluster():
+    try:
+        cluster.start()
+        yield cluster
+    except Exception as ex:
+        print(ex)
+    finally:
+        cluster.shutdown()
+
+
+def cleanup(nodes):
+    for node in nodes:
+        node.query("DROP TABLE IF EXISTS source SYNC")
+        node.query("DROP TABLE IF EXISTS destination SYNC")
+
+
+def create_table(node, table_name, replicated):
+    replica = node.name
+    engine = (
+        f"ReplicatedMergeTree('/clickhouse/tables/1/{table_name}', '{replica}')"
+        if replicated
+        else "MergeTree()"
+    )
+    partition_expression = (
+        "toYYYYMMDD(timestamp)" if table_name == "source" else "toYYYYMM(timestamp)"
+    )
+    node.query_with_retry(
+        """
+        CREATE TABLE {table_name}(timestamp DateTime)
+        ENGINE = {engine}
+        ORDER BY tuple() PARTITION BY {partition_expression}
+        SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
+        """.format(
+            table_name=table_name,
+            engine=engine,
+            partition_expression=partition_expression,
+        )
+    )
+
+
+def test_both_replicated(start_cluster):
+    for node in [replica1, replica2]:
+        create_table(node, "source", True)
+        create_table(node, "destination", True)
+
+    replica1.query("INSERT INTO source VALUES ('2010-03-02 02:01:01')")
+    replica1.query("SYSTEM SYNC REPLICA source")
+    replica1.query("SYSTEM SYNC REPLICA destination")
+    replica1.query(
+        f"ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source"
+    )
+
+    assert_eq_with_retry(
+        replica1, f"SELECT * FROM destination", "2010-03-02 02:01:01\n"
+    )
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT * FROM destination",
+        replica2.query(f"SELECT * FROM destination"),
+    )
+
+    cleanup([replica1, replica2])
+
+
+def test_only_destination_replicated(start_cluster):
+    create_table(replica1, "source", False)
+    create_table(replica1, "destination", True)
+    create_table(replica2, "destination", True)
+
+    replica1.query("INSERT INTO source VALUES ('2010-03-02 02:01:01')")
+    replica1.query("SYSTEM SYNC REPLICA destination")
+    replica1.query(
+        f"ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source"
+    )
+
+    assert_eq_with_retry(
+        replica1, f"SELECT * FROM destination", "2010-03-02 02:01:01\n"
+    )
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT * FROM destination",
+        replica2.query(f"SELECT * FROM destination"),
+    )
+
+    cleanup([replica1, replica2])
+
+
+def test_both_replicated_partitioned_to_unpartitioned(start_cluster):
+    def create_tables(nodes):
+        for node in nodes:
+            source_engine = (
+                f"ReplicatedMergeTree('/clickhouse/tables/1/source', '{node.name}')"
+            )
+            node.query(
+                """
+                CREATE TABLE source(timestamp DateTime)
+                ENGINE = {engine}
+                ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp)
+                SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
+                """.format(
+                    engine=source_engine,
+                )
+            )
+
+            destination_engine = f"ReplicatedMergeTree('/clickhouse/tables/1/destination', '{node.name}')"
+            node.query(
+                """
+                CREATE TABLE destination(timestamp DateTime)
+                ENGINE = {engine}
+                ORDER BY tuple() PARTITION BY tuple()
+                SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
+                """.format(
+                    engine=destination_engine,
+                )
+            )
+
+    create_tables([replica1, replica2])
+
+    replica1.query("INSERT INTO source VALUES ('2010-03-02 02:01:01')")
+    replica1.query("INSERT INTO source VALUES ('2010-03-03 02:01:01')")
+    replica1.query("SYSTEM SYNC REPLICA source")
+    replica1.query("SYSTEM SYNC REPLICA destination")
+
+    replica1.query(
+        f"ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source"
+    )
+    replica1.query(
+        f"ALTER TABLE destination ATTACH PARTITION ID '20100303' FROM source"
+    )
+
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT * FROM destination ORDER BY timestamp",
+        "2010-03-02 02:01:01\n2010-03-03 02:01:01\n",
+    )
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT * FROM destination ORDER BY timestamp",
+        replica2.query(f"SELECT * FROM destination ORDER BY timestamp"),
+    )
+
+    cleanup([replica1, replica2])
+
+
+def test_both_replicated_different_exp_same_id(start_cluster):
+    def create_tables(nodes):
+        for node in nodes:
+            source_engine = (
+                f"ReplicatedMergeTree('/clickhouse/tables/1/source', '{node.name}')"
+            )
+            node.query(
+                """
+                CREATE TABLE source(a UInt16,b UInt16,c UInt16,extra UInt64,Path String,Time DateTime,Value Float64,Timestamp Int64,sign Int8)
+                ENGINE = {engine}
+                ORDER BY tuple() PARTITION BY a % 3
+                SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
+                """.format(
+                    engine=source_engine,
+                )
+            )
+
+            destination_engine = f"ReplicatedMergeTree('/clickhouse/tables/1/destination', '{node.name}')"
+            node.query(
+                """
+                CREATE TABLE destination(a UInt16,b UInt16,c UInt16,extra UInt64,Path String,Time DateTime,Value Float64,Timestamp Int64,sign Int8)
+                ENGINE = {engine}
+                ORDER BY tuple() PARTITION BY a
+                SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
+                """.format(
+                    engine=destination_engine,
+                )
+            )
+
+    create_tables([replica1, replica2])
+
+    replica1.query(
+        "INSERT INTO source (a, b, c, extra, sign) VALUES (1, 5, 9, 1000, 1)"
+    )
+    replica1.query(
+        "INSERT INTO source (a, b, c, extra, sign) VALUES (2, 6, 10, 1000, 1)"
+    )
+    replica1.query("SYSTEM SYNC REPLICA source")
+    replica1.query("SYSTEM SYNC REPLICA destination")
+
+    replica1.query(f"ALTER TABLE destination ATTACH PARTITION 1 FROM source")
+    replica1.query(f"ALTER TABLE destination ATTACH PARTITION 2 FROM source")
+
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT * FROM destination ORDER BY a",
+        "1\t5\t9\t1000\t\t1970-01-01 00:00:00\t0\t0\t1\n2\t6\t10\t1000\t\t1970-01-01 00:00:00\t0\t0\t1\n",
+    )
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT * FROM destination ORDER BY a",
+        replica2.query(f"SELECT * FROM destination ORDER BY a"),
+    )
+
+    cleanup([replica1, replica2])
diff --git a/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.reference b/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.reference
new file mode 100644
index 00000000000..f1d036b08bf
--- /dev/null
+++ b/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.reference
@@ -0,0 +1,467 @@
+-- { echoOn }
+-- Should be allowed since destination partition expr is monotonically increasing and compatible
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+201003
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '20100302' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+201003
+-- Should be allowed since destination partition expr is monotonically increasing and compatible. Note that even though
+-- the destination partition expression is more granular, the data would still fall in the same partition. Thus, it is valid
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+20100302
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '201003' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+20100302
+-- Should be allowed since destination partition expr is monotonically increasing and compatible for those specific values
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY intDiv(A, 6);
+CREATE TABLE destination (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY A;
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 1), ('2010-03-02 02:01:03', 1);
+ALTER TABLE destination ATTACH PARTITION ID '0' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01	1
+2010-03-02 02:01:03	1
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01	1
+2010-03-02 02:01:03	1
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+1
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION 0 FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01	1
+2010-03-02 02:01:03	1
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01	1
+2010-03-02 02:01:03	1
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+1
+-- Should be allowed because dst partition exp is monot inc and data is not split
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY cityHash64(category);
+CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
+INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
+INSERT INTO TABLE source VALUES ('rice', 'food');
+ALTER TABLE destination ATTACH PARTITION ID '17908065610379824077' from source;
+SELECT * FROM source ORDER BY productName;
+mop	general
+rice	food
+spaghetti	food
+SELECT * FROM destination ORDER BY productName;
+rice	food
+spaghetti	food
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+59532f3c39a412a413f0f014c7750a9d
+59532f3c39a412a413f0f014c7750a9d
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '17908065610379824077' from source;
+SELECT * FROM source ORDER BY productName;
+mop	general
+rice	food
+spaghetti	food
+SELECT * FROM destination ORDER BY productName;
+rice	food
+spaghetti	food
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+59532f3c39a412a413f0f014c7750a9d
+59532f3c39a412a413f0f014c7750a9d
+-- Should be allowed, extra test case to validate https://github.com/ClickHouse/ClickHouse/pull/39507#issuecomment-1747574133
+
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp Int64) engine=MergeTree ORDER BY (timestamp) PARTITION BY intDiv(timestamp, 86400000);
+CREATE TABLE destination (timestamp Int64) engine=MergeTree ORDER BY (timestamp) PARTITION BY toYear(toDateTime(intDiv(timestamp, 1000)));
+INSERT INTO TABLE source VALUES (1267495261123);
+ALTER TABLE destination ATTACH PARTITION ID '14670' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+1267495261123
+SELECT * FROM destination ORDER BY timestamp;
+1267495261123
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+2010
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '14670' from source;
+SELECT * FROM source ORDER BY timestamp;
+1267495261123
+SELECT * FROM destination ORDER BY timestamp;
+1267495261123
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+2010
+-- Should be allowed, extra test case to validate https://github.com/ClickHouse/ClickHouse/pull/39507#issuecomment-1747511726
+
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime('UTC'), key Int64, f Float64) engine=MergeTree ORDER BY (key, timestamp) PARTITION BY toYear(timestamp);
+CREATE TABLE destination (timestamp DateTime('UTC'), key Int64, f Float64) engine=MergeTree ORDER BY (key, timestamp) PARTITION BY (intDiv(toUInt32(timestamp),86400));
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01',1,1),('2010-03-02 02:01:01',1,1),('2011-02-02 02:01:03',1,1);
+ALTER TABLE destination ATTACH PARTITION ID '2010' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01	1	1
+2010-03-02 02:01:01	1	1
+2011-02-02 02:01:03	1	1
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01	1	1
+2010-03-02 02:01:01	1	1
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+14670
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '2010' from source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01	1	1
+2010-03-02 02:01:01	1	1
+2011-02-02 02:01:03	1	1
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01	1	1
+2010-03-02 02:01:01	1	1
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+14670
+-- Should be allowed, partitioned table to unpartitioned. Since the destination is unpartitioned, parts would ultimately
+-- fall into the same partition.
+-- Destination partition by expression is omitted, which causes StorageMetadata::getPartitionKeyAST() to be nullptr.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple();
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+all
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '201003' from source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+all
+-- Same as above, but destination partition by expression is explicitly defined. Test case required to validate that
+-- partition by tuple() is accepted.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY tuple();
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+all
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '201003' from source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+all
+-- Should be allowed because the destination partition expression columns are a subset of the source partition expression columns
+-- Columns in this case refer to the expression elements, not to the actual table columns
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b, c);
+CREATE TABLE destination (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b);
+INSERT INTO TABLE source VALUES (1, 2, 3), (1, 2, 4);
+ALTER TABLE destination ATTACH PARTITION ID '1-2-3' FROM source;
+SELECT * FROM source ORDER BY (a, b, c);
+1	2	3
+1	2	4
+SELECT * FROM destination ORDER BY (a, b, c);
+1	2	3
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+1-2
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION (1, 2, 3) from source;
+SELECT * FROM source ORDER BY (a, b, c);
+1	2	3
+1	2	4
+SELECT * FROM destination ORDER BY (a, b, c);
+1	2	3
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+1-2
+-- Should be allowed because the destination partition expression columns are a subset of the source partition expression columns
+-- Columns in this case refer to the expression elements, not to the actual table columns
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b, c);
+CREATE TABLE destination (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY a;
+INSERT INTO TABLE source VALUES (1, 2, 3), (1, 2, 4);
+ALTER TABLE destination ATTACH PARTITION ID '1-2-3' FROM source;
+SELECT * FROM source ORDER BY (a, b, c);
+1	2	3
+1	2	4
+SELECT * FROM destination ORDER BY (a, b, c);
+1	2	3
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+1
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION (1, 2, 3) from source;
+SELECT * FROM source ORDER BY (a, b, c);
+1	2	3
+1	2	4
+SELECT * FROM destination ORDER BY (a, b, c);
+1	2	3
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+1
+-- Should be allowed. Special test case, tricky to explain. First column of source partition expression is
+-- timestamp, while first column of destination partition expression is `A`. One of the previous implementations
+-- would not match the columns, which could lead to `timestamp` min max being used to calculate monotonicity of `A`.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (`timestamp` DateTime, `A` Int64) ENGINE = MergeTree PARTITION BY tuple(toYYYYMM(timestamp), intDiv(A, 6)) ORDER BY timestamp;
+CREATE TABLE destination (`timestamp` DateTime, `A` Int64) ENGINE = MergeTree PARTITION BY A ORDER BY timestamp;
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 5);
+ALTER TABLE destination ATTACH PARTITION ID '201003-0' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01	5
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01	5
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+5
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION (201003, 0) from source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01	5
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01	5
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+5
+-- Should be allowed. Destination partition expression contains multiple expressions, but all of them are monotonically
+-- increasing in the source partition min max indexes.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(A, B) ORDER BY tuple();
+CREATE TABLE destination (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(intDiv(A, 2), intDiv(B, 2)) ORDER BY tuple();
+INSERT INTO TABLE source VALUES (6, 12);
+ALTER TABLE destination ATTACH PARTITION ID '6-12' FROM source;
+SELECT * FROM source ORDER BY A;
+6	12
+SELECT * FROM destination ORDER BY A;
+6	12
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+3-6
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION (6, 12) from source;
+SELECT * FROM source ORDER BY A;
+6	12
+SELECT * FROM destination ORDER BY A;
+6	12
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+3-6
+-- Should be allowed. The same scenario as above, but partition expressions inverted.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(intDiv(A, 2), intDiv(B, 2)) ORDER BY tuple();
+CREATE TABLE destination (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(A, B) ORDER BY tuple();
+INSERT INTO TABLE source VALUES (6, 12);
+ALTER TABLE destination ATTACH PARTITION ID '3-6' FROM source;
+SELECT * FROM source ORDER BY A;
+6	12
+SELECT * FROM destination ORDER BY A;
+6	12
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+6-12
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION (3, 6) from source;
+SELECT * FROM source ORDER BY A;
+6	12
+SELECT * FROM destination ORDER BY A;
+6	12
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+6-12
+-- Should be allowed, it is a local operation, no different than regular attach. Replicated to replicated.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE
+    source(timestamp DateTime)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/source_replicated_to_replicated_distinct_expression', '1')
+        PARTITION BY toYYYYMMDD(timestamp)
+        ORDER BY tuple();
+CREATE TABLE
+    destination(timestamp DateTime)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/destination_replicated_to_replicated_distinct_expression', '1')
+        PARTITION BY toYYYYMM(timestamp)
+        ORDER BY tuple();
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+201003
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '20100302' from source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+201003
+-- Should be allowed, it is a local operation, no different than regular attach. Non replicated to replicated
+DROP TABLE IF EXISTS source SYNC;
+DROP TABLE IF EXISTS destination SYNC;
+CREATE TABLE source(timestamp DateTime) ENGINE = MergeTree() PARTITION BY toYYYYMMDD(timestamp) ORDER BY tuple();
+CREATE TABLE
+    destination(timestamp DateTime)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/destination_non_replicated_to_replicated_distinct_expression', '1')
+        PARTITION BY toYYYYMM(timestamp)
+        ORDER BY tuple();
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+201003
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '20100302' from source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+201003
+-- Should not be allowed because data would be split into two different partitions
+DROP TABLE IF EXISTS source SYNC;
+DROP TABLE IF EXISTS destination SYNC;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-03 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source; -- { serverError 248 }
+ALTER TABLE destination ATTACH PARTITION '201003' from source; -- { serverError 248 }
+-- Should not be allowed because data would be split into two different partitions
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY intDiv(A, 6);
+CREATE TABLE destination (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY A;
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 1), ('2010-03-02 02:01:03', 2);
+ALTER TABLE destination ATTACH PARTITION ID '0' FROM source; -- { serverError 248 }
+ALTER TABLE destination ATTACH PARTITION 0 FROM source; -- { serverError 248 }
+-- Should not be allowed because dst partition exp takes more than two arguments, so it's not considered monotonically inc
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
+CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY substring(category, 1, 2);
+INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
+INSERT INTO TABLE source VALUES ('rice', 'food');
+ALTER TABLE destination ATTACH PARTITION ID '4590ba78048910b74a47d5bfb308abed' from source; -- { serverError 36 }
+ALTER TABLE destination ATTACH PARTITION 'food' from source; -- { serverError 36 }
+-- Should not be allowed because dst partition exp depends on a different set of columns
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
+CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(productName);
+INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
+INSERT INTO TABLE source VALUES ('rice', 'food');
+ALTER TABLE destination ATTACH PARTITION ID '4590ba78048910b74a47d5bfb308abed' from source; -- { serverError 36 }
+ALTER TABLE destination ATTACH PARTITION 'food' from source; -- { serverError 36 }
+-- Should not be allowed because dst partition exp is not monotonically increasing
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (productName String) engine=MergeTree ORDER BY tuple() PARTITION BY left(productName, 2);
+CREATE TABLE destination (productName String) engine=MergeTree ORDER BY tuple() PARTITION BY cityHash64(productName);
+INSERT INTO TABLE source VALUES ('bread'), ('mop');
+INSERT INTO TABLE source VALUES ('broccoli');
+ALTER TABLE destination ATTACH PARTITION ID '4589453b7ee96ce9de1265bd57674496' from source; -- { serverError 36 }
+ALTER TABLE destination ATTACH PARTITION 'br' from source; -- { serverError 36 }
+-- Empty/ non-existent partition, same partition expression. Nothing should happen
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+ALTER TABLE destination ATTACH PARTITION ID '1' FROM source;
+ALTER TABLE destination ATTACH PARTITION 1 FROM source;
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+-- Empty/ non-existent partition, different partition expression. Nothing should happen
+-- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+ALTER TABLE destination ATTACH PARTITION ID '1' FROM source;
+ALTER TABLE destination ATTACH PARTITION 1 FROM source;
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+-- Replace instead of attach. Empty/ non-existent partition, same partition expression. Nothing should happen
+-- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+ALTER TABLE destination REPLACE PARTITION '1' FROM source;
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+-- Replace instead of attach. Empty/ non-existent partition to non-empty partition, same partition id.
+-- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (A Int) engine=MergeTree ORDER BY tuple() PARTITION BY A;
+CREATE TABLE destination (A Int) engine=MergeTree ORDER BY tuple() PARTITION BY A;
+INSERT INTO TABLE destination VALUES (1);
+ALTER TABLE destination REPLACE PARTITION '1' FROM source;
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
diff --git a/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.sql b/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.sql
new file mode 100644
index 00000000000..9547d6ae249
--- /dev/null
+++ b/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.sql
@@ -0,0 +1,485 @@
+-- { echoOn }
+-- Should be allowed since destination partition expr is monotonically increasing and compatible
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '20100302' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed since destination partition expr is monotonically increasing and compatible. Note that even though
+-- the destination partition expression is more granular, the data would still fall in the same partition. Thus, it is valid
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '201003' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed since destination partition expr is monotonically increasing and compatible for those specific values
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY intDiv(A, 6);
+
+CREATE TABLE destination (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY A;
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 1), ('2010-03-02 02:01:03', 1);
+
+ALTER TABLE destination ATTACH PARTITION ID '0' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION 0 FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed because dst partition exp is monot inc and data is not split
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY cityHash64(category);
+CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
+
+INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
+INSERT INTO TABLE source VALUES ('rice', 'food');
+
+ALTER TABLE destination ATTACH PARTITION ID '17908065610379824077' from source;
+
+SELECT * FROM source ORDER BY productName;
+SELECT * FROM destination ORDER BY productName;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '17908065610379824077' from source;
+
+SELECT * FROM source ORDER BY productName;
+SELECT * FROM destination ORDER BY productName;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed, extra test case to validate https://github.com/ClickHouse/ClickHouse/pull/39507#issuecomment-1747574133
+
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp Int64) engine=MergeTree ORDER BY (timestamp) PARTITION BY intDiv(timestamp, 86400000);
+CREATE TABLE destination (timestamp Int64) engine=MergeTree ORDER BY (timestamp) PARTITION BY toYear(toDateTime(intDiv(timestamp, 1000)));
+
+INSERT INTO TABLE source VALUES (1267495261123);
+
+ALTER TABLE destination ATTACH PARTITION ID '14670' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '14670' from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed, extra test case to validate https://github.com/ClickHouse/ClickHouse/pull/39507#issuecomment-1747511726
+
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime('UTC'), key Int64, f Float64) engine=MergeTree ORDER BY (key, timestamp) PARTITION BY toYear(timestamp);
+CREATE TABLE destination (timestamp DateTime('UTC'), key Int64, f Float64) engine=MergeTree ORDER BY (key, timestamp) PARTITION BY (intDiv(toUInt32(timestamp),86400));
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01',1,1),('2010-03-02 02:01:01',1,1),('2011-02-02 02:01:03',1,1);
+
+ALTER TABLE destination ATTACH PARTITION ID '2010' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '2010' from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed, partitioned table to unpartitioned. Since the destination is unpartitioned, parts would ultimately
+-- fall into the same partition.
+-- Destination partition by expression is omitted, which causes StorageMetadata::getPartitionKeyAST() to be nullptr.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple();
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '201003' from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Same as above, but destination partition by expression is explicitly defined. Test case required to validate that
+-- partition by tuple() is accepted.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY tuple();
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '201003' from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed because the destination partition expression columns are a subset of the source partition expression columns
+-- Columns in this case refer to the expression elements, not to the actual table columns
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b, c);
+CREATE TABLE destination (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b);
+
+INSERT INTO TABLE source VALUES (1, 2, 3), (1, 2, 4);
+
+ALTER TABLE destination ATTACH PARTITION ID '1-2-3' FROM source;
+
+SELECT * FROM source ORDER BY (a, b, c);
+SELECT * FROM destination ORDER BY (a, b, c);
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION (1, 2, 3) from source;
+
+SELECT * FROM source ORDER BY (a, b, c);
+SELECT * FROM destination ORDER BY (a, b, c);
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed because the destination partition expression columns are a subset of the source partition expression columns
+-- Columns in this case refer to the expression elements, not to the actual table columns
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b, c);
+CREATE TABLE destination (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY a;
+
+INSERT INTO TABLE source VALUES (1, 2, 3), (1, 2, 4);
+
+ALTER TABLE destination ATTACH PARTITION ID '1-2-3' FROM source;
+
+SELECT * FROM source ORDER BY (a, b, c);
+SELECT * FROM destination ORDER BY (a, b, c);
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION (1, 2, 3) from source;
+
+SELECT * FROM source ORDER BY (a, b, c);
+SELECT * FROM destination ORDER BY (a, b, c);
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed. Special test case, tricky to explain. First column of source partition expression is
+-- timestamp, while first column of destination partition expression is `A`. One of the previous implementations
+-- would not match the columns, which could lead to `timestamp` min max being used to calculate monotonicity of `A`.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (`timestamp` DateTime, `A` Int64) ENGINE = MergeTree PARTITION BY tuple(toYYYYMM(timestamp), intDiv(A, 6)) ORDER BY timestamp;
+CREATE TABLE destination (`timestamp` DateTime, `A` Int64) ENGINE = MergeTree PARTITION BY A ORDER BY timestamp;
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 5);
+
+ALTER TABLE destination ATTACH PARTITION ID '201003-0' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION (201003, 0) from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed. Destination partition expression contains multiple expressions, but all of them are monotonically
+-- increasing in the source partition min max indexes.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(A, B) ORDER BY tuple();
+CREATE TABLE destination (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(intDiv(A, 2), intDiv(B, 2)) ORDER BY tuple();
+
+INSERT INTO TABLE source VALUES (6, 12);
+
+ALTER TABLE destination ATTACH PARTITION ID '6-12' FROM source;
+
+SELECT * FROM source ORDER BY A;
+SELECT * FROM destination ORDER BY A;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION (6, 12) from source;
+
+SELECT * FROM source ORDER BY A;
+SELECT * FROM destination ORDER BY A;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed. The same scenario as above, but partition expressions inverted.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(intDiv(A, 2), intDiv(B, 2)) ORDER BY tuple();
+CREATE TABLE destination (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(A, B) ORDER BY tuple();
+
+INSERT INTO TABLE source VALUES (6, 12);
+
+ALTER TABLE destination ATTACH PARTITION ID '3-6' FROM source;
+
+SELECT * FROM source ORDER BY A;
+SELECT * FROM destination ORDER BY A;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION (3, 6) from source;
+
+SELECT * FROM source ORDER BY A;
+SELECT * FROM destination ORDER BY A;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed, it is a local operation, no different than regular attach. Replicated to replicated.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE
+    source(timestamp DateTime)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/source_replicated_to_replicated_distinct_expression', '1')
+        PARTITION BY toYYYYMMDD(timestamp)
+        ORDER BY tuple();
+
+CREATE TABLE
+    destination(timestamp DateTime)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/destination_replicated_to_replicated_distinct_expression', '1')
+        PARTITION BY toYYYYMM(timestamp)
+        ORDER BY tuple();
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '20100302' from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed, it is a local operation, no different than regular attach. Non replicated to replicated
+DROP TABLE IF EXISTS source SYNC;
+DROP TABLE IF EXISTS destination SYNC;
+CREATE TABLE source(timestamp DateTime) ENGINE = MergeTree() PARTITION BY toYYYYMMDD(timestamp) ORDER BY tuple();
+
+CREATE TABLE
+    destination(timestamp DateTime)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/destination_non_replicated_to_replicated_distinct_expression', '1')
+        PARTITION BY toYYYYMM(timestamp)
+        ORDER BY tuple();
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '20100302' from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should not be allowed because data would be split into two different partitions
+DROP TABLE IF EXISTS source SYNC;
+DROP TABLE IF EXISTS destination SYNC;
+
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-03 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source; -- { serverError 248 }
+ALTER TABLE destination ATTACH PARTITION '201003' from source; -- { serverError 248 }
+
+-- Should not be allowed because data would be split into two different partitions
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY intDiv(A, 6);
+
+CREATE TABLE destination (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY A;
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 1), ('2010-03-02 02:01:03', 2);
+
+ALTER TABLE destination ATTACH PARTITION ID '0' FROM source; -- { serverError 248 }
+ALTER TABLE destination ATTACH PARTITION 0 FROM source; -- { serverError 248 }
+
+-- Should not be allowed because dst partition exp takes more than two arguments, so it's not considered monotonically inc
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
+CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY substring(category, 1, 2);
+
+INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
+INSERT INTO TABLE source VALUES ('rice', 'food');
+
+ALTER TABLE destination ATTACH PARTITION ID '4590ba78048910b74a47d5bfb308abed' from source; -- { serverError 36 }
+ALTER TABLE destination ATTACH PARTITION 'food' from source; -- { serverError 36 }
+
+-- Should not be allowed because dst partition exp depends on a different set of columns
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
+CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(productName);
+
+INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
+INSERT INTO TABLE source VALUES ('rice', 'food');
+
+ALTER TABLE destination ATTACH PARTITION ID '4590ba78048910b74a47d5bfb308abed' from source; -- { serverError 36 }
+ALTER TABLE destination ATTACH PARTITION 'food' from source; -- { serverError 36 }
+
+-- Should not be allowed because dst partition exp is not monotonically increasing
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (productName String) engine=MergeTree ORDER BY tuple() PARTITION BY left(productName, 2);
+CREATE TABLE destination (productName String) engine=MergeTree ORDER BY tuple() PARTITION BY cityHash64(productName);
+
+INSERT INTO TABLE source VALUES ('bread'), ('mop');
+INSERT INTO TABLE source VALUES ('broccoli');
+
+ALTER TABLE destination ATTACH PARTITION ID '4589453b7ee96ce9de1265bd57674496' from source; -- { serverError 36 }
+ALTER TABLE destination ATTACH PARTITION 'br' from source; -- { serverError 36 }
+
+-- Empty/ non-existent partition, same partition expression. Nothing should happen
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+
+ALTER TABLE destination ATTACH PARTITION ID '1' FROM source;
+ALTER TABLE destination ATTACH PARTITION 1 FROM source;
+
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Empty/ non-existent partition, different partition expression. Nothing should happen
+-- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+
+ALTER TABLE destination ATTACH PARTITION ID '1' FROM source;
+ALTER TABLE destination ATTACH PARTITION 1 FROM source;
+
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Replace instead of attach. Empty/ non-existent partition, same partition expression. Nothing should happen
+-- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+
+ALTER TABLE destination REPLACE PARTITION '1' FROM source;
+
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Replace instead of attach. Empty/ non-existent partition to non-empty partition, same partition id.
+-- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (A Int) engine=MergeTree ORDER BY tuple() PARTITION BY A;
+CREATE TABLE destination (A Int) engine=MergeTree ORDER BY tuple() PARTITION BY A;
+
+INSERT INTO TABLE destination VALUES (1);
+
+ALTER TABLE destination REPLACE PARTITION '1' FROM source;
+
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;

From 5179891aef9792366d948efd9f1a2454dfe8da69 Mon Sep 17 00:00:00 2001
From: Arthur Passos <arthur.ti@outlook.com>
Date: Tue, 23 Jan 2024 11:43:08 -0300
Subject: [PATCH 089/245] remove static log

---
 src/Storages/MergeTree/MergeTreeDataPartCloner.cpp | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
index 78cb9aa0624..e384e1b7066 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
@@ -13,8 +13,6 @@ namespace ErrorCodes
 extern const int BAD_ARGUMENTS;
 }
 
-static Poco::Logger * log = &Poco::Logger::get("MergeTreeDataPartCloner");
-
 namespace DistinctPartitionExpression
 {
 std::unique_ptr<WriteBufferFromFileBase> updatePartitionFile(
@@ -182,7 +180,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneSourcePart(
     }
 
     LOG_DEBUG(
-        log,
+        &Poco::Logger::get("MergeTreeDataPartCloner"),
         "Clone {} part {} to {}{}",
         src_flushed_tmp_part ? "flushed" : "",
         src_part_storage->getFullPath(),

From 7e86c0e9280bb6e46183c2c358474bfd283e2554 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Tue, 23 Jan 2024 23:03:15 +0800
Subject: [PATCH 090/245] Compress state of dashboard

---
 programs/server/dashboard.html     | 6 +++---
 programs/server/js/lz-string.js    | 1 +
 src/Server/WebUIRequestHandler.cpp | 9 +++++++++
 3 files changed, 13 insertions(+), 3 deletions(-)
 create mode 100644 programs/server/js/lz-string.js

diff --git a/programs/server/dashboard.html b/programs/server/dashboard.html
index 04fdfb2d3ca..1f32048da79 100644
--- a/programs/server/dashboard.html
+++ b/programs/server/dashboard.html
@@ -5,6 +5,7 @@
     <title>ClickHouse Dashboard</title>
     <link rel="icon" href="data:image/svg+xml;base64,PHN2ZyB4bWxucz0iaHR0cDovL3d3dy53My5vcmcvMjAwMC9zdmciIHdpZHRoPSI1NCIgaGVpZ2h0PSI0OCIgdmlld0JveD0iMCAwIDkgOCI+PHN0eWxlPi5ve2ZpbGw6I2ZjMH0ucntmaWxsOnJlZH08L3N0eWxlPjxwYXRoIGQ9Ik0wLDcgaDEgdjEgaC0xIHoiIGNsYXNzPSJyIi8+PHBhdGggZD0iTTAsMCBoMSB2NyBoLTEgeiIgY2xhc3M9Im8iLz48cGF0aCBkPSJNMiwwIGgxIHY4IGgtMSB6IiBjbGFzcz0ibyIvPjxwYXRoIGQ9Ik00LDAgaDEgdjggaC0xIHoiIGNsYXNzPSJvIi8+PHBhdGggZD0iTTYsMCBoMSB2OCBoLTEgeiIgY2xhc3M9Im8iLz48cGF0aCBkPSJNOCwzLjI1IGgxIHYxLjUgaC0xIHoiIGNsYXNzPSJvIi8+PC9zdmc+">
     <script src="https://cdn.jsdelivr.net/npm/uplot@1.6.21/dist/uPlot.iife.min.js"></script>
+    <script src="https://cdn.jsdelivr.net/npm/lz-string@1.5.0/libs/lz-string.min.js"></script>
     <style>
         :root {
             --color: black;
@@ -484,7 +485,6 @@
   *
   * TODO:
   * - zoom on the graphs should work on touch devices;
-  * - compress the state for URL's #hash;
   * - footer with "about" or a link to source code;
   * - allow to configure a table on a server to save the dashboards;
   * - if a query returned one value, display this value instead of a diagram;
@@ -1384,7 +1384,7 @@ document.getElementById('params').onsubmit = function(event) {
 function saveState() {
     const state = { host, user, queries, params, search_query, customized };
     history.pushState(state, '',
-        window.location.pathname + (window.location.search || '') + '#' + btoa(JSON.stringify(state)));
+        window.location.pathname + (window.location.search || '') + '#' + LZString.compressToEncodedURIComponent(JSON.stringify(state)));
 }
 
 async function searchQueries() {
@@ -1450,7 +1450,7 @@ window.onpopstate = function(event) {
 if (window.location.hash) {
     try {
         let search_query_, customized_;
-        ({host, user, queries, params, search_query_, customized_} = JSON.parse(atob(window.location.hash.substring(1))));
+        ({host, user, queries, params, search_query_, customized_} = JSON.parse(LZString.decompressFromEncodedURIComponent(window.location.hash.substring(1))));
         // For compatibility with old URLs' hashes
         search_query = search_query_ !== undefined ? search_query_ : search_query;
         customized = customized_ !== undefined ? customized_ : true;
diff --git a/programs/server/js/lz-string.js b/programs/server/js/lz-string.js
new file mode 100644
index 00000000000..534b61ff6b6
--- /dev/null
+++ b/programs/server/js/lz-string.js
@@ -0,0 +1 @@
+var LZString=function(){var r=String.fromCharCode,o="ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/=",n="ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+-$",e={};function t(r,o){if(!e[r]){e[r]={};for(var n=0;n<r.length;n++)e[r][r.charAt(n)]=n}return e[r][o]}var i={compressToBase64:function(r){if(null==r)return"";var n=i._compress(r,6,function(r){return o.charAt(r)});switch(n.length%4){default:case 0:return n;case 1:return n+"===";case 2:return n+"==";case 3:return n+"="}},decompressFromBase64:function(r){return null==r?"":""==r?null:i._decompress(r.length,32,function(n){return t(o,r.charAt(n))})},compressToUTF16:function(o){return null==o?"":i._compress(o,15,function(o){return r(o+32)})+" "},decompressFromUTF16:function(r){return null==r?"":""==r?null:i._decompress(r.length,16384,function(o){return r.charCodeAt(o)-32})},compressToUint8Array:function(r){for(var o=i.compress(r),n=new Uint8Array(2*o.length),e=0,t=o.length;e<t;e++){var s=o.charCodeAt(e);n[2*e]=s>>>8,n[2*e+1]=s%256}return n},decompressFromUint8Array:function(o){if(null==o)return i.decompress(o);for(var n=new Array(o.length/2),e=0,t=n.length;e<t;e++)n[e]=256*o[2*e]+o[2*e+1];var s=[];return n.forEach(function(o){s.push(r(o))}),i.decompress(s.join(""))},compressToEncodedURIComponent:function(r){return null==r?"":i._compress(r,6,function(r){return n.charAt(r)})},decompressFromEncodedURIComponent:function(r){return null==r?"":""==r?null:(r=r.replace(/ /g,"+"),i._decompress(r.length,32,function(o){return t(n,r.charAt(o))}))},compress:function(o){return i._compress(o,16,function(o){return r(o)})},_compress:function(r,o,n){if(null==r)return"";var e,t,i,s={},u={},a="",p="",c="",l=2,f=3,h=2,d=[],m=0,v=0;for(i=0;i<r.length;i+=1)if(a=r.charAt(i),Object.prototype.hasOwnProperty.call(s,a)||(s[a]=f++,u[a]=!0),p=c+a,Object.prototype.hasOwnProperty.call(s,p))c=p;else{if(Object.prototype.hasOwnProperty.call(u,c)){if(c.charCodeAt(0)<256){for(e=0;e<h;e++)m<<=1,v==o-1?(v=0,d.push(n(m)),m=0):v++;for(t=c.charCodeAt(0),e=0;e<8;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1}else{for(t=1,e=0;e<h;e++)m=m<<1|t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t=0;for(t=c.charCodeAt(0),e=0;e<16;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1}0==--l&&(l=Math.pow(2,h),h++),delete u[c]}else for(t=s[c],e=0;e<h;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1;0==--l&&(l=Math.pow(2,h),h++),s[p]=f++,c=String(a)}if(""!==c){if(Object.prototype.hasOwnProperty.call(u,c)){if(c.charCodeAt(0)<256){for(e=0;e<h;e++)m<<=1,v==o-1?(v=0,d.push(n(m)),m=0):v++;for(t=c.charCodeAt(0),e=0;e<8;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1}else{for(t=1,e=0;e<h;e++)m=m<<1|t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t=0;for(t=c.charCodeAt(0),e=0;e<16;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1}0==--l&&(l=Math.pow(2,h),h++),delete u[c]}else for(t=s[c],e=0;e<h;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1;0==--l&&(l=Math.pow(2,h),h++)}for(t=2,e=0;e<h;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1;for(;;){if(m<<=1,v==o-1){d.push(n(m));break}v++}return d.join("")},decompress:function(r){return null==r?"":""==r?null:i._decompress(r.length,32768,function(o){return r.charCodeAt(o)})},_decompress:function(o,n,e){var t,i,s,u,a,p,c,l=[],f=4,h=4,d=3,m="",v=[],g={val:e(0),position:n,index:1};for(t=0;t<3;t+=1)l[t]=t;for(s=0,a=Math.pow(2,2),p=1;p!=a;)u=g.val&g.position,g.position>>=1,0==g.position&&(g.position=n,g.val=e(g.index++)),s|=(u>0?1:0)*p,p<<=1;switch(s){case 0:for(s=0,a=Math.pow(2,8),p=1;p!=a;)u=g.val&g.position,g.position>>=1,0==g.position&&(g.position=n,g.val=e(g.index++)),s|=(u>0?1:0)*p,p<<=1;c=r(s);break;case 1:for(s=0,a=Math.pow(2,16),p=1;p!=a;)u=g.val&g.position,g.position>>=1,0==g.position&&(g.position=n,g.val=e(g.index++)),s|=(u>0?1:0)*p,p<<=1;c=r(s);break;case 2:return""}for(l[3]=c,i=c,v.push(c);;){if(g.index>o)return"";for(s=0,a=Math.pow(2,d),p=1;p!=a;)u=g.val&g.position,g.position>>=1,0==g.position&&(g.position=n,g.val=e(g.index++)),s|=(u>0?1:0)*p,p<<=1;switch(c=s){case 0:for(s=0,a=Math.pow(2,8),p=1;p!=a;)u=g.val&g.position,g.position>>=1,0==g.position&&(g.position=n,g.val=e(g.index++)),s|=(u>0?1:0)*p,p<<=1;l[h++]=r(s),c=h-1,f--;break;case 1:for(s=0,a=Math.pow(2,16),p=1;p!=a;)u=g.val&g.position,g.position>>=1,0==g.position&&(g.position=n,g.val=e(g.index++)),s|=(u>0?1:0)*p,p<<=1;l[h++]=r(s),c=h-1,f--;break;case 2:return v.join("")}if(0==f&&(f=Math.pow(2,d),d++),l[c])m=l[c];else{if(c!==h)return null;m=i+i.charAt(0)}v.push(m),l[h++]=i+m.charAt(0),i=m,0==--f&&(f=Math.pow(2,d),d++)}}};return i}();"function"==typeof define&&define.amd?define(function(){return LZString}):"undefined"!=typeof module&&null!=module?module.exports=LZString:"undefined"!=typeof angular&&null!=angular&&angular.module("LZString",[]).factory("LZString",function(){return LZString});
diff --git a/src/Server/WebUIRequestHandler.cpp b/src/Server/WebUIRequestHandler.cpp
index ac7a3bfccf3..e45d2a55acb 100644
--- a/src/Server/WebUIRequestHandler.cpp
+++ b/src/Server/WebUIRequestHandler.cpp
@@ -17,6 +17,7 @@
 INCBIN(resource_play_html, SOURCE_DIR "/programs/server/play.html");
 INCBIN(resource_dashboard_html, SOURCE_DIR "/programs/server/dashboard.html");
 INCBIN(resource_uplot_js, SOURCE_DIR "/programs/server/js/uplot.js");
+INCBIN(resource_lz_string_js, SOURCE_DIR "/programs/server/js/lz-string.js");
 INCBIN(resource_binary_html, SOURCE_DIR "/programs/server/binary.html");
 
 
@@ -59,6 +60,9 @@ void WebUIRequestHandler::handleRequest(HTTPServerRequest & request, HTTPServerR
         static re2::RE2 uplot_url = R"(https://[^\s"'`]+u[Pp]lot[^\s"'`]*\.js)";
         RE2::Replace(&html, uplot_url, "/js/uplot.js");
 
+        static re2::RE2 lz_string_url = R"(https://[^\s"'`]+lz-string[^\s"'`]*\.js)";
+        RE2::Replace(&html, lz_string_url, "/js/lz-string.js");
+
         WriteBufferFromHTTPServerResponse(response, request.getMethod() == HTTPRequest::HTTP_HEAD, keep_alive_timeout).write(html);
     }
     else if (request.getURI().starts_with("/binary"))
@@ -71,6 +75,11 @@ void WebUIRequestHandler::handleRequest(HTTPServerRequest & request, HTTPServerR
         response.setStatusAndReason(Poco::Net::HTTPResponse::HTTP_OK);
         WriteBufferFromHTTPServerResponse(response, request.getMethod() == HTTPRequest::HTTP_HEAD, keep_alive_timeout).write(reinterpret_cast<const char *>(gresource_uplot_jsData), gresource_uplot_jsSize);
     }
+    else if (request.getURI() == "/js/lz-string.js")
+    {
+        response.setStatusAndReason(Poco::Net::HTTPResponse::HTTP_OK);
+        WriteBufferFromHTTPServerResponse(response, request.getMethod() == HTTPRequest::HTTP_HEAD, keep_alive_timeout).write(reinterpret_cast<const char *>(gresource_lz_string_jsData), gresource_lz_string_jsSize);
+    }
     else
     {
         response.setStatusAndReason(Poco::Net::HTTPResponse::HTTP_NOT_FOUND);

From 94a79c081da87ffedc31841cc5b45083693f4323 Mon Sep 17 00:00:00 2001
From: HarryLeeIBM <hleeatwork@outlook.com>
Date: Tue, 23 Jan 2024 09:21:17 -0800
Subject: [PATCH 091/245] Fix aggregation issue in mixed cluster of x86_64 and
 aarch64

---
 src/Common/HashTable/StringHashTable.h | 22 ++++++++++++++++++++++
 1 file changed, 22 insertions(+)

diff --git a/src/Common/HashTable/StringHashTable.h b/src/Common/HashTable/StringHashTable.h
index bfa369ef8e4..f3ba54e7d6e 100644
--- a/src/Common/HashTable/StringHashTable.h
+++ b/src/Common/HashTable/StringHashTable.h
@@ -71,6 +71,28 @@ struct StringHashTableHash
         res = _mm_crc32_u64(res, key.c);
         return res;
     }
+#elif defined(__aarch64__) && defined(__ARM_FEATURE_CRC32)
+    size_t ALWAYS_INLINE operator()(StringKey8 key) const
+    {
+        size_t res = -1ULL;
+        res = __crc32cd(static_cast<UInt32>(res), key);
+        return res;
+    }
+    size_t ALWAYS_INLINE operator()(StringKey16 key) const
+    {
+        size_t res = -1ULL;
+        res = __crc32cd(static_cast<UInt32>(res), key.items[0]);
+        res = __crc32cd(static_cast<UInt32>(res), key.items[1]);
+        return res;
+    }
+    size_t ALWAYS_INLINE operator()(StringKey24 key) const
+    {
+        size_t res = -1ULL;
+        res = __crc32cd(static_cast<UInt32>(res), key.a);
+        res = __crc32cd(static_cast<UInt32>(res), key.b);
+        res = __crc32cd(static_cast<UInt32>(res), key.c);
+        return res;
+    }
 #elif defined(__s390x__) && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
     size_t ALWAYS_INLINE operator()(StringKey8 key) const
     {

From dba792dff0e8e46712753e80e7e7244458dde1c8 Mon Sep 17 00:00:00 2001
From: Arthur Passos <arthur.ti@outlook.com>
Date: Tue, 23 Jan 2024 15:03:31 -0300
Subject: [PATCH 092/245] Remove duplicate includ

---
 src/Storages/StorageMergeTree.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index b08590242a1..a2c667a5e1d 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -44,7 +44,6 @@
 #include <Storages/MergeTree/checkDataPart.h>
 #include <Storages/PartitionCommands.h>
 #include <base/sort.h>
-#include <Storages/buildQueryTreeForShard.h>
 #include <QueryPipeline/Pipe.h>
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/BuildQueryPipelineSettings.h>

From aed8ffe3d8ff123ef83435d1e03322f9a2665371 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 16:30:37 +0800
Subject: [PATCH 093/245] optimize for decimal

---
 src/Functions/if.cpp | 34 ++++++++++++++++++++++++++--------
 1 file changed, 26 insertions(+), 8 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index cae3b720d8b..09feda0d816 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -57,7 +57,7 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
         size_t a_index = 0, b_index = 0;
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType>)
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
             {
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
                 a_index += !!cond[i];
@@ -71,33 +71,39 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
     {
         size_t a_index = 0;
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
             {
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[i]);
                 a_index += !!cond[i];
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b[i]);
+        }
     }
     else if (b_is_short)
     {
         size_t b_index = 0;
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
             {
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
                 b_index += !cond[i];
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[b_index++]);
+        }
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[i]);
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[i]);
+        }
     }
 }
 
@@ -110,21 +116,25 @@ inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, Ar
     {
         size_t a_index = 0;
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
             {
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b);
                 a_index += !!cond[i];
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b);
+        }
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b);
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b);
+        }
     }
 }
 
@@ -137,21 +147,25 @@ inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, Ar
     {
         size_t b_index = 0;
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
             {
                 res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
                 b_index += !cond[i];
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[b_index++]);
+        }
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
                 res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[i]);
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[i]);
+        }
     }
 }
 
@@ -197,6 +211,7 @@ struct NumIfImpl
         auto col_res = ColVecResult::create(size);
         ArrayResult & res = col_res->getData();
 
+        /// TODO 这里是否可避免分支跳转
         for (size_t i = 0; i < size; ++i)
             res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b);
         return col_res;
@@ -1120,6 +1135,7 @@ public:
             }
             else
             {
+                /// TODO 这里不物化行不行？
                 materialized_cond_col = cond_const_col->convertToFullColumn();
                 cond_col = typeid_cast<const ColumnUInt8 *>(&*materialized_cond_col);
             }
@@ -1159,6 +1175,8 @@ public:
         TypeIndex left_id = left_type->getTypeId();
         TypeIndex right_id = right_type->getTypeId();
 
+        /// TODO map类型是否有优化空间
+        /// TODO 对nullable类型是否有优化空间
         if (!(callOnBasicTypes<true, true, true, false>(left_id, right_id, call)
             || (res = executeTyped<UUID, UUID>(cond_col, arguments, result_type, input_rows_count))
             || (res = executeString(cond_col, arguments, result_type))

From 622a0f65b38a58557f552668844050245d4fcedd Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 18:46:06 +0800
Subject: [PATCH 094/245] optimize for float

---
 src/Functions/if.cpp | 106 +++++++++++++++++++++++++++++++------------
 1 file changed, 78 insertions(+), 28 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 09feda0d816..bb71f3ff1d9 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -25,6 +25,8 @@
 #include <Functions/FunctionFactory.h>
 #include <type_traits>
 
+#pragma clang diagnostic ignored "-Wundefined-reinterpret-cast"
+
 namespace DB
 {
 namespace ErrorCodes
@@ -45,9 +47,28 @@ using namespace GatherUtils;
   * For better performance, try to use branch free code for numeric types(i.e. cond ? a : b --> !!cond * a + !cond * b), except floating point types because of Inf or NaN.
 */
 
-template <typename ArrayCond, typename ArrayA, typename ArrayB, typename ArrayResult, typename ResultType>
-inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const ArrayB & b, ArrayResult & res)
+template <typename ResultType>
+struct is_native_int_or_decimal // NOLINT(readability-identifier-naming)
 {
+    static constexpr bool value = std::is_integral_v<ResultType> || (is_decimal<ResultType> && sizeof(ResultType) <= 8);
+};
+
+#define BRANCHLESS_IF_FLOAT(TYPE, vc, va, vb, vr) \
+    using UIntType = typename NumberTraits::Construct<false, false, sizeof(TYPE)>::Type; \
+    using IntType = typename NumberTraits::Construct<true, false, sizeof(TYPE)>::Type; \
+    auto mask = static_cast<UIntType>(static_cast<IntType>(vc) - 1); \
+    auto new_a = static_cast<ResultType>(va); \
+    auto new_b = static_cast<ResultType>(vb); \
+    auto tmp = (~mask & (*reinterpret_cast<UIntType *>(&new_a))) | (mask & (*reinterpret_cast<UIntType *>(&new_b))); \
+    (vr) = *(reinterpret_cast<ResultType *>(&tmp));
+
+template <typename ResultType>
+inline constexpr bool is_native_int_or_decimal_v = is_native_int_or_decimal<ResultType>::value;
+
+template <typename ArrayCond, typename ArrayA, typename ArrayB, typename ArrayResult, typename ResultType>
+NO_INLINE void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const ArrayB & b, ArrayResult & res)
+{
+
     size_t size = cond.size();
     bool a_is_short = a.size() < size;
     bool b_is_short = b.size() < size;
@@ -57,14 +78,17 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
         size_t a_index = 0, b_index = 0;
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
-            {
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
-                a_index += !!cond[i];
-                b_index += !cond[i];
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[a_index], b[b_index], res[i])
             }
             else
-                res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b[b_index++]);
+                res[i] = cond[i] ? static_cast<ResultType>(a[a_index]) : static_cast<ResultType>(b[b_index]);
+
+            a_index += !!cond[i];
+            b_index += !cond[i];
         }
     }
     else if (a_is_short)
@@ -72,13 +96,16 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
         size_t a_index = 0;
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
-            {
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[i]);
-                a_index += !!cond[i];
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[a_index], b[i], res[i])
             }
             else
-                res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b[i]);
+                res[i] = cond[i] ? static_cast<ResultType>(a[a_index]) : static_cast<ResultType>(b[i]);
+
+            a_index += !!cond[i];
         }
     }
     else if (b_is_short)
@@ -86,29 +113,38 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
         size_t b_index = 0;
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
-            {
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
-                b_index += !cond[i];
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[i], b[b_index], res[i])
             }
             else
-                res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[b_index++]);
+                res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[b_index]);
+
+            b_index += !cond[i];
         }
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[i]);
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[i], b[i], res[i])
+            }
             else
+            {
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[i]);
+            }
         }
     }
 }
 
 template <typename ArrayCond, typename ArrayA, typename B, typename ArrayResult, typename ResultType>
-inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, ArrayResult & res)
+NO_INLINE void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, ArrayResult & res)
 {
     size_t size = cond.size();
     bool a_is_short = a.size() < size;
@@ -117,21 +153,28 @@ inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, Ar
         size_t a_index = 0;
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
-            {
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b);
-                a_index += !!cond[i];
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[a_index], b, res[i])
             }
             else
-                res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b);
+                res[i] = cond[i] ? static_cast<ResultType>(a[a_index]) : static_cast<ResultType>(b);
+
+            a_index += !!cond[i];
         }
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b);
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[i], b, res[i])
+            }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b);
         }
@@ -139,7 +182,7 @@ inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, Ar
 }
 
 template <typename ArrayCond, typename A, typename ArrayB, typename ArrayResult, typename ResultType>
-inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, ArrayResult & res)
+NO_INLINE void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, ArrayResult & res)
 {
     size_t size = cond.size();
     bool b_is_short = b.size() < size;
@@ -148,21 +191,28 @@ inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, Ar
         size_t b_index = 0;
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
-            {
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
-                b_index += !cond[i];
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a, b[b_index], res[i])
             }
             else
-                res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[b_index++]);
+                res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[b_index]);
+
+            b_index += !cond[i];
         }
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[i]);
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a, b[i], res[i])
+            }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[i]);
         }

From 393cab820e479a76710d691d1da825079307847a Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 18:48:29 +0800
Subject: [PATCH 095/245] add some comment

---
 src/Functions/if.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index bb71f3ff1d9..f10b9989f13 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -261,7 +261,7 @@ struct NumIfImpl
         auto col_res = ColVecResult::create(size);
         ArrayResult & res = col_res->getData();
 
-        /// TODO 这里是否可避免分支跳转
+        /// TODO cast a and b only once
         for (size_t i = 0; i < size; ++i)
             res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b);
         return col_res;
@@ -1185,7 +1185,7 @@ public:
             }
             else
             {
-                /// TODO 这里不物化行不行？
+                /// TODO why materialize condition
                 materialized_cond_col = cond_const_col->convertToFullColumn();
                 cond_col = typeid_cast<const ColumnUInt8 *>(&*materialized_cond_col);
             }

From eae787860944dc26bf70081369b0268f5b5ce7e4 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 19:53:50 +0800
Subject: [PATCH 096/245] fix style

---
 src/Functions/if.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index f10b9989f13..79646b4b86c 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -66,7 +66,7 @@ template <typename ResultType>
 inline constexpr bool is_native_int_or_decimal_v = is_native_int_or_decimal<ResultType>::value;
 
 template <typename ArrayCond, typename ArrayA, typename ArrayB, typename ArrayResult, typename ResultType>
-NO_INLINE void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const ArrayB & b, ArrayResult & res)
+inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const ArrayB & b, ArrayResult & res)
 {
 
     size_t size = cond.size();
@@ -144,7 +144,7 @@ NO_INLINE void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const
 }
 
 template <typename ArrayCond, typename ArrayA, typename B, typename ArrayResult, typename ResultType>
-NO_INLINE void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, ArrayResult & res)
+inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, ArrayResult & res)
 {
     size_t size = cond.size();
     bool a_is_short = a.size() < size;
@@ -182,7 +182,7 @@ NO_INLINE void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b,
 }
 
 template <typename ArrayCond, typename A, typename ArrayB, typename ArrayResult, typename ResultType>
-NO_INLINE void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, ArrayResult & res)
+inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, ArrayResult & res)
 {
     size_t size = cond.size();
     bool b_is_short = b.size() < size;

From a657a2631f2cbca1328a0b6fde09dd9deba2a6d2 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 19:58:07 +0800
Subject: [PATCH 097/245] add perf tests

---
 tests/performance/if.xml | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/tests/performance/if.xml b/tests/performance/if.xml
index f4d0e8f9773..b25218f553e 100644
--- a/tests/performance/if.xml
+++ b/tests/performance/if.xml
@@ -1,12 +1,12 @@
 <test>
-
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() > 42949673, zero + 1, zero + 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 3865470566, zero + 1, zero + 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 2147483647, zero + 1, zero + 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, zero + 2)) ]]></query>
-
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, zero + 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, 2)) ]]></query>
-
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() > 42949673, zero + 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 3865470566, zero + 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 2147483647, zero + 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, 2)) ]]></query>
+    
+    <query>with rand32() % 2 as x select if(x, materialize(1.234), materialize(2.456)) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1.234::Decimal64(3) as a, 2.456::Decimal64(3) as b select if(x, materialize(a), materialize(b)) from numbers(100000000) format Null</query>
 </test>

From 4e337f83170084ba5fa83488b7e9c6ae6c21976d Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 20:00:26 +0800
Subject: [PATCH 098/245] add perf tests

---
 src/Functions/if.cpp | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 79646b4b86c..4b1be7f4709 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -44,7 +44,7 @@ using namespace GatherUtils;
 /** Selection function by condition: if(cond, then, else).
   * cond - UInt8
   * then, else - numeric types for which there is a general type, or dates, datetimes, or strings, or arrays of these types.
-  * For better performance, try to use branch free code for numeric types(i.e. cond ? a : b --> !!cond * a + !cond * b), except floating point types because of Inf or NaN.
+  * For better performance, try to use branch free code for numeric types(i.e. cond ? a : b --> !!cond * a + !cond * b)
 */
 
 template <typename ResultType>
@@ -53,7 +53,7 @@ struct is_native_int_or_decimal // NOLINT(readability-identifier-naming)
     static constexpr bool value = std::is_integral_v<ResultType> || (is_decimal<ResultType> && sizeof(ResultType) <= 8);
 };
 
-#define BRANCHLESS_IF_FLOAT(TYPE, vc, va, vb, vr) \
+#define BRANCHFREE_IF_FLOAT(TYPE, vc, va, vb, vr) \
     using UIntType = typename NumberTraits::Construct<false, false, sizeof(TYPE)>::Type; \
     using IntType = typename NumberTraits::Construct<true, false, sizeof(TYPE)>::Type; \
     auto mask = static_cast<UIntType>(static_cast<IntType>(vc) - 1); \
@@ -82,7 +82,7 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[a_index], b[b_index], res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a[a_index], b[b_index], res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[a_index]) : static_cast<ResultType>(b[b_index]);
@@ -100,7 +100,7 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[i]);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[a_index], b[i], res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a[a_index], b[i], res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[a_index]) : static_cast<ResultType>(b[i]);
@@ -117,7 +117,7 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[i], b[b_index], res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a[i], b[b_index], res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[b_index]);
@@ -133,7 +133,7 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[i]);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[i], b[i], res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a[i], b[i], res[i])
             }
             else
             {
@@ -157,7 +157,7 @@ inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, Ar
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[a_index], b, res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a[a_index], b, res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[a_index]) : static_cast<ResultType>(b);
@@ -173,7 +173,7 @@ inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, Ar
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[i], b, res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a[i], b, res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b);
@@ -195,7 +195,7 @@ inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, Ar
                 res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a, b[b_index], res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a, b[b_index], res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[b_index]);
@@ -211,7 +211,7 @@ inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, Ar
                 res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[i]);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a, b[i], res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a, b[i], res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[i]);

From 2418798e3c244d32b2048781b8aced3440c65135 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 20:02:07 +0800
Subject: [PATCH 099/245] fix code style

---
 src/Functions/if.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 4b1be7f4709..7f1423cd434 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -1225,8 +1225,8 @@ public:
         TypeIndex left_id = left_type->getTypeId();
         TypeIndex right_id = right_type->getTypeId();
 
-        /// TODO map类型是否有优化空间
-        /// TODO 对nullable类型是否有优化空间
+        /// TODO optimize for map type
+        /// TODO optimize for nullable type
         if (!(callOnBasicTypes<true, true, true, false>(left_id, right_id, call)
             || (res = executeTyped<UUID, UUID>(cond_col, arguments, result_type, input_rows_count))
             || (res = executeString(cond_col, arguments, result_type))

From 383ae86ebb0da8a962521f55b08186331eb0f676 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 24 Jan 2024 15:06:16 +0000
Subject: [PATCH 100/245] Upgrade simdjson to v3.6.3

See https://github.com/ClickHouse/ClickHouse/issues/38621#issuecomment-1908219067
---
 contrib/simdjson | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/simdjson b/contrib/simdjson
index 1075e8609c4..6060be2fdf6 160000
--- a/contrib/simdjson
+++ b/contrib/simdjson
@@ -1 +1 @@
-Subproject commit 1075e8609c4afa253162d441437af929c29e31bb
+Subproject commit 6060be2fdf62edf4a8f51a8b0883d57d09397b30

From 7f8f379d7fe6b3368221ff97572df83eacd14e1f Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 24 Jan 2024 16:04:00 +0100
Subject: [PATCH 101/245] Parallel & disrtibuted processing for ordered mode

---
 src/Storages/S3Queue/S3QueueFilesMetadata.cpp |  51 +++-
 src/Storages/S3Queue/S3QueueFilesMetadata.h   |  14 +-
 src/Storages/S3Queue/S3QueueSettings.h        |   2 +
 src/Storages/S3Queue/S3QueueSource.cpp        |  73 +++++-
 src/Storages/S3Queue/S3QueueSource.h          |  14 +-
 src/Storages/S3Queue/StorageS3Queue.cpp       |  35 +--
 src/Storages/S3Queue/StorageS3Queue.h         |   1 +
 src/Storages/StorageS3.cpp                    |  28 +-
 src/Storages/StorageS3.h                      |  14 +-
 .../integration/test_storage_s3_queue/test.py | 240 ++++++++++++++++++
 10 files changed, 414 insertions(+), 58 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
index f49e1d6f25c..02974be4c4a 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
@@ -129,6 +129,8 @@ S3QueueFilesMetadata::S3QueueFilesMetadata(const fs::path & zookeeper_path_, con
     , max_loading_retries(settings_.s3queue_loading_retries.value)
     , min_cleanup_interval_ms(settings_.s3queue_cleanup_interval_min_ms.value)
     , max_cleanup_interval_ms(settings_.s3queue_cleanup_interval_max_ms.value)
+    , shards_num(settings_.s3queue_total_shards_num)
+    , threads_per_shard(settings_.s3queue_processing_threads_num)
     , zookeeper_processing_path(zookeeper_path_ / "processing")
     , zookeeper_processed_path(zookeeper_path_ / "processed")
     , zookeeper_failed_path(zookeeper_path_ / "failed")
@@ -197,6 +199,11 @@ S3QueueFilesMetadata::NodeMetadata S3QueueFilesMetadata::createNodeMetadata(
     return metadata;
 }
 
+size_t S3QueueFilesMetadata::getProcessingThreadForPath(const std::string & path) const
+{
+    return sipHash64(path.data(), path.size()) % getProcessingThreadsNum();
+}
+
 S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAsProcessing(const std::string & path)
 {
     auto timer = DB::CurrentThread::getProfileEvents().timer(ProfileEvents::S3QueueSetFileProcessingMicroseconds);
@@ -312,7 +319,8 @@ S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAs
 }
 
 std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
-          S3QueueFilesMetadata::ProcessingNodeHolderPtr> S3QueueFilesMetadata::trySetFileAsProcessingForUnorderedMode(const std::string & path, const FileStatusPtr & file_status)
+          S3QueueFilesMetadata::ProcessingNodeHolderPtr>
+S3QueueFilesMetadata::trySetFileAsProcessingForUnorderedMode(const std::string & path, const FileStatusPtr & file_status)
 {
     /// In one zookeeper transaction do the following:
     /// 1. check that corresponding persistent nodes do not exist in processed/ and failed/;
@@ -339,7 +347,8 @@ std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
 
     if (code == Coordination::Error::ZOK)
     {
-        auto holder = std::make_unique<ProcessingNodeHolder>(node_metadata.processing_id, path, zookeeper_processing_path / node_name, file_status, zk_client);
+        auto holder = std::make_unique<ProcessingNodeHolder>(
+            node_metadata.processing_id, path, zookeeper_processing_path / node_name, file_status, zk_client);
         return std::pair{SetFileProcessingResult::Success, std::move(holder)};
     }
 
@@ -362,7 +371,8 @@ std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
 }
 
 std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
-          S3QueueFilesMetadata::ProcessingNodeHolderPtr> S3QueueFilesMetadata::trySetFileAsProcessingForOrderedMode(const std::string & path, const FileStatusPtr & file_status)
+          S3QueueFilesMetadata::ProcessingNodeHolderPtr>
+S3QueueFilesMetadata::trySetFileAsProcessingForOrderedMode(const std::string & path, const FileStatusPtr & file_status)
 {
     /// Same as for Unordered mode.
     /// The only difference is the check if the file is already processed.
@@ -385,10 +395,15 @@ std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
         /// If the version did change - retry (since we cannot do Get and Create requests
         /// in the same zookeeper transaction, so we use a while loop with tries).
 
-        Coordination::Stat processed_node_stat;
-        auto data = zk_client->get(zookeeper_processed_path, &processed_node_stat);
+        auto processed_node = isShardedProcessing()
+            ? zookeeper_processed_path / toString(getProcessingThreadForPath(path))
+            : zookeeper_processed_path;
+
         NodeMetadata processed_node_metadata;
-        if (!data.empty())
+        Coordination::Stat processed_node_stat;
+        std::string data;
+        auto processed_node_exists = zk_client->tryGet(processed_node, data, &processed_node_stat);
+        if (processed_node_exists && !data.empty())
             processed_node_metadata = NodeMetadata::fromString(data);
 
         auto max_processed_file_path = processed_node_metadata.file_path;
@@ -403,13 +418,23 @@ std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
         requests.push_back(zkutil::makeRemoveRequest(zookeeper_failed_path / node_name, -1));
 
         requests.push_back(zkutil::makeCreateRequest(zookeeper_processing_path / node_name, node_metadata.toString(), zkutil::CreateMode::Ephemeral));
-        requests.push_back(zkutil::makeCheckRequest(zookeeper_processed_path, processed_node_stat.version));
+
+        if (processed_node_exists)
+        {
+            requests.push_back(zkutil::makeCheckRequest(processed_node, processed_node_stat.version));
+        }
+        else
+        {
+            requests.push_back(zkutil::makeCreateRequest(processed_node, "", zkutil::CreateMode::Persistent));
+            requests.push_back(zkutil::makeRemoveRequest(processed_node, -1));
+        }
 
         Coordination::Responses responses;
         auto code = zk_client->tryMulti(requests, responses);
         if (code == Coordination::Error::ZOK)
         {
-            auto holder = std::make_unique<ProcessingNodeHolder>(node_metadata.processing_id, path, zookeeper_processing_path / node_name, file_status, zk_client);
+            auto holder = std::make_unique<ProcessingNodeHolder>(
+                node_metadata.processing_id, path, zookeeper_processing_path / node_name, file_status, zk_client);
             return std::pair{SetFileProcessingResult::Success, std::move(holder)};
         }
 
@@ -500,11 +525,15 @@ void S3QueueFilesMetadata::setFileProcessedForOrderedMode(ProcessingNodeHolderPt
     const auto node_metadata = createNodeMetadata(path).toString();
     const auto zk_client = getZooKeeper();
 
+    auto processed_node = isShardedProcessing()
+        ? zookeeper_processed_path / toString(getProcessingThreadForPath(path))
+        : zookeeper_processed_path;
+
     while (true)
     {
         std::string res;
         Coordination::Stat stat;
-        bool exists = zk_client->tryGet(zookeeper_processed_path, res, &stat);
+        bool exists = zk_client->tryGet(processed_node, res, &stat);
         Coordination::Requests requests;
         if (exists)
         {
@@ -527,11 +556,11 @@ void S3QueueFilesMetadata::setFileProcessedForOrderedMode(ProcessingNodeHolderPt
                     return;
                 }
             }
-            requests.push_back(zkutil::makeSetRequest(zookeeper_processed_path, node_metadata, stat.version));
+            requests.push_back(zkutil::makeSetRequest(processed_node, node_metadata, stat.version));
         }
         else
         {
-            requests.push_back(zkutil::makeCreateRequest(zookeeper_processed_path, node_metadata, zkutil::CreateMode::Persistent));
+            requests.push_back(zkutil::makeCreateRequest(processed_node, node_metadata, zkutil::CreateMode::Persistent));
         }
 
         Coordination::Responses responses;
diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index f3be7c5c3a0..708355e4ac3 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -80,6 +80,15 @@ public:
 
     void deactivateCleanupTask();
 
+    bool isShardedProcessing() const { return getProcessingThreadsNum() > 1 && mode == S3QueueMode::ORDERED; }
+
+    size_t getProcessingThreadsNum() const { return shards_num * threads_per_shard; }
+
+    size_t getProcessingThreadForPath(const std::string & path) const;
+
+    /// shard_id must be in range [0, shards_num - 1]
+    size_t getIdForProcessingThread(size_t thread_id, size_t shard_id) const { return shard_id * threads_per_shard + thread_id; }
+
 private:
     const S3QueueMode mode;
     const UInt64 max_set_size;
@@ -87,6 +96,8 @@ private:
     const UInt64 max_loading_retries;
     const size_t min_cleanup_interval_ms;
     const size_t max_cleanup_interval_ms;
+    const size_t shards_num;
+    const size_t threads_per_shard;
 
     const fs::path zookeeper_processing_path;
     const fs::path zookeeper_processed_path;
@@ -117,8 +128,7 @@ private:
 
     struct NodeMetadata
     {
-        std::string file_path;
-        UInt64 last_processed_timestamp = 0;
+        std::string file_path; UInt64 last_processed_timestamp = 0;
         std::string last_exception;
         UInt64 retries = 0;
         std::string processing_id; /// For ephemeral processing node.
diff --git a/src/Storages/S3Queue/S3QueueSettings.h b/src/Storages/S3Queue/S3QueueSettings.h
index 66fe9b4ce31..d65b38f77f2 100644
--- a/src/Storages/S3Queue/S3QueueSettings.h
+++ b/src/Storages/S3Queue/S3QueueSettings.h
@@ -29,6 +29,8 @@ class ASTStorage;
     M(UInt32, s3queue_tracked_files_limit, 1000, "For unordered mode. Max set size for tracking processed files in ZooKeeper", 0) \
     M(UInt32, s3queue_cleanup_interval_min_ms, 60000, "For unordered mode. Polling backoff min for cleanup", 0) \
     M(UInt32, s3queue_cleanup_interval_max_ms, 60000, "For unordered mode. Polling backoff max for cleanup", 0) \
+    M(UInt32, s3queue_total_shards_num, 1, "Value 0 means disabled", 0) \
+    M(UInt32, s3queue_current_shard_num, 0, "", 0) \
 
 #define LIST_OF_S3QUEUE_SETTINGS(M, ALIAS) \
     S3QUEUE_RELATED_SETTINGS(M, ALIAS) \
diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index 27bec039f96..7d4ad64d554 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -46,29 +46,86 @@ StorageS3QueueSource::FileIterator::FileIterator(
     : metadata(metadata_)
     , glob_iterator(std::move(glob_iterator_))
     , shutdown_called(shutdown_called_)
+    , log(&Poco::Logger::get("StorageS3QueueSource"))
+    , sharded_processing(metadata->isShardedProcessing())
 {
+    if (sharded_processing)
+    {
+        for (size_t i = 0; i < metadata->getProcessingThreadsNum(); ++i)
+            sharded_keys.emplace(i, std::deque<KeyWithInfoPtr>{});
+    }
 }
 
-StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next()
+StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(size_t idx)
 {
     while (!shutdown_called)
     {
-        KeyWithInfoPtr val = glob_iterator->next();
+        KeyWithInfoPtr val{nullptr};
+
+        if (sharded_processing)
+        {
+            LOG_TEST(log, "CHECK: {}", idx);
+            auto & keys = sharded_keys.at(idx);
+            if (!keys.empty())
+            {
+                std::lock_guard lk(sharded_keys_mutex);
+                val = keys.front();
+                keys.pop_front();
+            }
+        }
+
+        if (!val)
+        {
+            std::unique_lock lk(sharded_keys_mutex, std::defer_lock);
+            if (sharded_processing)
+            {
+                /// To make sure order on keys in each shard in sharded_keys.
+                lk.lock();
+            }
+
+            val = glob_iterator->next();
+
+            if (val && sharded_processing)
+            {
+                auto shard = metadata->getProcessingThreadForPath(val->key);
+                if (shard != idx)
+                {
+                    LOG_TEST(log, "Key {} is for shard {} (total: {})", val->key, shard, sharded_keys.size());
+                    auto & keys = sharded_keys.at(shard);
+                    keys.push_back(val);
+                    continue;
+                }
+                LOG_TEST(log, "Processing shard {} with key {}", shard, val->key);
+            }
+        }
 
         if (!val)
             return {};
 
         if (shutdown_called)
         {
-            LOG_TEST(&Poco::Logger::get("StorageS3QueueSource"), "Shutdown was called, stopping file iterator");
+            LOG_TEST(log, "Shutdown was called, stopping file iterator");
             return {};
         }
 
-        if (auto processing_holder = metadata->trySetFileAsProcessing(val->key);
-            processing_holder && !shutdown_called)
+        auto processing_holder = metadata->trySetFileAsProcessing(val->key);
+        if (shutdown_called)
+        {
+            LOG_TEST(log, "Shutdown was called, stopping file iterator");
+            return {};
+        }
+
+        if (processing_holder)
         {
             return std::make_shared<S3QueueKeyWithInfo>(val->key, val->info, processing_holder);
         }
+        else if (sharded_processing
+                 && metadata->getFileStatus(val->key)->state == S3QueueFilesMetadata::FileStatus::State::Processing)
+        {
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                            "File {} is processing by someone else in sharded processing. "
+                            "It is a bug", val->key);
+        }
     }
     return {};
 }
@@ -83,6 +140,7 @@ StorageS3QueueSource::StorageS3QueueSource(
     const Block & header_,
     std::unique_ptr<StorageS3Source> internal_source_,
     std::shared_ptr<S3QueueFilesMetadata> files_metadata_,
+    size_t processing_id_,
     const S3QueueAction & action_,
     RemoveFileFunc remove_file_func_,
     const NamesAndTypesList & requested_virtual_columns_,
@@ -96,6 +154,7 @@ StorageS3QueueSource::StorageS3QueueSource(
     , WithContext(context_)
     , name(std::move(name_))
     , action(action_)
+    , processing_id(processing_id_)
     , files_metadata(files_metadata_)
     , internal_source(std::move(internal_source_))
     , requested_virtual_columns(requested_virtual_columns_)
@@ -123,7 +182,7 @@ void StorageS3QueueSource::lazyInitialize()
     if (initialized)
         return;
 
-    internal_source->lazyInitialize();
+    internal_source->lazyInitialize(processing_id);
     reader = std::move(internal_source->reader);
     if (reader)
         reader_future = std::move(internal_source->reader_future);
@@ -249,7 +308,7 @@ Chunk StorageS3QueueSource::generate()
         /// Even if task is finished the thread may be not freed in pool.
         /// So wait until it will be freed before scheduling a new task.
         internal_source->create_reader_pool.wait();
-        reader_future = internal_source->createReaderAsync();
+        reader_future = internal_source->createReaderAsync(processing_id);
     }
 
     return {};
diff --git a/src/Storages/S3Queue/S3QueueSource.h b/src/Storages/S3Queue/S3QueueSource.h
index 542f8e8fd8c..338f355974b 100644
--- a/src/Storages/S3Queue/S3QueueSource.h
+++ b/src/Storages/S3Queue/S3QueueSource.h
@@ -38,12 +38,15 @@ public:
     class FileIterator : public IIterator
     {
     public:
-        FileIterator(std::shared_ptr<S3QueueFilesMetadata> metadata_, std::unique_ptr<GlobIterator> glob_iterator_, std::atomic<bool> & shutdown_called_);
+        FileIterator(
+            std::shared_ptr<S3QueueFilesMetadata> metadata_,
+            std::unique_ptr<GlobIterator> glob_iterator_,
+            std::atomic<bool> & shutdown_called_);
 
         /// Note:
         /// List results in s3 are always returned in UTF-8 binary order.
         /// (https://docs.aws.amazon.com/AmazonS3/latest/userguide/ListingKeysUsingAPIs.html)
-        KeyWithInfoPtr next() override;
+        KeyWithInfoPtr next(size_t idx) override;
 
         size_t estimatedKeysCount() override;
 
@@ -52,6 +55,11 @@ public:
         const std::unique_ptr<GlobIterator> glob_iterator;
         std::atomic<bool> & shutdown_called;
         std::mutex mutex;
+        Poco::Logger * log;
+
+        const bool sharded_processing;
+        std::unordered_map<size_t, std::deque<KeyWithInfoPtr>> sharded_keys;
+        std::mutex sharded_keys_mutex;
     };
 
     StorageS3QueueSource(
@@ -59,6 +67,7 @@ public:
         const Block & header_,
         std::unique_ptr<StorageS3Source> internal_source_,
         std::shared_ptr<S3QueueFilesMetadata> files_metadata_,
+        size_t processing_id_,
         const S3QueueAction & action_,
         RemoveFileFunc remove_file_func_,
         const NamesAndTypesList & requested_virtual_columns_,
@@ -80,6 +89,7 @@ public:
 private:
     const String name;
     const S3QueueAction action;
+    const size_t processing_id;
     const std::shared_ptr<S3QueueFilesMetadata> files_metadata;
     const std::shared_ptr<StorageS3Source> internal_source;
     const NamesAndTypesList requested_virtual_columns;
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index bc33e8cf2a9..511add4912f 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -75,14 +75,8 @@ namespace
         return zkutil::extractZooKeeperPath(result_zk_path, true);
     }
 
-    void checkAndAdjustSettings(S3QueueSettings & s3queue_settings, const Settings & settings, Poco::Logger * log)
+    void checkAndAdjustSettings(S3QueueSettings & s3queue_settings, const Settings & settings)
     {
-        if (s3queue_settings.mode == S3QueueMode::ORDERED && s3queue_settings.s3queue_processing_threads_num > 1)
-        {
-            LOG_WARNING(log, "Parallel processing is not yet supported for Ordered mode");
-            s3queue_settings.s3queue_processing_threads_num = 1;
-        }
-
         if (!s3queue_settings.s3queue_processing_threads_num)
         {
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Setting `s3queue_processing_threads_num` cannot be set to zero");
@@ -99,6 +93,13 @@ namespace
                             "Setting `s3queue_cleanup_interval_min_ms` ({}) must be less or equal to `s3queue_cleanup_interval_max_ms` ({})",
                             s3queue_settings.s3queue_cleanup_interval_min_ms, s3queue_settings.s3queue_cleanup_interval_max_ms);
         }
+
+        if (s3queue_settings.s3queue_current_shard_num >= s3queue_settings.s3queue_total_shards_num)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                            "Setting `s3queue_current_shard_num` ({}) cannot exceed `{}` (`s3queue_total_shards_num` - 1)",
+                            s3queue_settings.s3queue_current_shard_num, s3queue_settings.s3queue_total_shards_num);
+
+        ///TODO: Add a test with different total_shards_settings for same keeper path - exception must be thrown.
     }
 }
 
@@ -134,7 +135,7 @@ StorageS3Queue::StorageS3Queue(
         throw Exception(ErrorCodes::QUERY_NOT_ALLOWED, "S3Queue url must either end with '/' or contain globs");
     }
 
-    checkAndAdjustSettings(*s3queue_settings, context_->getSettingsRef(), log);
+    checkAndAdjustSettings(*s3queue_settings, context_->getSettingsRef());
 
     configuration.update(context_);
     FormatFactory::instance().checkFormatName(configuration.format);
@@ -221,13 +222,12 @@ public:
         std::shared_ptr<StorageS3Queue> storage_,
         ContextPtr context_,
         size_t max_block_size_,
-        size_t num_streams_)
+        size_t )
         : SourceStepWithFilter(DataStream{.header = std::move(sample_block)})
         , info(std::move(info_))
         , storage(std::move(storage_))
         , context(std::move(context_))
         , max_block_size(max_block_size_)
-        , num_streams(num_streams_)
     {
     }
 
@@ -236,7 +236,6 @@ private:
     std::shared_ptr<StorageS3Queue> storage;
     ContextPtr context;
     size_t max_block_size;
-    size_t num_streams;
 
     std::shared_ptr<StorageS3Queue::FileIterator> iterator;
 
@@ -301,11 +300,15 @@ void StorageS3Queue::read(
 void ReadFromS3Queue::initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
 {
     Pipes pipes;
-    const size_t adjusted_num_streams = std::min<size_t>(num_streams, storage->s3queue_settings->s3queue_processing_threads_num);
+    const size_t adjusted_num_streams = storage->s3queue_settings->s3queue_processing_threads_num;
 
     createIterator(nullptr);
     for (size_t i = 0; i < adjusted_num_streams; ++i)
-        pipes.emplace_back(storage->createSource(info, iterator, max_block_size, context));
+        pipes.emplace_back(storage->createSource(
+                               info,
+                               iterator,
+                               storage->files_metadata->getIdForProcessingThread(i, storage->s3queue_settings->s3queue_current_shard_num),
+                               max_block_size, context));
 
     auto pipe = Pipe::unitePipes(std::move(pipes));
     if (pipe.empty())
@@ -320,6 +323,7 @@ void ReadFromS3Queue::initializePipeline(QueryPipelineBuilder & pipeline, const
 std::shared_ptr<StorageS3QueueSource> StorageS3Queue::createSource(
     const ReadFromFormatInfo & info,
     std::shared_ptr<StorageS3Queue::FileIterator> file_iterator,
+    size_t processing_id,
     size_t max_block_size,
     ContextPtr local_context)
 {
@@ -359,7 +363,7 @@ std::shared_ptr<StorageS3QueueSource> StorageS3Queue::createSource(
     auto s3_queue_log = s3queue_settings->s3queue_enable_logging_to_s3queue_log ? local_context->getS3QueueLog() : nullptr;
     return std::make_shared<StorageS3QueueSource>(
         getName(), info.source_header, std::move(internal_source),
-        files_metadata, after_processing, file_deleter, info.requested_virtual_columns,
+        files_metadata, processing_id, after_processing, file_deleter, info.requested_virtual_columns,
         local_context, shutdown_called, table_is_being_dropped, s3_queue_log, getStorageID(), log);
 }
 
@@ -463,7 +467,8 @@ bool StorageS3Queue::streamToViews()
     for (size_t i = 0; i < s3queue_settings->s3queue_processing_threads_num; ++i)
     {
         auto source = createSource(
-            read_from_format_info, file_iterator, DBMS_DEFAULT_BUFFER_SIZE, s3queue_context);
+            read_from_format_info, file_iterator, files_metadata->getIdForProcessingThread(i, s3queue_settings->s3queue_current_shard_num),
+            DBMS_DEFAULT_BUFFER_SIZE, s3queue_context);
 
         pipes.emplace_back(std::move(source));
     }
diff --git a/src/Storages/S3Queue/StorageS3Queue.h b/src/Storages/S3Queue/StorageS3Queue.h
index 3d3594dc2ab..f65fdf38b3c 100644
--- a/src/Storages/S3Queue/StorageS3Queue.h
+++ b/src/Storages/S3Queue/StorageS3Queue.h
@@ -91,6 +91,7 @@ private:
     std::shared_ptr<StorageS3QueueSource> createSource(
         const ReadFromFormatInfo & info,
         std::shared_ptr<StorageS3Queue::FileIterator> file_iterator,
+        size_t processing_id,
         size_t max_block_size,
         ContextPtr local_context);
 
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index c376af5a3d7..dcd7e13b865 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -244,7 +244,7 @@ public:
         fillInternalBufferAssumeLocked();
     }
 
-    KeyWithInfoPtr next()
+    KeyWithInfoPtr next(size_t)
     {
         std::lock_guard lock(mutex);
         return nextAssumeLocked();
@@ -436,9 +436,9 @@ StorageS3Source::DisclosedGlobIterator::DisclosedGlobIterator(
 {
 }
 
-StorageS3Source::KeyWithInfoPtr StorageS3Source::DisclosedGlobIterator::next()
+StorageS3Source::KeyWithInfoPtr StorageS3Source::DisclosedGlobIterator::next(size_t idx) /// NOLINT
 {
-    return pimpl->next();
+    return pimpl->next(idx);
 }
 
 size_t StorageS3Source::DisclosedGlobIterator::estimatedKeysCount()
@@ -471,7 +471,7 @@ public:
         }
     }
 
-    KeyWithInfoPtr next()
+    KeyWithInfoPtr next(size_t)
     {
         size_t current_index = index.fetch_add(1, std::memory_order_relaxed);
         if (current_index >= keys.size())
@@ -516,9 +516,9 @@ StorageS3Source::KeysIterator::KeysIterator(
 {
 }
 
-StorageS3Source::KeyWithInfoPtr StorageS3Source::KeysIterator::next()
+StorageS3Source::KeyWithInfoPtr StorageS3Source::KeysIterator::next(size_t idx) /// NOLINT
 {
-    return pimpl->next();
+    return pimpl->next(idx);
 }
 
 size_t StorageS3Source::KeysIterator::estimatedKeysCount()
@@ -545,7 +545,7 @@ StorageS3Source::ReadTaskIterator::ReadTaskIterator(
         buffer.emplace_back(std::make_shared<KeyWithInfo>(key_future.get(), std::nullopt));
 }
 
-StorageS3Source::KeyWithInfoPtr StorageS3Source::ReadTaskIterator::next()
+StorageS3Source::KeyWithInfoPtr StorageS3Source::ReadTaskIterator::next(size_t) /// NOLINT
 {
     size_t current_index = index.fetch_add(1, std::memory_order_relaxed);
     if (current_index >= buffer.size())
@@ -599,23 +599,23 @@ StorageS3Source::StorageS3Source(
 {
 }
 
-void StorageS3Source::lazyInitialize()
+void StorageS3Source::lazyInitialize(size_t idx)
 {
     if (initialized)
         return;
 
-    reader = createReader();
+    reader = createReader(idx);
     if (reader)
-        reader_future = createReaderAsync();
+        reader_future = createReaderAsync(idx);
     initialized = true;
 }
 
-StorageS3Source::ReaderHolder StorageS3Source::createReader()
+StorageS3Source::ReaderHolder StorageS3Source::createReader(size_t idx)
 {
     KeyWithInfoPtr key_with_info;
     do
     {
-        key_with_info = (*file_iterator)();
+        key_with_info = file_iterator->next(idx);
         if (!key_with_info || key_with_info->key.empty())
             return {};
 
@@ -689,9 +689,9 @@ StorageS3Source::ReaderHolder StorageS3Source::createReader()
     return ReaderHolder{key_with_info, bucket, std::move(read_buf), std::move(source), std::move(pipeline), std::move(current_reader)};
 }
 
-std::future<StorageS3Source::ReaderHolder> StorageS3Source::createReaderAsync()
+std::future<StorageS3Source::ReaderHolder> StorageS3Source::createReaderAsync(size_t idx)
 {
-    return create_reader_scheduler([this] { return createReader(); }, Priority{});
+    return create_reader_scheduler([=, this] { return createReader(idx); }, Priority{});
 }
 
 std::unique_ptr<ReadBuffer> StorageS3Source::createS3ReadBuffer(const String & key, size_t object_size)
diff --git a/src/Storages/StorageS3.h b/src/Storages/StorageS3.h
index b90a0d394cb..5c4e4d358c0 100644
--- a/src/Storages/StorageS3.h
+++ b/src/Storages/StorageS3.h
@@ -61,7 +61,7 @@ public:
     {
     public:
         virtual ~IIterator() = default;
-        virtual KeyWithInfoPtr next() = 0;
+        virtual KeyWithInfoPtr next(size_t idx = 0) = 0; /// NOLINT
 
         /// Estimates how many streams we need to process all files.
         /// If keys count >= max_threads_count, the returned number may not represent the actual number of the keys.
@@ -85,7 +85,7 @@ public:
             const S3Settings::RequestSettings & request_settings_ = {},
             std::function<void(FileProgress)> progress_callback_ = {});
 
-        KeyWithInfoPtr next() override;
+        KeyWithInfoPtr next(size_t idx = 0) override; /// NOLINT
         size_t estimatedKeysCount() override;
 
     private:
@@ -106,7 +106,7 @@ public:
             KeysWithInfo * read_keys = nullptr,
             std::function<void(FileProgress)> progress_callback_ = {});
 
-        KeyWithInfoPtr next() override;
+        KeyWithInfoPtr next(size_t idx = 0) override; /// NOLINT
         size_t estimatedKeysCount() override;
 
     private:
@@ -120,7 +120,7 @@ public:
     public:
         explicit ReadTaskIterator(const ReadTaskCallback & callback_, size_t max_threads_count);
 
-        KeyWithInfoPtr next() override;
+        KeyWithInfoPtr next(size_t idx = 0) override; /// NOLINT
         size_t estimatedKeysCount() override;
 
     private:
@@ -253,11 +253,11 @@ private:
 
     /// Notice: we should initialize reader and future_reader lazily in generate to make sure key_condition
     /// is set before createReader is invoked for key_condition is read in createReader.
-    void lazyInitialize();
+    void lazyInitialize(size_t idx = 0);
 
     /// Recreate ReadBuffer and Pipeline for each file.
-    ReaderHolder createReader();
-    std::future<ReaderHolder> createReaderAsync();
+    ReaderHolder createReader(size_t idx = 0);
+    std::future<ReaderHolder> createReaderAsync(size_t idx = 0);
 
     std::unique_ptr<ReadBuffer> createS3ReadBuffer(const String & key, size_t object_size);
     std::unique_ptr<ReadBuffer> createAsyncS3ReadBuffer(const String & key, const ReadSettings & read_settings, size_t object_size);
diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 7d40060fec6..5209c6f9642 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -960,3 +960,243 @@ def test_s3_client_reused(started_cluster):
         s3_clients_after = get_created_s3_clients_count()
 
         assert s3_clients_before == s3_clients_after
+
+
+@pytest.mark.parametrize("mode", ["unordered", "ordered"])
+def test_processing_threads(started_cluster, mode):
+    node = started_cluster.instances["instance"]
+    table_name = f"processing_threads_{mode}"
+    dst_table_name = f"{table_name}_dst"
+    keeper_path = f"/clickhouse/test_{table_name}"
+    files_path = f"{table_name}_data"
+    files_to_generate = 300
+    processing_threads = 32
+
+    create_table(
+        started_cluster,
+        node,
+        table_name,
+        mode,
+        files_path,
+        additional_settings={
+            "keeper_path": keeper_path,
+            "s3queue_processing_threads_num": processing_threads,
+        },
+    )
+    create_mv(node, table_name, dst_table_name)
+
+    total_values = generate_random_files(
+        started_cluster, files_path, files_to_generate, row_num=1
+    )
+
+    def get_count(table_name):
+        return int(run_query(node, f"SELECT count() FROM {table_name}"))
+
+    for _ in range(100):
+        if (get_count(f"{dst_table_name}")) == files_to_generate:
+            break
+        time.sleep(1)
+
+    assert get_count(dst_table_name) == files_to_generate
+
+    res = [
+        list(map(int, l.split()))
+        for l in node.query(
+            f"SELECT column1, column2, column3 FROM {dst_table_name}"
+        ).splitlines()
+    ]
+    assert {tuple(v) for v in res} == set([tuple(i) for i in total_values])
+
+    if mode == "ordered":
+        zk = started_cluster.get_kazoo_client("zoo1")
+        processed_nodes = zk.get_children(f"{keeper_path}/processed/")
+        assert len(processed_nodes) == processing_threads
+
+
+@pytest.mark.parametrize(
+    "mode, processing_threads",
+    [
+        pytest.param("unordered", 1),
+        pytest.param("unordered", 8),
+        pytest.param("ordered", 1),
+        pytest.param("ordered", 8),
+    ],
+)
+def test_shards(started_cluster, mode, processing_threads):
+    node = started_cluster.instances["instance"]
+    table_name = f"test_shards_{mode}_{processing_threads}"
+    dst_table_name = f"{table_name}_dst"
+    keeper_path = f"/clickhouse/test_{table_name}"
+    files_path = f"{table_name}_data"
+    files_to_generate = 300
+    shards_num = 3
+
+    for i in range(shards_num):
+        table = f"{table_name}_{i + 1}"
+        dst_table = f"{dst_table_name}_{i + 1}"
+        create_table(
+            started_cluster,
+            node,
+            table,
+            mode,
+            files_path,
+            additional_settings={
+                "keeper_path": keeper_path,
+                "s3queue_processing_threads_num": processing_threads,
+                "s3queue_total_shards_num": shards_num,
+                "s3queue_current_shard_num": i,
+            },
+        )
+        create_mv(node, table, dst_table)
+
+    total_values = generate_random_files(
+        started_cluster, files_path, files_to_generate, row_num=1
+    )
+
+    def get_count(table_name):
+        return int(run_query(node, f"SELECT count() FROM {table_name}"))
+
+    for _ in range(100):
+        if (
+            get_count(f"{dst_table_name}_1")
+            + get_count(f"{dst_table_name}_2")
+            + get_count(f"{dst_table_name}_3")
+        ) == files_to_generate:
+            break
+        time.sleep(1)
+
+    if (
+        get_count(f"{dst_table_name}_1")
+        + get_count(f"{dst_table_name}_2")
+        + get_count(f"{dst_table_name}_3")
+    ) != files_to_generate:
+        info = node.query(
+            f"SELECT * FROM system.s3queue WHERE zookeeper_path like '%{table_name}' ORDER BY file_name FORMAT Vertical"
+        )
+        logging.debug(info)
+        assert False
+
+    res1 = [
+        list(map(int, l.split()))
+        for l in node.query(
+            f"SELECT column1, column2, column3 FROM {dst_table_name}_1"
+        ).splitlines()
+    ]
+    res2 = [
+        list(map(int, l.split()))
+        for l in node.query(
+            f"SELECT column1, column2, column3 FROM {dst_table_name}_2"
+        ).splitlines()
+    ]
+    res3 = [
+        list(map(int, l.split()))
+        for l in node.query(
+            f"SELECT column1, column2, column3 FROM {dst_table_name}_3"
+        ).splitlines()
+    ]
+    assert {tuple(v) for v in res1 + res2 + res3} == set(
+        [tuple(i) for i in total_values]
+    )
+
+    # Checking that all files were processed only once
+    time.sleep(10)
+    assert (
+        get_count(f"{dst_table_name}_1")
+        + get_count(f"{dst_table_name}_2")
+        + get_count(f"{dst_table_name}_3")
+    ) == files_to_generate
+
+    if mode == "ordered":
+        zk = started_cluster.get_kazoo_client("zoo1")
+        processed_nodes = zk.get_children(f"{keeper_path}/processed/")
+        assert len(processed_nodes) == shards_num * processing_threads
+
+
+@pytest.mark.parametrize(
+    "mode, processing_threads",
+    [
+        pytest.param("unordered", 1),
+        pytest.param("unordered", 8),
+        pytest.param("ordered", 1),
+        pytest.param("ordered", 8),
+    ],
+)
+def test_shards_distributed(started_cluster, mode, processing_threads):
+    node = started_cluster.instances["instance"]
+    node_2 = started_cluster.instances["instance2"]
+    table_name = f"test_shards_distributed_{mode}_{processing_threads}"
+    dst_table_name = f"{table_name}_dst"
+    keeper_path = f"/clickhouse/test_{table_name}"
+    files_path = f"{table_name}_data"
+    files_to_generate = 300
+    row_num = 50
+    total_rows = row_num * files_to_generate
+    shards_num = 2
+
+    i = 0
+    for instance in [node, node_2]:
+        create_table(
+            started_cluster,
+            instance,
+            table_name,
+            mode,
+            files_path,
+            additional_settings={
+                "keeper_path": keeper_path,
+                "s3queue_processing_threads_num": processing_threads,
+                "s3queue_total_shards_num": shards_num,
+                "s3queue_current_shard_num": i,
+            },
+        )
+        i += 1
+
+    for instance in [node, node_2]:
+        create_mv(instance, table_name, dst_table_name)
+
+    total_values = generate_random_files(
+        started_cluster, files_path, files_to_generate, row_num=row_num
+    )
+
+    def get_count(node, table_name):
+        return int(run_query(node, f"SELECT count() FROM {table_name}"))
+
+    for _ in range(150):
+        if (
+            get_count(node, dst_table_name) + get_count(node_2, dst_table_name)
+        ) == total_rows:
+            break
+        time.sleep(1)
+
+    if (
+        get_count(node, dst_table_name) + get_count(node_2, dst_table_name)
+    ) != total_rows:
+        info = node.query(
+            f"SELECT * FROM system.s3queue WHERE zookeeper_path like '%{table_name}' ORDER BY file_name FORMAT Vertical"
+        )
+        logging.debug(info)
+        assert False
+
+    get_query = f"SELECT column1, column2, column3 FROM {dst_table_name}"
+    res1 = [list(map(int, l.split())) for l in run_query(node, get_query).splitlines()]
+    res2 = [
+        list(map(int, l.split())) for l in run_query(node_2, get_query).splitlines()
+    ]
+
+    assert len(res1) + len(res2) == total_rows
+
+    # Checking that all engines have made progress
+    assert len(res1) > 0
+    assert len(res2) > 0
+
+    assert {tuple(v) for v in res1 + res2} == set([tuple(i) for i in total_values])
+
+    # Checking that all files were processed only once
+    time.sleep(10)
+    assert (
+        get_count(node, dst_table_name) + get_count(node_2, dst_table_name)
+    ) == total_rows
+
+    if mode == "ordered":
+        zk = started_cluster.get_kazoo_client("zoo1")
+        processed_nodes = zk.get_children(f"{keeper_path}/processed/")
+        assert len(processed_nodes) == shards_num * processing_threads

From 5ecf36f275fe7b64b29a2abc1ea7686c7369f463 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 24 Jan 2024 17:19:52 +0100
Subject: [PATCH 102/245] Fix style check

---
 src/Storages/S3Queue/S3QueueSource.cpp  | 1 +
 src/Storages/S3Queue/StorageS3Queue.cpp | 8 +++-----
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index 7d4ad64d554..1073270742f 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -28,6 +28,7 @@ namespace ErrorCodes
 {
     extern const int S3_ERROR;
     extern const int NOT_IMPLEMENTED;
+    extern const int LOGICAL_ERROR;
 }
 
 StorageS3QueueSource::S3QueueKeyWithInfo::S3QueueKeyWithInfo(
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index 511add4912f..66c4dacf5bd 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -221,8 +221,7 @@ public:
         ReadFromFormatInfo info_,
         std::shared_ptr<StorageS3Queue> storage_,
         ContextPtr context_,
-        size_t max_block_size_,
-        size_t )
+        size_t max_block_size_)
         : SourceStepWithFilter(DataStream{.header = std::move(sample_block)})
         , info(std::move(info_))
         , storage(std::move(storage_))
@@ -269,7 +268,7 @@ void StorageS3Queue::read(
     ContextPtr local_context,
     QueryProcessingStage::Enum /*processed_stage*/,
     size_t max_block_size,
-    size_t num_streams)
+    size_t)
 {
     if (!local_context->getSettingsRef().stream_like_engine_allow_direct_select)
     {
@@ -291,8 +290,7 @@ void StorageS3Queue::read(
         read_from_format_info,
         std::move(this_ptr),
         local_context,
-        max_block_size,
-        num_streams);
+        max_block_size);
 
     query_plan.addStep(std::move(reading));
 }

From e8629cf4f56c2fa5f1cd229a8986c628391a1420 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Thu, 25 Jan 2024 18:02:55 +0800
Subject: [PATCH 103/245] add another perf and tests

---
 src/Functions/if.cpp     | 37 ++++++++++++++++++++++++++++++++-----
 tests/performance/if.xml | 12 ++++++++++++
 2 files changed, 44 insertions(+), 5 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 7f1423cd434..7789fc51ed1 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -219,6 +219,36 @@ inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, Ar
     }
 }
 
+template <typename ArrayCond, typename A, typename B, typename ArrayResult, typename ResultType>
+inline void fillConstantConstant(const ArrayCond & cond, A a, B b, ArrayResult & res)
+{
+    size_t size = cond.size();
+    if constexpr (std::is_same_v<ResultType, Int8> || std::is_same_v<ResultType, UInt8> || is_over_big_int<ResultType>)
+    {
+        alignas(64) const ResultType ab[2] = {static_cast<ResultType>(a), static_cast<ResultType>(b)};
+        for (size_t i = 0; i < size; ++i)
+        {
+            /// Introduce memory access to avoid branch miss
+            res[i] = ab[!cond[i]];
+        }
+    }
+    else if constexpr (std::is_same_v<ResultType, Decimal32> || std::is_same_v<ResultType, Decimal64>)
+    {
+        ResultType new_a = static_cast<ResultType>(a);
+        ResultType new_b = static_cast<ResultType>(b);
+        for (size_t i = 0; i < size; ++i)
+        {
+            /// Reuse new_a and new_b to achieve auto-vectorization
+            res[i] = cond[i] ? new_a : new_b;
+        }
+    }
+    else
+    {
+        for (size_t i = 0; i < size; ++i)
+            res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b);
+    }
+}
+
 template <typename A, typename B, typename ResultType>
 struct NumIfImpl
 {
@@ -261,9 +291,7 @@ struct NumIfImpl
         auto col_res = ColVecResult::create(size);
         ArrayResult & res = col_res->getData();
 
-        /// TODO cast a and b only once
-        for (size_t i = 0; i < size; ++i)
-            res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b);
+        fillConstantConstant<ArrayCond, A, B, ArrayResult, ResultType>(cond, a, b, res);
         return col_res;
     }
 };
@@ -312,8 +340,7 @@ struct NumIfImpl<Decimal<A>, Decimal<B>, Decimal<R>>
         auto col_res = ColVecResult::create(size, scale);
         ArrayResult & res = col_res->getData();
 
-        for (size_t i = 0; i < size; ++i)
-            res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b);
+        fillConstantConstant<ArrayCond, A, B, ArrayResult, ResultType>(cond, a, b, res);
         return col_res;
     }
 };
diff --git a/tests/performance/if.xml b/tests/performance/if.xml
index b25218f553e..0f1dca91ac2 100644
--- a/tests/performance/if.xml
+++ b/tests/performance/if.xml
@@ -7,6 +7,18 @@
     <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, zero + 2)) ]]></query>
     <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, 2)) ]]></query>
     
+    <!-- Tests when branches are both not constant -->
     <query>with rand32() % 2 as x select if(x, materialize(1.234), materialize(2.456)) from numbers(100000000) format Null</query>
     <query>with rand32() % 2 as x, 1.234::Decimal64(3) as a, 2.456::Decimal64(3) as b select if(x, materialize(a), materialize(b)) from numbers(100000000) format Null</query>
+
+    <!-- Tests when branches are both constant -->
+    <query>with rand32() % 2 as x, 1::Int8 as a, -1::Int8 as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Int64 as a, -1::Int64 as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Int32 as a, -1::Int32 as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Decimal32(3) as a, -1::Decimal32(3) as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Decimal64(3) as a, -1::Decimal64(3) as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Decimal128(3) as a, -1::Decimal128(3) as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Decimal256(3) as a, -1::Decimal256(3) as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Int128 as a, -1::Int128 as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Int256 as a, -1::Int256 as b select if(x, a, b) from numbers(100000000) format Null</query>
 </test>

From aca8e90ec9372447624575f0802c3351cca2150c Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Thu, 25 Jan 2024 20:09:26 +0800
Subject: [PATCH 104/245] optimize when if condition is constant

---
 src/Functions/if.cpp | 16 +++++-----------
 1 file changed, 5 insertions(+), 11 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 7789fc51ed1..6c5d84c6098 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -1204,18 +1204,12 @@ public:
 
         if (cond_const_col)
         {
-            if (arg_then.type->equals(*arg_else.type))
-            {
-                return cond_const_col->getValue<UInt8>()
-                    ? arg_then.column
-                    : arg_else.column;
-            }
+            UInt8 value = cond_const_col->getValue<UInt8>();
+            const ColumnWithTypeAndName & arg = value ? arg_then : arg_else;
+            if (arg.type->equals(*result_type))
+                return arg.column;
             else
-            {
-                /// TODO why materialize condition
-                materialized_cond_col = cond_const_col->convertToFullColumn();
-                cond_col = typeid_cast<const ColumnUInt8 *>(&*materialized_cond_col);
-            }
+                return castColumn(arg, result_type);
         }
 
         if (!cond_col)

From 4b26de9660a317f827bcba4e84cde4176db195d2 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 25 Jan 2024 13:26:13 +0000
Subject: [PATCH 105/245] Rename setting to use it not only in if/multiIf in
 future

---
 docs/en/operations/settings/settings.md                     | 6 +++---
 docs/en/sql-reference/data-types/variant.md                 | 6 +++---
 src/Core/Settings.h                                         | 4 ++--
 src/Core/SettingsChangesHistory.h                           | 2 +-
 src/Functions/if.cpp                                        | 2 +-
 src/Functions/multiIf.cpp                                   | 2 +-
 tests/queries/0_stateless/02941_variant_type_alters.sh      | 2 +-
 tests/queries/0_stateless/02943_variant_element.sql         | 2 +-
 tests/queries/0_stateless/02943_variant_read_subcolumns.sh  | 2 +-
 ...43_variant_type_with_different_local_and_global_order.sh | 2 +-
 .../0_stateless/02944_variant_as_if_multi_if_result.sql     | 2 +-
 11 files changed, 16 insertions(+), 16 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index dcc46a8b4ba..fb2e04f1e35 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -5182,14 +5182,14 @@ Allows creation of experimental [Variant](../../sql-reference/data-types/variant
 
 Default value: `false`.
 
-## use_variant_when_no_common_type_in_if {#use_variant_when_no_common_type_in_if}
+## use_variant_as_common_type {#use_variant_as_common_type}
 
 Allows to use `Variant` type as a result type for [if](../../sql-reference/functions/conditional-functions.md/#if)/[multiIf](../../sql-reference/functions/conditional-functions.md/#multiif) functions when there is no common type for argument types.
 
 Example:
 
 ```sql
-SET use_variant_when_no_common_type_in_if = 1;
+SET use_variant_as_common_type = 1;
 SELECT toTypeName(if(number % 2, number, range(number))) as variant_type FROM numbers(1);
 SELECT if(number % 2, number, range(number)) as variant FROM numbers(5);
 ```
@@ -5208,7 +5208,7 @@ SELECT if(number % 2, number, range(number)) as variant FROM numbers(5);
 ```
 
 ```sql
-SET use_variant_when_no_common_type_in_if = 1;
+SET use_variant_as_common_type = 1;
 SELECT toTypeName(multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) = 2, 'Hello, World!', NULL)) AS variant_type FROM numbers(1);
 SELECT multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) = 2, 'Hello, World!', NULL) AS variant FROM numbers(4);
 ```
diff --git a/docs/en/sql-reference/data-types/variant.md b/docs/en/sql-reference/data-types/variant.md
index 34966d79079..afbd1b798b2 100644
--- a/docs/en/sql-reference/data-types/variant.md
+++ b/docs/en/sql-reference/data-types/variant.md
@@ -47,10 +47,10 @@ SELECT toTypeName(variant) as type_name, 'Hello, World!'::Variant(UInt64, String
 └────────────────────────────────────────┴───────────────┘
 ```
 
-Using functions `if/multiIf` when arguments doesn't have common type (setting `use_variant_when_no_common_type_in_if` should be enabled for it):
+Using functions `if/multiIf` when arguments doesn't have common type (setting `use_variant_as_common_type` should be enabled for it):
 
 ```sql
-SET use_variant_when_no_common_type_in_if = 1;
+SET use_variant_as_common_type = 1;
 SELECT if(number % 2, number, range(number)) as variant FROM numbers(5);
 ```
 
@@ -65,7 +65,7 @@ SELECT if(number % 2, number, range(number)) as variant FROM numbers(5);
 ```
 
 ```sql
-SET use_variant_when_no_common_type_in_if = 1;
+SET use_variant_as_common_type = 1;
 SELECT multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) = 2, 'Hello, World!', NULL) AS variant FROM numbers(4);
 ```
 
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 11d33594257..da26a621c0e 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -229,7 +229,7 @@ class IColumn;
     \
     M(Bool, force_index_by_date, false, "Throw an exception if there is a partition key in a table, and it is not used.", 0) \
     M(Bool, force_primary_key, false, "Throw an exception if there is primary key in a table, and it is not used.", 0) \
-    M(Bool, use_skip_indexes, true, "Use data skipping indexes during query execution.", 0) \
+    M(Bool, use_skip_indexes, true, "Use data skinipping indexes during query execution.", 0) \
     M(Bool, use_skip_indexes_if_final, false, "If query has FINAL, then skipping data based on indexes may produce incorrect result, hence disabled by default.", 0) \
     M(String, ignore_data_skipping_indices, "", "Comma separated list of strings or literals with the name of the data skipping indices that should be excluded during query execution.", 0) \
     \
@@ -824,7 +824,7 @@ class IColumn;
     M(Bool, function_json_value_return_type_allow_complex, false, "Allow function JSON_VALUE to return complex type, such as: struct, array, map.", 0) \
     M(Bool, use_with_fill_by_sorting_prefix, true, "Columns preceding WITH FILL columns in ORDER BY clause form sorting prefix. Rows with different values in sorting prefix are filled independently", 0) \
     M(Bool, optimize_uniq_to_count, true, "Rewrite uniq and its variants(except uniqUpTo) to count if subquery has distinct or group by clause.", 0) \
-    M(Bool, use_variant_when_no_common_type_in_if, false, "Use Variant as a result type for if/multiIf in case when there is no common type for arguments", 0) \
+    M(Bool, use_variant_as_common_type, false, "Use Variant as a result type for if/multiIf in case when there is no common type for arguments", 0) \
     \
     /** Experimental functions */ \
     M(Bool, allow_experimental_materialized_postgresql_table, false, "Allows to use the MaterializedPostgreSQL table engine. Disabled by default, because this feature is experimental", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index b0306bd951b..d00ccf5aa66 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -88,7 +88,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
               {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},
               {"allow_experimental_variant_type", false, false, "Add new experimental Variant type"},
-              {"use_variant_when_no_common_type_in_if", false, false, "Allow to use Variant in if/multiIf if there is no common type"},
+              {"use_variant_as_common_type", false, false, "Allow to use Variant in if/multiIf if there is no common type"},
               {"output_format_arrow_use_64_bit_indexes_for_dictionary", false, false, "Allow to use 64 bit indexes type in Arrow dictionaries"},
               {"parallel_replicas_mark_segment_size", 128, 128, "Add new setting to control segment size in new parallel replicas coordinator implementation"},
               {"ignore_materialized_views_with_dropped_target_table", false, false, "Add new setting to allow to ignore materialized views with dropped target table"},
diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index c247938f885..c784b2fca59 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -264,7 +264,7 @@ public:
     static constexpr auto name = "if";
     static FunctionPtr create(ContextPtr context)
     {
-        return std::make_shared<FunctionIf>(context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_when_no_common_type_in_if);
+        return std::make_shared<FunctionIf>(context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_as_common_type);
     }
 
     explicit FunctionIf(bool use_variant_when_no_common_type_ = false) : FunctionIfBase(), use_variant_when_no_common_type(use_variant_when_no_common_type_) {}
diff --git a/src/Functions/multiIf.cpp b/src/Functions/multiIf.cpp
index 31662bb353e..cb946b55c73 100644
--- a/src/Functions/multiIf.cpp
+++ b/src/Functions/multiIf.cpp
@@ -118,7 +118,7 @@ public:
             types_of_branches.emplace_back(arg);
         });
 
-        if (context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_when_no_common_type_in_if)
+        if (context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_as_common_type)
             return getLeastSupertypeOrVariant(types_of_branches);
 
         return getLeastSupertype(types_of_branches);
diff --git a/tests/queries/0_stateless/02941_variant_type_alters.sh b/tests/queries/0_stateless/02941_variant_type_alters.sh
index 9b0d4febd65..7c151d1fe9e 100755
--- a/tests/queries/0_stateless/02941_variant_type_alters.sh
+++ b/tests/queries/0_stateless/02941_variant_type_alters.sh
@@ -7,7 +7,7 @@ CLICKHOUSE_LOG_COMMENT=
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_as_common_type=1 "
 
 function run()
 {
diff --git a/tests/queries/0_stateless/02943_variant_element.sql b/tests/queries/0_stateless/02943_variant_element.sql
index c8eff9775ad..556c0147e56 100644
--- a/tests/queries/0_stateless/02943_variant_element.sql
+++ b/tests/queries/0_stateless/02943_variant_element.sql
@@ -1,5 +1,5 @@
 set allow_experimental_variant_type=1;
-set use_variant_when_no_common_type_in_if=1;
+set use_variant_as_common_type=1;
 
 select variantElement(NULL::Variant(String, UInt64), 'UInt64') from numbers(4);
 select variantElement(number::Variant(String, UInt64), 'UInt64') from numbers(4);
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns.sh b/tests/queries/0_stateless/02943_variant_read_subcolumns.sh
index 9ccad55191f..88be09c2036 100755
--- a/tests/queries/0_stateless/02943_variant_read_subcolumns.sh
+++ b/tests/queries/0_stateless/02943_variant_read_subcolumns.sh
@@ -7,7 +7,7 @@ CLICKHOUSE_LOG_COMMENT=
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_as_common_type=1 "
 
 
 function test()
diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
index 9f4df8d7466..d089ed3cb2f 100755
--- a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
@@ -7,7 +7,7 @@ CLICKHOUSE_LOG_COMMENT=
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_as_common_type=1 "
 
 
 function test1_insert()
diff --git a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
index 1121b21e383..d88c0e8b7ae 100644
--- a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
+++ b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
@@ -1,6 +1,6 @@
 set allow_experimental_analyzer=0; -- The result type for if function with constant is different with analyzer.
 set allow_experimental_variant_type=1;
-set use_variant_when_no_common_type_in_if=1;
+set use_variant_as_common_type=1;
 
 select toTypeName(res), if(1, [1,2,3], 'str_1') as res;
 select toTypeName(res), if(1, [1,2,3], 'str_1'::Nullable(String)) as res;

From 16a9e95605791b1ea73b4973e115a74ddd019e02 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Thu, 25 Jan 2024 15:40:11 +0000
Subject: [PATCH 106/245] Minor cleanup of msan usage

---
 src/Common/SymbolIndex.cpp                     | 16 +---------------
 src/Compression/CompressionCodecDeflateQpl.cpp | 13 +++++--------
 src/Functions/FunctionsStringSimilarity.cpp    |  3 +--
 3 files changed, 7 insertions(+), 25 deletions(-)

diff --git a/src/Common/SymbolIndex.cpp b/src/Common/SymbolIndex.cpp
index 8e8ffa4d8b7..8dde617fc74 100644
--- a/src/Common/SymbolIndex.cpp
+++ b/src/Common/SymbolIndex.cpp
@@ -1,6 +1,7 @@
 #if defined(__ELF__) && !defined(OS_FREEBSD)
 
 #include <Common/SymbolIndex.h>
+#include <Common/MemorySanitizer.h>
 
 #include <algorithm>
 #include <optional>
@@ -55,21 +56,6 @@ Otherwise you will get only exported symbols from program headers.
 
 */
 
-#if defined(__clang__)
-#   pragma clang diagnostic ignored "-Wreserved-id-macro"
-#   pragma clang diagnostic ignored "-Wunused-macros"
-#endif
-
-#define __msan_unpoison_string(X) // NOLINT
-#define __msan_unpoison(X, Y) // NOLINT
-#if defined(ch_has_feature)
-#    if ch_has_feature(memory_sanitizer)
-#        undef __msan_unpoison_string
-#        undef __msan_unpoison
-#        include <sanitizer/msan_interface.h>
-#    endif
-#endif
-
 
 namespace DB
 {
diff --git a/src/Compression/CompressionCodecDeflateQpl.cpp b/src/Compression/CompressionCodecDeflateQpl.cpp
index ee0356adde5..292f729a38d 100644
--- a/src/Compression/CompressionCodecDeflateQpl.cpp
+++ b/src/Compression/CompressionCodecDeflateQpl.cpp
@@ -6,14 +6,15 @@
 #include <Compression/CompressionFactory.h>
 #include <Compression/CompressionInfo.h>
 #include <Poco/Logger.h>
-#include <Common/randomSeed.h>
-#include <Common/logger_useful.h>
-#include "libaccel_config.h"
 #include <Common/MemorySanitizer.h>
+#include <Common/logger_useful.h>
+#include <Common/randomSeed.h>
 #include <base/scope_guard.h>
 #include <base/getPageSize.h>
-#include <immintrin.h>
 
+#include "libaccel_config.h"
+
+#include <immintrin.h>
 
 namespace DB
 {
@@ -416,9 +417,7 @@ UInt32 CompressionCodecDeflateQpl::doCompressData(const char * source, UInt32 so
 {
 /// QPL library is using AVX-512 with some shuffle operations.
 /// Memory sanitizer don't understand if there was uninitialized memory in SIMD register but it was not used in the result of shuffle.
-#if defined(MEMORY_SANITIZER)
     __msan_unpoison(dest, getMaxCompressedDataSize(source_size));
-#endif
     Int32 res = HardwareCodecDeflateQpl::RET_ERROR;
     if (DeflateQplJobHWPool::instance().isJobPoolReady())
         res = hw_codec->doCompressData(source, source_size, dest, getMaxCompressedDataSize(source_size));
@@ -439,9 +438,7 @@ void CompressionCodecDeflateQpl::doDecompressData(const char * source, UInt32 so
 {
 /// QPL library is using AVX-512 with some shuffle operations.
 /// Memory sanitizer don't understand if there was uninitialized memory in SIMD register but it was not used in the result of shuffle.
-#if defined(MEMORY_SANITIZER)
     __msan_unpoison(dest, uncompressed_size);
-#endif
 /// Device IOTLB miss has big perf. impact for IAA accelerators.
 /// To avoid page fault, we need touch buffers related to accelerator in advance.
     touchBufferWithZeroFilling(dest, uncompressed_size);
diff --git a/src/Functions/FunctionsStringSimilarity.cpp b/src/Functions/FunctionsStringSimilarity.cpp
index df068531655..aadf5c246fc 100644
--- a/src/Functions/FunctionsStringSimilarity.cpp
+++ b/src/Functions/FunctionsStringSimilarity.cpp
@@ -3,6 +3,7 @@
 #include <Functions/FunctionsHashing.h>
 #include <Common/HashTable/ClearableHashMap.h>
 #include <Common/HashTable/Hash.h>
+#include <Common/MemorySanitizer.h>
 #include <Common/UTF8Helpers.h>
 
 #include <Core/Defines.h>
@@ -108,10 +109,8 @@ struct NgramDistanceImpl
 
         if constexpr (case_insensitive)
         {
-#if defined(MEMORY_SANITIZER)
             /// Due to PODArray padding accessing more elements should be OK
             __msan_unpoison(code_points + (N - 1), padding_offset * sizeof(CodePoint));
-#endif
             /// We really need template lambdas with C++20 to do it inline
             unrollLowering<N - 1>(code_points, std::make_index_sequence<padding_offset>());
         }

From e431f89339aeefef1fd4cdd5a0781d7a3d254e82 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Thu, 25 Jan 2024 18:19:46 +0100
Subject: [PATCH 107/245] Restart CI

---
 src/Columns/tests/gtest_column_variant.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Columns/tests/gtest_column_variant.cpp b/src/Columns/tests/gtest_column_variant.cpp
index 0a6512c46b7..25f276b9600 100644
--- a/src/Columns/tests/gtest_column_variant.cpp
+++ b/src/Columns/tests/gtest_column_variant.cpp
@@ -677,6 +677,7 @@ TEST(ColumnVariant, ScatterGeneral)
     selector.push_back(1);
     selector.push_back(2);
     selector.push_back(1);
+
     auto columns = column->scatter(3, selector);
     ASSERT_EQ(columns[0]->size(), 3);
     ASSERT_EQ((*columns[0])[0].get<UInt64>(), 42);

From 08b6ec439e69bd78b166f7f268af0fbed93e5f81 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 25 Jan 2024 18:04:41 +0100
Subject: [PATCH 108/245] Try fxi

---
 .../test_broken_projections/test.py           | 177 +++++++++---------
 1 file changed, 85 insertions(+), 92 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 87d910b9c77..5fa3a9ee146 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -27,7 +27,6 @@ def cluster():
     finally:
         cluster.shutdown()
 
-
 def create_table(node, table, replica, data_prefix="", aggressive_merge=True):
     if data_prefix == "":
         data_prefix = table
@@ -35,9 +34,11 @@ def create_table(node, table, replica, data_prefix="", aggressive_merge=True):
     if aggressive_merge:
         vertical_merge_algorithm_min_rows_to_activate = 1
         vertical_merge_algorithm_min_columns_to_activate = 1
+        max_parts_to_merge_at_once=3
     else:
         vertical_merge_algorithm_min_rows_to_activate = 100000
         vertical_merge_algorithm_min_columns_to_activate = 100
+        max_parts_to_merge_at_once=3
 
     node.query(
         f"""
@@ -49,20 +50,19 @@ def create_table(node, table, replica, data_prefix="", aggressive_merge=True):
         c Int64,
         d Int64,
         e Int64,
-
-        PROJECTION proj
+        PROJECTION proj1
         (
             SELECT c ORDER BY d
         ),
-        PROJECTION proj_2
+        PROJECTION proj2
         (
             SELECT d ORDER BY c
         )
     )
     ENGINE = ReplicatedMergeTree('/test_broken_projection_{data_prefix}/data/', '{replica}') ORDER BY a
     SETTINGS min_bytes_for_wide_part = 0,
-        max_parts_to_merge_at_once=3,
-        enable_vertical_merge_algorithm=1,
+        max_parts_to_merge_at_once={max_parts_to_merge_at_once},
+        enable_vertical_merge_algorithm=0,
         vertical_merge_algorithm_min_rows_to_activate = {vertical_merge_algorithm_min_rows_to_activate},
         vertical_merge_algorithm_min_columns_to_activate = {vertical_merge_algorithm_min_columns_to_activate},
         compress_primary_key=0;
@@ -216,16 +216,16 @@ def random_str(length=6):
 def check(node, table, check_result, expect_broken_part="", expected_error=""):
     query_id = random_str()
 
-    if expect_broken_part == "proj":
+    if expect_broken_part == "proj1":
         assert expected_error in node.query_and_get_error(
             f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c"
         )
     else:
         node.query(
-            f"SELECT c FROM '{table}' WHERE d == 12 OR d == 16 ORDER BY c",
+            f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c",
             query_id=query_id,
         )
-        assert "proj" in node.query(
+        assert "proj1" in node.query(
             f"""
         SYSTEM FLUSH LOGS;
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
@@ -236,7 +236,7 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
 
     query_id = random_str()
 
-    if expect_broken_part == "proj_2":
+    if expect_broken_part == "proj2":
         assert expected_error in node.query_and_get_error(
             f"SELECT d FROM '{table}' WHERE c == 12 ORDER BY d"
         )
@@ -245,7 +245,7 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
             f"SELECT d FROM '{table}' WHERE c == 12 OR c == 16 ORDER BY d",
             query_id=query_id,
         )
-        assert "proj" in node.query(
+        assert "proj2" in node.query(
             f"""
         SYSTEM FLUSH LOGS;
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
@@ -272,42 +272,42 @@ def test_broken_ignored(cluster):
         node, table_name
     )
 
-    # Break metadata (columns.txt) file of projection 'proj'
-    break_projection(node, table_name, "proj", "all_2_2_0", "metadata")
+    # Break metadata (columns.txt) file of projection 'proj1'
+    break_projection(node, table_name, "proj1", "all_2_2_0", "metadata")
 
     # Do select and after "check table" query.
     # Select works because it does not read columns.txt.
     # But expect check table result as 0.
     check(node, table_name, 0)
 
-    # Projection 'proj' from part all_2_2_0 will now appear in broken parts info
+    # Projection 'proj1' from part all_2_2_0 will now appear in broken parts info
     # because it was marked broken during "check table" query.
-    assert "all_2_2_0\tproj\tFILE_DOESNT_EXIST" in get_broken_projections_info(
+    assert "all_2_2_0\tproj1\tFILE_DOESNT_EXIST" in get_broken_projections_info(
         node, table_name
     )
 
     # Check table query will also show a list of parts which have broken projections.
     assert "all_2_2_0" in check_table_full(node, table_name)
 
-    # Break data file of projection 'proj_2' for part all_2_2_0
-    break_projection(node, table_name, "proj_2", "all_2_2_0", "data")
+    # Break data file of projection 'proj2' for part all_2_2_0
+    break_projection(node, table_name, "proj2", "all_2_2_0", "data")
 
     # It will not yet appear in broken projections info.
-    assert "proj_2" not in get_broken_projections_info(node, table_name)
+    assert "proj2" not in get_broken_projections_info(node, table_name)
 
     # Select now fails with error "File doesn't exist"
-    check(node, table_name, 0, "proj_2", "FILE_DOESNT_EXIST")
+    check(node, table_name, 0, "proj2", "FILE_DOESNT_EXIST")
 
-    # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
-    assert "all_2_2_0\tproj_2\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
+    # Projection 'proj2' from part all_2_2_0 will now appear in broken parts info.
+    assert "all_2_2_0\tproj2\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
         node, table_name
     )
 
     # Second select works, because projection is now marked as broken.
     check(node, table_name, 0)
 
-    # Break data file of projection 'proj_2' for part all_3_3_0
-    break_projection(node, table_name, "proj_2", "all_3_3_0", "data")
+    # Break data file of projection 'proj2' for part all_3_3_0
+    break_projection(node, table_name, "proj2", "all_3_3_0", "data")
 
     # It will not yet appear in broken projections info.
     assert "all_3_3_0" not in get_broken_projections_info(node, table_name)
@@ -315,13 +315,13 @@ def test_broken_ignored(cluster):
     insert(node, table_name, 20, 5)
     insert(node, table_name, 25, 5)
 
-    # Part all_3_3_0 has 'proj' and 'proj_2' projections, but 'proj_2' is broken and server does NOT know it yet.
+    # Part all_3_3_0 has 'proj' and 'proj2' projections, but 'proj2' is broken and server does NOT know it yet.
     # Parts all_4_4_0 and all_5_5_0 have both non-broken projections.
     # So a merge will be create for future part all_3_5_1.
-    # During merge it will fail to read from 'proj_2' of part all_3_3_0 and proj_2 will be marked broken.
+    # During merge it will fail to read from 'proj2' of part all_3_3_0 and proj2 will be marked broken.
     # Merge will be retried and on second attempt it will succeed.
     # The result part all_3_5_1 will have only 1 projection - 'proj', because
-    # it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
+    # it will skip 'proj2' as it will see that one part does not have it anymore in the set of valid projections.
     optimize(node, table_name, 0, 1)
     time.sleep(5)
 
@@ -333,7 +333,7 @@ def test_broken_ignored(cluster):
     # SELECT count() FROM system.text_log
     # WHERE level='Error'
     # AND logger_name='MergeTreeBackgroundExecutor'
-    # AND message like 'Exception while executing background task %{table_uuid}:all_3_5_1%%Cannot open file%proj_2.proj/c.bin%'
+    # AND message like 'Exception while executing background task %{table_uuid}:all_3_5_1%%Cannot open file%proj2.proj/c.bin%'
     # """)
     # )
 
@@ -356,27 +356,27 @@ def test_materialize_broken_projection(cluster):
         node, table_name
     )
 
-    break_projection(node, table_name, "proj", "all_1_1_0", "metadata")
+    break_projection(node, table_name, "proj1", "all_1_1_0", "metadata")
     reattach(node, table_name)
 
-    assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
+    assert "all_1_1_0\tproj1\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
         node, table_name
     )
-    assert "Part all_1_1_0 has a broken projection proj" in check_table_full(
+    assert "Part all_1_1_0 has a broken projection proj1" in check_table_full(
         node, table_name
     )
 
-    break_projection(node, table_name, "proj_2", "all_1_1_0", "data")
+    break_projection(node, table_name, "proj2", "all_1_1_0", "data")
     reattach(node, table_name)
 
-    assert "all_1_1_0\tproj_2\tFILE_DOESNT_EXIST" in get_broken_projections_info(
+    assert "all_1_1_0\tproj2\tFILE_DOESNT_EXIST" in get_broken_projections_info(
         node, table_name
     )
-    assert "Part all_1_1_0 has a broken projection proj_2" in check_table_full(
+    assert "Part all_1_1_0 has a broken projection proj2" in check_table_full(
         node, table_name
     )
 
-    materialize_projection(node, table_name, "proj")
+    materialize_projection(node, table_name, "proj1")
 
     assert "has a broken projection" not in check_table_full(node, table_name)
 
@@ -398,8 +398,8 @@ def test_broken_ignored_replicated(cluster):
     create_table(node, table_name2, 2, table_name)
     check(node, table_name2, 1)
 
-    break_projection(node, table_name, "proj", "all_0_0_0", "data")
-    assert "Part all_0_0_0 has a broken projection proj" in check_table_full(
+    break_projection(node, table_name, "proj1", "all_0_0_0", "data")
+    assert "Part all_0_0_0 has a broken projection proj1" in check_table_full(
         node, table_name
     )
 
@@ -413,11 +413,11 @@ def get_random_string(string_length=8):
     return "".join((random.choice(alphabet) for _ in range(string_length)))
 
 
-def test_broken_projections_in_backups(cluster):
+def test_broken_projections_in_backups_1(cluster):
     node = cluster.instances["node"]
 
     table_name = "test4"
-    create_table(node, table_name, 1, aggressive_merge=False)
+    create_table(node, table_name, 1, aggressive_merge=False, data_prefix=table_name)
 
     node.query("SYSTEM STOP MERGES")
 
@@ -432,24 +432,13 @@ def test_broken_projections_in_backups(cluster):
 
     check(node, table_name, 1)
 
-    break_projection(node, table_name, "proj", "all_2_2_0", "data")
-    check(node, table_name, 0, "proj", "FILE_DOESNT_EXIST")
+    break_projection(node, table_name, "proj1", "all_2_2_0", "data")
+    check(node, table_name, 0, "proj1", "FILE_DOESNT_EXIST")
 
-    assert "all_2_2_0\tproj\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
+    assert "all_2_2_0\tproj1\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
         node, table_name
     )
 
-    assert (
-        "all_0_0_0\tproj\t0\n"
-        "all_0_0_0\tproj_2\t0\n"
-        "all_1_1_0\tproj\t0\n"
-        "all_1_1_0\tproj_2\t0\n"
-        "all_2_2_0\tproj\t1\n"
-        "all_2_2_0\tproj_2\t0\n"
-        "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
-    )
-
     backup_name = f"b1-{get_random_string()}"
     assert "BACKUP_CREATED" in node.query(
         f"""
@@ -466,25 +455,32 @@ def test_broken_projections_in_backups(cluster):
     """
     )
 
-    assert (
-        "all_0_0_0\tproj\t0\n"
-        "all_0_0_0\tproj_2\t0\n"
-        "all_1_1_0\tproj\t0\n"
-        "all_1_1_0\tproj_2\t0\n"
-        "all_2_2_0\tproj\t0\n"
-        "all_2_2_0\tproj_2\t0\n"
-        "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
-    )
+    node.query("SYSTEM STOP MERGES")
 
     check(node, table_name, 1)
     assert "" == get_broken_projections_info(node, table_name)
 
-    break_projection(node, table_name, "proj_2", "all_2_2_0", "part")
 
-    check(node, table_name, 0, "proj_2", "ErrnoException")
+def test_broken_projections_in_backups_2(cluster):
+    node = cluster.instances["node"]
 
-    assert "all_2_2_0\tproj_2\tFILE_DOESNT_EXIST" == get_broken_projections_info(
+    table_name = "test5"
+    create_table(node, table_name, 1, aggressive_merge=False, data_prefix=table_name)
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    assert ["all_0_0_0", "all_1_1_0", "all_2_2_0", "all_3_3_0"] == get_parts(
+        node, table_name
+    )
+
+    check(node, table_name, 1)
+    break_projection(node, table_name, "proj2", "all_2_2_0", "part")
+    check(node, table_name, 0, "proj2", "ErrnoException")
+
+    assert "all_2_2_0\tproj2\tFILE_DOESNT_EXIST" == get_broken_projections_info(
         node, table_name
     )
 
@@ -495,7 +491,7 @@ def test_broken_projections_in_backups(cluster):
     """
     )
 
-    materialize_projection(node, table_name, "proj_2")
+    materialize_projection(node, table_name, "proj2")
     check(node, table_name, 1)
 
     backup_name = f"b3-{get_random_string()}"
@@ -515,22 +511,31 @@ def test_broken_projections_in_backups(cluster):
     )
     check(node, table_name, 1)
 
-    assert (
-        "all_0_0_0\tproj\t0\n"
-        "all_0_0_0\tproj_2\t0\n"
-        "all_1_1_0\tproj\t0\n"
-        "all_1_1_0\tproj_2\t0\n"
-        "all_2_2_0\tproj\t0\n"
-        "all_2_2_0\tproj_2\t0\n"
-        "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
-    )
 
-    break_projection(node, table_name, "proj", "all_1_1_0", "part")
-    assert "Part all_1_1_0 has a broken projection proj" in check_table_full(
+def test_broken_projections_in_backups_3(cluster):
+    node = cluster.instances["node"]
+
+    table_name = "test6"
+    create_table(node, table_name, 1, aggressive_merge=False, data_prefix=table_name)
+
+    node.query("SYSTEM STOP MERGES")
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    assert ["all_0_0_0", "all_1_1_0", "all_2_2_0", "all_3_3_0"] == get_parts(
         node, table_name
     )
-    assert "all_1_1_0\tproj\tFILE_DOESNT_EXIST" == get_broken_projections_info(
+
+    check(node, table_name, 1)
+
+    break_projection(node, table_name, "proj1", "all_1_1_0", "part")
+    assert "Part all_1_1_0 has a broken projection proj1" in check_table_full(
+        node, table_name
+    )
+    assert "all_1_1_0\tproj1\tFILE_DOESNT_EXIST" == get_broken_projections_info(
         node, table_name
     )
 
@@ -550,19 +555,7 @@ def test_broken_projections_in_backups(cluster):
     """
     )
 
-    assert (
-        "all_0_0_0\tproj\t0\n"
-        "all_0_0_0\tproj_2\t0\n"
-        "all_1_1_0\tproj\t1\n"
-        "all_1_1_0\tproj_2\t0\n"
-        "all_2_2_0\tproj\t0\n"
-        "all_2_2_0\tproj_2\t0\n"
-        "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
-    )
-
     check(node, table_name, 0)
-    assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(
+    assert "all_1_1_0\tproj1\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(
         node, table_name
     )
-    node.query("SYSTEM START MERGES")

From 0c82926b951fc475f4b8bdc4f1000785c0d4664e Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Thu, 25 Jan 2024 18:21:38 +0000
Subject: [PATCH 109/245] Automatic style fix

---
 tests/integration/test_broken_projections/test.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 5fa3a9ee146..f5e2ecba2b7 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -27,6 +27,7 @@ def cluster():
     finally:
         cluster.shutdown()
 
+
 def create_table(node, table, replica, data_prefix="", aggressive_merge=True):
     if data_prefix == "":
         data_prefix = table
@@ -34,11 +35,11 @@ def create_table(node, table, replica, data_prefix="", aggressive_merge=True):
     if aggressive_merge:
         vertical_merge_algorithm_min_rows_to_activate = 1
         vertical_merge_algorithm_min_columns_to_activate = 1
-        max_parts_to_merge_at_once=3
+        max_parts_to_merge_at_once = 3
     else:
         vertical_merge_algorithm_min_rows_to_activate = 100000
         vertical_merge_algorithm_min_columns_to_activate = 100
-        max_parts_to_merge_at_once=3
+        max_parts_to_merge_at_once = 3
 
     node.query(
         f"""

From ff15ab12b8b48db5871dde0106176dc4c7193df2 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 25 Jan 2024 21:06:50 +0000
Subject: [PATCH 110/245] Remove bad implementation of
 DataTypeVariant::createColumnConst, support use_variant_as_common_type
 setting in functions array/map

---
 docs/en/operations/settings/settings.md       | 39 ++++++++++-
 docs/en/sql-reference/data-types/variant.md   | 30 ++++++++-
 src/Columns/ColumnMap.cpp                     |  5 ++
 src/Columns/ColumnMap.h                       |  1 +
 src/DataTypes/DataTypeVariant.cpp             | 41 ------------
 src/DataTypes/DataTypeVariant.h               |  1 -
 src/DataTypes/getLeastSupertype.cpp           | 66 +++++++------------
 src/DataTypes/getLeastSupertype.h             |  5 +-
 src/Functions/array/array.cpp                 | 13 +++-
 src/Functions/map.cpp                         | 22 +++++--
 ...=> 02944_variant_as_common_type.reference} |  7 ++
 ...t.sql => 02944_variant_as_common_type.sql} | 13 +++-
 12 files changed, 147 insertions(+), 96 deletions(-)
 rename tests/queries/0_stateless/{02944_variant_as_if_multi_if_result.reference => 02944_variant_as_common_type.reference} (83%)
 rename tests/queries/0_stateless/{02944_variant_as_if_multi_if_result.sql => 02944_variant_as_common_type.sql} (87%)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index fb2e04f1e35..e8fc095438b 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -5184,7 +5184,7 @@ Default value: `false`.
 
 ## use_variant_as_common_type {#use_variant_as_common_type}
 
-Allows to use `Variant` type as a result type for [if](../../sql-reference/functions/conditional-functions.md/#if)/[multiIf](../../sql-reference/functions/conditional-functions.md/#multiif) functions when there is no common type for argument types.
+Allows to use `Variant` type as a result type for [if](../../sql-reference/functions/conditional-functions.md/#if)/[multiIf](../../sql-reference/functions/conditional-functions.md/#multiif)/[array](../../sql-reference/functions/array-functions.md)/[map](../../sql-reference/functions/tuple-map-functions.md) functions when there is no common type for argument types.
 
 Example:
 
@@ -5226,6 +5226,43 @@ SELECT multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) =
 └───────────────┘
 ```
 
+```sql
+SET use_variant_as_common_type = 1;
+SELECT toTypeName(array(range(number), number, 'str_' || toString(number))) as array_of_variants_type from numbers(1);
+SELECT array(range(number), number, 'str_' || toString(number)) as array_of_variants FROM numbers(3);
+```
+
+```text
+┌─array_of_variants_type────────────────────────┐
+│ Array(Variant(Array(UInt64), String, UInt64)) │
+└───────────────────────────────────────────────┘
+
+┌─array_of_variants─┐
+│ [[],0,'str_0']    │
+│ [[0],1,'str_1']   │
+│ [[0,1],2,'str_2'] │
+└───────────────────┘
+```
+
+```sql
+SET use_variant_as_common_type = 1;
+SELECT toTypeName(map('a', range(number), 'b', number, 'c', 'str_' || toString(number))) as map_of_variants_type from numbers(1);
+SELECT map('a', range(number), 'b', number, 'c', 'str_' || toString(number)) as map_of_variants FROM numbers(3);
+```
+
+```text
+┌─map_of_variants_type────────────────────────────────┐
+│ Map(String, Variant(Array(UInt64), String, UInt64)) │
+└─────────────────────────────────────────────────────┘
+
+┌─map_of_variants───────────────┐
+│ {'a':[],'b':0,'c':'str_0'}    │
+│ {'a':[0],'b':1,'c':'str_1'}   │
+│ {'a':[0,1],'b':2,'c':'str_2'} │
+└───────────────────────────────┘
+```
+
+
 Default value: `false`.
 
 ## max_partition_size_to_drop
diff --git a/docs/en/sql-reference/data-types/variant.md b/docs/en/sql-reference/data-types/variant.md
index afbd1b798b2..0058e13b4ca 100644
--- a/docs/en/sql-reference/data-types/variant.md
+++ b/docs/en/sql-reference/data-types/variant.md
@@ -47,7 +47,7 @@ SELECT toTypeName(variant) as type_name, 'Hello, World!'::Variant(UInt64, String
 └────────────────────────────────────────┴───────────────┘
 ```
 
-Using functions `if/multiIf` when arguments doesn't have common type (setting `use_variant_as_common_type` should be enabled for it):
+Using functions `if/multiIf` when arguments don't have common type (setting `use_variant_as_common_type` should be enabled for it):
 
 ```sql
 SET use_variant_as_common_type = 1;
@@ -78,6 +78,34 @@ SELECT multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) =
 └───────────────┘
 ```
 
+Using functions 'array/map' if array elements/map values don't have common type (setting `use_variant_as_common_type` should be enabled for it):
+
+```sql
+SET use_variant_as_common_type = 1;
+SELECT array(range(number), number, 'str_' || toString(number)) as array_of_variants FROM numbers(3);
+```
+
+```text
+┌─array_of_variants─┐
+│ [[],0,'str_0']    │
+│ [[0],1,'str_1']   │
+│ [[0,1],2,'str_2'] │
+└───────────────────┘
+```
+
+```sql
+SET use_variant_as_common_type = 1;
+SELECT map('a', range(number), 'b', number, 'c', 'str_' || toString(number)) as map_of_variants FROM numbers(3);
+```
+
+```text
+┌─map_of_variants───────────────┐
+│ {'a':[],'b':0,'c':'str_0'}    │
+│ {'a':[0],'b':1,'c':'str_1'}   │
+│ {'a':[0,1],'b':2,'c':'str_2'} │
+└───────────────────────────────┘
+```
+
 ## Reading Variant nested types as subcolumns
 
 Variant type supports reading a single nested type from a Variant column using the type name as a subcolumn.
diff --git a/src/Columns/ColumnMap.cpp b/src/Columns/ColumnMap.cpp
index ddcde43ca23..307a1ef0f62 100644
--- a/src/Columns/ColumnMap.cpp
+++ b/src/Columns/ColumnMap.cpp
@@ -141,6 +141,11 @@ void ColumnMap::updateHashFast(SipHash & hash) const
     nested->updateHashFast(hash);
 }
 
+void ColumnMap::insertFrom(const IColumn & src, size_t start)
+{
+    nested->insertFrom(assert_cast<const ColumnMap &>(src).getNestedColumn(), start);
+}
+
 void ColumnMap::insertRangeFrom(const IColumn & src, size_t start, size_t length)
 {
     nested->insertRangeFrom(
diff --git a/src/Columns/ColumnMap.h b/src/Columns/ColumnMap.h
index fde8a7e0e67..0bae86231f9 100644
--- a/src/Columns/ColumnMap.h
+++ b/src/Columns/ColumnMap.h
@@ -64,6 +64,7 @@ public:
     void updateHashWithValue(size_t n, SipHash & hash) const override;
     void updateWeakHash32(WeakHash32 & hash) const override;
     void updateHashFast(SipHash & hash) const override;
+    void insertFrom(const IColumn & src_, size_t n) override;
     void insertRangeFrom(const IColumn & src, size_t start, size_t length) override;
     ColumnPtr filter(const Filter & filt, ssize_t result_size_hint) const override;
     void expand(const Filter & mask, bool inverted) override;
diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index 3a39fdf9ea8..456b4ea03b6 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -96,47 +96,6 @@ MutableColumnPtr DataTypeVariant::createColumn() const
     return ColumnVariant::create(std::move(nested_columns));
 }
 
-ColumnPtr DataTypeVariant::createColumnConst(size_t size, const DB::Field & field) const
-{
-    auto column = createColumn();
-    if (field.isNull())
-    {
-        column->insertDefault();
-    }
-    else
-    {
-        /// We don't have exact mapping Field type -> Data type, so we cannot
-        /// always know in which variant we need to insert the field by it's type.
-        /// Examples:
-        /// Field(42) and Variant(UInt16, String). Type of the Field - UInt64, but we can insert it in UInt16
-        /// Field(42) and Variant(Date, String). Type of the Field - UInt64, but we can insert it in Date
-
-        /// Let's first apply FieldToDataType visitor to find best Data type for this field.
-        /// If we have variant with such type, we will insert this field into it.
-        /// Otherwise we will try to find the first variant that has default Field value with the same type.
-        auto field_type = applyVisitor(FieldToDataType(), field);
-        auto discr = tryGetVariantDiscriminator(field_type);
-        if (!discr)
-        {
-            for (size_t i = 0; i != variants.size(); ++i)
-            {
-                if (field.getType() == variants[i]->getDefault().getType())
-                {
-                    discr = i;
-                    break;
-                }
-            }
-        }
-
-        if (!discr)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot insert field \"{}\" with type {} into column with type {}", toString(field), field.getTypeName(), getName());
-
-        assert_cast<ColumnVariant &>(*column).insertIntoVariant(field, *discr);
-    }
-
-    return ColumnConst::create(std::move(column), size);
-}
-
 Field DataTypeVariant::getDefault() const
 {
     return Null();
diff --git a/src/DataTypes/DataTypeVariant.h b/src/DataTypes/DataTypeVariant.h
index 1a1cb6c12f2..d26ce4ea90f 100644
--- a/src/DataTypes/DataTypeVariant.h
+++ b/src/DataTypes/DataTypeVariant.h
@@ -37,7 +37,6 @@ public:
 
     MutableColumnPtr createColumn() const override;
 
-    ColumnPtr createColumnConst(size_t size, const Field & field) const override;
     Field getDefault() const override;
 
     bool equals(const IDataType & rhs) const override;
diff --git a/src/DataTypes/getLeastSupertype.cpp b/src/DataTypes/getLeastSupertype.cpp
index 5d67f888c4b..3c64cb755a7 100644
--- a/src/DataTypes/getLeastSupertype.cpp
+++ b/src/DataTypes/getLeastSupertype.cpp
@@ -59,25 +59,6 @@ DataTypePtr throwOrReturn(const DataTypes & types, std::string_view message_suff
     if constexpr (on_error == LeastSupertypeOnError::String)
         return std::make_shared<DataTypeString>();
 
-    if constexpr (on_error == LeastSupertypeOnError::Variant && std::is_same_v<DataTypes, std::vector<DataTypePtr>>)
-    {
-        DataTypes variants;
-        for (const auto & type : types)
-        {
-            if (isVariant(type))
-            {
-                const DataTypes & nested_variants = assert_cast<const DataTypeVariant &>(*type).getVariants();
-                variants.insert(variants.end(), nested_variants.begin(), nested_variants.end());
-            }
-            else
-            {
-                variants.push_back(removeNullableOrLowCardinalityNullable(type));
-            }
-        }
-
-        return std::make_shared<DataTypeVariant>(variants);
-    }
-
     if constexpr (on_error == LeastSupertypeOnError::Null)
         return nullptr;
 
@@ -402,17 +383,7 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
             if (!all_maps)
                 return throwOrReturn<on_error>(types, "because some of them are Maps and some of them are not", ErrorCodes::NO_COMMON_TYPE);
 
-            DataTypePtr keys_common_type;
-            if constexpr (on_error == LeastSupertypeOnError::Variant)
-            {
-                keys_common_type = getLeastSupertype<LeastSupertypeOnError::Null>(key_types);
-                if (!keys_common_type)
-                    return throwOrReturn<on_error>(types, "", ErrorCodes::NO_COMMON_TYPE);
-            }
-            else
-            {
-                keys_common_type = getLeastSupertype<on_error>(key_types);
-            }
+            DataTypePtr keys_common_type = getLeastSupertype<on_error>(key_types);
 
             auto values_common_type = getLeastSupertype<on_error>(value_types);
             /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype for keys or values,
@@ -454,17 +425,7 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
                 return getLeastSupertype<on_error>(nested_types);
             else
             {
-                DataTypePtr nested_type;
-                if constexpr (on_error == LeastSupertypeOnError::Variant)
-                {
-                    nested_type = getLeastSupertype<LeastSupertypeOnError::Null>(nested_types);
-                    if (!nested_type)
-                        return throwOrReturn<on_error>(types, "", ErrorCodes::NO_COMMON_TYPE);
-                }
-                else
-                {
-                    nested_type = getLeastSupertype<on_error>(nested_types);
-                }
+                DataTypePtr nested_type = getLeastSupertype<on_error>(nested_types);
 
                 /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype,
                 /// nested_type will be nullptr, we should return nullptr in this case.
@@ -684,7 +645,28 @@ DataTypePtr getLeastSupertypeOrString(const DataTypes & types)
 
 DataTypePtr getLeastSupertypeOrVariant(const DataTypes & types)
 {
-    return getLeastSupertype<LeastSupertypeOnError::Variant>(types);
+    auto common_type = getLeastSupertype<LeastSupertypeOnError::Null>(types);
+    if (common_type)
+        return common_type;
+
+    /// Create Variant with provided arguments as variants.
+    DataTypes variants;
+    for (const auto & type : types)
+    {
+        /// Nested Variant types are not supported. If we have Variant type
+        /// we use all its variants in the result Variant.
+        if (isVariant(type))
+        {
+            const DataTypes & nested_variants = assert_cast<const DataTypeVariant &>(*type).getVariants();
+            variants.insert(variants.end(), nested_variants.begin(), nested_variants.end());
+        }
+        else
+        {
+            variants.push_back(removeNullableOrLowCardinalityNullable(type));
+        }
+    }
+
+    return std::make_shared<DataTypeVariant>(variants);
 }
 
 DataTypePtr tryGetLeastSupertype(const DataTypes & types)
diff --git a/src/DataTypes/getLeastSupertype.h b/src/DataTypes/getLeastSupertype.h
index d949fad69c5..ceaffbdab7a 100644
--- a/src/DataTypes/getLeastSupertype.h
+++ b/src/DataTypes/getLeastSupertype.h
@@ -8,7 +8,6 @@ enum class LeastSupertypeOnError
 {
     Throw,
     String,
-    Variant,
     Null,
 };
 
@@ -25,14 +24,14 @@ DataTypePtr getLeastSupertype(const DataTypes & types);
 /// All types can be casted to String, because they can be serialized to String.
 DataTypePtr getLeastSupertypeOrString(const DataTypes & types);
 
-/// Same as getLeastSupertype but in case when there is no supertype for some types
+/// Same as getLeastSupertype but in case when there is no supertype for provided types
 /// it uses Variant of these types as a supertype. Any type can be casted to a Variant
 /// that contains this type.
 /// As nested Variants are not allowed, if one of the types is Variant, it's variants
 /// are used in the resulting Variant.
 /// Examples:
 /// (UInt64, String) -> Variant(UInt64, String)
-/// (Array(UInt64), Array(String)) -> Array(Variant(UInt64, String))
+/// (Array(UInt64), Array(String)) -> Variant(Array(UInt64), Array(String))
 /// (Variant(UInt64, String), Array(UInt32)) -> Variant(UInt64, String, Array(UInt32))
 DataTypePtr getLeastSupertypeOrVariant(const DataTypes & types);
 
diff --git a/src/Functions/array/array.cpp b/src/Functions/array/array.cpp
index 551f0a6625b..4379283ec86 100644
--- a/src/Functions/array/array.cpp
+++ b/src/Functions/array/array.cpp
@@ -4,6 +4,7 @@
 #include <DataTypes/getLeastSupertype.h>
 #include <Columns/ColumnArray.h>
 #include <Interpreters/castColumn.h>
+#include <Interpreters/Context.h>
 
 
 namespace DB
@@ -14,9 +15,12 @@ class FunctionArray : public IFunction
 {
 public:
     static constexpr auto name = "array";
-    static FunctionPtr create(ContextPtr)
+
+    FunctionArray(bool use_variant_as_common_type_ = false) : use_variant_as_common_type(use_variant_as_common_type_) {}
+
+    static FunctionPtr create(ContextPtr context)
     {
-        return std::make_shared<FunctionArray>();
+        return std::make_shared<FunctionArray>(context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_as_common_type);
     }
 
     bool useDefaultImplementationForNulls() const override { return false; }
@@ -31,6 +35,9 @@ public:
 
     DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
     {
+        if (use_variant_as_common_type)
+            return std::make_shared<DataTypeArray>(getLeastSupertypeOrVariant(arguments));
+
         return std::make_shared<DataTypeArray>(getLeastSupertype(arguments));
     }
 
@@ -97,6 +104,8 @@ private:
     }
 
     bool addField(DataTypePtr type_res, const Field & f, Array & arr) const;
+
+    bool use_variant_as_common_type = false;
 };
 
 
diff --git a/src/Functions/map.cpp b/src/Functions/map.cpp
index c950a0491a5..79a18dce99b 100644
--- a/src/Functions/map.cpp
+++ b/src/Functions/map.cpp
@@ -8,6 +8,7 @@
 #include <DataTypes/getLeastSupertype.h>
 #include <Columns/ColumnMap.h>
 #include <Interpreters/castColumn.h>
+#include <Interpreters/Context.h>
 #include <Common/HashTable/HashSet.h>
 
 
@@ -30,9 +31,11 @@ class FunctionMap : public IFunction
 public:
     static constexpr auto name = "map";
 
-    static FunctionPtr create(ContextPtr)
+    FunctionMap(bool use_variant_as_common_type_) : use_variant_as_common_type(use_variant_as_common_type_) {}
+
+    static FunctionPtr create(ContextPtr context)
     {
-        return std::make_shared<FunctionMap>();
+        return std::make_shared<FunctionMap>(context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_as_common_type);
     }
 
     String getName() const override
@@ -77,8 +80,16 @@ public:
         }
 
         DataTypes tmp;
-        tmp.emplace_back(getLeastSupertype(keys));
-        tmp.emplace_back(getLeastSupertype(values));
+        if (use_variant_as_common_type)
+        {
+            tmp.emplace_back(getLeastSupertypeOrVariant(keys));
+            tmp.emplace_back(getLeastSupertypeOrVariant(values));
+        }
+        else
+        {
+            tmp.emplace_back(getLeastSupertype(keys));
+            tmp.emplace_back(getLeastSupertype(values));
+        }
         return std::make_shared<DataTypeMap>(tmp);
     }
 
@@ -138,6 +149,9 @@ public:
 
         return ColumnMap::create(nested_column);
     }
+
+private:
+    bool use_variant_as_common_type = false;
 };
 
 /// mapFromArrays(keys, values) is a function that allows you to make key-value pair from a pair of arrays
diff --git a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference b/tests/queries/0_stateless/02944_variant_as_common_type.reference
similarity index 83%
rename from tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference
rename to tests/queries/0_stateless/02944_variant_as_common_type.reference
index 3803f39253c..0425a8cfa30 100644
--- a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference
+++ b/tests/queries/0_stateless/02944_variant_as_common_type.reference
@@ -94,3 +94,10 @@ Variant(Array(UInt64), String, UInt64)	str_2
 Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
 Variant(Array(UInt64), String, UInt64)	4
 Variant(Array(UInt64), String, UInt64)	str_5
+Array(Variant(String, UInt8))	[1,'str_1',2,'str_2']
+Array(Variant(Array(String), Array(UInt8)))	[[1,2,3],['str_1','str_2','str_3']]
+Array(Variant(Array(UInt8), Array(Variant(Array(String), Array(UInt8)))))	[[[1,2,3],['str_1','str_2','str_3']],[1,2,3]]
+Array(Variant(Array(Array(UInt8)), Array(UInt8)))	[[1,2,3],[[1,2,3]]]
+Map(String, Variant(String, UInt8))	{'a':1,'b':'str_1'}
+Map(String, Variant(Map(String, Variant(String, UInt8)), UInt8))	{'a':1,'b':{'c':2,'d':'str_1'}}
+Map(String, Variant(Array(Array(UInt8)), Array(UInt8), UInt8))	{'a':1,'b':[1,2,3],'c':[[4,5,6]]}
diff --git a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql b/tests/queries/0_stateless/02944_variant_as_common_type.sql
similarity index 87%
rename from tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
rename to tests/queries/0_stateless/02944_variant_as_common_type.sql
index d88c0e8b7ae..e985cf365dd 100644
--- a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
+++ b/tests/queries/0_stateless/02944_variant_as_common_type.sql
@@ -1,4 +1,5 @@
-set allow_experimental_analyzer=0; -- The result type for if function with constant is different with analyzer.
+set allow_experimental_analyzer=0; -- The result type for if function with constant is different with analyzer. It wil be fixed after refactoring around constants in analyzer.
+
 set allow_experimental_variant_type=1;
 set use_variant_as_common_type=1;
 
@@ -63,3 +64,13 @@ select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 =
 select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, ('str_' || toString(number))::LowCardinality(String)) as res from numbers(6);
 select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, ('str_' || toString(number))::LowCardinality(Nullable(String))) as res from numbers(6);
 
+
+select toTypeName(res), array(1, 'str_1', 2, 'str_2') as res;
+select toTypeName(res), array([1, 2, 3], ['str_1', 'str_2', 'str_3']) as res;
+select toTypeName(res), array(array([1, 2, 3], ['str_1', 'str_2', 'str_3']), [1, 2, 3]) as res;
+select toTypeName(res), array([1, 2, 3], [[1, 2, 3]]) as res;
+
+select toTypeName(res), map('a', 1, 'b', 'str_1') as res;
+select toTypeName(res), map('a', 1, 'b', map('c', 2, 'd', 'str_1')) as res;
+select toTypeName(res), map('a', 1, 'b', [1, 2, 3], 'c', [[4, 5, 6]]) as res;
+

From 7f6784937d91c628286a8d630d451460df897b64 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 25 Jan 2024 23:59:24 +0000
Subject: [PATCH 111/245] Fix

---
 src/DataTypes/getLeastSupertype.cpp | 26 +++++++++++---------------
 1 file changed, 11 insertions(+), 15 deletions(-)

diff --git a/src/DataTypes/getLeastSupertype.cpp b/src/DataTypes/getLeastSupertype.cpp
index 3c64cb755a7..09d44eeb160 100644
--- a/src/DataTypes/getLeastSupertype.cpp
+++ b/src/DataTypes/getLeastSupertype.cpp
@@ -68,8 +68,8 @@ DataTypePtr throwOrReturn(const DataTypes & types, std::string_view message_suff
     throw Exception(error_code, "There is no supertype for types {} {}", getExceptionMessagePrefix(types), message_suffix);
 }
 
-template <typename ThrowOrReturnFunc>
-DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOrReturnFunc)
+template <LeastSupertypeOnError on_error>
+DataTypePtr getNumericType(const TypeIndexSet & types)
 {
     bool all_numbers = true;
 
@@ -120,7 +120,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOr
     if (max_bits_of_signed_integer || max_bits_of_unsigned_integer || max_mantissa_bits_of_floating)
     {
         if (!all_numbers)
-            return throwOrReturnFunc(types, "because some of them are numbers and some of them are not", ErrorCodes::NO_COMMON_TYPE);
+            return throwOrReturn<on_error>(types, "because some of them are numbers and some of them are not", ErrorCodes::NO_COMMON_TYPE);
 
         /// If there are signed and unsigned types of same bit-width, the result must be signed number with at least one more bit.
         /// Example, common of Int32, UInt32 = Int64.
@@ -135,7 +135,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOr
             if (min_bit_width_of_integer != 64)
                 ++min_bit_width_of_integer;
             else
-                return throwOrReturnFunc(types,
+                return throwOrReturn<on_error>(types,
                     "because some of them are signed integers and some are unsigned integers,"
                     " but there is no signed integer type, that can exactly represent all required unsigned integer values",
                     ErrorCodes::NO_COMMON_TYPE);
@@ -150,7 +150,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOr
             else if (min_mantissa_bits <= 53)
                 return std::make_shared<DataTypeFloat64>();
             else
-                return throwOrReturnFunc(types,
+                return throwOrReturn<on_error>(types,
                     " because some of them are integers and some are floating point,"
                     " but there is no floating point type, that can exactly represent all required integers", ErrorCodes::NO_COMMON_TYPE);
         }
@@ -171,7 +171,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOr
             else if (min_bit_width_of_integer <= 256)
                 return std::make_shared<DataTypeInt256>();
             else
-                return throwOrReturnFunc(types,
+                return throwOrReturn<on_error>(types,
                     " because some of them are signed integers and some are unsigned integers,"
                     " but there is no signed integer type, that can exactly represent all required unsigned integer values", ErrorCodes::NO_COMMON_TYPE);
         }
@@ -191,7 +191,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOr
             else if (min_bit_width_of_integer <= 256)
                 return std::make_shared<DataTypeUInt256>();
             else
-                return throwOrReturnFunc(types,
+                return throwOrReturn<on_error>(types,
                     " but as all data types are unsigned integers, we must have found maximum unsigned integer type", ErrorCodes::NO_COMMON_TYPE);
         }
     }
@@ -383,7 +383,7 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
             if (!all_maps)
                 return throwOrReturn<on_error>(types, "because some of them are Maps and some of them are not", ErrorCodes::NO_COMMON_TYPE);
 
-            DataTypePtr keys_common_type = getLeastSupertype<on_error>(key_types);
+            auto keys_common_type = getLeastSupertype<on_error>(key_types);
 
             auto values_common_type = getLeastSupertype<on_error>(value_types);
             /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype for keys or values,
@@ -425,7 +425,7 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
                 return getLeastSupertype<on_error>(nested_types);
             else
             {
-                DataTypePtr nested_type = getLeastSupertype<on_error>(nested_types);
+                auto nested_type = getLeastSupertype<on_error>(nested_types);
 
                 /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype,
                 /// nested_type will be nullptr, we should return nullptr in this case.
@@ -459,8 +459,6 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
         if (have_nullable)
         {
             auto nested_type = getLeastSupertype<on_error>(nested_types);
-            if (isVariant(nested_type))
-                return nested_type;
             /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype,
             /// nested_type will be nullptr, we should return nullptr in this case.
             if (!nested_type)
@@ -628,8 +626,7 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
     {
         /// First, if we have signed integers, try to convert all UInt64 to Int64 if possible.
         convertUInt64toInt64IfPossible(types, type_ids);
-        auto throw_or_return = [&](const TypeIndexSet &, std::string_view message_suffix, int error_code){ return throwOrReturn<on_error>(types, message_suffix, error_code); };
-        auto numeric_type = getNumericType(type_ids, throw_or_return);
+        auto numeric_type = getNumericType<on_error>(type_ids);
         if (numeric_type)
             return numeric_type;
     }
@@ -708,8 +705,7 @@ DataTypePtr getLeastSupertype(const TypeIndexSet & types)
         return std::make_shared<DataTypeString>();
     }
 
-    auto throw_or_return = [](const TypeIndexSet & type_ids, std::string_view message_suffix, int error_code){ return throwOrReturn<on_error>(type_ids, message_suffix, error_code); };
-    auto numeric_type = getNumericType(types, throw_or_return);
+    auto numeric_type = getNumericType<on_error>(types);
     if (numeric_type)
         return numeric_type;
 

From 626e30609a08290f22b328f7282644bed766e649 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Fri, 26 Jan 2024 10:43:27 +0800
Subject: [PATCH 112/245] change as request

---
 src/Functions/if.cpp | 11 ++++-------
 1 file changed, 4 insertions(+), 7 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 6c5d84c6098..49e0f7320ff 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -48,11 +48,11 @@ using namespace GatherUtils;
 */
 
 template <typename ResultType>
-struct is_native_int_or_decimal // NOLINT(readability-identifier-naming)
-{
-    static constexpr bool value = std::is_integral_v<ResultType> || (is_decimal<ResultType> && sizeof(ResultType) <= 8);
-};
+concept is_native_int_or_decimal_v
+    = std::is_integral_v<ResultType> || (is_decimal<ResultType> && sizeof(ResultType) <= 8);
 
+// This macro performs a branch-free conditional assignment for floating point types.
+// It uses bitwise operations to avoid branching, which can be beneficial for performance.
 #define BRANCHFREE_IF_FLOAT(TYPE, vc, va, vb, vr) \
     using UIntType = typename NumberTraits::Construct<false, false, sizeof(TYPE)>::Type; \
     using IntType = typename NumberTraits::Construct<true, false, sizeof(TYPE)>::Type; \
@@ -62,9 +62,6 @@ struct is_native_int_or_decimal // NOLINT(readability-identifier-naming)
     auto tmp = (~mask & (*reinterpret_cast<UIntType *>(&new_a))) | (mask & (*reinterpret_cast<UIntType *>(&new_b))); \
     (vr) = *(reinterpret_cast<ResultType *>(&tmp));
 
-template <typename ResultType>
-inline constexpr bool is_native_int_or_decimal_v = is_native_int_or_decimal<ResultType>::value;
-
 template <typename ArrayCond, typename ArrayA, typename ArrayB, typename ArrayResult, typename ResultType>
 inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const ArrayB & b, ArrayResult & res)
 {

From 29b3cf60a698299572b173e8b936526877611c03 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Fri, 26 Jan 2024 16:45:09 +0800
Subject: [PATCH 113/245] fix perf regression

---
 src/Functions/if.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 49e0f7320ff..fba50385923 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -220,7 +220,7 @@ template <typename ArrayCond, typename A, typename B, typename ArrayResult, type
 inline void fillConstantConstant(const ArrayCond & cond, A a, B b, ArrayResult & res)
 {
     size_t size = cond.size();
-    if constexpr (std::is_same_v<ResultType, Int8> || std::is_same_v<ResultType, UInt8> || is_over_big_int<ResultType>)
+    if constexpr (std::is_same_v<ResultType, Int8> || is_over_big_int<ResultType>)
     {
         alignas(64) const ResultType ab[2] = {static_cast<ResultType>(a), static_cast<ResultType>(b)};
         for (size_t i = 0; i < size; ++i)

From 7515fa99f48121c5f0680581c8a217c89d97b896 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 26 Jan 2024 13:15:15 +0100
Subject: [PATCH 114/245] I hope now

---
 tests/integration/test_broken_projections/test.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index f5e2ecba2b7..f8cbe8e6d9a 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -226,12 +226,14 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
             f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c",
             query_id=query_id,
         )
+        time.sleep(2)
+        node.query("SYSTEM FLUSH LOGS")
         assert "proj1" in node.query(
             f"""
         SYSTEM FLUSH LOGS;
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
         FROM system.query_log
-        WHERE current_database=currentDatabase() AND query_id='{query_id}' AND type='QueryFinish'
+        WHERE query_id='{query_id}' AND type='QueryFinish'
         """
         )
 
@@ -246,12 +248,14 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
             f"SELECT d FROM '{table}' WHERE c == 12 OR c == 16 ORDER BY d",
             query_id=query_id,
         )
+        time.sleep(2)
+        node.query("SYSTEM FLUSH LOGS")
         assert "proj2" in node.query(
             f"""
         SYSTEM FLUSH LOGS;
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
         FROM system.query_log
-        WHERE current_database=currentDatabase() AND query_id='{query_id}' AND type='QueryFinish'
+        WHERE query_id='{query_id}' AND type='QueryFinish'
         """
         )
 

From 176d8beac972eb6df4954b3974ba40a0b4b48b45 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 26 Jan 2024 14:34:26 +0100
Subject: [PATCH 115/245] Disable parallel replicas JOIN with CTE (not
 analyzer)

---
 src/Interpreters/ActionsVisitor.cpp           |  5 +-
 src/Interpreters/GlobalSubqueriesVisitor.h    | 63 +++++++++++++++----
 src/Interpreters/InterpreterSelectQuery.cpp   | 33 +---------
 src/Interpreters/PreparedSets.cpp             | 27 ++------
 src/Interpreters/PreparedSets.h               | 14 +----
 .../02972_parallel_replicas_cte.reference     |  2 +
 .../02972_parallel_replicas_cte.sql           | 23 +++++++
 7 files changed, 85 insertions(+), 82 deletions(-)
 create mode 100644 tests/queries/0_stateless/02972_parallel_replicas_cte.reference
 create mode 100644 tests/queries/0_stateless/02972_parallel_replicas_cte.sql

diff --git a/src/Interpreters/ActionsVisitor.cpp b/src/Interpreters/ActionsVisitor.cpp
index 1789cc6c4b1..78e125146d4 100644
--- a/src/Interpreters/ActionsVisitor.cpp
+++ b/src/Interpreters/ActionsVisitor.cpp
@@ -1414,10 +1414,7 @@ FutureSetPtr ActionsMatcher::makeSet(const ASTFunction & node, Data & data, bool
             set_key = right_in_operand->getTreeHash(/*ignore_aliases=*/ true);
 
         if (auto set = data.prepared_sets->findSubquery(set_key))
-        {
-            set->markAsINSubquery();
             return set;
-        }
 
         FutureSetFromSubqueryPtr external_table_set;
 
@@ -1464,7 +1461,7 @@ FutureSetPtr ActionsMatcher::makeSet(const ASTFunction & node, Data & data, bool
         }
 
         return data.prepared_sets->addFromSubquery(
-            set_key, std::move(source), nullptr, std::move(external_table_set), data.getContext()->getSettingsRef(), /*in_subquery=*/true);
+            set_key, std::move(source), nullptr, std::move(external_table_set), data.getContext()->getSettingsRef());
     }
     else
     {
diff --git a/src/Interpreters/GlobalSubqueriesVisitor.h b/src/Interpreters/GlobalSubqueriesVisitor.h
index 384b562c80c..08fbd748e48 100644
--- a/src/Interpreters/GlobalSubqueriesVisitor.h
+++ b/src/Interpreters/GlobalSubqueriesVisitor.h
@@ -32,6 +32,7 @@ namespace ErrorCodes
 {
     extern const int WRONG_GLOBAL_SUBQUERY;
     extern const int LOGICAL_ERROR;
+    extern const int SUPPORT_IS_DISABLED;
 }
 
 class GlobalSubqueriesMatcher
@@ -200,23 +201,33 @@ public:
     }
 
 private:
-    static bool shouldBeExecutedGlobally(const Data & data)
-    {
-        const Settings & settings = data.getContext()->getSettingsRef();
-        /// For parallel replicas we reinterpret JOIN as GLOBAL JOIN as a way to broadcast data
-        const bool enable_parallel_processing_of_joins = data.getContext()->canUseParallelReplicasOnInitiator();
-        return settings.prefer_global_in_and_join || enable_parallel_processing_of_joins;
-    }
-
-
     /// GLOBAL IN
     static void visit(ASTFunction & func, ASTPtr &, Data & data)
     {
-        if ((shouldBeExecutedGlobally(data)
+        const Settings & settings = data.getContext()->getSettingsRef();
+        const bool prefer_global = settings.prefer_global_in_and_join;
+        const bool enable_parallel_processing_of_joins = data.getContext()->canUseParallelReplicasOnInitiator();
+
+        if (((prefer_global || enable_parallel_processing_of_joins)
              && (func.name == "in" || func.name == "notIn" || func.name == "nullIn" || func.name == "notNullIn"))
             || func.name == "globalIn" || func.name == "globalNotIn" || func.name == "globalNullIn" || func.name == "globalNotNullIn")
         {
             ASTPtr & ast = func.arguments->children[1];
+            if (enable_parallel_processing_of_joins)
+            {
+                /// We don't enable parallel replicas for IN (subquery)
+                if (ast->as<ASTSubquery>())
+                {
+                    if (settings.allow_experimental_parallel_reading_from_replicas == 1)
+                    {
+                        LOG_DEBUG(getLogger("GlobalSubqueriesMatcher"), "IN with subquery is not supported with parallel replicas");
+                        data.getContext()->getQueryContext()->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
+                        return;
+                    }
+                    else if (settings.allow_experimental_parallel_reading_from_replicas == 2)
+                        throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "IN with subquery is not supported with parallel replicas");
+                }
+            }
 
             /// Literal or function can use regular IN.
             /// NOTE: We don't support passing table functions to IN.
@@ -241,9 +252,39 @@ private:
     /// GLOBAL JOIN
     static void visit(ASTTablesInSelectQueryElement & table_elem, ASTPtr &, Data & data)
     {
+        const Settings & settings = data.getContext()->getSettingsRef();
+        const bool prefer_global = settings.prefer_global_in_and_join;
+        const bool enable_parallel_processing_of_joins = data.getContext()->canUseParallelReplicasOnInitiator();
+
         if (table_elem.table_join
-            && (table_elem.table_join->as<ASTTableJoin &>().locality == JoinLocality::Global || shouldBeExecutedGlobally(data)))
+            && (table_elem.table_join->as<ASTTableJoin &>().locality == JoinLocality::Global || prefer_global
+                || enable_parallel_processing_of_joins))
         {
+            if (enable_parallel_processing_of_joins)
+            {
+                /// For parallel replicas we currently only support JOIN with subqueries
+                /// Note that tableA join tableB is previously converted into tableA JOIN (Select * FROM tableB) so that's ok
+                /// We don't support WITH cte as (subquery) Select table JOIN cte because we don't do conversion in AST
+                bool is_subquery = false;
+                if (const auto * ast_table_expr = table_elem.table_expression->as<ASTTableExpression>())
+                    is_subquery = ast_table_expr->subquery->as<ASTSubquery>() != nullptr
+                        && ast_table_expr->subquery->as<ASTSubquery>()->cte_name.empty();
+                else if (table_elem.table_expression->as<ASTSubquery>())
+                    is_subquery = true;
+
+                if (!is_subquery)
+                {
+                    if (settings.allow_experimental_parallel_reading_from_replicas == 1)
+                    {
+                        LOG_DEBUG(getLogger("GlobalSubqueriesMatcher"), "JOIN with parallel replicas is only supported with subqueries");
+                        data.getContext()->getQueryContext()->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
+                        return;
+                    }
+                    else if (settings.allow_experimental_parallel_reading_from_replicas == 2)
+                        throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "JOIN with parallel replicas is only supported with subqueries");
+                }
+            }
+
             Names required_columns;
 
             /// Fill required columns for GLOBAL JOIN.
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index 946a62c39c1..d0cf9f1160c 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -864,38 +864,7 @@ bool InterpreterSelectQuery::adjustParallelReplicasAfterAnalysis()
     ASTSelectQuery & query = getSelectQuery();
 
     /// While only_analyze we don't know anything about parts, so any decision about how many parallel replicas to use would be wrong
-    if (!storage || !context->canUseParallelReplicasOnInitiator())
-        return false;
-
-    /// check if IN operator with subquery is present in the query
-    /// if so, disable parallel replicas
-    if (query_analyzer->getPreparedSets()->hasSubqueries())
-    {
-        bool in_subqueries = false;
-        const auto & sets = query_analyzer->getPreparedSets();
-        const auto subqueries = sets->getSubqueries();
-        for (const auto & subquery : subqueries)
-        {
-            if (subquery->isINSubquery())
-            {
-                in_subqueries = true;
-                break;
-            }
-        }
-
-        if (in_subqueries)
-        {
-            if (settings.allow_experimental_parallel_reading_from_replicas == 2)
-                throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "IN with subquery is not supported with parallel replicas");
-
-            context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
-            context->setSetting("max_parallel_replicas", UInt64{0});
-            LOG_DEBUG(log, "Disabling parallel replicas to execute a query with IN with subquery");
-            return true;
-        }
-    }
-
-    if (options.only_analyze)
+    if (!storage || options.only_analyze || !context->canUseParallelReplicasOnInitiator())
         return false;
 
     if (getTrivialCount(0).has_value())
diff --git a/src/Interpreters/PreparedSets.cpp b/src/Interpreters/PreparedSets.cpp
index cc3db726f01..76f75cde1dc 100644
--- a/src/Interpreters/PreparedSets.cpp
+++ b/src/Interpreters/PreparedSets.cpp
@@ -98,12 +98,8 @@ FutureSetFromSubquery::FutureSetFromSubquery(
     std::unique_ptr<QueryPlan> source_,
     StoragePtr external_table_,
     std::shared_ptr<FutureSetFromSubquery> external_table_set_,
-    const Settings & settings,
-    bool in_subquery_)
-    : external_table(std::move(external_table_))
-    , external_table_set(std::move(external_table_set_))
-    , source(std::move(source_))
-    , in_subquery(in_subquery_)
+    const Settings & settings)
+    : external_table(std::move(external_table_)), external_table_set(std::move(external_table_set_)), source(std::move(source_))
 {
     set_and_key = std::make_shared<SetAndKey>();
     set_and_key->key = std::move(key);
@@ -281,16 +277,10 @@ FutureSetFromSubqueryPtr PreparedSets::addFromSubquery(
     std::unique_ptr<QueryPlan> source,
     StoragePtr external_table,
     FutureSetFromSubqueryPtr external_table_set,
-    const Settings & settings,
-    bool in_subquery)
+    const Settings & settings)
 {
     auto from_subquery = std::make_shared<FutureSetFromSubquery>(
-        toString(key, {}),
-        std::move(source),
-        std::move(external_table),
-        std::move(external_table_set),
-        settings,
-        in_subquery);
+        toString(key, {}), std::move(source), std::move(external_table), std::move(external_table_set), settings);
 
     auto [it, inserted] = sets_from_subqueries.emplace(key, from_subquery);
 
@@ -340,15 +330,6 @@ std::shared_ptr<FutureSetFromSubquery> PreparedSets::findSubquery(const Hash & k
     return it->second;
 }
 
-void PreparedSets::markAsINSubquery(const Hash & key)
-{
-    auto it = sets_from_subqueries.find(key);
-    if (it == sets_from_subqueries.end())
-        return;
-
-    it->second->markAsINSubquery();
-}
-
 std::shared_ptr<FutureSetFromStorage> PreparedSets::findStorage(const Hash & key) const
 {
     auto it = sets_from_storage.find(key);
diff --git a/src/Interpreters/PreparedSets.h b/src/Interpreters/PreparedSets.h
index 7178cff73b9..3419d3b6839 100644
--- a/src/Interpreters/PreparedSets.h
+++ b/src/Interpreters/PreparedSets.h
@@ -101,8 +101,7 @@ public:
         std::unique_ptr<QueryPlan> source_,
         StoragePtr external_table_,
         std::shared_ptr<FutureSetFromSubquery> external_table_set_,
-        const Settings & settings,
-        bool in_subquery_);
+        const Settings & settings);
 
     FutureSetFromSubquery(
         String key,
@@ -118,8 +117,6 @@ public:
 
     QueryTreeNodePtr detachQueryTree() { return std::move(query_tree); }
     void setQueryPlan(std::unique_ptr<QueryPlan> source_);
-    void markAsINSubquery() { in_subquery = true; }
-    bool isINSubquery() const { return in_subquery; }
 
 private:
     SetAndKeyPtr set_and_key;
@@ -128,11 +125,6 @@ private:
 
     std::unique_ptr<QueryPlan> source;
     QueryTreeNodePtr query_tree;
-    bool in_subquery = false; // subquery used in IN operator
-                              // the flag can be removed after enabling new analyzer and removing interpreter
-                              // or after enabling support IN operator with subqueries in parallel replicas
-                              // Note: it's necessary with interpreter since prepared sets used also for GLOBAL JOINs,
-                              //       with new analyzer it's not a case
 };
 
 using FutureSetFromSubqueryPtr = std::shared_ptr<FutureSetFromSubquery>;
@@ -160,8 +152,7 @@ public:
         std::unique_ptr<QueryPlan> source,
         StoragePtr external_table,
         FutureSetFromSubqueryPtr external_table_set,
-        const Settings & settings,
-        bool in_subquery = false);
+        const Settings & settings);
 
     FutureSetFromSubqueryPtr addFromSubquery(
         const Hash & key,
@@ -171,7 +162,6 @@ public:
     FutureSetFromTuplePtr findTuple(const Hash & key, const DataTypes & types) const;
     FutureSetFromStoragePtr findStorage(const Hash & key) const;
     FutureSetFromSubqueryPtr findSubquery(const Hash & key) const;
-    void markAsINSubquery(const Hash & key);
 
     using Subqueries = std::vector<FutureSetFromSubqueryPtr>;
     Subqueries getSubqueries() const;
diff --git a/tests/queries/0_stateless/02972_parallel_replicas_cte.reference b/tests/queries/0_stateless/02972_parallel_replicas_cte.reference
new file mode 100644
index 00000000000..fe21e3cec22
--- /dev/null
+++ b/tests/queries/0_stateless/02972_parallel_replicas_cte.reference
@@ -0,0 +1,2 @@
+990000
+990000
diff --git a/tests/queries/0_stateless/02972_parallel_replicas_cte.sql b/tests/queries/0_stateless/02972_parallel_replicas_cte.sql
new file mode 100644
index 00000000000..d65374a3e02
--- /dev/null
+++ b/tests/queries/0_stateless/02972_parallel_replicas_cte.sql
@@ -0,0 +1,23 @@
+DROP TABLE IF EXISTS pr_1;
+DROP TABLE IF EXISTS pr_2;
+
+CREATE TABLE pr_1 (`a` UInt32) ENGINE = MergeTree ORDER BY a PARTITION BY a % 10 AS
+SELECT 10 * intDiv(number, 10) + 1 FROM numbers(1_000_000);
+
+CREATE TABLE pr_2 (`a` UInt32) ENGINE = MergeTree ORDER BY a AS
+SELECT * FROM numbers(1_000_000);
+
+WITH filtered_groups AS (SELECT a FROM pr_1 WHERE a >= 10000)
+SELECT count() FROM pr_2 INNER JOIN filtered_groups ON pr_2.a = filtered_groups.a;
+
+WITH filtered_groups AS (SELECT a FROM pr_1 WHERE a >= 10000)
+SELECT count() FROM pr_2 INNER JOIN filtered_groups ON pr_2.a = filtered_groups.a
+SETTINGS allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_two_shards', max_parallel_replicas = 3;
+
+-- Testing that it is disabled for allow_experimental_analyzer=0. With analyzer it will be supported (with correct result)
+WITH filtered_groups AS (SELECT a FROM pr_1 WHERE a >= 10000)
+SELECT count() FROM pr_2 INNER JOIN filtered_groups ON pr_2.a = filtered_groups.a
+SETTINGS allow_experimental_analyzer = 0, allow_experimental_parallel_reading_from_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_two_shards', max_parallel_replicas = 3; -- { serverError SUPPORT_IS_DISABLED }
+
+DROP TABLE IF EXISTS pr_1;
+DROP TABLE IF EXISTS pr_2;

From 7908f69d84dc5a12156dee6ec7c137e1bf60c568 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 26 Jan 2024 14:01:06 +0000
Subject: [PATCH 116/245] Fix special builds and tests

---
 src/Functions/array/array.cpp                    | 2 +-
 src/Functions/map.cpp                            | 2 +-
 tests/queries/0_stateless/02942_variant_cast.sql | 1 +
 3 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Functions/array/array.cpp b/src/Functions/array/array.cpp
index 4379283ec86..03b51808799 100644
--- a/src/Functions/array/array.cpp
+++ b/src/Functions/array/array.cpp
@@ -16,7 +16,7 @@ class FunctionArray : public IFunction
 public:
     static constexpr auto name = "array";
 
-    FunctionArray(bool use_variant_as_common_type_ = false) : use_variant_as_common_type(use_variant_as_common_type_) {}
+    explicit FunctionArray(bool use_variant_as_common_type_ = false) : use_variant_as_common_type(use_variant_as_common_type_) {}
 
     static FunctionPtr create(ContextPtr context)
     {
diff --git a/src/Functions/map.cpp b/src/Functions/map.cpp
index 79a18dce99b..66cd10a3f0b 100644
--- a/src/Functions/map.cpp
+++ b/src/Functions/map.cpp
@@ -31,7 +31,7 @@ class FunctionMap : public IFunction
 public:
     static constexpr auto name = "map";
 
-    FunctionMap(bool use_variant_as_common_type_) : use_variant_as_common_type(use_variant_as_common_type_) {}
+    explicit FunctionMap(bool use_variant_as_common_type_) : use_variant_as_common_type(use_variant_as_common_type_) {}
 
     static FunctionPtr create(ContextPtr context)
     {
diff --git a/tests/queries/0_stateless/02942_variant_cast.sql b/tests/queries/0_stateless/02942_variant_cast.sql
index 33587e3e438..fc2d1d63657 100644
--- a/tests/queries/0_stateless/02942_variant_cast.sql
+++ b/tests/queries/0_stateless/02942_variant_cast.sql
@@ -1,4 +1,5 @@
 set allow_experimental_variant_type=1;
+set allow_experimental_analyzer=0; -- It's currently doesn't work with analyzer because of the way it works with constants, but it will be refactored and fixed in future
 
 select NULL::Variant(String, UInt64);
 select 42::UInt64::Variant(String, UInt64);

From 394e37894ff5ad87960ed8efffa655d88050e517 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Fri, 26 Jan 2024 15:03:35 +0000
Subject: [PATCH 117/245] Small improvement in QueryAnalysisPass

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 11 +++++++----
 src/Analyzer/QueryNode.cpp                |  1 +
 2 files changed, 8 insertions(+), 4 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index e33c6565321..5582e369f33 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -1214,7 +1214,7 @@ private:
 
     static void expandGroupByAll(QueryNode & query_tree_node_typed);
 
-    static void expandOrderByAll(QueryNode & query_tree_node_typed);
+    static void expandOrderByAll(QueryNode & query_tree_node_typed, const Settings & settings);
 
     static std::string
     rewriteAggregateFunctionNameIfNeeded(const std::string & aggregate_function_name, NullsAction action, const ContextPtr & context);
@@ -2328,8 +2328,11 @@ void QueryAnalyzer::expandGroupByAll(QueryNode & query_tree_node_typed)
         recursivelyCollectMaxOrdinaryExpressions(node, group_by_nodes);
 }
 
-void QueryAnalyzer::expandOrderByAll(QueryNode & query_tree_node_typed)
+void QueryAnalyzer::expandOrderByAll(QueryNode & query_tree_node_typed, const Settings & settings)
 {
+    if (!settings.enable_order_by_all || !query_tree_node_typed.isOrderByAll())
+        return;
+
     auto * all_node = query_tree_node_typed.getOrderBy().getNodes()[0]->as<SortNode>();
     if (!all_node)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Select analyze for not sort node.");
@@ -2355,6 +2358,7 @@ void QueryAnalyzer::expandOrderByAll(QueryNode & query_tree_node_typed)
     }
 
     query_tree_node_typed.getOrderByNode() = list_node;
+    query_tree_node_typed.setIsOrderByAll(false);
 }
 
 std::string QueryAnalyzer::rewriteAggregateFunctionNameIfNeeded(
@@ -7133,8 +7137,7 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
     if (query_node_typed.hasHaving() && query_node_typed.isGroupByWithTotals() && is_rollup_or_cube)
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "WITH TOTALS and WITH ROLLUP or CUBE are not supported together in presence of HAVING");
 
-    if (settings.enable_order_by_all && query_node_typed.isOrderByAll())
-        expandOrderByAll(query_node_typed);
+    expandOrderByAll(query_node_typed, settings);
 
     /// Initialize aliases in query node scope
     QueryExpressionsAliasVisitor visitor(scope);
diff --git a/src/Analyzer/QueryNode.cpp b/src/Analyzer/QueryNode.cpp
index a82fb4489b5..d0bff759dea 100644
--- a/src/Analyzer/QueryNode.cpp
+++ b/src/Analyzer/QueryNode.cpp
@@ -338,6 +338,7 @@ ASTPtr QueryNode::toASTImpl(const ConvertToASTOptions & options) const
     select_query->group_by_with_cube = is_group_by_with_cube;
     select_query->group_by_with_grouping_sets = is_group_by_with_grouping_sets;
     select_query->group_by_all = is_group_by_all;
+    select_query->order_by_all = is_order_by_all;
 
     if (hasWith())
         select_query->setExpression(ASTSelectQuery::Expression::WITH, getWith().toAST(options));

From e3c07d456295ccc2524a2fafc6ea8a74a2e8bc39 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 24 Jan 2024 17:50:39 +0000
Subject: [PATCH 118/245] Analyzer: Fix CTE name clash resolution

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 23 ++++++++++++++++++++---
 1 file changed, 20 insertions(+), 3 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index e33c6565321..ceb54fc6056 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -1396,6 +1396,8 @@ private:
     /// Lambdas that are currently in resolve process
     std::unordered_set<IQueryTreeNode *> lambdas_in_resolve_process;
 
+    std::unordered_set<String> cte_in_resolve_process;
+
     /// Function name to user defined lambda map
     std::unordered_map<std::string, QueryTreeNodePtr> function_name_to_user_defined_lambda;
 
@@ -3712,7 +3714,12 @@ IdentifierResolveResult QueryAnalyzer::tryResolveIdentifier(const IdentifierLook
         if (it->second.resolve_result.isResolved() &&
             scope.use_identifier_lookup_to_result_cache &&
             !scope.non_cached_identifier_lookups_during_expression_resolve.contains(identifier_lookup))
-            return it->second.resolve_result;
+        {
+            if (!it->second.resolve_result.isResolvedFromCTEs() || !cte_in_resolve_process.contains(identifier_lookup.identifier.getFullName()))
+            {
+                return it->second.resolve_result;
+            }
+        }
     }
     else
     {
@@ -3769,8 +3776,10 @@ IdentifierResolveResult QueryAnalyzer::tryResolveIdentifier(const IdentifierLook
 
     if (!resolve_result.resolved_identifier && identifier_lookup.isTableExpressionLookup())
     {
-        auto cte_query_node_it = scope.cte_name_to_query_node.find(identifier_lookup.identifier.getFullName());
-        if (cte_query_node_it != scope.cte_name_to_query_node.end())
+        auto full_name = identifier_lookup.identifier.getFullName();
+        auto cte_query_node_it = scope.cte_name_to_query_node.find(full_name);
+        if (cte_query_node_it != scope.cte_name_to_query_node.end()
+            && !cte_in_resolve_process.contains(full_name))
         {
             resolve_result.resolved_identifier = cte_query_node_it->second;
             resolve_result.resolve_place = IdentifierResolvePlace::CTE;
@@ -5704,6 +5713,7 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
 
                     if (resolved_as_cte)
                     {
+                        auto cte_node = resolved_identifier_node;
                         resolved_identifier_node = resolved_identifier_node->clone();
                         subquery_node = resolved_identifier_node->as<QueryNode>();
                         union_node = resolved_identifier_node->as<UnionNode>();
@@ -7112,6 +7122,10 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
             max_subquery_depth);
 
     auto & query_node_typed = query_node->as<QueryNode &>();
+
+    if (query_node_typed.isCTE())
+        cte_in_resolve_process.insert(query_node_typed.getCTEName());
+
     const auto & settings = scope.context->getSettingsRef();
 
     bool is_rollup_or_cube = query_node_typed.isGroupByWithRollup() || query_node_typed.isGroupByWithCube();
@@ -7452,6 +7466,9 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
         node->removeAlias();
 
     query_node_typed.resolveProjectionColumns(std::move(projection_columns));
+
+    if (query_node_typed.isCTE())
+        cte_in_resolve_process.erase(query_node_typed.getCTEName());
 }
 
 void QueryAnalyzer::resolveUnion(const QueryTreeNodePtr & union_node, IdentifierResolveScope & scope)

From 778f4371c2b73dddf122e5948b67e01466cbed32 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 25 Jan 2024 09:43:27 +0000
Subject: [PATCH 119/245] Cleanup the code

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 23 +++++++++++++++++++++--
 tests/analyzer_tech_debt.txt              |  1 -
 2 files changed, 21 insertions(+), 3 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index ceb54fc6056..a43f4cba5e9 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -1396,7 +1396,7 @@ private:
     /// Lambdas that are currently in resolve process
     std::unordered_set<IQueryTreeNode *> lambdas_in_resolve_process;
 
-    std::unordered_set<String> cte_in_resolve_process;
+    std::unordered_set<std::string_view> cte_in_resolve_process;
 
     /// Function name to user defined lambda map
     std::unordered_map<std::string, QueryTreeNodePtr> function_name_to_user_defined_lambda;
@@ -3778,6 +3778,19 @@ IdentifierResolveResult QueryAnalyzer::tryResolveIdentifier(const IdentifierLook
     {
         auto full_name = identifier_lookup.identifier.getFullName();
         auto cte_query_node_it = scope.cte_name_to_query_node.find(full_name);
+
+        /// CTE may reference table expressions with the same name, e.g.:
+        ///
+        /// WITH test1 AS (SELECT * FROM test1) SELECT * FROM test1;
+        ///
+        /// Since we don't support recursive CTEs, `test1` identifier inside of CTE
+        /// references to table <default database name>.test1.
+        /// This means that the example above is equivalent to the following query:
+        ///
+        /// SELECT * FROM test1;
+        ///
+        /// To accomplish this behaviour it's not allowed to resolve identifiers to
+        /// CTE that is being resolved.
         if (cte_query_node_it != scope.cte_name_to_query_node.end()
             && !cte_in_resolve_process.contains(full_name))
         {
@@ -5713,7 +5726,6 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
 
                     if (resolved_as_cte)
                     {
-                        auto cte_node = resolved_identifier_node;
                         resolved_identifier_node = resolved_identifier_node->clone();
                         subquery_node = resolved_identifier_node->as<QueryNode>();
                         union_node = resolved_identifier_node->as<UnionNode>();
@@ -7474,6 +7486,10 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
 void QueryAnalyzer::resolveUnion(const QueryTreeNodePtr & union_node, IdentifierResolveScope & scope)
 {
     auto & union_node_typed = union_node->as<UnionNode &>();
+
+    if(union_node_typed.isCTE())
+        cte_in_resolve_process.insert(union_node_typed.getCTEName());
+
     auto & queries_nodes = union_node_typed.getQueries().getNodes();
 
     for (auto & query_node : queries_nodes)
@@ -7497,6 +7513,9 @@ void QueryAnalyzer::resolveUnion(const QueryTreeNodePtr & union_node, Identifier
                 scope.scope_node->formatASTForErrorMessage());
         }
     }
+
+    if(union_node_typed.isCTE())
+        cte_in_resolve_process.erase(union_node_typed.getCTEName());
 }
 
 }
diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index a84f912f371..d944dd96e25 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -7,7 +7,6 @@
 01214_test_storage_merge_aliases_with_where
 01244_optimize_distributed_group_by_sharding_key
 01268_shard_avgweighted
-01495_subqueries_in_with_statement
 01560_merge_distributed_join
 01584_distributed_buffer_cannot_find_column
 01624_soft_constraints

From e38face46b7c78b04551ec4a9590e10f7b872935 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Thu, 25 Jan 2024 10:55:45 +0100
Subject: [PATCH 120/245] Fix style

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index a43f4cba5e9..9c42c6621da 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -7487,7 +7487,7 @@ void QueryAnalyzer::resolveUnion(const QueryTreeNodePtr & union_node, Identifier
 {
     auto & union_node_typed = union_node->as<UnionNode &>();
 
-    if(union_node_typed.isCTE())
+    if (union_node_typed.isCTE())
         cte_in_resolve_process.insert(union_node_typed.getCTEName());
 
     auto & queries_nodes = union_node_typed.getQueries().getNodes();
@@ -7514,7 +7514,7 @@ void QueryAnalyzer::resolveUnion(const QueryTreeNodePtr & union_node, Identifier
         }
     }
 
-    if(union_node_typed.isCTE())
+    if (union_node_typed.isCTE())
         cte_in_resolve_process.erase(union_node_typed.getCTEName());
 }
 

From a9d2e136978116311e2f9559cfabe040f35e80a2 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Fri, 26 Jan 2024 14:23:19 +0000
Subject: [PATCH 121/245] Handle CTEs more careafully

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 9c42c6621da..feca2980638 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -5730,6 +5730,8 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
                         subquery_node = resolved_identifier_node->as<QueryNode>();
                         union_node = resolved_identifier_node->as<UnionNode>();
 
+                        std::string_view cte_name = subquery_node ? subquery_node->getCTEName() : union_node->getCTEName();
+
                         if (subquery_node)
                             subquery_node->setIsCTE(false);
                         else
@@ -5738,10 +5740,21 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
                         IdentifierResolveScope subquery_scope(resolved_identifier_node, &scope /*parent_scope*/);
                         subquery_scope.subquery_depth = scope.subquery_depth + 1;
 
+                        /// CTE is being resolved, it's required to forbid to resolve to it again
+                        /// because recursive CTEs are not supported, e.g.:
+                        ///
+                        /// WITH test1 AS (SELECT i + 1, j + 1 FROM test1) SELECT toInt64(4) i, toInt64(5) j FROM numbers(3) WHERE (i, j) IN test1;
+                        ///
+                        /// In this example argument of function `in` is being resolve here. If CTE `test1` is not forbidden,
+                        /// `test1` is resolved to CTE (not to the table) in `initializeQueryJoinTreeNode` function.
+                        cte_in_resolve_process.insert(cte_name);
+
                         if (subquery_node)
                             resolveQuery(resolved_identifier_node, subquery_scope);
                         else
                             resolveUnion(resolved_identifier_node, subquery_scope);
+
+                        cte_in_resolve_process.erase(cte_name);
                     }
                 }
             }

From ee15b6e64608ddb519c4997533aca14d21153834 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 26 Jan 2024 16:26:59 +0100
Subject: [PATCH 122/245] Fix

---
 src/Storages/S3Queue/S3QueueFilesMetadata.cpp | 35 +++++++++-----
 src/Storages/S3Queue/S3QueueFilesMetadata.h   |  4 +-
 src/Storages/S3Queue/S3QueueSource.cpp        | 48 +++++++++----------
 src/Storages/S3Queue/S3QueueSource.h          |  2 +
 src/Storages/S3Queue/StorageS3Queue.cpp       |  2 +-
 5 files changed, 52 insertions(+), 39 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
index 02974be4c4a..9fb127baef9 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
@@ -199,7 +199,7 @@ S3QueueFilesMetadata::NodeMetadata S3QueueFilesMetadata::createNodeMetadata(
     return metadata;
 }
 
-size_t S3QueueFilesMetadata::getProcessingThreadForPath(const std::string & path) const
+size_t S3QueueFilesMetadata::getProcessingIdForPath(const std::string & path) const
 {
     return sipHash64(path.data(), path.size()) % getProcessingThreadsNum();
 }
@@ -219,16 +219,24 @@ S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAs
         std::lock_guard lock(file_status->metadata_lock);
         switch (file_status->state)
         {
-            case FileStatus::State::Processing: [[fallthrough]];
+            case FileStatus::State::Processing:
+            {
+                LOG_TEST(log, "File {} is already processing", path);
+                return {};
+            }
             case FileStatus::State::Processed:
             {
+                LOG_TEST(log, "File {} is already processed", path);
                 return {};
             }
             case FileStatus::State::Failed:
             {
                 /// If max_loading_retries == 0, file is not retriable.
                 if (max_loading_retries == 0)
+                {
+                    LOG_TEST(log, "File {} is failed and processing retries are disabled", path);
                     return {};
+                }
 
                 /// Otherwise file_status->retries is also cached.
                 /// In case file_status->retries >= max_loading_retries we can fully rely that it is true
@@ -237,7 +245,10 @@ S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAs
                 /// (another server could have done a try after we cached retries value),
                 /// so check with zookeeper here.
                 if (file_status->retries >= max_loading_retries)
+                {
+                    LOG_TEST(log, "File {} is failed and processing retries are exceeeded", path);
                     return {};
+                }
 
                 break;
             }
@@ -291,31 +302,26 @@ S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAs
             if (!file_status->processing_start_time)
                 file_status->processing_start_time = std::chrono::system_clock::to_time_t(std::chrono::system_clock::now());
 
-            break;
+            return processing_node_holder;
         }
         case SetFileProcessingResult::AlreadyProcessed:
         {
             std::lock_guard lock(file_status->metadata_lock);
             file_status->state = FileStatus::State::Processed;
-            break;
+            return {};
         }
         case SetFileProcessingResult::AlreadyFailed:
         {
             std::lock_guard lock(file_status->metadata_lock);
             file_status->state = FileStatus::State::Failed;
-            break;
+            return {};
         }
         case SetFileProcessingResult::ProcessingByOtherNode:
         {
             /// We cannot save any local state here, see comment above.
-            break;
+            return {};
         }
     }
-
-    if (result == SetFileProcessingResult::Success)
-        return processing_node_holder;
-
-    return {};
 }
 
 std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
@@ -396,7 +402,7 @@ S3QueueFilesMetadata::trySetFileAsProcessingForOrderedMode(const std::string & p
         /// in the same zookeeper transaction, so we use a while loop with tries).
 
         auto processed_node = isShardedProcessing()
-            ? zookeeper_processed_path / toString(getProcessingThreadForPath(path))
+            ? zookeeper_processed_path / toString(getProcessingIdForPath(path))
             : zookeeper_processed_path;
 
         NodeMetadata processed_node_metadata;
@@ -435,6 +441,8 @@ S3QueueFilesMetadata::trySetFileAsProcessingForOrderedMode(const std::string & p
         {
             auto holder = std::make_unique<ProcessingNodeHolder>(
                 node_metadata.processing_id, path, zookeeper_processing_path / node_name, file_status, zk_client);
+
+            LOG_TEST(log, "File {} is ready to be processed", path);
             return std::pair{SetFileProcessingResult::Success, std::move(holder)};
         }
 
@@ -526,9 +534,10 @@ void S3QueueFilesMetadata::setFileProcessedForOrderedMode(ProcessingNodeHolderPt
     const auto zk_client = getZooKeeper();
 
     auto processed_node = isShardedProcessing()
-        ? zookeeper_processed_path / toString(getProcessingThreadForPath(path))
+        ? zookeeper_processed_path / toString(getProcessingIdForPath(path))
         : zookeeper_processed_path;
 
+    LOG_TEST(log, "Setting file `{}` as processed", path);
     while (true)
     {
         std::string res;
diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index 708355e4ac3..1436f8eae7b 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -84,11 +84,13 @@ public:
 
     size_t getProcessingThreadsNum() const { return shards_num * threads_per_shard; }
 
-    size_t getProcessingThreadForPath(const std::string & path) const;
+    size_t getProcessingIdForPath(const std::string & path) const;
 
     /// shard_id must be in range [0, shards_num - 1]
     size_t getIdForProcessingThread(size_t thread_id, size_t shard_id) const { return shard_id * threads_per_shard + thread_id; }
 
+    bool isProcessingIdBelongsToShard(size_t id, size_t shard_id) const { return shard_id * threads_per_shard <= id && id < shard_id * (threads_per_shard + 1); }
+
 private:
     const S3QueueMode mode;
     const UInt64 max_set_size;
diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index 1073270742f..eed644aff7c 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -43,12 +43,14 @@ StorageS3QueueSource::S3QueueKeyWithInfo::S3QueueKeyWithInfo(
 StorageS3QueueSource::FileIterator::FileIterator(
     std::shared_ptr<S3QueueFilesMetadata> metadata_,
     std::unique_ptr<GlobIterator> glob_iterator_,
+    size_t current_shard_,
     std::atomic<bool> & shutdown_called_)
     : metadata(metadata_)
     , glob_iterator(std::move(glob_iterator_))
     , shutdown_called(shutdown_called_)
     , log(&Poco::Logger::get("StorageS3QueueSource"))
     , sharded_processing(metadata->isShardedProcessing())
+    , current_shard(current_shard_)
 {
     if (sharded_processing)
     {
@@ -63,40 +65,36 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
     {
         KeyWithInfoPtr val{nullptr};
 
-        if (sharded_processing)
-        {
-            LOG_TEST(log, "CHECK: {}", idx);
-            auto & keys = sharded_keys.at(idx);
-            if (!keys.empty())
-            {
-                std::lock_guard lk(sharded_keys_mutex);
-                val = keys.front();
-                keys.pop_front();
-            }
-        }
-
-        if (!val)
         {
             std::unique_lock lk(sharded_keys_mutex, std::defer_lock);
             if (sharded_processing)
             {
-                /// To make sure order on keys in each shard in sharded_keys.
+                /// To make sure order on keys in each shard in sharded_keys
+                /// we need to check sharded_keys and to next() under lock.
                 lk.lock();
+
+                auto & keys = sharded_keys.at(idx);
+                if (!keys.empty())
+                {
+                    val = keys.front();
+                    keys.pop_front();
+                }
             }
 
-            val = glob_iterator->next();
-
-            if (val && sharded_processing)
+            if (!val)
             {
-                auto shard = metadata->getProcessingThreadForPath(val->key);
-                if (shard != idx)
+                val = glob_iterator->next();
+                if (val && sharded_processing)
                 {
-                    LOG_TEST(log, "Key {} is for shard {} (total: {})", val->key, shard, sharded_keys.size());
-                    auto & keys = sharded_keys.at(shard);
-                    keys.push_back(val);
-                    continue;
+                    auto shard = metadata->getProcessingIdForPath(val->key);
+                    if (idx != shard && metadata->isProcessingIdBelongsToShard(shard, current_shard))
+                    {
+                        LOG_TEST(log, "Key {} is for shard {} (total: {})", val->key, shard, sharded_keys.size());
+                        auto & keys = sharded_keys.at(shard);
+                        keys.push_back(val);
+                        continue;
+                    }
                 }
-                LOG_TEST(log, "Processing shard {} with key {}", shard, val->key);
             }
         }
 
@@ -116,6 +114,8 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
             return {};
         }
 
+        LOG_TEST(log, "Checking if can process key {} for processing_id {}", val->key, idx);
+
         if (processing_holder)
         {
             return std::make_shared<S3QueueKeyWithInfo>(val->key, val->info, processing_holder);
diff --git a/src/Storages/S3Queue/S3QueueSource.h b/src/Storages/S3Queue/S3QueueSource.h
index 338f355974b..47fc3ee960e 100644
--- a/src/Storages/S3Queue/S3QueueSource.h
+++ b/src/Storages/S3Queue/S3QueueSource.h
@@ -41,6 +41,7 @@ public:
         FileIterator(
             std::shared_ptr<S3QueueFilesMetadata> metadata_,
             std::unique_ptr<GlobIterator> glob_iterator_,
+            size_t current_shard_,
             std::atomic<bool> & shutdown_called_);
 
         /// Note:
@@ -58,6 +59,7 @@ public:
         Poco::Logger * log;
 
         const bool sharded_processing;
+        const size_t current_shard;
         std::unordered_map<size_t, std::deque<KeyWithInfoPtr>> sharded_keys;
         std::mutex sharded_keys_mutex;
     };
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index 66c4dacf5bd..39c7e974740 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -569,7 +569,7 @@ std::shared_ptr<StorageS3Queue::FileIterator> StorageS3Queue::createFileIterator
     auto glob_iterator = std::make_unique<StorageS3QueueSource::GlobIterator>(
         *configuration.client, configuration.url, predicate, virtual_columns, local_context,
         /* read_keys */nullptr, configuration.request_settings);
-    return std::make_shared<FileIterator>(files_metadata, std::move(glob_iterator), shutdown_called);
+    return std::make_shared<FileIterator>(files_metadata, std::move(glob_iterator), s3queue_settings->s3queue_current_shard_num, shutdown_called);
 }
 
 void registerStorageS3QueueImpl(const String & name, StorageFactory & factory)

From e56728ae6c00c6abc92a2d186eb24cb2b2fe57b7 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 24 Jan 2024 11:32:09 +0100
Subject: [PATCH 123/245] tests: add s3_plain disk

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/config/config.d/storage_conf.xml | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/tests/config/config.d/storage_conf.xml b/tests/config/config.d/storage_conf.xml
index 18652826d83..1429dfff724 100644
--- a/tests/config/config.d/storage_conf.xml
+++ b/tests/config/config.d/storage_conf.xml
@@ -4,11 +4,17 @@
             <s3_disk>
                 <type>s3</type>
                 <path>s3_disk/</path>
-                <endpoint>http://localhost:11111/test/common/</endpoint>
+                <endpoint>http://localhost:11111/test/s3/</endpoint>
                 <access_key_id>clickhouse</access_key_id>
                 <secret_access_key>clickhouse</secret_access_key>
                 <request_timeout_ms>20000</request_timeout_ms>
             </s3_disk>
+            <s3_plain_disk>
+                <type>s3_plain</type>
+                <endpoint>http://localhost:11111/test/s3_plain/</endpoint>
+                <access_key_id>clickhouse</access_key_id>
+                <secret_access_key>clickhouse</secret_access_key>
+            </s3_plain_disk>
             <s3_cache>
                 <type>cache</type>
                 <disk>s3_disk</disk>

From 6751e01cc3d848132cafb10f0e2195281b6c2575 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 24 Jan 2024 11:59:16 +0100
Subject: [PATCH 124/245] Do not drop parts for static (ro/write-once) storages
 for Replicated engine

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/MergeTree/MergeTreeData.cpp | 9 +++++++++
 src/Storages/StorageMergeTree.cpp        | 3 ---
 2 files changed, 9 insertions(+), 3 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 39c113c240e..b70e1471b3c 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -2740,6 +2740,15 @@ void MergeTreeData::renameInMemory(const StorageID & new_table_id)
 
 void MergeTreeData::dropAllData()
 {
+    /// In case there is read-only/write-once disk we cannot allow to call dropAllData(), but dropping tables is allowed.
+    ///
+    /// Note, that one may think that drop on write-once disk should be
+    /// supported, since it is pretty trivial to implement
+    /// MetadataStorageFromPlainObjectStorageTransaction::removeDirectory(),
+    /// however removing part requires moveDirectory() as well.
+    if (isStaticStorage())
+        return;
+
     LOG_TRACE(log, "dropAllData: waiting for locks.");
     auto settings_ptr = getSettings();
 
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 7e6c5ca3924..b0473a4bbb0 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -319,9 +319,6 @@ void StorageMergeTree::checkTableCanBeDropped(ContextPtr query_context) const
 void StorageMergeTree::drop()
 {
     shutdown(true);
-    /// In case there is read-only disk we cannot allow to call dropAllData(), but dropping tables is allowed.
-    if (isStaticStorage())
-        return;
     dropAllData();
 }
 

From 41ebaefeda10c8177dbb92e0651fd833238880b9 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 24 Jan 2024 16:27:17 +0100
Subject: [PATCH 125/245] Add a note for MetadataStorageFromPlainObjectStorage
 to support transactions

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../ObjectStorages/MetadataStorageFromPlainObjectStorage.h      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
index 1bb008c0c19..58089079a44 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
+++ b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
@@ -106,7 +106,7 @@ public:
 
     void commit() override
     {
-        /// Nothing to commit.
+        /// TODO: rewrite with transactions
     }
 
     bool supportsChmod() const override { return false; }

From f3b4f28f0d6f3064416653877b1b081f004f0d8f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 24 Jan 2024 16:51:44 +0100
Subject: [PATCH 126/245] Disable mutable operations into
 {Replicated,}MergeTree with static storage

Mutable operations includes:
- INSERT
- OPTIMIZE
- parts manipulation
- ...

But does not include DROP, since you need an ability to DROP it.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/MergeTree/MergeTreeData.cpp    |  3 +++
 src/Storages/StorageMergeTree.cpp           | 21 +++++++++++++++++++++
 src/Storages/StorageMergeTree.h             |  2 ++
 src/Storages/StorageReplicatedMergeTree.cpp |  7 +++++++
 4 files changed, 33 insertions(+)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index b70e1471b3c..61bfc2bf9cb 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -90,6 +90,7 @@
 
 #include <base/insertAtEnd.h>
 #include <base/interpolate.h>
+#include <base/defines.h>
 
 #include <algorithm>
 #include <atomic>
@@ -7080,6 +7081,8 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
     const ReadSettings & read_settings,
     const WriteSettings & write_settings)
 {
+    chassert(!isStaticStorage());
+
     /// Check that the storage policy contains the disk where the src_part is located.
     bool does_storage_policy_allow_same_disk = false;
     for (const DiskPtr & disk : getStoragePolicy()->getDisks())
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index b0473a4bbb0..f9d360f02e7 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -65,6 +65,7 @@ namespace ErrorCodes
     extern const int NO_SUCH_DATA_PART;
     extern const int ABORTED;
     extern const int SUPPORT_IS_DISABLED;
+    extern const int TABLE_IS_READ_ONLY;
 }
 
 namespace ActionLocks
@@ -294,6 +295,8 @@ std::optional<UInt64> StorageMergeTree::totalBytesUncompressed(const Settings &)
 SinkToStoragePtr
 StorageMergeTree::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
+    assertNotReadonly();
+
     const auto & settings = local_context->getSettingsRef();
     return std::make_shared<MergeTreeSink>(
         *this, metadata_snapshot, settings.max_partitions_per_insert_block, local_context);
@@ -327,6 +330,8 @@ void StorageMergeTree::alter(
     ContextPtr local_context,
     AlterLockHolder & table_lock_holder)
 {
+    assertNotReadonly();
+
     if (local_context->getCurrentTransaction() && local_context->getSettingsRef().throw_on_unsupported_query_inside_transaction)
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "ALTER METADATA is not supported inside transactions");
 
@@ -617,6 +622,8 @@ void StorageMergeTree::setMutationCSN(const String & mutation_id, CSN csn)
 
 void StorageMergeTree::mutate(const MutationCommands & commands, ContextPtr query_context)
 {
+    assertNotReadonly();
+
     delayMutationOrThrowIfNeeded(nullptr, query_context);
 
     /// Validate partition IDs (if any) before starting mutation
@@ -807,6 +814,8 @@ std::vector<MergeTreeMutationStatus> StorageMergeTree::getMutationsStatus() cons
 
 CancellationCode StorageMergeTree::killMutation(const String & mutation_id)
 {
+    assertNotReadonly();
+
     LOG_TRACE(log, "Killing mutation {}", mutation_id);
     UInt64 mutation_version = MergeTreeMutationEntry::tryParseFileName(mutation_id);
     if (!mutation_version)
@@ -1517,6 +1526,8 @@ bool StorageMergeTree::optimize(
     bool cleanup,
     ContextPtr local_context)
 {
+    assertNotReadonly();
+
     if (deduplicate)
     {
         if (deduplicate_by_columns.empty())
@@ -1762,6 +1773,8 @@ void StorageMergeTree::renameAndCommitEmptyParts(MutableDataPartsVector & new_pa
 
 void StorageMergeTree::truncate(const ASTPtr &, const StorageMetadataPtr &, ContextPtr query_context, TableExclusiveLockHolder &)
 {
+    assertNotReadonly();
+
     {
         /// Asks to complete merges and does not allow them to start.
         /// This protects against "revival" of data for a removed partition after completion of merge.
@@ -2036,6 +2049,8 @@ PartitionCommandsResultInfo StorageMergeTree::attachPartition(
 
 void StorageMergeTree::replacePartitionFrom(const StoragePtr & source_table, const ASTPtr & partition, bool replace, ContextPtr local_context)
 {
+    assertNotReadonly();
+
     auto lock1 = lockForShare(local_context->getCurrentQueryId(), local_context->getSettingsRef().lock_acquire_timeout);
     auto lock2 = source_table->lockForShare(local_context->getCurrentQueryId(), local_context->getSettingsRef().lock_acquire_timeout);
     auto merges_blocker = stopMergesAndWait();
@@ -2434,6 +2449,12 @@ PreparedSetsCachePtr StorageMergeTree::getPreparedSetsCache(Int64 mutation_id)
     return cache;
 }
 
+void StorageMergeTree::assertNotReadonly() const
+{
+    if (isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
+}
+
 void StorageMergeTree::fillNewPartName(MutableDataPartPtr & part, DataPartsLock &)
 {
     part->info.min_block = part->info.max_block = increment.get();
diff --git a/src/Storages/StorageMergeTree.h b/src/Storages/StorageMergeTree.h
index 51bf6aa42e7..359fa1d262d 100644
--- a/src/Storages/StorageMergeTree.h
+++ b/src/Storages/StorageMergeTree.h
@@ -273,6 +273,8 @@ private:
 
     PreparedSetsCachePtr getPreparedSetsCache(Int64 mutation_id);
 
+    void assertNotReadonly() const;
+
     friend class MergeTreeSink;
     friend class MergeTreeData;
     friend class MergePlainMergeTreeTask;
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index c82721d2a18..579cc5f4c30 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -4659,6 +4659,9 @@ bool StorageReplicatedMergeTree::fetchPart(
     zkutil::ZooKeeper::Ptr zookeeper_,
     bool try_fetch_shared)
 {
+    if (isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
+
     auto zookeeper = zookeeper_ ? zookeeper_ : getZooKeeper();
     const auto part_info = MergeTreePartInfo::fromPartName(part_name, format_version);
 
@@ -5496,6 +5499,8 @@ void StorageReplicatedMergeTree::assertNotReadonly() const
 {
     if (is_readonly)
         throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode (replica path: {})", replica_path);
+    if (isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
 }
 
 
@@ -5504,6 +5509,8 @@ SinkToStoragePtr StorageReplicatedMergeTree::write(const ASTPtr & /*query*/, con
     if (!initialization_done)
         throw Exception(ErrorCodes::NOT_INITIALIZED, "Table is not initialized yet");
 
+    if (isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
     /// If table is read-only because it doesn't have metadata in zk yet, then it's not possible to insert into it
     /// Without this check, we'll write data parts on disk, and afterwards will remove them since we'll fail to commit them into zk
     /// In case of remote storage like s3, it'll generate unnecessary PUT requests

From 9ce18bbf4332a53c7838694365c31ee3861e0a98 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 24 Jan 2024 16:06:53 +0100
Subject: [PATCH 127/245] Implement
 MetadataStorageFromPlainObjectStorageTransaction::removeDirectory (for DROP
 TABLE)

This is required to remove format_version.txt for MergeTree after DROP

    (lldb) bt
    * thread 192, name = 'BgSchPool', stop reason = breakpoint 1.1
        frame 0: 0x0000000016c7f452 clickhouse`__cxa_throw(thrown_object=0x00007ffd7a53c480, tinfo=0x00000000011602a0, dest=(clickhouse`DB::Exception::~Exception() at Exception.h:40)) + 18 at cxa_exception.cpp:258
        frame 1: 0x00000000109bf709 clickhouse`DB::IMetadataTransaction::throwNotImplemented() + 137 at IMetadataStorage.h:151
        frame 2: 0x00000000109bf126 clickhouse`DB::IMetadataTransaction::removeDirectory(this=<unavailable>, (null)=<unavailable>) + 6 at IMetadataStorage.h:96
        frame 3: 0x0000000010968978 clickhouse`DB::(anonymous namespace)::RemoveRecursiveObjectStorageOperation::removeMetadataRecursive(this=0x00007ffd7a7327a0, tx=std::__1::shared_ptr<DB::IMetadataTransaction>::element_type @ 0x00007ffd7a6f6018 strong=4 weak=1, path_to_remove="tmp_insert_all_2_2_0") + 376 at DiskObjectStorageTransaction.cpp:364
        frame 4: 0x000000001096893d clickhouse`DB::(anonymous namespace)::RemoveRecursiveObjectStorageOperation::removeMetadataRecursive(this=0x00007ffd7a7327a0, tx=std::__1::shared_ptr<DB::IMetadataTransaction>::element_type @ 0x00007ffd7a6f6018 strong=4 weak=1, path_to_remove="store/27f/27f6f9d2-ab2e-4817-b771-0e706e485b15/") + 317 at DiskObjectStorageTransaction.cpp:362
        frame 5: 0x0000000010965a7f clickhouse`DB::(anonymous namespace)::RemoveRecursiveObjectStorageOperation::execute(this=0x00007ffd7a7327a0, tx=std::__1::shared_ptr<DB::IMetadataTransaction>::element_type @ 0x00007ffd7a6f6018 strong=4 weak=1) + 95 at DiskObjectStorageTransaction.cpp:372
        frame 6: 0x0000000010963a2f clickhouse`DB::DiskObjectStorageTransaction::commit(this=0x00007ffea22b6168) + 79 at DiskObjectStorageTransaction.cpp:903
        frame 7: 0x00000000109577e5 clickhouse`DB::DiskObjectStorage::removeSharedRecursive(this=<unavailable>, path="store/27f/27f6f9d2-ab2e-4817-b771-0e706e485b15/", keep_all_batch_data=false, file_names_remove_metadata_only=size=0) + 133 at DiskObjectStorage.cpp:426
        frame 8: 0x000000001095af79 clickhouse`DB::DiskObjectStorage::removeRecursive(this=<unavailable>, path=<unavailable>) + 57 at DiskObjectStorage.h:79
      * frame 9: 0x0000000010b5c3d5 clickhouse`DB::DatabaseCatalog::dropTableFinally(this=0x00007ffff7096800, table=0x00007ffe853e1bd0) + 1365 at DatabaseCatalog.cpp:1317
        frame 10: 0x0000000010b5b7e7 clickhouse`DB::DatabaseCatalog::dropTableDataTask(this=0x00007ffff7096800) + 2375 at DatabaseCatalog.cpp:1270

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../MetadataStorageFromPlainObjectStorage.cpp               | 6 ++++++
 .../ObjectStorages/MetadataStorageFromPlainObjectStorage.h  | 1 +
 2 files changed, 7 insertions(+)

diff --git a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
index f20cd67a39f..72d512c6f6b 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
@@ -121,6 +121,12 @@ void MetadataStorageFromPlainObjectStorageTransaction::unlinkFile(const std::str
     metadata_storage.object_storage->removeObject(object);
 }
 
+void MetadataStorageFromPlainObjectStorageTransaction::removeDirectory(const std::string & path)
+{
+    for (auto it = metadata_storage.iterateDirectory(path); it->isValid(); it->next())
+        metadata_storage.object_storage->removeObject(StoredObject(it->path()));
+}
+
 void MetadataStorageFromPlainObjectStorageTransaction::createDirectory(const std::string &)
 {
     /// Noop. It is an Object Storage not a filesystem.
diff --git a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
index 58089079a44..8a8466c3fbe 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
+++ b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
@@ -101,6 +101,7 @@ public:
     void createDirectoryRecursive(const std::string & path) override;
 
     void unlinkFile(const std::string & path) override;
+    void removeDirectory(const std::string & path) override;
 
     UnlinkMetadataFileOperationOutcomePtr unlinkMetadata(const std::string & path) override;
 

From d79c1f7e1c4a98a333c89aa77306ad2c22b2d183 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 25 Jan 2024 15:38:36 +0100
Subject: [PATCH 128/245] Fix
 MetadataStorageFromPlainObjectStorage::iterateDirectory() (add prefix)

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp    | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
index 72d512c6f6b..b03809f5b39 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
@@ -98,6 +98,8 @@ DirectoryIteratorPtr MetadataStorageFromPlainObjectStorage::iterateDirectory(con
 {
     /// Required for MergeTree
     auto paths = listDirectory(path);
+    // Prepend path, since iterateDirectory() includes path, unlike listDirectory()
+    std::for_each(paths.begin(), paths.end(), [&](auto & child) { child = fs::path(path) / child; });
     std::vector<std::filesystem::path> fs_paths(paths.begin(), paths.end());
     return std::make_unique<StaticDirectoryIterator>(std::move(fs_paths));
 }

From 046a7a5df53451e224da8214d783ebbd7e7db0dc Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 24 Jan 2024 11:56:09 +0100
Subject: [PATCH 129/245] tests: cover DROP TABLE on s3_plain disk

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 ...80_s3_plain_DROP_TABLE_MergeTree.reference |  7 +++
 .../02980_s3_plain_DROP_TABLE_MergeTree.sh    | 35 +++++++++++++++
 .../02980_s3_plain_DROP_TABLE_MergeTree.yml   |  7 +++
 ...n_DROP_TABLE_ReplicatedMergeTree.reference |  7 +++
 ...s3_plain_DROP_TABLE_ReplicatedMergeTree.sh | 45 +++++++++++++++++++
 ...3_plain_DROP_TABLE_ReplicatedMergeTree.yml |  7 +++
 6 files changed, 108 insertions(+)
 create mode 100644 tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
 create mode 100755 tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
 create mode 100644 tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.yml
 create mode 100644 tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
 create mode 100755 tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
 create mode 100644 tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.yml

diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
new file mode 100644
index 00000000000..2bec7a1d508
--- /dev/null
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
@@ -0,0 +1,7 @@
+Files before DROP TABLE
+format_version.txt
+
+Files after DETACH TABLE
+format_version.txt
+
+Files after DROP TABLE
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
new file mode 100755
index 00000000000..406e53a2175
--- /dev/null
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
@@ -0,0 +1,35 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+# Tag no-fasttest: requires S3
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+config="${BASH_SOURCE[0]/.sh/.yml}"
+
+$CLICKHOUSE_CLIENT -nm -q "
+    drop table if exists data;
+    create table data (key Int) engine=MergeTree() order by key settings disk='s3_plain_disk';
+    insert into data values (1); -- { serverError TABLE_IS_READ_ONLY }
+    optimize table data final; -- { serverError TABLE_IS_READ_ONLY }
+"
+
+path=$($CLICKHOUSE_CLIENT -q "SELECT replace(data_paths[1], 's3_plain', '') FROM system.tables WHERE database = '$CLICKHOUSE_DATABASE' AND table = 'data'")
+# trim / to fix "Unable to parse ExceptionName: XMinioInvalidObjectName Message: Object name contains unsupported characters."
+path=${path%/}
+
+echo "Files before DROP TABLE"
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "${path:?}" | tail -n+2
+
+$CLICKHOUSE_CLIENT -q "detach table data"
+echo "Files after DETACH TABLE"
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
+
+$CLICKHOUSE_CLIENT -nm -q "
+    attach table data;
+    drop table data;
+"
+# Check that there is no leftovers:
+echo "Files after DROP TABLE"
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.yml b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.yml
new file mode 100644
index 00000000000..ca5036736d8
--- /dev/null
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.yml
@@ -0,0 +1,7 @@
+storage_configuration:
+  disks:
+    s3_plain_disk:
+      type: s3_plain
+      endpoint: http://localhost:11111/test/s3_plain/
+      access_key_id: clickhouse
+      secret_access_key: clickhouse
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
new file mode 100644
index 00000000000..166512b4b85
--- /dev/null
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
@@ -0,0 +1,7 @@
+Files before DROP TABLE
+format_version.txt
+
+Files after DETACH TABLE
+format_version.txt
+
+Files after DETACH TABLE
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
new file mode 100755
index 00000000000..6b8f191edc0
--- /dev/null
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
@@ -0,0 +1,45 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+# Tag no-fasttest: requires S3
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+config="${BASH_SOURCE[0]/.sh/.yml}"
+
+$CLICKHOUSE_CLIENT -nm -q "
+    drop table if exists data_read;
+    drop table if exists data_write;
+
+    create table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key settings disk='s3_plain_disk';
+    create table data_write (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'write') order by key;
+
+    insert into data_write values (1);
+    system sync replica data_read; -- { serverError TABLE_IS_READ_ONLY }
+"
+
+path=$($CLICKHOUSE_CLIENT -q "SELECT replace(data_paths[1], 's3_plain', '') FROM system.tables WHERE database = '$CLICKHOUSE_DATABASE' AND table = 'data_read'")
+# trim / to fix "Unable to parse ExceptionName: XMinioInvalidObjectName Message: Object name contains unsupported characters."
+path=${path%/}
+
+echo "Files before DROP TABLE"
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "${path:?}" | tail -n+2
+
+$CLICKHOUSE_CLIENT -nm -q "
+    detach table data_read;
+    detach table data_write;
+"
+echo "Files after DETACH TABLE"
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
+
+$CLICKHOUSE_CLIENT -nm -q "
+    attach table data_read;
+    attach table data_write;
+
+    drop table data_read;
+    drop table data_write;
+"
+# Check that there is no leftovers:
+echo "Files after DETACH TABLE"
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.yml b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.yml
new file mode 100644
index 00000000000..ca5036736d8
--- /dev/null
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.yml
@@ -0,0 +1,7 @@
+storage_configuration:
+  disks:
+    s3_plain_disk:
+      type: s3_plain
+      endpoint: http://localhost:11111/test/s3_plain/
+      access_key_id: clickhouse
+      secret_access_key: clickhouse

From 1ee723d50d1226eff86b0fd6c0297322a5bda682 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 25 Jan 2024 17:56:25 +0100
Subject: [PATCH 130/245] Prohibit DROP from static storages

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/MergeTree/MergeTreeData.cpp                 | 9 ---------
 src/Storages/StorageMergeTree.cpp                        | 4 ++++
 src/Storages/StorageReplicatedMergeTree.cpp              | 4 ++++
 .../integration/test_attach_backup_from_s3_plain/test.py | 3 +--
 4 files changed, 9 insertions(+), 11 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 61bfc2bf9cb..62ec058b124 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -2741,15 +2741,6 @@ void MergeTreeData::renameInMemory(const StorageID & new_table_id)
 
 void MergeTreeData::dropAllData()
 {
-    /// In case there is read-only/write-once disk we cannot allow to call dropAllData(), but dropping tables is allowed.
-    ///
-    /// Note, that one may think that drop on write-once disk should be
-    /// supported, since it is pretty trivial to implement
-    /// MetadataStorageFromPlainObjectStorageTransaction::removeDirectory(),
-    /// however removing part requires moveDirectory() as well.
-    if (isStaticStorage())
-        return;
-
     LOG_TRACE(log, "dropAllData: waiting for locks.");
     auto settings_ptr = getSettings();
 
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index f9d360f02e7..9e1420d811b 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -321,6 +321,10 @@ void StorageMergeTree::checkTableCanBeDropped(ContextPtr query_context) const
 
 void StorageMergeTree::drop()
 {
+    /// In case there is read-only/write-once disk we do not allow DROP, use DETACH instead.
+    if (isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
+
     shutdown(true);
     dropAllData();
 }
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 579cc5f4c30..39c6641a885 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -1085,6 +1085,10 @@ zkutil::ZooKeeperPtr StorageReplicatedMergeTree::getZooKeeperIfTableShutDown() c
 
 void StorageReplicatedMergeTree::drop()
 {
+    /// In case there is read-only/write-once disk we do not allow DROP, use DETACH instead.
+    if (isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
+
     /// There is also the case when user has configured ClickHouse to wrong ZooKeeper cluster
     /// or metadata of staled replica were removed manually,
     /// in this case, has_metadata_in_zookeeper = false, and we also permit to drop the table.
diff --git a/tests/integration/test_attach_backup_from_s3_plain/test.py b/tests/integration/test_attach_backup_from_s3_plain/test.py
index e575c487b7a..4d48a4438ea 100644
--- a/tests/integration/test_attach_backup_from_s3_plain/test.py
+++ b/tests/integration/test_attach_backup_from_s3_plain/test.py
@@ -64,8 +64,7 @@ def test_attach_part(table_name, backup_name, storage_policy, min_bytes_for_wide
 
     node.query(
         f"""
-    -- NOTE: DROP DATABASE cannot be done w/o this due to metadata leftovers
-    set force_remove_data_recursively_on_drop=1;
+    detach table ordinary_db.{table_name};
     drop database ordinary_db sync;
     """
     )

From aafc149c1eff50c0df95459240065f2eafd73a1b Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 25 Jan 2024 19:24:53 +0100
Subject: [PATCH 131/245] Prohibit CREATE on static storages (ATTACH should be
 used instead)

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/StorageMergeTree.cpp           | 6 ++++--
 src/Storages/StorageReplicatedMergeTree.cpp | 3 +++
 2 files changed, 7 insertions(+), 2 deletions(-)

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 9e1420d811b..9896e04c57f 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -115,12 +115,14 @@ StorageMergeTree::StorageMergeTree(
     , writer(*this)
     , merger_mutator(*this)
 {
-    initializeDirectoriesAndFormatVersion(relative_data_path_, attach, date_column_name);
+    if (!attach && isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Creating data on static storage is prohibited, use ATTACH instead");
 
+    initializeDirectoriesAndFormatVersion(relative_data_path_, attach, date_column_name);
 
     loadDataParts(has_force_restore_data_flag, std::nullopt);
 
-    if (!attach && !getDataPartsForInternalUsage().empty() && !isStaticStorage())
+    if (!attach && !getDataPartsForInternalUsage().empty())
         throw Exception(ErrorCodes::INCORRECT_DATA,
                         "Data directory for table already containing data parts - probably "
                         "it was unclean DROP table or manual intervention. "
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 39c6641a885..2f5daaff36c 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -338,6 +338,9 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
     , replicated_fetches_throttler(std::make_shared<Throttler>(getSettings()->max_replicated_fetches_network_bandwidth, getContext()->getReplicatedFetchesThrottler()))
     , replicated_sends_throttler(std::make_shared<Throttler>(getSettings()->max_replicated_sends_network_bandwidth, getContext()->getReplicatedSendsThrottler()))
 {
+    if (!attach && isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Creating data on static storage is prohibited, use ATTACH instead");
+
     initializeDirectoriesAndFormatVersion(relative_data_path_, attach, date_column_name);
     /// We create and deactivate all tasks for consistency.
     /// They all will be scheduled and activated by the restarting thread.

From d99fb4ce5be1086c0b90d20c85bd7f98414b34a9 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 25 Jan 2024 19:24:55 +0100
Subject: [PATCH 132/245] tests: rewrite test for MergeTree engines in s3_plain
 using ATTACH

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 ...80_s3_plain_DROP_TABLE_MergeTree.reference |  9 ++--
 .../02980_s3_plain_DROP_TABLE_MergeTree.sh    | 40 +++++++++++++----
 ...n_DROP_TABLE_ReplicatedMergeTree.reference |  9 ++--
 ...s3_plain_DROP_TABLE_ReplicatedMergeTree.sh | 43 +++++++++++++------
 4 files changed, 68 insertions(+), 33 deletions(-)

diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
index 2bec7a1d508..d510f225161 100644
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
@@ -1,7 +1,4 @@
-Files before DROP TABLE
-format_version.txt
-
+data after INSERT	1
+data after ATTACH	1
+Files before DETACH TABLE
 Files after DETACH TABLE
-format_version.txt
-
-Files after DROP TABLE
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
index 406e53a2175..2059d33ccfd 100755
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
@@ -6,11 +6,38 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
+# config for clickhouse-disks (to check leftovers)
 config="${BASH_SOURCE[0]/.sh/.yml}"
 
+# only in Atomic ATTACH from s3_plain works
+new_database="ordinary_$CLICKHOUSE_DATABASE"
+$CLICKHOUSE_CLIENT --allow_deprecated_database_ordinary=1 -q "create database $new_database engine=Ordinary"
+CLICKHOUSE_CLIENT=${CLICKHOUSE_CLIENT/--database=$CLICKHOUSE_DATABASE/--database=$new_database}
+CLICKHOUSE_DATABASE="$new_database"
+
 $CLICKHOUSE_CLIENT -nm -q "
     drop table if exists data;
-    create table data (key Int) engine=MergeTree() order by key settings disk='s3_plain_disk';
+    create table data (key Int) engine=MergeTree() order by key settings disk='s3_plain_disk'; -- { serverError TABLE_IS_READ_ONLY }
+
+    create table data (key Int) engine=MergeTree() order by key;
+    insert into data values (1);
+    select 'data after INSERT', count() from data;
+"
+
+# suppress output
+$CLICKHOUSE_CLIENT -q "backup table data to S3('http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE', 'test', 'testtest')" > /dev/null
+
+$CLICKHOUSE_CLIENT -nm -q "
+    drop table data;
+    attach table data (key Int) engine=MergeTree() order by key
+    settings
+        max_suspicious_broken_parts=0,
+        disk=disk(type=s3_plain,
+            endpoint='http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE',
+            access_key_id='test',
+            secret_access_key='testtest');
+    select 'data after ATTACH', count() from data;
+
     insert into data values (1); -- { serverError TABLE_IS_READ_ONLY }
     optimize table data final; -- { serverError TABLE_IS_READ_ONLY }
 "
@@ -19,17 +46,12 @@ path=$($CLICKHOUSE_CLIENT -q "SELECT replace(data_paths[1], 's3_plain', '') FROM
 # trim / to fix "Unable to parse ExceptionName: XMinioInvalidObjectName Message: Object name contains unsupported characters."
 path=${path%/}
 
-echo "Files before DROP TABLE"
+echo "Files before DETACH TABLE"
 clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "${path:?}" | tail -n+2
 
 $CLICKHOUSE_CLIENT -q "detach table data"
 echo "Files after DETACH TABLE"
 clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
 
-$CLICKHOUSE_CLIENT -nm -q "
-    attach table data;
-    drop table data;
-"
-# Check that there is no leftovers:
-echo "Files after DROP TABLE"
-clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
+# metadata file is left
+$CLICKHOUSE_CLIENT --force_remove_data_recursively_on_drop=1 -q "drop database if exists $CLICKHOUSE_DATABASE"
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
index 166512b4b85..d510f225161 100644
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
@@ -1,7 +1,4 @@
-Files before DROP TABLE
-format_version.txt
-
-Files after DETACH TABLE
-format_version.txt
-
+data after INSERT	1
+data after ATTACH	1
+Files before DETACH TABLE
 Files after DETACH TABLE
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
index 6b8f191edc0..d8c92c5d6fa 100755
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
@@ -8,14 +8,41 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 
 config="${BASH_SOURCE[0]/.sh/.yml}"
 
+# only in Atomic ATTACH from s3_plain works
+new_database="ordinary_$CLICKHOUSE_DATABASE"
+$CLICKHOUSE_CLIENT --allow_deprecated_database_ordinary=1 -q "create database $new_database engine=Ordinary"
+CLICKHOUSE_CLIENT=${CLICKHOUSE_CLIENT/--database=$CLICKHOUSE_DATABASE/--database=$new_database}
+CLICKHOUSE_DATABASE="$new_database"
+
 $CLICKHOUSE_CLIENT -nm -q "
     drop table if exists data_read;
     drop table if exists data_write;
 
-    create table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key settings disk='s3_plain_disk';
     create table data_write (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'write') order by key;
+    create table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key settings disk='s3_plain_disk'; -- { serverError TABLE_IS_READ_ONLY }
+    create table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key;
 
     insert into data_write values (1);
+    system sync replica data_read;
+    select 'data after INSERT', count() from data_read;
+"
+
+# suppress output
+$CLICKHOUSE_CLIENT -q "backup table data_read to S3('http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE', 'test', 'testtest')" > /dev/null
+
+$CLICKHOUSE_CLIENT -nm -q "
+    drop table data_read;
+    attach table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key
+    settings
+        max_suspicious_broken_parts=0,
+        disk=disk(type=s3_plain,
+            endpoint='http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE',
+            access_key_id='test',
+            secret_access_key='testtest');
+    select 'data after ATTACH', count() from data_read;
+
+    insert into data_read values (1); -- { serverError TABLE_IS_READ_ONLY }
+    optimize table data_read final; -- { serverError TABLE_IS_READ_ONLY }
     system sync replica data_read; -- { serverError TABLE_IS_READ_ONLY }
 "
 
@@ -23,7 +50,7 @@ path=$($CLICKHOUSE_CLIENT -q "SELECT replace(data_paths[1], 's3_plain', '') FROM
 # trim / to fix "Unable to parse ExceptionName: XMinioInvalidObjectName Message: Object name contains unsupported characters."
 path=${path%/}
 
-echo "Files before DROP TABLE"
+echo "Files before DETACH TABLE"
 clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "${path:?}" | tail -n+2
 
 $CLICKHOUSE_CLIENT -nm -q "
@@ -33,13 +60,5 @@ $CLICKHOUSE_CLIENT -nm -q "
 echo "Files after DETACH TABLE"
 clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
 
-$CLICKHOUSE_CLIENT -nm -q "
-    attach table data_read;
-    attach table data_write;
-
-    drop table data_read;
-    drop table data_write;
-"
-# Check that there is no leftovers:
-echo "Files after DETACH TABLE"
-clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
+# metadata file is left
+$CLICKHOUSE_CLIENT --force_remove_data_recursively_on_drop=1 -q "drop database if exists $CLICKHOUSE_DATABASE"

From 66a40bda0acce258debe6158ce39dacf3300c502 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 26 Jan 2024 11:36:07 +0100
Subject: [PATCH 133/245] Revert "Prohibit DROP from static storages"

It is actually OK to DROP at least from read-only disk, as for the
write-once it should be OK as well, since CREATE is prohibited anyway,
so there should be no leftovers

CI: https://s3.amazonaws.com/clickhouse-test-reports/59170/c82050d1925439f0ede2b32acb5b1b8df4acae5d/stress_test__asan_.html
CI: https://s3.amazonaws.com/clickhouse-test-reports/59170/c82050d1925439f0ede2b32acb5b1b8df4acae5d/integration_tests__asan__[3_4].html

This reverts commit 082e62712c5e2f4c48d1abc6141ccfd1249d26b4.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/MergeTree/MergeTreeData.cpp                 | 9 +++++++++
 src/Storages/StorageMergeTree.cpp                        | 4 ----
 src/Storages/StorageReplicatedMergeTree.cpp              | 4 ----
 .../integration/test_attach_backup_from_s3_plain/test.py | 3 ++-
 4 files changed, 11 insertions(+), 9 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 62ec058b124..61bfc2bf9cb 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -2741,6 +2741,15 @@ void MergeTreeData::renameInMemory(const StorageID & new_table_id)
 
 void MergeTreeData::dropAllData()
 {
+    /// In case there is read-only/write-once disk we cannot allow to call dropAllData(), but dropping tables is allowed.
+    ///
+    /// Note, that one may think that drop on write-once disk should be
+    /// supported, since it is pretty trivial to implement
+    /// MetadataStorageFromPlainObjectStorageTransaction::removeDirectory(),
+    /// however removing part requires moveDirectory() as well.
+    if (isStaticStorage())
+        return;
+
     LOG_TRACE(log, "dropAllData: waiting for locks.");
     auto settings_ptr = getSettings();
 
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 9896e04c57f..ead75113c6d 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -323,10 +323,6 @@ void StorageMergeTree::checkTableCanBeDropped(ContextPtr query_context) const
 
 void StorageMergeTree::drop()
 {
-    /// In case there is read-only/write-once disk we do not allow DROP, use DETACH instead.
-    if (isStaticStorage())
-        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
-
     shutdown(true);
     dropAllData();
 }
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 2f5daaff36c..6aa6cc60d7b 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -1088,10 +1088,6 @@ zkutil::ZooKeeperPtr StorageReplicatedMergeTree::getZooKeeperIfTableShutDown() c
 
 void StorageReplicatedMergeTree::drop()
 {
-    /// In case there is read-only/write-once disk we do not allow DROP, use DETACH instead.
-    if (isStaticStorage())
-        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
-
     /// There is also the case when user has configured ClickHouse to wrong ZooKeeper cluster
     /// or metadata of staled replica were removed manually,
     /// in this case, has_metadata_in_zookeeper = false, and we also permit to drop the table.
diff --git a/tests/integration/test_attach_backup_from_s3_plain/test.py b/tests/integration/test_attach_backup_from_s3_plain/test.py
index 4d48a4438ea..e575c487b7a 100644
--- a/tests/integration/test_attach_backup_from_s3_plain/test.py
+++ b/tests/integration/test_attach_backup_from_s3_plain/test.py
@@ -64,7 +64,8 @@ def test_attach_part(table_name, backup_name, storage_policy, min_bytes_for_wide
 
     node.query(
         f"""
-    detach table ordinary_db.{table_name};
+    -- NOTE: DROP DATABASE cannot be done w/o this due to metadata leftovers
+    set force_remove_data_recursively_on_drop=1;
     drop database ordinary_db sync;
     """
     )

From 7cc7fb892c4f2ed4317ba0b86a082624d2b2c1a2 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 26 Jan 2024 11:42:37 +0100
Subject: [PATCH 134/245] tests/test_disk_over_web_server: update expected
 assertion for static storage

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/integration/test_disk_over_web_server/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_disk_over_web_server/test.py b/tests/integration/test_disk_over_web_server/test.py
index a71fdeff302..4b175d188ef 100644
--- a/tests/integration/test_disk_over_web_server/test.py
+++ b/tests/integration/test_disk_over_web_server/test.py
@@ -172,7 +172,7 @@ def test_incorrect_usage(cluster):
     assert "Table is read-only" in result
 
     result = node2.query_and_get_error("OPTIMIZE TABLE test0 FINAL")
-    assert "Only read-only operations are supported" in result
+    assert "Table is in readonly mode due to static storage" in result
 
     node2.query("DROP TABLE test0 SYNC")
 

From 7ba31bf55c42132dd35ee2ed0caf284587e5dd47 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 26 Jan 2024 16:28:36 +0100
Subject: [PATCH 135/245] Do not create format_version.txt on write-once
 storages

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/MergeTree/MergeTreeData.cpp | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 61bfc2bf9cb..6ed07da5c3f 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -301,7 +301,11 @@ void MergeTreeData::initializeDirectoriesAndFormatVersion(const std::string & re
             if (disk->isBroken())
                continue;
 
-            if (!disk->isReadOnly())
+            /// Write once disk is almost the same as read-only for MergeTree,
+            /// since it does not support move, that is required for any
+            /// operation over MergeTree, so avoid writing format_version.txt
+            /// into it as well, to avoid leaving it after DROP.
+            if (!disk->isReadOnly() && !disk->isWriteOnce())
             {
                 auto buf = disk->writeFile(format_version_path, DBMS_DEFAULT_BUFFER_SIZE, WriteMode::Rewrite, getContext()->getWriteSettings());
                 writeIntText(format_version.toUnderType(), *buf);

From 90ab986be6a80227ca281a86ce12db1499d830fe Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 26 Jan 2024 16:37:54 +0100
Subject: [PATCH 136/245] Revert "Prohibit CREATE on static storages (ATTACH
 should be used instead)"

CREATE is used by Replicated database even for ATTACH, and anyway ATTACH
creates format_version.txt as well (without previuos patch).

This reverts commit 323f1f320ebe7e588d443abf78efa2c60193e7a9.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/StorageMergeTree.cpp           | 6 ++----
 src/Storages/StorageReplicatedMergeTree.cpp | 3 ---
 2 files changed, 2 insertions(+), 7 deletions(-)

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index ead75113c6d..f9d360f02e7 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -115,14 +115,12 @@ StorageMergeTree::StorageMergeTree(
     , writer(*this)
     , merger_mutator(*this)
 {
-    if (!attach && isStaticStorage())
-        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Creating data on static storage is prohibited, use ATTACH instead");
-
     initializeDirectoriesAndFormatVersion(relative_data_path_, attach, date_column_name);
 
+
     loadDataParts(has_force_restore_data_flag, std::nullopt);
 
-    if (!attach && !getDataPartsForInternalUsage().empty())
+    if (!attach && !getDataPartsForInternalUsage().empty() && !isStaticStorage())
         throw Exception(ErrorCodes::INCORRECT_DATA,
                         "Data directory for table already containing data parts - probably "
                         "it was unclean DROP table or manual intervention. "
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 6aa6cc60d7b..579cc5f4c30 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -338,9 +338,6 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
     , replicated_fetches_throttler(std::make_shared<Throttler>(getSettings()->max_replicated_fetches_network_bandwidth, getContext()->getReplicatedFetchesThrottler()))
     , replicated_sends_throttler(std::make_shared<Throttler>(getSettings()->max_replicated_sends_network_bandwidth, getContext()->getReplicatedSendsThrottler()))
 {
-    if (!attach && isStaticStorage())
-        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Creating data on static storage is prohibited, use ATTACH instead");
-
     initializeDirectoriesAndFormatVersion(relative_data_path_, attach, date_column_name);
     /// We create and deactivate all tasks for consistency.
     /// They all will be scheduled and activated by the restarting thread.

From 332924a2b48910b9d9fb2fcfab7c10c78391426f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 26 Jan 2024 15:29:42 +0100
Subject: [PATCH 137/245] tests: adjust 02980_s3_plain_DROP_TABLE tests

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 ...80_s3_plain_DROP_TABLE_MergeTree.reference | 26 +++++++++++++++++++
 .../02980_s3_plain_DROP_TABLE_MergeTree.sh    |  9 +++----
 ...n_DROP_TABLE_ReplicatedMergeTree.reference | 26 +++++++++++++++++++
 ...s3_plain_DROP_TABLE_ReplicatedMergeTree.sh |  8 +++---
 4 files changed, 60 insertions(+), 9 deletions(-)

diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
index d510f225161..531163e1d84 100644
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
@@ -1,4 +1,30 @@
 data after INSERT	1
 data after ATTACH	1
 Files before DETACH TABLE
+all_1_1_0
+
+backups/ordinary_default/data/ordinary_default/data/all_1_1_0:
+primary.cidx
+serialization.json
+metadata_version.txt
+default_compression_codec.txt
+data.bin
+data.cmrk3
+count.txt
+columns.txt
+checksums.txt
+
 Files after DETACH TABLE
+all_1_1_0
+
+backups/ordinary_default/data/ordinary_default/data/all_1_1_0:
+primary.cidx
+serialization.json
+metadata_version.txt
+default_compression_codec.txt
+data.bin
+data.cmrk3
+count.txt
+columns.txt
+checksums.txt
+
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
index 2059d33ccfd..386c29704b6 100755
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
@@ -1,6 +1,7 @@
 #!/usr/bin/env bash
-# Tags: no-fasttest
+# Tags: no-fasttest, no-random-settings, no-random-merge-tree-settings
 # Tag no-fasttest: requires S3
+# Tag no-random-settings, no-random-merge-tree-settings: to avoid creating extra files like serialization.json, this test too exocit anyway
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -17,15 +18,13 @@ CLICKHOUSE_DATABASE="$new_database"
 
 $CLICKHOUSE_CLIENT -nm -q "
     drop table if exists data;
-    create table data (key Int) engine=MergeTree() order by key settings disk='s3_plain_disk'; -- { serverError TABLE_IS_READ_ONLY }
-
     create table data (key Int) engine=MergeTree() order by key;
     insert into data values (1);
     select 'data after INSERT', count() from data;
 "
 
 # suppress output
-$CLICKHOUSE_CLIENT -q "backup table data to S3('http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE', 'test', 'testtest')" > /dev/null
+$CLICKHOUSE_CLIENT -q "backup table data to S3('http://localhost:11111/test/s3_plain/backups/$CLICKHOUSE_DATABASE', 'test', 'testtest')" > /dev/null
 
 $CLICKHOUSE_CLIENT -nm -q "
     drop table data;
@@ -33,7 +32,7 @@ $CLICKHOUSE_CLIENT -nm -q "
     settings
         max_suspicious_broken_parts=0,
         disk=disk(type=s3_plain,
-            endpoint='http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE',
+            endpoint='http://localhost:11111/test/s3_plain/backups/$CLICKHOUSE_DATABASE',
             access_key_id='test',
             secret_access_key='testtest');
     select 'data after ATTACH', count() from data;
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
index d510f225161..ad9897b3381 100644
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
@@ -1,4 +1,30 @@
 data after INSERT	1
 data after ATTACH	1
 Files before DETACH TABLE
+all_0_0_0
+
+backups/ordinary_default/data/ordinary_default/data_read/all_0_0_0:
+primary.cidx
+serialization.json
+metadata_version.txt
+default_compression_codec.txt
+data.bin
+data.cmrk3
+count.txt
+columns.txt
+checksums.txt
+
 Files after DETACH TABLE
+all_0_0_0
+
+backups/ordinary_default/data/ordinary_default/data_read/all_0_0_0:
+primary.cidx
+serialization.json
+metadata_version.txt
+default_compression_codec.txt
+data.bin
+data.cmrk3
+count.txt
+columns.txt
+checksums.txt
+
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
index d8c92c5d6fa..f31ef518c62 100755
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
@@ -1,6 +1,7 @@
 #!/usr/bin/env bash
-# Tags: no-fasttest
+# Tags: no-fasttest, no-random-settings, no-random-merge-tree-settings
 # Tag no-fasttest: requires S3
+# Tag no-random-settings, no-random-merge-tree-settings: to avoid creating extra files like serialization.json, this test too exocit anyway
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -19,7 +20,6 @@ $CLICKHOUSE_CLIENT -nm -q "
     drop table if exists data_write;
 
     create table data_write (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'write') order by key;
-    create table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key settings disk='s3_plain_disk'; -- { serverError TABLE_IS_READ_ONLY }
     create table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key;
 
     insert into data_write values (1);
@@ -28,7 +28,7 @@ $CLICKHOUSE_CLIENT -nm -q "
 "
 
 # suppress output
-$CLICKHOUSE_CLIENT -q "backup table data_read to S3('http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE', 'test', 'testtest')" > /dev/null
+$CLICKHOUSE_CLIENT -q "backup table data_read to S3('http://localhost:11111/test/s3_plain/backups/$CLICKHOUSE_DATABASE', 'test', 'testtest')" > /dev/null
 
 $CLICKHOUSE_CLIENT -nm -q "
     drop table data_read;
@@ -36,7 +36,7 @@ $CLICKHOUSE_CLIENT -nm -q "
     settings
         max_suspicious_broken_parts=0,
         disk=disk(type=s3_plain,
-            endpoint='http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE',
+            endpoint='http://localhost:11111/test/s3_plain/backups/$CLICKHOUSE_DATABASE',
             access_key_id='test',
             secret_access_key='testtest');
     select 'data after ATTACH', count() from data_read;

From 6795d0207f98657e499c66871678c23412ac04ba Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Fri, 26 Jan 2024 16:37:54 +0000
Subject: [PATCH 138/245] Update test_reload_after_fail_in_cache_dictionary for
 analyzer

---
 tests/analyzer_integration_broken_tests.txt                   | 1 -
 tests/integration/test_dictionaries_update_and_reload/test.py | 2 +-
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index 23f22209451..e1d4de59a23 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -1,7 +1,6 @@
 test_access_for_functions/test.py::test_access_rights_for_function
 test_build_sets_from_multiple_threads/test.py::test_set
 test_concurrent_backups_s3/test.py::test_concurrent_backups
-test_dictionaries_update_and_reload/test.py::test_reload_after_fail_in_cache_dictionary
 test_distributed_backward_compatability/test.py::test_distributed_in_tuple
 test_distributed_type_object/test.py::test_distributed_type_object
 test_executable_table_function/test.py::test_executable_function_input_python
diff --git a/tests/integration/test_dictionaries_update_and_reload/test.py b/tests/integration/test_dictionaries_update_and_reload/test.py
index 3d96d0b8dd4..648ea847afb 100644
--- a/tests/integration/test_dictionaries_update_and_reload/test.py
+++ b/tests/integration/test_dictionaries_update_and_reload/test.py
@@ -281,7 +281,7 @@ def test_reload_after_fail_in_cache_dictionary(started_cluster):
     query_and_get_error = instance.query_and_get_error
 
     # Can't get a value from the cache dictionary because the source (table `test.xypairs`) doesn't respond.
-    expected_error = "Table test.xypairs does not exist"
+    expected_error = "UNKNOWN_TABLE"
     update_error = "Could not update cache dictionary cache_xypairs now"
     assert expected_error in query_and_get_error(
         "SELECT dictGetUInt64('cache_xypairs', 'y', toUInt64(1))"

From 8fcedddcda46f59b8ddf701105b8f8cabff60ba7 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Fri, 26 Jan 2024 17:46:49 +0100
Subject: [PATCH 139/245] Fix abort in iceberg metadata on bad file paths

---
 src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp b/src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp
index e01a9a831c0..df1536f53fc 100644
--- a/src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp
+++ b/src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp
@@ -596,10 +596,11 @@ Strings IcebergMetadata::getDataFiles()
             const auto status = status_int_column->getInt(i);
             const auto data_path = std::string(file_path_string_column->getDataAt(i).toView());
             const auto pos = data_path.find(configuration.url.key);
-            const auto file_path = data_path.substr(pos);
             if (pos == std::string::npos)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "Expected to find {} in data path: {}", configuration.url.key, data_path);
 
+            const auto file_path = data_path.substr(pos);
+
             if (ManifestEntryStatus(status) == ManifestEntryStatus::DELETED)
             {
                 LOG_TEST(log, "Processing delete file for path: {}", file_path);

From e6352234c31a1eebea36d461cf29675d8d1a1b63 Mon Sep 17 00:00:00 2001
From: Aleksandr Musorin <aleksandr.musorin@semrush.com>
Date: Tue, 23 Jan 2024 14:43:30 +0100
Subject: [PATCH 140/245] Added parsing trailing symbols for type expressions

```sql
SELECT (1, 'foo')::Tuple(a Int, b String,);
SELECT (1, 'foo')::Tuple(Int, String,);
SELECT (1, (2,'foo'))::Tuple(Int, Tuple(Int, String,),);
````

fix
---
 src/Parsers/ParserDataType.cpp                    | 15 +++++++++++++++
 .../0_stateless/02676_trailing_commas.reference   |  3 +++
 .../queries/0_stateless/02676_trailing_commas.sql |  4 ++++
 3 files changed, 22 insertions(+)

diff --git a/src/Parsers/ParserDataType.cpp b/src/Parsers/ParserDataType.cpp
index 3e2a6facac6..99c0b4b29ac 100644
--- a/src/Parsers/ParserDataType.cpp
+++ b/src/Parsers/ParserDataType.cpp
@@ -116,6 +116,18 @@ bool ParserDataType::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     if (!type_name_suffix.empty())
         type_name = type_name_upper + " " + type_name_suffix;
 
+    /// skip trailing comma in types, e.g. Tuple(Int, String,)
+    if (pos->type == TokenType::Comma)
+    {
+        Expected test_expected;
+        auto test_pos = pos;
+        ++test_pos;
+        if (ParserToken(TokenType::ClosingRoundBracket).ignore(test_pos, test_expected))
+        { // the end of the type definition was reached, there was a trailing comma
+            ++pos;
+        }
+    }
+
     auto function_node = std::make_shared<ASTFunction>();
     function_node->name = type_name;
     function_node->no_empty_args = true;
@@ -133,6 +145,9 @@ bool ParserDataType::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
     if (!args_parser.parse(pos, expr_list_args, expected))
         return false;
+    if (pos->type == TokenType::Comma)
+        // ignore trailing comma inside Nested structures like Tuple(Int, Tuple(Int, String),)
+        ++pos;
     if (pos->type != TokenType::ClosingRoundBracket)
         return false;
     ++pos;
diff --git a/tests/queries/0_stateless/02676_trailing_commas.reference b/tests/queries/0_stateless/02676_trailing_commas.reference
index 76d173ca23e..cfb2ccd6a0f 100644
--- a/tests/queries/0_stateless/02676_trailing_commas.reference
+++ b/tests/queries/0_stateless/02676_trailing_commas.reference
@@ -3,3 +3,6 @@
 1
 1	2	0
 1
+(1,'foo')
+(1,'foo')
+(1,(2,'foo'))
diff --git a/tests/queries/0_stateless/02676_trailing_commas.sql b/tests/queries/0_stateless/02676_trailing_commas.sql
index 048405c4d20..7fb64bb57a3 100644
--- a/tests/queries/0_stateless/02676_trailing_commas.sql
+++ b/tests/queries/0_stateless/02676_trailing_commas.sql
@@ -3,3 +3,7 @@ SELECT 1, FROM numbers(1);
 WITH 1 as a SELECT a, FROM numbers(1);
 WITH 1 as from SELECT from, from + from, from in [0], FROM numbers(1);
 SELECT n, FROM (SELECT 1 AS n);
+SELECT (1, 'foo')::Tuple(a Int, b String,);
+SELECT (1, 'foo')::Tuple(a Int, b String,,); -- { clientError SYNTAX_ERROR }
+SELECT (1, 'foo')::Tuple(Int, String,);
+SELECT (1, (2,'foo'))::Tuple(Int, Tuple(Int, String,),);

From 0a21e6aa5d99f499749d73cec56981f3f2e82a5b Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 26 Jan 2024 19:07:30 +0100
Subject: [PATCH 141/245] Fix

---
 src/Storages/S3Queue/S3QueueFilesMetadata.h |  2 +-
 src/Storages/S3Queue/S3QueueSource.cpp      | 11 +++++++----
 2 files changed, 8 insertions(+), 5 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index bfb232675b8..f62898889c3 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -89,7 +89,7 @@ public:
     /// shard_id must be in range [0, shards_num - 1]
     size_t getIdForProcessingThread(size_t thread_id, size_t shard_id) const { return shard_id * threads_per_shard + thread_id; }
 
-    bool isProcessingIdBelongsToShard(size_t id, size_t shard_id) const { return shard_id * threads_per_shard <= id && id < shard_id * (threads_per_shard + 1); }
+    bool isProcessingIdBelongsToShard(size_t id, size_t shard_id) const { return shard_id * threads_per_shard <= id && id < (shard_id + 1) * threads_per_shard; }
 
 private:
     const S3QueueMode mode;
diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index 400fd13d0dd..96805eca10b 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -87,11 +87,14 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
                 if (val && sharded_processing)
                 {
                     auto shard = metadata->getProcessingIdForPath(val->key);
-                    if (idx != shard && metadata->isProcessingIdBelongsToShard(shard, current_shard))
+                    if (idx != shard)
                     {
-                        LOG_TEST(log, "Key {} is for shard {} (total: {})", val->key, shard, sharded_keys.size());
-                        auto & keys = sharded_keys.at(shard);
-                        keys.push_back(val);
+                        if (metadata->isProcessingIdBelongsToShard(shard, current_shard))
+                        {
+                            LOG_TEST(log, "Key {} is for shard {} (total: {})", val->key, shard, sharded_keys.size());
+                            auto & keys = sharded_keys.at(shard);
+                            keys.push_back(val);
+                        }
                         continue;
                     }
                 }

From 2c6243f365cc0f2248a868a66aa91d0adae6454a Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Fri, 26 Jan 2024 19:52:53 +0100
Subject: [PATCH 142/245] Update test.py

---
 tests/integration/test_broken_projections/test.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index f8cbe8e6d9a..8be14c6a57b 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -230,7 +230,6 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
         node.query("SYSTEM FLUSH LOGS")
         assert "proj1" in node.query(
             f"""
-        SYSTEM FLUSH LOGS;
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
         FROM system.query_log
         WHERE query_id='{query_id}' AND type='QueryFinish'
@@ -252,7 +251,6 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
         node.query("SYSTEM FLUSH LOGS")
         assert "proj2" in node.query(
             f"""
-        SYSTEM FLUSH LOGS;
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
         FROM system.query_log
         WHERE query_id='{query_id}' AND type='QueryFinish'

From 163a3e44d38b249155f4c056e6388b0cffe26153 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Fri, 26 Jan 2024 21:22:39 +0100
Subject: [PATCH 143/245] Update run.sh

---
 docker/test/stateless/run.sh | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index b7c04a6fabd..8eeb01449b4 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -246,16 +246,16 @@ clickhouse-client -q "system flush logs" ||:
 stop_logs_replication
 
 # Try to get logs while server is running
-successfuly_saved=0
+failed_to_save_logs=0
 for table in query_log zookeeper_log trace_log transactions_info_log metric_log
 do
-    clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst
-    successfuly_saved=$?
+    error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst } 2>&1 )
+    [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
-        clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst
-        successfuly_saved=$((successfuly_saved | $?))
-        clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst
-        successfuly_saved=$((successfuly_saved | $?))
+        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst } 2>&1 )
+        [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
+        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst } 2>&1 )
+        [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     fi
 done
 
@@ -280,7 +280,7 @@ fi
 
 
 # If server crashed dump system logs with clickhouse-local
-if [ $successfuly_saved -ne 0 ]; then
+if [ $failed_to_save_logs -ne 0 ]; then
     # Compress tables.
     #
     # NOTE:

From 5d62cdd58cb6f4988742bf40c1a27c318aeb6172 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Thu, 25 Jan 2024 21:05:02 +0300
Subject: [PATCH 144/245] Added setting
 update_insert_deduplication_token_in_dependent_materialized_views

---
 src/Core/Settings.h                           |   1 +
 .../Transforms/buildPushingToViewsChain.cpp   |  25 +++++
 ...ation_token_hierarchical_inserts.reference |   9 ++
 ...duplication_token_hierarchical_inserts.sql | 103 ++++++++++++++++++
 4 files changed, 138 insertions(+)
 create mode 100644 tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
 create mode 100644 tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index e0b3ca39899..a09f2d2331d 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -588,6 +588,7 @@ class IColumn;
     M(Bool, normalize_function_names, true, "Normalize function names to their canonical names", 0) \
     M(Bool, enable_early_constant_folding, true, "Enable query optimization where we analyze function and subqueries results and rewrite query if there're constants there", 0) \
     M(Bool, deduplicate_blocks_in_dependent_materialized_views, false, "Should deduplicate blocks for materialized views if the block is not a duplicate for the table. Use true to always deduplicate in dependent tables.", 0) \
+    M(Bool, update_insert_deduplication_token_in_dependent_materialized_views, false, "Should update insert deduplication token with table identifier during insert in dependent materialized views.", 0) \
     M(Bool, materialized_views_ignore_errors, false, "Allows to ignore errors for MATERIALIZED VIEW, and deliver original block to the table regardless of MVs", 0) \
     M(Bool, ignore_materialized_views_with_dropped_target_table, false, "Ignore MVs with dropped taraget table during pushing to views", 0) \
     M(Bool, allow_experimental_refreshable_materialized_view, false, "Allow refreshable materialized views (CREATE MATERIALIZED VIEW <name> REFRESH ...).", 0) \
diff --git a/src/Processors/Transforms/buildPushingToViewsChain.cpp b/src/Processors/Transforms/buildPushingToViewsChain.cpp
index 960cc019001..0cbbf4ef482 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.cpp
+++ b/src/Processors/Transforms/buildPushingToViewsChain.cpp
@@ -244,7 +244,32 @@ Chain buildPushingToViewsChain(
 
         // Do not deduplicate insertions into MV if the main insertion is Ok
         if (disable_deduplication_for_children)
+        {
             insert_context->setSetting("insert_deduplicate", Field{false});
+        }
+        else if (insert_settings.update_insert_deduplication_token_in_dependent_materialized_views)
+        {
+            /** Update deduplication token passed to dependent MV with current table id. So it is possible to properly handle
+              * deduplication in complex INSERT flows.
+              *
+              * Example:
+              *
+              * landing -┬--> mv_1_1 ---> ds_1_1 ---> mv_2_1 --┬-> ds_2_1 ---> mv_3_1 ---> ds_3_1
+              *          |                                     |
+              *          └--> mv_1_2 ---> ds_1_2 ---> mv_2_2 --┘
+              *
+              * Here we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will
+              * be inserted into `ds_2_1`.
+              */
+            auto insert_deduplication_token = insert_settings.insert_deduplication_token.toString();
+
+            if (table_id.hasUUID())
+                insert_deduplication_token += "_" + toString(table_id.uuid);
+            else
+                insert_deduplication_token += "_" + table_id.getFullNameNotQuoted();
+
+            insert_context->setSetting("insert_deduplication_token", insert_deduplication_token);
+        }
 
         // Processing of blocks for MVs is done block by block, and there will
         // be no parallel reading after (plus it is not a costless operation)
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
new file mode 100644
index 00000000000..a5a9a5539ba
--- /dev/null
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
@@ -0,0 +1,9 @@
+0
+landing	all_1_1_0	0
+ds_1_2	all_1_1_0	0
+ds_1_1	all_1_1_0	0
+ds_2_1	all_1_1_0	0
+ds_2_1	all_2_2_0	0
+ds_3_1	all_1_1_0	0
+ds_3_1	all_2_2_0	0
+10
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
new file mode 100644
index 00000000000..4208543c284
--- /dev/null
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
@@ -0,0 +1,103 @@
+SET insert_deduplicate = 1;
+SET deduplicate_blocks_in_dependent_materialized_views = 1;
+SET update_insert_deduplication_token_in_dependent_materialized_views = 1;
+SET insert_deduplication_token = 'test';
+
+DROP TABLE IF EXISTS landing;
+CREATE TABLE landing
+(
+    timestamp UInt64,
+    value UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP TABLE IF EXISTS ds_1_1;
+CREATE TABLE ds_1_1
+(
+    t UInt64,
+    v UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP VIEW IF EXISTS mv_1_1;
+CREATE MATERIALIZED VIEW mv_1_1 TO ds_1_1 as
+SELECT
+    timestamp t, sum(value) v
+FROM landing
+GROUP BY t;
+
+DROP TABLE IF EXISTS ds_1_2;
+CREATE TABLE ds_1_2
+(
+    t UInt64,
+    v UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP VIEW IF EXISTS mv_1_2;
+CREATE MATERIALIZED VIEW mv_1_2 TO ds_1_2 as
+SELECT
+    timestamp t, sum(value) v
+FROM landing
+GROUP BY t;
+
+DROP TABLE IF EXISTS ds_2_1;
+CREATE TABLE ds_2_1
+(
+    l String,
+    t DateTime,
+    v UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP VIEW IF EXISTS mv_2_1;
+CREATE MATERIALIZED VIEW mv_2_1 TO ds_2_1 as
+SELECT '2_1' l, t, v
+FROM ds_1_1;
+
+DROP VIEW IF EXISTS mv_2_2;
+CREATE MATERIALIZED VIEW mv_2_2 TO ds_2_1 as
+SELECT '2_2' l, t, v
+FROM ds_1_2;
+
+DROP TABLE IF EXISTS ds_3_1;
+CREATE TABLE ds_3_1
+(
+    l String,
+    t DateTime,
+    v UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP VIEW IF EXISTS mv_3_1;
+CREATE MATERIALIZED VIEW mv_3_1 TO ds_3_1 as
+SELECT '3_1' l, t, v
+FROM ds_2_1;
+
+INSERT INTO landing SELECT 1 as timestamp, 1 AS value FROM numbers(10);
+
+SELECT sleep(3);
+
+INSERT INTO landing SELECT 1 as timestamp, 1 AS value FROM numbers(10);
+
+SYSTEM FLUSH LOGS;
+SELECT table, name, error FROM system.part_log
+WHERE database = currentDatabase()
+ORDER BY event_time;
+
+SELECT count() FROM landing;
+
+DROP TABLE landing;
+
+DROP TABLE ds_1_1;
+DROP VIEW mv_1_1;
+
+DROP TABLE ds_1_2;
+DROP VIEW mv_1_2;
+
+DROP TABLE ds_2_1;
+DROP VIEW mv_2_1;
+DROP VIEW mv_2_2;
+
+DROP TABLE ds_3_1;
+DROP VIEW mv_3_1;

From 4ae425461fa7c3fb6b9a32d4f209ce558322497f Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Thu, 25 Jan 2024 21:22:48 +0300
Subject: [PATCH 145/245] Added documentation

---
 docs/en/operations/settings/settings.md | 28 ++++++++++++++++++++++++-
 1 file changed, 27 insertions(+), 1 deletion(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 75d05d55366..3fd409e2d68 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -1991,6 +1991,32 @@ If an INSERTed block is skipped due to deduplication in the source table, there
 At the same time, this behaviour “breaks” `INSERT` idempotency. If an `INSERT` into the main table was successful and `INSERT` into a materialized view failed (e.g. because of communication failure with ClickHouse Keeper) a client will get an error and can retry the operation. However, the materialized view won’t receive the second insert because it will be discarded by deduplication in the main (source) table. The setting `deduplicate_blocks_in_dependent_materialized_views` allows for changing this behaviour. On retry, a materialized view will receive the repeat insert and will perform a deduplication check by itself,
 ignoring check result for the source table, and will insert rows lost because of the first failure.
 
+## update_insert_deduplication_token_in_dependent_materialized_views {#update-insert-deduplication-token-in-dependent-materialized-views}
+
+Allows to update insert deduplication token with table identifier during insert in dependent materialized views.
+
+Possible values:
+
+      0 — Disabled.
+      1 — Enabled.
+
+Default value: 0.
+
+Usage:
+
+If setting `update_insert_deduplication_token_in_dependent_materialized_views` is enabled, `insert_deduplication_token` is passed to dependent materialized views. But in complex INSERT flows it is possible that we want to avoid deduplication for dependent materialized views.
+
+Example:
+```
+landing -┬--> mv_1_1 ---> ds_1_1 ---> mv_2_1 --┬-> ds_2_1 ---> mv_3_1 ---> ds_3_1
+         |                                     |
+         └--> mv_1_2 ---> ds_1_2 ---> mv_2_2 --┘
+```
+
+In this example we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will be inserted into `ds_2_1`. Without `update_insert_deduplication_token_in_dependent_materialized_views` setting, those two different blocks will be deduplicated, because different blocks from `mv_2_1` and `mv_2_2` will have the same `insert_deduplication_token`.
+
+If setting `update_insert_deduplication_token_in_dependent_materialized_views` is enabled, during each insert into dependent materialized views `insert_deduplication_token` is updated with table identifier, so block from `mv_2_1` and block from `mv_2_2` will have different `insert_deduplication_token` and will not be deduplicated.
+
 ## insert_deduplication_token {#insert_deduplication_token}
 
 The setting allows a user to provide own deduplication semantic in MergeTree/ReplicatedMergeTree
@@ -5165,7 +5191,7 @@ SETTINGS(dictionary_use_async_executor=1, max_threads=8);
 ## storage_metadata_write_full_object_key {#storage_metadata_write_full_object_key}
 
 When set to `true` the metadata files are written with `VERSION_FULL_OBJECT_KEY` format version. With that format full object storage key names are written to the metadata files.
-When set to `false` the metadata files are written with the previous format version, `VERSION_INLINE_DATA`. With that format only suffixes of object storage key names are are written to the metadata files. The prefix for all of object storage key names is set in configurations files at `storage_configuration.disks` section. 
+When set to `false` the metadata files are written with the previous format version, `VERSION_INLINE_DATA`. With that format only suffixes of object storage key names are are written to the metadata files. The prefix for all of object storage key names is set in configurations files at `storage_configuration.disks` section.
 
 Default value: `false`.
 

From 4a10b7125298b9133ec66b2654138ed459010d33 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Fri, 26 Jan 2024 13:49:32 +0300
Subject: [PATCH 146/245] Updated documentation

---
 docs/en/operations/settings/settings.md | 52 ++++++++++++-------------
 1 file changed, 26 insertions(+), 26 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 3fd409e2d68..5f197990f4d 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -1991,32 +1991,6 @@ If an INSERTed block is skipped due to deduplication in the source table, there
 At the same time, this behaviour “breaks” `INSERT` idempotency. If an `INSERT` into the main table was successful and `INSERT` into a materialized view failed (e.g. because of communication failure with ClickHouse Keeper) a client will get an error and can retry the operation. However, the materialized view won’t receive the second insert because it will be discarded by deduplication in the main (source) table. The setting `deduplicate_blocks_in_dependent_materialized_views` allows for changing this behaviour. On retry, a materialized view will receive the repeat insert and will perform a deduplication check by itself,
 ignoring check result for the source table, and will insert rows lost because of the first failure.
 
-## update_insert_deduplication_token_in_dependent_materialized_views {#update-insert-deduplication-token-in-dependent-materialized-views}
-
-Allows to update insert deduplication token with table identifier during insert in dependent materialized views.
-
-Possible values:
-
-      0 — Disabled.
-      1 — Enabled.
-
-Default value: 0.
-
-Usage:
-
-If setting `update_insert_deduplication_token_in_dependent_materialized_views` is enabled, `insert_deduplication_token` is passed to dependent materialized views. But in complex INSERT flows it is possible that we want to avoid deduplication for dependent materialized views.
-
-Example:
-```
-landing -┬--> mv_1_1 ---> ds_1_1 ---> mv_2_1 --┬-> ds_2_1 ---> mv_3_1 ---> ds_3_1
-         |                                     |
-         └--> mv_1_2 ---> ds_1_2 ---> mv_2_2 --┘
-```
-
-In this example we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will be inserted into `ds_2_1`. Without `update_insert_deduplication_token_in_dependent_materialized_views` setting, those two different blocks will be deduplicated, because different blocks from `mv_2_1` and `mv_2_2` will have the same `insert_deduplication_token`.
-
-If setting `update_insert_deduplication_token_in_dependent_materialized_views` is enabled, during each insert into dependent materialized views `insert_deduplication_token` is updated with table identifier, so block from `mv_2_1` and block from `mv_2_2` will have different `insert_deduplication_token` and will not be deduplicated.
-
 ## insert_deduplication_token {#insert_deduplication_token}
 
 The setting allows a user to provide own deduplication semantic in MergeTree/ReplicatedMergeTree
@@ -2066,6 +2040,32 @@ SELECT * FROM test_table
 └───┘
 ```
 
+## update_insert_deduplication_token_in_dependent_materialized_views {#update-insert-deduplication-token-in-dependent-materialized-views}
+
+Allows to update `insert_deduplication_token` with table identifier during insert in dependent materialized views, if setting `deduplicate_blocks_in_dependent_materialized_views` is enabled and `insert_deduplication_token` is set.
+
+Possible values:
+
+      0 — Disabled.
+      1 — Enabled.
+
+Default value: 0.
+
+Usage:
+
+If setting `deduplicate_blocks_in_dependent_materialized_views` is enabled, `insert_deduplication_token` is passed to dependent materialized views. But in complex INSERT flows it is possible that we want to avoid deduplication for dependent materialized views.
+
+Example:
+```
+landing -┬--> mv_1_1 ---> ds_1_1 ---> mv_2_1 --┬-> ds_2_1 ---> mv_3_1 ---> ds_3_1
+         |                                     |
+         └--> mv_1_2 ---> ds_1_2 ---> mv_2_2 --┘
+```
+
+In this example we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will be inserted into `ds_2_1`. Without `update_insert_deduplication_token_in_dependent_materialized_views` setting enabled, those two different blocks will be deduplicated, because different blocks from `mv_2_1` and `mv_2_2` will have the same `insert_deduplication_token`.
+
+If setting `update_insert_deduplication_token_in_dependent_materialized_views` is enabled, during each insert into dependent materialized views `insert_deduplication_token` is updated with table identifier, so block from `mv_2_1` and block from `mv_2_2` will have different `insert_deduplication_token` and will not be deduplicated.
+
 ## insert_keeper_max_retries
 
 The setting sets the maximum number of retries for ClickHouse Keeper (or ZooKeeper) requests during insert into replicated MergeTree. Only Keeper requests which failed due to network error, Keeper session timeout, or request timeout are considered for retries.

From 0f46200d5aaba14cbfbb2e923826b1394ebc4d2c Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Fri, 26 Jan 2024 20:09:22 +0300
Subject: [PATCH 147/245] Fixed tests

---
 src/Processors/Transforms/buildPushingToViewsChain.cpp       | 5 +++--
 ...insert_deduplication_token_hierarchical_inserts.reference | 4 ++--
 ...02972_insert_deduplication_token_hierarchical_inserts.sql | 2 +-
 3 files changed, 6 insertions(+), 5 deletions(-)

diff --git a/src/Processors/Transforms/buildPushingToViewsChain.cpp b/src/Processors/Transforms/buildPushingToViewsChain.cpp
index 0cbbf4ef482..8ddc3ab0c61 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.cpp
+++ b/src/Processors/Transforms/buildPushingToViewsChain.cpp
@@ -247,7 +247,8 @@ Chain buildPushingToViewsChain(
         {
             insert_context->setSetting("insert_deduplicate", Field{false});
         }
-        else if (insert_settings.update_insert_deduplication_token_in_dependent_materialized_views)
+        else if (insert_settings.update_insert_deduplication_token_in_dependent_materialized_views &&
+            !insert_settings.insert_deduplication_token.value.empty())
         {
             /** Update deduplication token passed to dependent MV with current table id. So it is possible to properly handle
               * deduplication in complex INSERT flows.
@@ -261,7 +262,7 @@ Chain buildPushingToViewsChain(
               * Here we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will
               * be inserted into `ds_2_1`.
               */
-            auto insert_deduplication_token = insert_settings.insert_deduplication_token.toString();
+            auto insert_deduplication_token = insert_settings.insert_deduplication_token.value;
 
             if (table_id.hasUUID())
                 insert_deduplication_token += "_" + toString(table_id.uuid);
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
index a5a9a5539ba..71c9053d644 100644
--- a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
@@ -1,9 +1,9 @@
 0
-landing	all_1_1_0	0
-ds_1_2	all_1_1_0	0
 ds_1_1	all_1_1_0	0
+ds_1_2	all_1_1_0	0
 ds_2_1	all_1_1_0	0
 ds_2_1	all_2_2_0	0
 ds_3_1	all_1_1_0	0
 ds_3_1	all_2_2_0	0
+landing	all_1_1_0	0
 10
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
index 4208543c284..2e982cde738 100644
--- a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
@@ -83,7 +83,7 @@ INSERT INTO landing SELECT 1 as timestamp, 1 AS value FROM numbers(10);
 SYSTEM FLUSH LOGS;
 SELECT table, name, error FROM system.part_log
 WHERE database = currentDatabase()
-ORDER BY event_time;
+ORDER BY event_time, table, name;
 
 SELECT count() FROM landing;
 

From 7d48d0da72af35a2f63d5b6fcf53303e15c5c330 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Sat, 27 Jan 2024 15:57:33 +0300
Subject: [PATCH 148/245] Fixed tests

---
 .../02972_insert_deduplication_token_hierarchical_inserts.sql   | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
index 2e982cde738..242133e9122 100644
--- a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
@@ -83,7 +83,7 @@ INSERT INTO landing SELECT 1 as timestamp, 1 AS value FROM numbers(10);
 SYSTEM FLUSH LOGS;
 SELECT table, name, error FROM system.part_log
 WHERE database = currentDatabase()
-ORDER BY event_time, table, name;
+ORDER BY table, name;
 
 SELECT count() FROM landing;
 

From 71cd1efd8bdf0d1265f578575217fb8b5404123f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sat, 27 Jan 2024 15:17:40 +0100
Subject: [PATCH 149/245] tests: fix
 02980_s3_plain_DROP_TABLE_ReplicatedMergeTree flakiness

In case of commit failed (likely due to fault injection in tests) part
name will have different name, not all_0_0_0, so replace numbers with X.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 ...2980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference | 8 ++++----
 .../02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh      | 5 +++--
 2 files changed, 7 insertions(+), 6 deletions(-)

diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
index ad9897b3381..1e191b719a5 100644
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
@@ -1,9 +1,9 @@
 data after INSERT	1
 data after ATTACH	1
 Files before DETACH TABLE
-all_0_0_0
+all_X_X_X
 
-backups/ordinary_default/data/ordinary_default/data_read/all_0_0_0:
+backups/ordinary_default/data/ordinary_default/data_read/all_X_X_X:
 primary.cidx
 serialization.json
 metadata_version.txt
@@ -15,9 +15,9 @@ columns.txt
 checksums.txt
 
 Files after DETACH TABLE
-all_0_0_0
+all_X_X_X
 
-backups/ordinary_default/data/ordinary_default/data_read/all_0_0_0:
+backups/ordinary_default/data/ordinary_default/data_read/all_X_X_X:
 primary.cidx
 serialization.json
 metadata_version.txt
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
index f31ef518c62..bf20247c7aa 100755
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
@@ -51,14 +51,15 @@ path=$($CLICKHOUSE_CLIENT -q "SELECT replace(data_paths[1], 's3_plain', '') FROM
 path=${path%/}
 
 echo "Files before DETACH TABLE"
-clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "${path:?}" | tail -n+2
+# sed to match any part, since in case of fault injection part name may not be all_0_0_0 but all_1_1_0
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "${path:?}" | tail -n+2 | sed 's/all_[^_]*_[^_]*_0/all_X_X_X/g'
 
 $CLICKHOUSE_CLIENT -nm -q "
     detach table data_read;
     detach table data_write;
 "
 echo "Files after DETACH TABLE"
-clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2 | sed 's/all_[^_]*_[^_]*_0/all_X_X_X/g'
 
 # metadata file is left
 $CLICKHOUSE_CLIENT --force_remove_data_recursively_on_drop=1 -q "drop database if exists $CLICKHOUSE_DATABASE"

From eb909a5db4ea844f69afb146c20de33ce25a01ff Mon Sep 17 00:00:00 2001
From: slvrtrn <hypnoash@gmail.com>
Date: Sat, 27 Jan 2024 18:36:38 +0100
Subject: [PATCH 150/245] Reapply add MySQL net write/read settings

---
 src/Server/MySQLHandler.cpp                   | 46 +++++++++++++------
 src/Server/MySQLHandler.h                     |  9 ++--
 .../02967_mysql_settings_override.reference   | 23 ++++++++++
 .../02967_mysql_settings_override.sh          | 31 +++++++++++++
 4 files changed, 91 insertions(+), 18 deletions(-)
 create mode 100644 tests/queries/0_stateless/02967_mysql_settings_override.reference
 create mode 100755 tests/queries/0_stateless/02967_mysql_settings_override.sh

diff --git a/src/Server/MySQLHandler.cpp b/src/Server/MySQLHandler.cpp
index c159a09c874..260219c1556 100644
--- a/src/Server/MySQLHandler.cpp
+++ b/src/Server/MySQLHandler.cpp
@@ -66,7 +66,7 @@ static String showCountWarningsReplacementQuery(const String & query);
 static String selectEmptyReplacementQuery(const String & query);
 static String showTableStatusReplacementQuery(const String & query);
 static String killConnectionIdReplacementQuery(const String & query);
-static String selectLimitReplacementQuery(const String & query);
+static std::optional<String> setSettingReplacementQuery(const String & query, const String & mysql_setting, const String & native_setting);
 
 MySQLHandler::MySQLHandler(
     IServer & server_,
@@ -88,12 +88,14 @@ MySQLHandler::MySQLHandler(
     if (ssl_enabled)
         server_capabilities |= CLIENT_SSL;
 
-    replacements.emplace("SHOW WARNINGS", showWarningsReplacementQuery);
-    replacements.emplace("SHOW COUNT(*) WARNINGS", showCountWarningsReplacementQuery);
-    replacements.emplace("KILL QUERY", killConnectionIdReplacementQuery);
-    replacements.emplace("SHOW TABLE STATUS LIKE", showTableStatusReplacementQuery);
-    replacements.emplace("SHOW VARIABLES", selectEmptyReplacementQuery);
-    replacements.emplace("SET SQL_SELECT_LIMIT", selectLimitReplacementQuery);
+    queries_replacements.emplace("SHOW WARNINGS", showWarningsReplacementQuery);
+    queries_replacements.emplace("SHOW COUNT(*) WARNINGS", showCountWarningsReplacementQuery);
+    queries_replacements.emplace("KILL QUERY", killConnectionIdReplacementQuery);
+    queries_replacements.emplace("SHOW TABLE STATUS LIKE", showTableStatusReplacementQuery);
+    queries_replacements.emplace("SHOW VARIABLES", selectEmptyReplacementQuery);
+    settings_replacements.emplace("SQL_SELECT_LIMIT", "limit");
+    settings_replacements.emplace("NET_WRITE_TIMEOUT", "send_timeout");
+    settings_replacements.emplace("NET_READ_TIMEOUT", "receive_timeout");
 }
 
 void MySQLHandler::run()
@@ -342,16 +344,30 @@ void MySQLHandler::comQuery(ReadBuffer & payload, bool binary_protocol)
         bool should_replace = false;
         bool with_output = false;
 
-        for (auto const & x : replacements)
+        // Queries replacements
+        for (auto const & [query_to_replace, replacement_fn] : queries_replacements)
         {
-            if (0 == strncasecmp(x.first.c_str(), query.c_str(), x.first.size()))
+            if (0 == strncasecmp(query_to_replace.c_str(), query.c_str(), query_to_replace.size()))
             {
                 should_replace = true;
-                replacement_query = x.second(query);
+                replacement_query = replacement_fn(query);
                 break;
             }
         }
 
+        // Settings replacements
+        if (!should_replace)
+            for (auto const & [mysql_setting, native_setting] : settings_replacements)
+            {
+                const auto replacement_query_opt = setSettingReplacementQuery(query, mysql_setting, native_setting);
+                if (replacement_query_opt.has_value())
+                {
+                    should_replace = true;
+                    replacement_query = replacement_query_opt.value();
+                    break;
+                }
+            }
+
         ReadBufferFromString replacement(replacement_query);
 
         auto query_context = session->makeQueryContext();
@@ -601,12 +617,12 @@ static String showTableStatusReplacementQuery(const String & query)
     return query;
 }
 
-static String selectLimitReplacementQuery(const String & query)
+static std::optional<String> setSettingReplacementQuery(const String & query, const String & mysql_setting, const String & native_setting)
 {
-    const String prefix = "SET SQL_SELECT_LIMIT";
-    if (query.starts_with(prefix))
-        return "SET limit" + std::string(query.data() + prefix.length());
-    return query;
+    const String prefix = "SET " + mysql_setting;
+    if (0 == strncasecmp(prefix.c_str(), query.c_str(), prefix.size()))
+        return "SET " + native_setting + String(query.data() + prefix.length());
+    return std::nullopt;
 }
 
 /// Replace "KILL QUERY [connection_id]" into "KILL QUERY WHERE query_id LIKE 'mysql:[connection_id]:xxx'".
diff --git a/src/Server/MySQLHandler.h b/src/Server/MySQLHandler.h
index 867a90a6205..8f9dcd872db 100644
--- a/src/Server/MySQLHandler.h
+++ b/src/Server/MySQLHandler.h
@@ -92,9 +92,12 @@ protected:
     MySQLProtocol::PacketEndpointPtr packet_endpoint;
     std::unique_ptr<Session> session;
 
-    using ReplacementFn = std::function<String(const String & query)>;
-    using Replacements = std::unordered_map<std::string, ReplacementFn>;
-    Replacements replacements;
+    using QueryReplacementFn = std::function<String(const String & query)>;
+    using QueriesReplacements = std::unordered_map<std::string, QueryReplacementFn>;
+    QueriesReplacements queries_replacements;
+
+    using SettingsReplacements = std::unordered_map<std::string, std::string>;
+    SettingsReplacements settings_replacements;
 
     std::mutex prepared_statements_mutex;
     UInt32 current_prepared_statement_id TSA_GUARDED_BY(prepared_statements_mutex) = 0;
diff --git a/tests/queries/0_stateless/02967_mysql_settings_override.reference b/tests/queries/0_stateless/02967_mysql_settings_override.reference
new file mode 100644
index 00000000000..bc058f4889e
--- /dev/null
+++ b/tests/queries/0_stateless/02967_mysql_settings_override.reference
@@ -0,0 +1,23 @@
+-- Init
+s
+a
+b
+c
+d
+-- Uppercase tests
+s
+a
+b
+name	value
+send_timeout	22
+name	value
+receive_timeout	33
+-- Lowercase tests
+s
+a
+b
+c
+name	value
+send_timeout	55
+name	value
+receive_timeout	66
diff --git a/tests/queries/0_stateless/02967_mysql_settings_override.sh b/tests/queries/0_stateless/02967_mysql_settings_override.sh
new file mode 100755
index 00000000000..e3439a80ab4
--- /dev/null
+++ b/tests/queries/0_stateless/02967_mysql_settings_override.sh
@@ -0,0 +1,31 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+# Tag no-fasttest: requires mysql client
+
+# Tests the override of certain MySQL proprietary settings to ClickHouse native settings
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+CHANGED_SETTINGS_QUERY="SELECT name, value FROM system.settings WHERE name IN ('send_timeout', 'receive_timeout') AND changed;"
+
+TEST_TABLE="mysql_settings_override_test"
+
+DROP_TABLE="DROP TABLE IF EXISTS $TEST_TABLE;"
+CREATE_TABLE="CREATE TABLE $TEST_TABLE (s String) ENGINE MergeTree ORDER BY s;"
+INSERT_STMT="INSERT INTO $TEST_TABLE VALUES ('a'), ('b'), ('c'), ('d');"
+SELECT_STMT="SELECT * FROM $TEST_TABLE;"
+
+echo "-- Init"
+${MYSQL_CLIENT} --execute "$DROP_TABLE $CREATE_TABLE $INSERT_STMT $SELECT_STMT" # should fetch all 4 records
+
+echo "-- Uppercase tests"
+${MYSQL_CLIENT} --execute "SET SQL_SELECT_LIMIT = 2; $SELECT_STMT" # should fetch 2 records out of 4
+${MYSQL_CLIENT} --execute "SET NET_WRITE_TIMEOUT = 22; $CHANGED_SETTINGS_QUERY"
+${MYSQL_CLIENT} --execute "SET NET_READ_TIMEOUT = 33; $CHANGED_SETTINGS_QUERY"
+
+echo "-- Lowercase tests"
+${MYSQL_CLIENT} --execute "set sql_select_limit=3; $SELECT_STMT" # should fetch 3 records out of 4
+${MYSQL_CLIENT} --execute "set net_write_timeout=55; $CHANGED_SETTINGS_QUERY"
+${MYSQL_CLIENT} --execute "set net_read_timeout=66; $CHANGED_SETTINGS_QUERY"

From 7d785c47e292b8f28d7c1b947393432316cd9c14 Mon Sep 17 00:00:00 2001
From: slvrtrn <hypnoash@gmail.com>
Date: Sat, 27 Jan 2024 18:45:57 +0100
Subject: [PATCH 151/245] Add drop table

---
 tests/queries/0_stateless/02967_mysql_settings_override.sh | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/02967_mysql_settings_override.sh b/tests/queries/0_stateless/02967_mysql_settings_override.sh
index e3439a80ab4..cee18255eeb 100755
--- a/tests/queries/0_stateless/02967_mysql_settings_override.sh
+++ b/tests/queries/0_stateless/02967_mysql_settings_override.sh
@@ -29,3 +29,5 @@ echo "-- Lowercase tests"
 ${MYSQL_CLIENT} --execute "set sql_select_limit=3; $SELECT_STMT" # should fetch 3 records out of 4
 ${MYSQL_CLIENT} --execute "set net_write_timeout=55; $CHANGED_SETTINGS_QUERY"
 ${MYSQL_CLIENT} --execute "set net_read_timeout=66; $CHANGED_SETTINGS_QUERY"
+
+${MYSQL_CLIENT} --execute "$DROP_TABLE"

From 7022ca9eceb1fc6c2abc97a77ee5b770b6a3997b Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Sat, 27 Jan 2024 20:24:03 +0100
Subject: [PATCH 152/245] Fix _block_number column with non-default
 serializations and mutation

---
 src/Storages/MergeTree/MutateTask.cpp         | 10 +++++
 ...parse_serialization_and_mutation.reference |  0
 ...mber_sparse_serialization_and_mutation.sql | 39 +++++++++++++++++++
 3 files changed, 49 insertions(+)
 create mode 100644 tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.reference
 create mode 100644 tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.sql

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 6bcdfe34296..302a9bb2b1e 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -21,6 +21,7 @@
 #include <Storages/MutationCommands.h>
 #include <Storages/MergeTree/MergeTreeDataMergerMutator.h>
 #include <Storages/MergeTree/MergeTreeIndexInverted.h>
+#include <Storages/BlockNumberColumn.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <boost/algorithm/string/replace.hpp>
 #include <Common/ProfileEventsScope.h>
@@ -308,6 +309,15 @@ getColumnsForNewDataPart(
         }
     }
 
+    if (!storage_columns_set.contains(BlockNumberColumn::name))
+    {
+        if (source_part->tryGetSerialization(BlockNumberColumn::name) != nullptr)
+        {
+            storage_columns.push_back({BlockNumberColumn::name, BlockNumberColumn::type});
+            storage_columns_set.insert(BlockNumberColumn::name);
+        }
+    }
+
     SerializationInfoByName new_serialization_infos;
     for (const auto & [name, old_info] : serialization_infos)
     {
diff --git a/tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.reference b/tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.sql b/tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.sql
new file mode 100644
index 00000000000..7a1de2897fb
--- /dev/null
+++ b/tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.sql
@@ -0,0 +1,39 @@
+-- Tags: zookeeper
+
+-- we need exact block-numbers
+SET insert_keeper_fault_injection_probability=0;
+
+DROP TABLE IF EXISTS table_with_some_columns;
+
+CREATE TABLE table_with_some_columns(
+    key UInt64,
+    value0 UInt8
+)
+ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/table_with_some_columns', '1')
+ORDER BY key
+SETTINGS allow_experimental_block_number_column=1,
+ratio_of_defaults_for_sparse_serialization=0.0001,
+min_bytes_for_wide_part = 0,
+replace_long_file_name_to_hash=0; -- simpler to debug
+
+INSERT INTO table_with_some_columns SELECT rand(), number + 10 from numbers(100000);
+
+INSERT INTO table_with_some_columns SELECT rand(), number + 10 from numbers(1);
+
+OPTIMIZE TABLE table_with_some_columns FINAL;
+
+INSERT INTO table_with_some_columns SELECT rand(), number+222222222 from numbers(1);
+
+OPTIMIZE TABLE table_with_some_columns FINAL;
+
+set alter_sync = 2;
+
+ALTER TABLE table_with_some_columns DROP COLUMN value0;
+
+INSERT INTO table_with_some_columns SELECT rand() from numbers(1);
+
+OPTIMIZE TABLE table_with_some_columns FINAL;
+
+SELECT *, _block_number FROM table_with_some_columns where not ignore(*) Format Null;
+
+DROP TABLE IF EXISTS table_with_some_columns;

From 00c140b7bbf834efa81c54c9c403653824607455 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Sat, 27 Jan 2024 21:13:08 +0000
Subject: [PATCH 153/245] Fix getting filename from read buffer wrappers

---
 src/IO/CompressedReadBufferWrapper.h |  5 +++--
 src/IO/ReadBuffer.cpp                |  5 ++++-
 src/IO/ReadBufferWrapperBase.h       | 15 +++++++++++++++
 src/IO/WithFileName.cpp              |  8 ++++----
 4 files changed, 26 insertions(+), 7 deletions(-)
 create mode 100644 src/IO/ReadBufferWrapperBase.h

diff --git a/src/IO/CompressedReadBufferWrapper.h b/src/IO/CompressedReadBufferWrapper.h
index bb58a7bfeb3..66e57488434 100644
--- a/src/IO/CompressedReadBufferWrapper.h
+++ b/src/IO/CompressedReadBufferWrapper.h
@@ -1,11 +1,12 @@
 #pragma once
 #include <IO/BufferWithOwnMemory.h>
 #include <IO/ReadBuffer.h>
+#include <IO/ReadBufferWrapperBase.h>
 
 namespace DB
 {
 
-class CompressedReadBufferWrapper : public BufferWithOwnMemory<ReadBuffer>
+class CompressedReadBufferWrapper : public BufferWithOwnMemory<ReadBuffer>, public ReadBufferWrapperBase
 {
 public:
     CompressedReadBufferWrapper(
@@ -16,7 +17,7 @@ public:
     : BufferWithOwnMemory<ReadBuffer>(buf_size, existing_memory, alignment)
     , in(std::move(in_)) {}
 
-    const ReadBuffer & getWrappedReadBuffer() const { return *in; }
+    const ReadBuffer & getWrappedReadBuffer() const override { return *in; }
     ReadBuffer & getWrappedReadBuffer() { return *in; }
 
     void prefetch(Priority priority) override { in->prefetch(priority); }
diff --git a/src/IO/ReadBuffer.cpp b/src/IO/ReadBuffer.cpp
index bf054d08425..0d1cd322fdd 100644
--- a/src/IO/ReadBuffer.cpp
+++ b/src/IO/ReadBuffer.cpp
@@ -1,4 +1,5 @@
 #include <IO/ReadBuffer.h>
+#include <IO/ReadBufferWrapperBase.h>
 
 
 namespace DB
@@ -7,7 +8,7 @@ namespace DB
 namespace
 {
     template <typename CustomData>
-    class ReadBufferWrapper : public ReadBuffer
+    class ReadBufferWrapper : public ReadBuffer, public ReadBufferWrapperBase
     {
     public:
         ReadBufferWrapper(ReadBuffer & in_, CustomData && custom_data_)
@@ -15,6 +16,8 @@ namespace
         {
         }
 
+        const ReadBuffer & getWrappedReadBuffer() const override { return in; }
+
     private:
         ReadBuffer & in;
         CustomData custom_data;
diff --git a/src/IO/ReadBufferWrapperBase.h b/src/IO/ReadBufferWrapperBase.h
new file mode 100644
index 00000000000..1c594e8018a
--- /dev/null
+++ b/src/IO/ReadBufferWrapperBase.h
@@ -0,0 +1,15 @@
+#pragma once
+
+#include <IO/ReadBuffer.h>
+
+namespace DB
+{
+
+class ReadBufferWrapperBase
+{
+public:
+    virtual const ReadBuffer & getWrappedReadBuffer() const = 0;
+    virtual ~ReadBufferWrapperBase() = default;
+};
+
+}
diff --git a/src/IO/WithFileName.cpp b/src/IO/WithFileName.cpp
index 2383182f7e7..7b50b205935 100644
--- a/src/IO/WithFileName.cpp
+++ b/src/IO/WithFileName.cpp
@@ -1,5 +1,5 @@
 #include <IO/WithFileName.h>
-#include <IO/CompressedReadBufferWrapper.h>
+#include <IO/ReadBufferWrapperBase.h>
 #include <IO/ParallelReadBuffer.h>
 #include <IO/PeekableReadBuffer.h>
 
@@ -16,10 +16,10 @@ static String getFileName(const T & entry)
 
 String getFileNameFromReadBuffer(const ReadBuffer & in)
 {
-    if (const auto * compressed = dynamic_cast<const CompressedReadBufferWrapper *>(&in))
-        return getFileName(compressed->getWrappedReadBuffer());
+    if (const auto * wrapper = dynamic_cast<const ReadBufferWrapperBase *>(&in))
+        return getFileNameFromReadBuffer(wrapper->getWrappedReadBuffer());
     else if (const auto * parallel = dynamic_cast<const ParallelReadBuffer *>(&in))
-        return getFileName(parallel->getReadBuffer());
+        return getFileNameFromReadBuffer(parallel->getReadBuffer());
     else if (const auto * peekable = dynamic_cast<const PeekableReadBuffer *>(&in))
         return getFileNameFromReadBuffer(peekable->getSubBuffer());
     else

From 24ab61932e438c887f7224092d9524397881e9c3 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Sat, 27 Jan 2024 22:42:43 +0100
Subject: [PATCH 154/245] Update run.sh

---
 docker/test/stateless/run.sh | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index 8eeb01449b4..19f9783cd01 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -249,12 +249,12 @@ stop_logs_replication
 failed_to_save_logs=0
 for table in query_log zookeeper_log trace_log transactions_info_log metric_log
 do
-    error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst } 2>&1 )
+    error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst; } 2>&1 )
     [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
-        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst } 2>&1 )
+        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst; } 2>&1 )
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
-        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst } 2>&1 )
+        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst; } 2>&1 )
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     fi
 done

From 5023851b471c3fc4564db3bc8d01c351f6cb1fa2 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Sat, 27 Jan 2024 22:09:40 +0000
Subject: [PATCH 155/245] Add test

---
 .../02973_s3_compressed_file_in_error_message.reference  | 1 +
 .../02973_s3_compressed_file_in_error_message.sh         | 9 +++++++++
 2 files changed, 10 insertions(+)
 create mode 100644 tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.reference
 create mode 100755 tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh

diff --git a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.reference b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.reference
new file mode 100644
index 00000000000..d00491fd7e5
--- /dev/null
+++ b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.reference
@@ -0,0 +1 @@
+1
diff --git a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
new file mode 100755
index 00000000000..2af0a83bd26
--- /dev/null
+++ b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
@@ -0,0 +1,9 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_LOCAL -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c -F "a.tsv"
+

From 07750ee9494cdbd8e7cb838eec79f1a00f6b8afb Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Fri, 26 Jan 2024 19:38:58 +0300
Subject: [PATCH 156/245] Added AtomicLogger

---
 base/poco/Foundation/src/Logger.cpp           | 13 ++---
 src/Common/AtomicLogger.h                     | 51 +++++++++++++++++++
 src/Common/Exception.cpp                      | 10 ++++
 src/Common/Exception.h                        |  3 ++
 src/Common/Logger.h                           |  1 -
 src/Common/logger_useful.h                    |  4 +-
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  8 +--
 src/Storages/MergeTree/MergeTreeData.cpp      | 26 +++++-----
 src/Storages/MergeTree/MergeTreeData.h        |  7 +--
 src/Storages/StorageMergeTree.cpp             |  6 +--
 src/Storages/StorageReplicatedMergeTree.cpp   | 16 +++---
 11 files changed, 103 insertions(+), 42 deletions(-)
 create mode 100644 src/Common/AtomicLogger.h

diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index 7c54116aaa4..e67b05a9225 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -304,16 +304,12 @@ struct LoggerDeleter
 {
 	void operator()(Poco::Logger * logger)
 	{
-		if (Logger::destroy(logger->name()))
-			return;
-
-		logger->release();
+		Logger::destroy(logger->name());
 	}
 };
 
 inline LoggerPtr makeLoggerPtr(Logger & logger)
 {
-	logger.duplicate();
 	return std::shared_ptr<Logger>(&logger, LoggerDeleter());
 }
 
@@ -329,8 +325,13 @@ Logger& Logger::get(const std::string& name)
 LoggerPtr Logger::getShared(const std::string & name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
+	bool logger_exists = _pLoggerMap && _pLoggerMap->contains(name);
 
-	return makeLoggerPtr(unsafeGet(name));
+	Logger & logger = unsafeGet(name);
+	if (logger_exists)
+		logger.duplicate();
+
+	return makeLoggerPtr(logger);
 }
 
 Logger& Logger::unsafeGet(const std::string& name)
diff --git a/src/Common/AtomicLogger.h b/src/Common/AtomicLogger.h
new file mode 100644
index 00000000000..bfbe7caad10
--- /dev/null
+++ b/src/Common/AtomicLogger.h
@@ -0,0 +1,51 @@
+#pragma once
+
+#include <memory>
+
+#include <Common/Logger.h>
+#include <Common/SharedMutex.h>
+#include <Common/SharedLockGuard.h>
+
+
+/** AtomicLogger allows to atomically change logger.
+  * Standard library does not have atomic_shared_ptr, and we do not use std::atomic* operations,
+  * because standard library implementation uses fixed table of mutexes, and it is better to avoid contention here.
+  */
+class AtomicLogger
+{
+public:
+    explicit AtomicLogger(LoggerPtr logger_)
+        : logger(std::move(logger_))
+    {}
+
+    explicit AtomicLogger(const std::string & log_name)
+        : AtomicLogger(::getLogger(log_name))
+    {}
+
+    void store(LoggerPtr new_logger)
+    {
+        std::lock_guard lock(log_mutex);
+        logger = std::move(new_logger);
+    }
+
+    void store(const std::string & new_log_name)
+    {
+        auto new_logger = ::getLogger(new_log_name);
+        store(std::move(new_logger));
+    }
+
+    LoggerPtr load() const
+    {
+        DB::SharedLockGuard lock(log_mutex);
+        return logger;
+    }
+
+    String loadName() const
+    {
+        DB::SharedLockGuard lock(log_mutex);
+        return logger->name();
+    }
+private:
+    mutable DB::SharedMutex log_mutex;
+    LoggerPtr logger TSA_GUARDED_BY(log_mutex);
+};
diff --git a/src/Common/Exception.cpp b/src/Common/Exception.cpp
index ff83f6ba807..7e73e2c0783 100644
--- a/src/Common/Exception.cpp
+++ b/src/Common/Exception.cpp
@@ -257,6 +257,11 @@ void tryLogCurrentException(LoggerPtr logger, const std::string & start_of_messa
     tryLogCurrentException(logger.get(), start_of_message);
 }
 
+void tryLogCurrentException(const AtomicLogger & logger, const std::string & start_of_message)
+{
+    tryLogCurrentException(logger.load(), start_of_message);
+}
+
 static void getNoSpaceLeftInfoMessage(std::filesystem::path path, String & msg)
 {
     path = std::filesystem::absolute(path);
@@ -529,6 +534,11 @@ void tryLogException(std::exception_ptr e, LoggerPtr logger, const std::string &
     }
 }
 
+void tryLogException(std::exception_ptr e, const AtomicLogger & logger, const std::string & start_of_message)
+{
+    tryLogException(e, logger.load(), start_of_message);
+}
+
 std::string getExceptionMessage(const Exception & e, bool with_stacktrace, bool check_embedded_stacktrace)
 {
     return getExceptionMessageAndPattern(e, with_stacktrace, check_embedded_stacktrace).text;
diff --git a/src/Common/Exception.h b/src/Common/Exception.h
index 8afed6034cf..817a4400080 100644
--- a/src/Common/Exception.h
+++ b/src/Common/Exception.h
@@ -11,6 +11,7 @@
 #include <base/scope_guard.h>
 #include <Common/LoggingFormatStringHelpers.h>
 #include <Common/Logger.h>
+#include <Common/AtomicLogger.h>
 #include <Common/StackTrace.h>
 
 #include <fmt/format.h>
@@ -245,6 +246,7 @@ using Exceptions = std::vector<std::exception_ptr>;
 void tryLogCurrentException(const char * log_name, const std::string & start_of_message = "");
 void tryLogCurrentException(Poco::Logger * logger, const std::string & start_of_message = "");
 void tryLogCurrentException(LoggerPtr logger, const std::string & start_of_message = "");
+void tryLogCurrentException(const AtomicLogger & logger, const std::string & start_of_message = "");
 
 
 /** Prints current exception in canonical format.
@@ -290,6 +292,7 @@ struct ExecutionStatus
 /// TODO: Logger leak constexpr overload
 void tryLogException(std::exception_ptr e, const char * log_name, const std::string & start_of_message = "");
 void tryLogException(std::exception_ptr e, LoggerPtr logger, const std::string & start_of_message = "");
+void tryLogException(std::exception_ptr e, const AtomicLogger & logger, const std::string & start_of_message = "");
 
 std::string getExceptionMessage(const Exception & e, bool with_stacktrace, bool check_embedded_stacktrace = false);
 PreformattedMessage getExceptionMessageAndPattern(const Exception & e, bool with_stacktrace, bool check_embedded_stacktrace = false);
diff --git a/src/Common/Logger.h b/src/Common/Logger.h
index 13e1c6bf8f5..6dcdea9a9d8 100644
--- a/src/Common/Logger.h
+++ b/src/Common/Logger.h
@@ -43,7 +43,6 @@ LoggerRawPtr getRawLogger(const std::string & name);
 
 LoggerRawPtr createRawLogger(const std::string & name, Poco::Channel * channel, Poco::Message::Priority level = Poco::Message::PRIO_INFORMATION);
 
-
 /** Returns true, if currently Logger with specified name is created.
   * Otherwise, returns false.
   */
diff --git a/src/Common/logger_useful.h b/src/Common/logger_useful.h
index 3899d060b7c..8e78e93e198 100644
--- a/src/Common/logger_useful.h
+++ b/src/Common/logger_useful.h
@@ -9,6 +9,7 @@
 #include <Common/ProfileEvents.h>
 #include <Common/LoggingFormatStringHelpers.h>
 #include <Common/Logger.h>
+#include <Common/AtomicLogger.h>
 
 namespace Poco { class Logger; }
 
@@ -20,7 +21,8 @@ using LogSeriesLimiterPtr = std::shared_ptr<LogSeriesLimiter>;
 
 namespace
 {
-    [[maybe_unused]] const ::Poco::Logger * getLoggerHelper(const LoggerPtr & logger) { return logger.get(); }
+    [[maybe_unused]] LoggerPtr getLoggerHelper(const LoggerPtr & logger) { return logger; }
+    [[maybe_unused]] LoggerPtr getLoggerHelper(const AtomicLogger & logger) { return logger.load(); }
     [[maybe_unused]] const ::Poco::Logger * getLoggerHelper(const ::Poco::Logger * logger) { return logger; }
     [[maybe_unused]] std::unique_ptr<LogToStrImpl> getLoggerHelper(std::unique_ptr<LogToStrImpl> && logger) { return logger; }
     [[maybe_unused]] std::unique_ptr<LogFrequencyLimiterIml> getLoggerHelper(std::unique_ptr<LogFrequencyLimiterIml> && logger) { return logger; }
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 87f23b0da2a..19730dc05c1 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -1663,7 +1663,7 @@ try
 
     metadata_manager->deleteAll(true);
     metadata_manager->assertAllDeleted(true);
-    getDataPartStorage().rename(to.parent_path(), to.filename(), storage.log, remove_new_dir_if_exists, fsync_dir);
+    getDataPartStorage().rename(to.parent_path(), to.filename(), storage.log.load(), remove_new_dir_if_exists, fsync_dir);
     metadata_manager->updateAll(true);
 
     auto new_projection_root_path = to.string();
@@ -1758,7 +1758,7 @@ void IMergeTreeDataPart::remove()
     }
 
     bool is_temporary_part = is_temp || state == MergeTreeDataPartState::Temporary;
-    getDataPartStorage().remove(std::move(can_remove_callback), checksums, projection_checksums, is_temporary_part, storage.log);
+    getDataPartStorage().remove(std::move(can_remove_callback), checksums, projection_checksums, is_temporary_part, storage.log.load());
 }
 
 std::optional<String> IMergeTreeDataPart::getRelativePathForPrefix(const String & prefix, bool detached, bool broken) const
@@ -1775,7 +1775,7 @@ std::optional<String> IMergeTreeDataPart::getRelativePathForPrefix(const String
     if (detached && parent_part)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot detach projection");
 
-    return getDataPartStorage().getRelativePathForPrefix(storage.log, prefix, detached, broken);
+    return getDataPartStorage().getRelativePathForPrefix(storage.log.load(), prefix, detached, broken);
 }
 
 std::optional<String> IMergeTreeDataPart::getRelativePathForDetachedPart(const String & prefix, bool broken) const
@@ -1841,7 +1841,7 @@ MutableDataPartStoragePtr IMergeTreeDataPart::makeCloneOnDisk(
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Can not clone data part {} to empty directory.", name);
 
     String path_to_clone = fs::path(storage.relative_data_path) / directory_name / "";
-    return getDataPartStorage().clonePart(path_to_clone, getDataPartStorage().getPartDirectory(), disk, read_settings, write_settings, storage.log, cancellation_hook);
+    return getDataPartStorage().clonePart(path_to_clone, getDataPartStorage().getPartDirectory(), disk, read_settings, write_settings, storage.log.load(), cancellation_hook);
 }
 
 UInt64 IMergeTreeDataPart::getIndexSizeFromFile() const
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 39c113c240e..f0eeb3602d5 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -354,8 +354,7 @@ MergeTreeData::MergeTreeData(
     , merging_params(merging_params_)
     , require_part_metadata(require_part_metadata_)
     , broken_part_callback(broken_part_callback_)
-    , log_name(std::make_shared<String>(table_id_.getNameForLogs()))
-    , log(getLogger(*log_name))
+    , log(table_id_.getNameForLogs())
     , storage_settings(std::move(storage_settings_))
     , pinned_part_uuids(std::make_shared<PinnedPartUUIDs>())
     , data_parts_by_info(data_parts_indexes.get<TagByInfo>())
@@ -1296,7 +1295,7 @@ MergeTreeData::LoadPartResult MergeTreeData::loadDataPart(
         res.is_broken = true;
         tryLogCurrentException(log, fmt::format("while loading part {} on path {}", part_name, part_path));
 
-        res.size_of_part = calculatePartSizeSafe(res.part, log);
+        res.size_of_part = calculatePartSizeSafe(res.part, log.load());
         auto part_size_str = res.size_of_part ? formatReadableSizeWithBinarySuffix(*res.size_of_part) : "failed to calculate size";
 
         LOG_ERROR(log,
@@ -1327,7 +1326,7 @@ MergeTreeData::LoadPartResult MergeTreeData::loadDataPart(
     if (part_disk_ptr->exists(marker_path))
     {
         /// NOTE: getBytesOnDisk() cannot be used here, since it may be zero if checksums.txt does not exist.
-        res.size_of_part = calculatePartSizeSafe(res.part, log);
+        res.size_of_part = calculatePartSizeSafe(res.part, log.load());
         res.is_broken = true;
 
         auto part_size_str = res.size_of_part ? formatReadableSizeWithBinarySuffix(*res.size_of_part) : "failed to calculate size";
@@ -2114,7 +2113,7 @@ size_t MergeTreeData::clearOldTemporaryDirectories(const String & root_path, siz
                     {
                         /// Actually we don't rely on temporary_directories_lifetime when removing old temporaries directories,
                         /// it's just an extra level of protection just in case we have a bug.
-                        LOG_INFO(LogFrequencyLimiter(log, 10), "{} is in use (by merge/mutation/INSERT) (consider increasing temporary_directories_lifetime setting)", full_path);
+                        LOG_INFO(LogFrequencyLimiter(log.load(), 10), "{} is in use (by merge/mutation/INSERT) (consider increasing temporary_directories_lifetime setting)", full_path);
                         continue;
                     }
                     else if (!disk->exists(it->path()))
@@ -2734,8 +2733,7 @@ void MergeTreeData::rename(const String & new_table_path, const StorageID & new_
 void MergeTreeData::renameInMemory(const StorageID & new_table_id)
 {
     IStorage::renameInMemory(new_table_id);
-    std::atomic_store(&log_name, std::make_shared<String>(new_table_id.getNameForLogs()));
-    log = getLogger(*log_name);
+    log.store(new_table_id.getNameForLogs());
 }
 
 void MergeTreeData::dropAllData()
@@ -6249,13 +6247,13 @@ ReservationPtr MergeTreeData::tryReserveSpacePreferringTTLRules(
                     log,
                     "Would like to reserve space on volume '{}' by TTL rule of table '{}' but volume was not found",
                     move_ttl_entry->destination_name,
-                    *std::atomic_load(&log_name));
+                    log.loadName());
             else if (move_ttl_entry->destination_type == DataDestinationType::DISK && !move_ttl_entry->if_exists)
                 LOG_WARNING(
                     log,
                     "Would like to reserve space on disk '{}' by TTL rule of table '{}' but disk was not found",
                     move_ttl_entry->destination_name,
-                    *std::atomic_load(&log_name));
+                    log.loadName());
         }
         else if (is_insert && !perform_ttl_move_on_insert)
         {
@@ -6264,7 +6262,7 @@ ReservationPtr MergeTreeData::tryReserveSpacePreferringTTLRules(
                 "TTL move on insert to {} {} for table {} is disabled",
                 (move_ttl_entry->destination_type == DataDestinationType::VOLUME ? "volume" : "disk"),
                 move_ttl_entry->destination_name,
-                *std::atomic_load(&log_name));
+                log.loadName());
         }
         else
         {
@@ -6280,13 +6278,13 @@ ReservationPtr MergeTreeData::tryReserveSpacePreferringTTLRules(
                         log,
                         "Would like to reserve space on volume '{}' by TTL rule of table '{}' but there is not enough space",
                         move_ttl_entry->destination_name,
-                        *std::atomic_load(&log_name));
+                        log.loadName());
                 else if (move_ttl_entry->destination_type == DataDestinationType::DISK)
                     LOG_WARNING(
                         log,
                         "Would like to reserve space on disk '{}' by TTL rule of table '{}' but there is not enough space",
                         move_ttl_entry->destination_name,
-                        *std::atomic_load(&log_name));
+                        log.loadName());
             }
         }
     }
@@ -7989,7 +7987,7 @@ bool MergeTreeData::insertQueryIdOrThrowNoLock(const String & query_id, size_t m
         throw Exception(
             ErrorCodes::TOO_MANY_SIMULTANEOUS_QUERIES,
             "Too many simultaneous queries for table {}. Maximum is: {}",
-            *std::atomic_load(&log_name),
+            log.loadName(),
             max_queries);
     query_id_set.insert(query_id);
     return true;
@@ -8181,7 +8179,7 @@ ReservationPtr MergeTreeData::balancedReservation(
                     }
 
                     // Record submerging big parts in the tagger to clean them up.
-                    tagger_ptr->emplace(*this, part_name, std::move(covered_parts), log);
+                    tagger_ptr->emplace(*this, part_name, std::move(covered_parts), log.load());
                 }
             }
         }
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index caef247500a..29aafcc3a13 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -462,7 +462,7 @@ public:
     /// Load the set of data parts from disk. Call once - immediately after the object is created.
     void loadDataParts(bool skip_sanity_checks, std::optional<std::unordered_set<std::string>> expected_parts);
 
-    String getLogName() const { return *std::atomic_load(&log_name); }
+    String getLogName() const { return log.loadName(); }
 
     Int64 getMaxBlockNumber() const;
 
@@ -1115,10 +1115,7 @@ protected:
     /// Engine-specific methods
     BrokenPartCallback broken_part_callback;
 
-    /// log_name will change during table RENAME. Use atomic_shared_ptr to allow concurrent RW.
-    /// NOTE clang-14 doesn't have atomic_shared_ptr yet. Use std::atomic* operations for now.
-    std::shared_ptr<String> log_name;
-    LoggerPtr log;
+    AtomicLogger log;
 
     /// Storage settings.
     /// Use get and set to receive readonly versions.
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 7e6c5ca3924..b402191f895 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -683,7 +683,7 @@ std::optional<MergeTreeMutationStatus> StorageMergeTree::getIncompleteMutationsS
 
     const auto & mutation_entry = current_mutation_it->second;
 
-    auto txn = tryGetTransactionForMutation(mutation_entry, log);
+    auto txn = tryGetTransactionForMutation(mutation_entry, log.load());
     /// There's no way a transaction may finish before a mutation that was started by the transaction.
     /// But sometimes we need to check status of an unrelated mutation, in this case we don't care about transactions.
     assert(txn || mutation_entry.tid.isPrehistoric() || from_another_mutation);
@@ -829,7 +829,7 @@ CancellationCode StorageMergeTree::killMutation(const String & mutation_id)
     if (!to_kill)
         return CancellationCode::NotFound;
 
-    if (auto txn = tryGetTransactionForMutation(*to_kill, log))
+    if (auto txn = tryGetTransactionForMutation(*to_kill, log.load()))
     {
         LOG_TRACE(log, "Cancelling transaction {} which had started mutation {}", to_kill->tid, mutation_id);
         TransactionLog::instance().rollbackTransaction(txn);
@@ -1222,7 +1222,7 @@ MergeMutateSelectedEntryPtr StorageMergeTree::selectPartsToMutate(
             if (!part->version.isVisible(first_mutation_tid.start_csn, first_mutation_tid))
                 continue;
 
-            txn = tryGetTransactionForMutation(mutations_begin_it->second, log);
+            txn = tryGetTransactionForMutation(mutations_begin_it->second, log.load());
             if (!txn)
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot find transaction {} that has started mutation {} "
                                 "that is going to be applied to part {}",
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index c82721d2a18..9c2f9dba485 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -320,7 +320,7 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
                     attach,
                     [this] (const std::string & name) { enqueuePartForCheck(name); })
     , zookeeper_name(zkutil::extractZooKeeperName(zookeeper_path_))
-    , zookeeper_path(zkutil::extractZooKeeperPath(zookeeper_path_, /* check_starts_with_slash */ !attach, log))
+    , zookeeper_path(zkutil::extractZooKeeperPath(zookeeper_path_, /* check_starts_with_slash */ !attach, log.load()))
     , replica_name(replica_name_)
     , replica_path(fs::path(zookeeper_path) / "replicas" / replica_name_)
     , reader(*this)
@@ -812,7 +812,7 @@ bool StorageReplicatedMergeTree::createTableIfNotExists(const StorageMetadataPtr
             else
             {
                 auto metadata_drop_lock = zkutil::EphemeralNodeHolder::existing(drop_lock_path, *zookeeper);
-                if (!removeTableNodesFromZooKeeper(zookeeper, zookeeper_path, metadata_drop_lock, log))
+                if (!removeTableNodesFromZooKeeper(zookeeper, zookeeper_path, metadata_drop_lock, log.load()))
                 {
                     /// Someone is recursively removing table right now, we cannot create new table until old one is removed
                     continue;
@@ -1128,7 +1128,7 @@ void StorageReplicatedMergeTree::drop()
             if (lost_part_count > 0)
                 LOG_INFO(log, "Dropping table with non-zero lost_part_count equal to {}", lost_part_count);
         }
-        dropReplica(zookeeper, zookeeper_path, replica_name, log, getSettings(), &has_metadata_in_zookeeper);
+        dropReplica(zookeeper, zookeeper_path, replica_name, log.load(), getSettings(), &has_metadata_in_zookeeper);
     }
 }
 
@@ -4181,7 +4181,7 @@ void StorageReplicatedMergeTree::startBeingLeader()
         return;
     }
 
-    zkutil::checkNoOldLeaders(log, *zookeeper, fs::path(zookeeper_path) / "leader_election");
+    zkutil::checkNoOldLeaders(log.load(), *zookeeper, fs::path(zookeeper_path) / "leader_election");
 
     LOG_INFO(log, "Became leader");
     is_leader = true;
@@ -4275,7 +4275,7 @@ void StorageReplicatedMergeTree::waitForUniquePartsToBeFetchedByOtherReplicas(St
 
     auto zookeeper = getZooKeeperIfTableShutDown();
 
-    auto unique_parts_set = findReplicaUniqueParts(replica_name, zookeeper_path, format_version, zookeeper, log);
+    auto unique_parts_set = findReplicaUniqueParts(replica_name, zookeeper_path, format_version, zookeeper, log.load());
     if (unique_parts_set.empty())
     {
         LOG_INFO(log, "Will not wait for unique parts to be fetched because we don't have any unique parts");
@@ -9348,7 +9348,7 @@ StorageReplicatedMergeTree::unlockSharedData(const IMergeTreeDataPart & part, co
 
     return unlockSharedDataByID(
         part.getUniqueId(), shared_id, part.info, replica_name,
-        part.getDataPartStorage().getDiskType(), zookeeper, *getSettings(), log, zookeeper_path, format_version);
+        part.getDataPartStorage().getDiskType(), zookeeper, *getSettings(), log.load(), zookeeper_path, format_version);
 }
 
 namespace
@@ -10301,7 +10301,7 @@ void StorageReplicatedMergeTree::backupData(
         bool exists = false;
         Strings mutation_ids;
         {
-            ZooKeeperRetriesControl retries_ctl("getMutations", log, zookeeper_retries_info, nullptr);
+            ZooKeeperRetriesControl retries_ctl("getMutations", log.load(), zookeeper_retries_info, nullptr);
             retries_ctl.retryLoop([&]()
             {
                 if (!zookeeper || zookeeper->expired())
@@ -10320,7 +10320,7 @@ void StorageReplicatedMergeTree::backupData(
                 bool mutation_id_exists = false;
                 String mutation;
 
-                ZooKeeperRetriesControl retries_ctl("getMutation", log, zookeeper_retries_info, nullptr);
+                ZooKeeperRetriesControl retries_ctl("getMutation", log.load(), zookeeper_retries_info, nullptr);
                 retries_ctl.retryLoop([&]()
                 {
                     if (!zookeeper || zookeeper->expired())

From 50309dfd908e5e1da4addb3f53d1b750687c473d Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Sat, 27 Jan 2024 16:30:36 +0300
Subject: [PATCH 157/245] Fixed tests

---
 base/poco/Foundation/include/Poco/Logger.h |  11 --
 base/poco/Foundation/src/Logger.cpp        | 114 ++++++++++++++-------
 src/Common/tests/gtest_log.cpp             |   3 -
 3 files changed, 78 insertions(+), 50 deletions(-)

diff --git a/base/poco/Foundation/include/Poco/Logger.h b/base/poco/Foundation/include/Poco/Logger.h
index f91d836f190..cf202718662 100644
--- a/base/poco/Foundation/include/Poco/Logger.h
+++ b/base/poco/Foundation/include/Poco/Logger.h
@@ -904,13 +904,6 @@ public:
     /// Returns a pointer to the Logger with the given name if it
     /// exists, or a null pointer otherwise.
 
-    static bool destroy(const std::string & name);
-    /// Destroys the logger with the specified name. Does nothing
-    /// if the logger is not found.
-    ///
-    /// After a logger has been destroyed, all references to it
-    /// become invalid.
-
     static void shutdown();
     /// Shuts down the logging framework and releases all
     /// Loggers.
@@ -940,8 +933,6 @@ public:
     static const std::string ROOT; /// The name of the root logger ("").
 
 protected:
-    typedef std::map<std::string, Logger *> LoggerMap;
-
     Logger(const std::string & name, Channel * pChannel, int level);
     ~Logger();
 
@@ -962,8 +953,6 @@ private:
     std::string _name;
     Channel * _pChannel;
     std::atomic_int _level;
-
-    static LoggerMap * _pLoggerMap;
 };
 
 
diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index e67b05a9225..d8c90e7ccb9 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -20,6 +20,7 @@
 #include "Poco/NumberParser.h"
 #include "Poco/String.h"
 
+#include <cassert>
 #include <mutex>
 
 namespace
@@ -37,12 +38,20 @@ std::mutex & getLoggerMutex()
 	return *logger_mutex;
 }
 
+struct LoggerEntry
+{
+	Poco::Logger * logger;
+	bool owned_by_shared_ptr = false;
+};
+
+using LoggerMap = std::unordered_map<std::string, LoggerEntry>;
+LoggerMap * _pLoggerMap = nullptr;
+
 }
 
 namespace Poco {
 
 
-Logger::LoggerMap* Logger::_pLoggerMap = 0;
 const std::string Logger::ROOT;
 
 
@@ -134,12 +143,12 @@ void Logger::setLevel(const std::string& name, int level)
 	if (_pLoggerMap)
 	{
 		std::string::size_type len = name.length();
-		for (LoggerMap::iterator it = _pLoggerMap->begin(); it != _pLoggerMap->end(); ++it)
+		for (auto & it : *_pLoggerMap)
 		{
 			if (len == 0 ||
-				(it->first.compare(0, len, name) == 0 && (it->first.length() == len || it->first[len] == '.')))
+				(it.first.compare(0, len, name) == 0 && (it.first.length() == len || it.first[len] == '.')))
 			{
-				it->second->setLevel(level);
+				it.second.logger->setLevel(level);
 			}
 		}
 	}
@@ -153,12 +162,12 @@ void Logger::setChannel(const std::string& name, Channel* pChannel)
 	if (_pLoggerMap)
 	{
 		std::string::size_type len = name.length();
-		for (LoggerMap::iterator it = _pLoggerMap->begin(); it != _pLoggerMap->end(); ++it)
+		for (auto & it : *_pLoggerMap)
 		{
 			if (len == 0 ||
-				(it->first.compare(0, len, name) == 0 && (it->first.length() == len || it->first[len] == '.')))
+				(it.first.compare(0, len, name) == 0 && (it.first.length() == len || it.first[len] == '.')))
 			{
-				it->second->setChannel(pChannel);
+				it.second.logger->setChannel(pChannel);
 			}
 		}
 	}
@@ -172,12 +181,12 @@ void Logger::setProperty(const std::string& loggerName, const std::string& prope
 	if (_pLoggerMap)
 	{
 		std::string::size_type len = loggerName.length();
-		for (LoggerMap::iterator it = _pLoggerMap->begin(); it != _pLoggerMap->end(); ++it)
+		for (auto & it : *_pLoggerMap)
 		{
 			if (len == 0 ||
-				(it->first.compare(0, len, loggerName) == 0 && (it->first.length() == len || it->first[len] == '.')))
+				(it.first.compare(0, len, loggerName) == 0 && (it.first.length() == len || it.first[len] == '.')))
 			{
-				it->second->setProperty(propertyName, value);
+				it.second.logger->setProperty(propertyName, value);
 			}
 		}
 	}
@@ -304,10 +313,31 @@ struct LoggerDeleter
 {
 	void operator()(Poco::Logger * logger)
 	{
-		Logger::destroy(logger->name());
+		std::lock_guard<std::mutex> lock(getLoggerMutex());
+
+		/// If logger infrastructure is destroyed just decrement logger reference count
+		if (!_pLoggerMap)
+		{
+			logger->release();
+			return;
+		}
+
+		auto it = _pLoggerMap->find(logger->name());
+		assert(it != _pLoggerMap->end());
+
+		/** If reference count is 1, this means this shared pointer owns logger
+		  * and need destroy it.
+		  */
+		size_t reference_count_before_release = logger->release();
+		if (reference_count_before_release == 1)
+		{
+			assert(it->second.owned_by_shared_ptr);
+			_pLoggerMap->erase(it);
+		}
 	}
 };
 
+
 inline LoggerPtr makeLoggerPtr(Logger & logger)
 {
 	return std::shared_ptr<Logger>(&logger, LoggerDeleter());
@@ -315,25 +345,52 @@ inline LoggerPtr makeLoggerPtr(Logger & logger)
 
 }
 
+
 Logger& Logger::get(const std::string& name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	return unsafeGet(name);
+	Logger & logger = unsafeGet(name);
+
+	/** If there are already shared pointer created for this logger
+	  * we need to increment Logger reference count and now logger
+	  * is owned by logger infrastructure.
+	  */
+	auto it = _pLoggerMap->find(name);
+	if (it->second.owned_by_shared_ptr)
+	{
+		it->second.logger->duplicate();
+		it->second.owned_by_shared_ptr = false;
+	}
+
+	return logger;
 }
 
+
 LoggerPtr Logger::getShared(const std::string & name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 	bool logger_exists = _pLoggerMap && _pLoggerMap->contains(name);
 
 	Logger & logger = unsafeGet(name);
+
+	/** If logger already exists, then this shared pointer does not own it.
+	  * If logger does not exists, logger infrastructure could be already destroyed
+	  * or logger was created.
+	  */
 	if (logger_exists)
+	{
 		logger.duplicate();
+	}
+	else if (_pLoggerMap)
+	{
+		_pLoggerMap->find(name)->second.owned_by_shared_ptr = true;
+	}
 
 	return makeLoggerPtr(logger);
 }
 
+
 Logger& Logger::unsafeGet(const std::string& name)
 {
 	Logger* pLogger = find(name);
@@ -390,10 +447,14 @@ void Logger::shutdown()
 
 	if (_pLoggerMap)
 	{
-		for (LoggerMap::iterator it = _pLoggerMap->begin(); it != _pLoggerMap->end(); ++it)
+		for (auto & it : *_pLoggerMap)
 		{
-			it->second->release();
+			if (it.second.owned_by_shared_ptr)
+				continue;
+
+			it.second.logger->release();
 		}
+
 		delete _pLoggerMap;
 		_pLoggerMap = 0;
 	}
@@ -406,32 +467,12 @@ Logger* Logger::find(const std::string& name)
 	{
 		LoggerMap::iterator it = _pLoggerMap->find(name);
 		if (it != _pLoggerMap->end())
-			return it->second;
+			return it->second.logger;
 	}
 	return 0;
 }
 
 
-bool Logger::destroy(const std::string& name)
-{
-	std::lock_guard<std::mutex> lock(getLoggerMutex());
-
-	if (_pLoggerMap)
-	{
-		LoggerMap::iterator it = _pLoggerMap->find(name);
-		if (it != _pLoggerMap->end())
-		{
-			if (it->second->release() == 1)
-				_pLoggerMap->erase(it);
-
-			return true;
-		}
-	}
-
-	return false;
-}
-
-
 void Logger::names(std::vector<std::string>& names)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
@@ -539,7 +580,8 @@ void Logger::add(Logger* pLogger)
 {
 	if (!_pLoggerMap)
 		_pLoggerMap = new LoggerMap;
-	_pLoggerMap->insert(LoggerMap::value_type(pLogger->name(), pLogger));
+
+	_pLoggerMap->emplace(pLogger->name(), LoggerEntry{pLogger, false /*owned_by_shared_ptr*/});
 }
 
 
diff --git a/src/Common/tests/gtest_log.cpp b/src/Common/tests/gtest_log.cpp
index 419aac370d6..622497fe2f5 100644
--- a/src/Common/tests/gtest_log.cpp
+++ b/src/Common/tests/gtest_log.cpp
@@ -32,7 +32,6 @@ TEST(Logger, TestLog)
         LOG_TEST(log, "Hello World");
 
         EXPECT_EQ(oss.str(), "Hello World\n");
-        Poco::Logger::destroy("TestLogger");
     }
 
     {   /// Test logs invisible for other levels
@@ -45,8 +44,6 @@ TEST(Logger, TestLog)
             LOG_TEST(log, "Hello World");
 
             EXPECT_EQ(oss.str(), "");
-
-            Poco::Logger::destroy(std::string{level} + "_Logger");
         }
     }
 

From bccd8b5e270caccf1011971c424e2acee64b9e95 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Sat, 27 Jan 2024 19:17:17 +0300
Subject: [PATCH 158/245] Fixed tests

---
 base/poco/Foundation/src/Logger.cpp | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index d8c90e7ccb9..cfc063c8979 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -422,7 +422,10 @@ LoggerPtr Logger::createShared(const std::string & name, Channel * pChannel, int
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	return makeLoggerPtr(unsafeCreate(name, pChannel, level));
+	Logger & logger = unsafeCreate(name, pChannel, level);
+	_pLoggerMap->find(name)->second.owned_by_shared_ptr = true;
+
+	return makeLoggerPtr(logger);
 }
 
 Logger& Logger::root()

From 5165fb7286a145091e9cf89a92284a34d22c31c0 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Sun, 28 Jan 2024 13:55:23 +0300
Subject: [PATCH 159/245] Fixed build

---
 src/Common/AtomicLogger.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/AtomicLogger.h b/src/Common/AtomicLogger.h
index bfbe7caad10..4bda55e070b 100644
--- a/src/Common/AtomicLogger.h
+++ b/src/Common/AtomicLogger.h
@@ -47,5 +47,5 @@ public:
     }
 private:
     mutable DB::SharedMutex log_mutex;
-    LoggerPtr logger TSA_GUARDED_BY(log_mutex);
+    LoggerPtr logger;
 };

From d70fe79a1e4aeb61a2c17fbe8d67e285228a3eb3 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Sun, 28 Jan 2024 12:28:08 +0100
Subject: [PATCH 160/245] Revert "Disable randomization of
 allow_experimental_block_number_column flag (#56474)"

This reverts commit 951d9ac1446d990f6da476217eeb5330ad5b8137.
---
 docker/test/stateless/stress_tests.lib        | 2 ++
 tests/config/config.d/merge_tree_settings.xml | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/docker/test/stateless/stress_tests.lib b/docker/test/stateless/stress_tests.lib
index 6f0dabb5207..ab573555a43 100644
--- a/docker/test/stateless/stress_tests.lib
+++ b/docker/test/stateless/stress_tests.lib
@@ -78,6 +78,8 @@ function configure()
         randomize_config_boolean_value use_compression zookeeper
     fi
 
+    randomize_config_boolean_value allow_experimental_block_number_column merge_tree_settings
+
     # for clickhouse-server (via service)
     echo "ASAN_OPTIONS='malloc_context_size=10 verbosity=1 allocator_release_to_os_interval_ms=10000'" >> /etc/environment
     # for clickhouse-client
diff --git a/tests/config/config.d/merge_tree_settings.xml b/tests/config/config.d/merge_tree_settings.xml
index f277c18fa3f..7dcea114b90 100644
--- a/tests/config/config.d/merge_tree_settings.xml
+++ b/tests/config/config.d/merge_tree_settings.xml
@@ -2,5 +2,7 @@
     <merge_tree>
         <!-- 10 seconds (default is 1 minute) -->
         <zookeeper_session_expiration_check_period>10</zookeeper_session_expiration_check_period>
+        <!-- Setting randomized for stress test, it is disabled here and this line is used to randomize it in the script -->
+        <allow_experimental_block_number_column>0</allow_experimental_block_number_column>
     </merge_tree>
 </clickhouse>

From febd4ce8d794749da1346428709f72ce0e34495f Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Sun, 28 Jan 2024 13:41:33 +0100
Subject: [PATCH 161/245] Update run.sh

---
 docker/test/stateless/run.sh | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index 19f9783cd01..5c1398bf308 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -249,12 +249,12 @@ stop_logs_replication
 failed_to_save_logs=0
 for table in query_log zookeeper_log trace_log transactions_info_log metric_log
 do
-    error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst; } 2>&1 )
+    err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst; } 2>&1 )
     [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
-        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst; } 2>&1 )
+        err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst; } 2>&1 )
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
-        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst; } 2>&1 )
+        err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst; } 2>&1 )
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     fi
 done

From 29700fbad154328fcaeda059a6b4644f95edee11 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Sun, 28 Jan 2024 15:33:27 +0100
Subject: [PATCH 162/245] Fix special build

---
 src/Columns/ColumnMap.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Columns/ColumnMap.cpp b/src/Columns/ColumnMap.cpp
index 307a1ef0f62..4a758ca248a 100644
--- a/src/Columns/ColumnMap.cpp
+++ b/src/Columns/ColumnMap.cpp
@@ -141,9 +141,9 @@ void ColumnMap::updateHashFast(SipHash & hash) const
     nested->updateHashFast(hash);
 }
 
-void ColumnMap::insertFrom(const IColumn & src, size_t start)
+void ColumnMap::insertFrom(const IColumn & src, size_t n)
 {
-    nested->insertFrom(assert_cast<const ColumnMap &>(src).getNestedColumn(), start);
+    nested->insertFrom(assert_cast<const ColumnMap &>(src).getNestedColumn(), n);
 }
 
 void ColumnMap::insertRangeFrom(const IColumn & src, size_t start, size_t length)

From 41883ddb34d39dba8aaf5e06099c7623575239b6 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Sun, 28 Jan 2024 18:15:11 +0100
Subject: [PATCH 163/245] Update run.sh

---
 docker/test/stateless/run.sh | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index 5c1398bf308..89e8eb13a6d 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -250,11 +250,14 @@ failed_to_save_logs=0
 for table in query_log zookeeper_log trace_log transactions_info_log metric_log
 do
     err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst; } 2>&1 )
+    echo $err
     [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
         err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst; } 2>&1 )
+        echo $err
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
         err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst; } 2>&1 )
+        echo $err
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     fi
 done

From cc4d4647f50295c3c1a1757f0f4213a28fe79e81 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Sun, 28 Jan 2024 22:24:03 +0100
Subject: [PATCH 164/245] Update run.sh

---
 docker/test/stateless/run.sh | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index 89e8eb13a6d..05b9ec2a06f 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -250,14 +250,14 @@ failed_to_save_logs=0
 for table in query_log zookeeper_log trace_log transactions_info_log metric_log
 do
     err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst; } 2>&1 )
-    echo $err
+    echo "$err"
     [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
         err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst; } 2>&1 )
-        echo $err
+        echo "$err"
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
         err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst; } 2>&1 )
-        echo $err
+        echo "$err"
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     fi
 done

From 7aea3847dbea8a4d25b9aaafff5250edfbb47f1e Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Mon, 29 Jan 2024 11:54:19 +0800
Subject: [PATCH 165/245] improve exception message of function regexp_extract

---
 src/Functions/regexpExtract.cpp | 24 +++++++++++++++---------
 1 file changed, 15 insertions(+), 9 deletions(-)

diff --git a/src/Functions/regexpExtract.cpp b/src/Functions/regexpExtract.cpp
index 0502d2fbfdc..e7c982d675a 100644
--- a/src/Functions/regexpExtract.cpp
+++ b/src/Functions/regexpExtract.cpp
@@ -124,21 +124,23 @@ private:
         res_offsets.push_back(res_offset);
     }
 
-    static void vectorConstant(
+    void vectorConstant(
         const ColumnString::Chars & data,
         const ColumnString::Offsets & offsets,
         const std::string & pattern,
         ssize_t index,
         ColumnString::Chars & res_data,
-        ColumnString::Offsets & res_offsets)
+        ColumnString::Offsets & res_offsets) const
     {
         const OptimizedRegularExpression regexp = Regexps::createRegexp<false, false, false>(pattern);
         unsigned capture = regexp.getNumberOfSubpatterns();
         if (index < 0 || index >= capture + 1)
             throw Exception(
                 ErrorCodes::INDEX_OF_POSITIONAL_ARGUMENT_IS_OUT_OF_RANGE,
-                "Index value {} is out of range, should be in [0, {})",
+                "Index value {} is out of range of regexp pattern '{}' in function {}, should be in [0, {})",
                 index,
+                pattern,
+                getName(),
                 capture + 1);
 
         OptimizedRegularExpression::MatchVec matches;
@@ -161,13 +163,13 @@ private:
         }
     }
 
-    static void vectorVector(
+    void vectorVector(
         const ColumnString::Chars & data,
         const ColumnString::Offsets & offsets,
         const std::string & pattern,
         const ColumnPtr & column_index,
         ColumnString::Chars & res_data,
-        ColumnString::Offsets & res_offsets)
+        ColumnString::Offsets & res_offsets) const
     {
         res_data.reserve(data.size() / 5);
         res_offsets.reserve(offsets.size());
@@ -187,8 +189,10 @@ private:
             if (index < 0 || index >= capture + 1)
                 throw Exception(
                     ErrorCodes::INDEX_OF_POSITIONAL_ARGUMENT_IS_OUT_OF_RANGE,
-                    "Index value {} is out of range, should be in [0, {})",
+                    "Index value {} is out of range of regexp pattern '{}' in function {}, should be in [0, {})",
                     index,
+                    pattern,
+                    getName(),
                     capture + 1);
 
             regexp.match(
@@ -202,12 +206,12 @@ private:
         }
     }
 
-    static void constantVector(
+    void constantVector(
         const std::string & str,
         const std::string & pattern,
         const ColumnPtr & column_index,
         ColumnString::Chars & res_data,
-        ColumnString::Offsets & res_offsets)
+        ColumnString::Offsets & res_offsets) const
     {
         size_t rows = column_index->size();
         res_data.reserve(str.size() / 5);
@@ -230,8 +234,10 @@ private:
             if (index < 0 || index >= capture + 1)
                 throw Exception(
                     ErrorCodes::INDEX_OF_POSITIONAL_ARGUMENT_IS_OUT_OF_RANGE,
-                    "Index value {} is out of range, should be in [0, {})",
+                    "Index value {} is out of range of regexp pattern '{}' in function {}, should be in [0, {})",
                     index,
+                    pattern,
+                    getName(),
                     capture + 1);
 
             saveMatch(matches, index, padded_str, 0, res_data, res_offsets, res_offset);

From 94be2cf7a657e0cc824d0d7a29b5ef44575235c3 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 29 Jan 2024 13:28:07 +0300
Subject: [PATCH 166/245] Fixed tests

---
 tests/config/users.d/readonly.xml         | 3 ++-
 tests/config/users.d/session_log_test.xml | 3 ++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/tests/config/users.d/readonly.xml b/tests/config/users.d/readonly.xml
index 0fe1e3fe6d9..799de11decf 100644
--- a/tests/config/users.d/readonly.xml
+++ b/tests/config/users.d/readonly.xml
@@ -9,7 +9,8 @@
     <users>
         <readonly>
             <password></password>
-            <networks incl="networks" replace="replace">
+
+            <networks>
                 <ip>::1</ip>
                 <ip>127.0.0.1</ip>
             </networks>
diff --git a/tests/config/users.d/session_log_test.xml b/tests/config/users.d/session_log_test.xml
index cc2c2c5fcde..f93b0efd828 100644
--- a/tests/config/users.d/session_log_test.xml
+++ b/tests/config/users.d/session_log_test.xml
@@ -18,7 +18,8 @@
     <users>
         <session_log_test_xml_user>
             <no_password></no_password>
-            <networks incl="networks" replace="replace">
+
+            <networks>
                 <ip>::1</ip>
                 <ip>127.0.0.1</ip>
             </networks>

From ab2b12ba9f9a33e185362244eb396f0d111865c8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 11:40:12 +0100
Subject: [PATCH 167/245] Fix typo

---
 docs/en/operations/system-tables/metrics.md        | 2 +-
 src/Common/CurrentMetrics.cpp                      | 2 +-
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 3 +--
 3 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/docs/en/operations/system-tables/metrics.md b/docs/en/operations/system-tables/metrics.md
index 3dec6345eb6..898e6ae2e2c 100644
--- a/docs/en/operations/system-tables/metrics.md
+++ b/docs/en/operations/system-tables/metrics.md
@@ -287,7 +287,7 @@ Number of threads in the HashedDictionary thread pool running a task.
 
 ### IOPrefetchThreads
 
-Number of threads in the IO prefertch thread pool.
+Number of threads in the IO prefetch thread pool.
 
 ### IOPrefetchThreadsActive
 
diff --git a/src/Common/CurrentMetrics.cpp b/src/Common/CurrentMetrics.cpp
index 724b6ab62f7..e7534f71dbb 100644
--- a/src/Common/CurrentMetrics.cpp
+++ b/src/Common/CurrentMetrics.cpp
@@ -87,7 +87,7 @@
     M(MarksLoaderThreads, "Number of threads in thread pool for loading marks.") \
     M(MarksLoaderThreadsActive, "Number of threads in the thread pool for loading marks running a task.") \
     M(MarksLoaderThreadsScheduled, "Number of queued or active jobs in the thread pool for loading marks.") \
-    M(IOPrefetchThreads, "Number of threads in the IO prefertch thread pool.") \
+    M(IOPrefetchThreads, "Number of threads in the IO prefetch thread pool.") \
     M(IOPrefetchThreadsActive, "Number of threads in the IO prefetch thread pool running a task.") \
     M(IOPrefetchThreadsScheduled, "Number of queued or active jobs in the IO prefetch thread pool.") \
     M(IOWriterThreads, "Number of threads in the IO writer thread pool.") \
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index ab48a4a798c..93e2a12d69c 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1,4 +1,4 @@
-personal_ws-1.1 en 2657 
+personal_ws-1.1 en 2657
 AArch
 ACLs
 ALTERs
@@ -2060,7 +2060,6 @@ prebuild
 prebuilt
 preemptable
 preferServerCiphers
-prefertch
 prefetch
 prefetchsize
 preloaded

From bd83830ceafe2637279f61a482077189b83ba25c Mon Sep 17 00:00:00 2001
From: Max K <max.kainov@clickhouse.com>
Date: Mon, 29 Jan 2024 12:17:38 +0100
Subject: [PATCH 168/245] CI: WA for issue with perf test with artifact reuse
 (#59325)

* CI: WA for issue with perf test with artifact reuse

 #do_not_test

* Automatic style fix

---------

Co-authored-by: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
---
 tests/ci/ci_config.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index df72c02cb7d..e011b8ad3c9 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -214,6 +214,11 @@ class BuildConfig:
                     "./packages",
                     "./docker/packager/packager",
                     "./rust",
+                    # FIXME: This is a WA to rebuild the CH and recreate the Performance.tar.zst artifact
+                    # when there are changes in performance test scripts.
+                    # Due to the current design of the perf test we need to rebuild CH when the performance test changes,
+                    # otherwise the changes will not be visible in the PerformanceTest job in CI
+                    "./tests/performance",
                 ],
                 exclude_files=[".md"],
                 docker=["clickhouse/binary-builder"],

From 5c5ec7465bb0ea47ddb9cc6661df4a860a20ee94 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 29 Jan 2024 12:28:29 +0100
Subject: [PATCH 169/245] Update test

---
 .../test_broken_projections/test.py           | 24 +++++++++++++++++--
 1 file changed, 22 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 8be14c6a57b..e0b8c3d9247 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -228,13 +228,23 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
         )
         time.sleep(2)
         node.query("SYSTEM FLUSH LOGS")
-        assert "proj1" in node.query(
+        res = node.query(
             f"""
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
         FROM system.query_log
         WHERE query_id='{query_id}' AND type='QueryFinish'
         """
         )
+        if res == "":
+            res = node.query(
+                """
+                SELECT query, splitByChar('.', arrayJoin(projections))[-1]
+                FROM system.query_log
+            """
+            )
+            print(res)
+            assert False
+        assert "proj1" in res
 
     query_id = random_str()
 
@@ -249,13 +259,23 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
         )
         time.sleep(2)
         node.query("SYSTEM FLUSH LOGS")
-        assert "proj2" in node.query(
+        res = node.query(
             f"""
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
         FROM system.query_log
         WHERE query_id='{query_id}' AND type='QueryFinish'
         """
         )
+        if res == "":
+            res = node.query(
+                """
+                SELECT query, splitByChar('.', arrayJoin(projections))[-1]
+                FROM system.query_log
+            """
+            )
+            print(res)
+            assert False
+        assert "proj2" in res
 
     assert check_result == int(node.query(f"CHECK TABLE {table}"))
 

From ef252d8376c1d296e2da52b8ff14b3c4b611df3e Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 29 Jan 2024 12:36:00 +0100
Subject: [PATCH 170/245] Validate settings with keeper, add a test

---
 src/Storages/S3Queue/S3QueueTableMetadata.cpp | 50 ++++++++++++--
 src/Storages/S3Queue/S3QueueTableMetadata.h   |  2 +
 .../integration/test_storage_s3_queue/test.py | 66 +++++++++++++++++++
 3 files changed, 114 insertions(+), 4 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueTableMetadata.cpp b/src/Storages/S3Queue/S3QueueTableMetadata.cpp
index 104f70224b6..3ee2594135d 100644
--- a/src/Storages/S3Queue/S3QueueTableMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueTableMetadata.cpp
@@ -16,8 +16,22 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int METADATA_MISMATCH;
+    extern const int BAD_ARGUMENTS;
 }
 
+namespace
+{
+    S3QueueMode modeFromString(const std::string & mode)
+    {
+        if (mode == "ordered")
+            return S3QueueMode::ORDERED;
+        if (mode == "unordered")
+            return S3QueueMode::UNORDERED;
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unexpected S3Queue mode: {}", mode);
+    }
+}
+
+
 S3QueueTableMetadata::S3QueueTableMetadata(
     const StorageS3::Configuration & configuration,
     const S3QueueSettings & engine_settings,
@@ -28,10 +42,11 @@ S3QueueTableMetadata::S3QueueTableMetadata(
     mode = engine_settings.mode.toString();
     s3queue_tracked_files_limit = engine_settings.s3queue_tracked_files_limit;
     s3queue_tracked_file_ttl_sec = engine_settings.s3queue_tracked_file_ttl_sec;
+    s3queue_total_shards_num = engine_settings.s3queue_total_shards_num;
+    s3queue_processing_threads_num = engine_settings.s3queue_processing_threads_num;
     columns = storage_metadata.getColumns().toString();
 }
 
-
 String S3QueueTableMetadata::toString() const
 {
     Poco::JSON::Object json;
@@ -39,6 +54,8 @@ String S3QueueTableMetadata::toString() const
     json.set("mode", mode);
     json.set("s3queue_tracked_files_limit", s3queue_tracked_files_limit);
     json.set("s3queue_tracked_file_ttl_sec", s3queue_tracked_file_ttl_sec);
+    json.set("s3queue_total_shards_num", s3queue_total_shards_num);
+    json.set("s3queue_processing_threads_num", s3queue_processing_threads_num);
     json.set("format_name", format_name);
     json.set("columns", columns);
 
@@ -58,6 +75,10 @@ void S3QueueTableMetadata::read(const String & metadata_str)
     s3queue_tracked_file_ttl_sec = json->getValue<UInt64>("s3queue_tracked_file_ttl_sec");
     format_name = json->getValue<String>("format_name");
     columns = json->getValue<String>("columns");
+    if (json->has("s3queue_total_shards_num"))
+        s3queue_total_shards_num = json->getValue<UInt64>("s3queue_total_shards_num");
+    if (json->has("s3queue_processing_threads_num"))
+        s3queue_processing_threads_num = json->getValue<UInt64>("s3queue_processing_threads_num");
 }
 
 S3QueueTableMetadata S3QueueTableMetadata::parse(const String & metadata_str)
@@ -67,7 +88,6 @@ S3QueueTableMetadata S3QueueTableMetadata::parse(const String & metadata_str)
     return metadata;
 }
 
-
 void S3QueueTableMetadata::checkImmutableFieldsEquals(const S3QueueTableMetadata & from_zk) const
 {
     if (after_processing != from_zk.after_processing)
@@ -83,8 +103,8 @@ void S3QueueTableMetadata::checkImmutableFieldsEquals(const S3QueueTableMetadata
             ErrorCodes::METADATA_MISMATCH,
             "Existing table metadata in ZooKeeper differs in engine mode. "
             "Stored in ZooKeeper: {}, local: {}",
-            DB::toString(from_zk.mode),
-            DB::toString(mode));
+            from_zk.mode,
+            mode);
 
     if (s3queue_tracked_files_limit != from_zk.s3queue_tracked_files_limit)
         throw Exception(
@@ -109,6 +129,28 @@ void S3QueueTableMetadata::checkImmutableFieldsEquals(const S3QueueTableMetadata
             "Stored in ZooKeeper: {}, local: {}",
             from_zk.format_name,
             format_name);
+
+    if (modeFromString(mode) == S3QueueMode::ORDERED)
+    {
+        if (s3queue_processing_threads_num != from_zk.s3queue_processing_threads_num)
+        {
+            throw Exception(
+                ErrorCodes::METADATA_MISMATCH,
+                "Existing table metadata in ZooKeeper differs in s3queue_processing_threads_num setting. "
+                "Stored in ZooKeeper: {}, local: {}",
+                from_zk.s3queue_processing_threads_num,
+                s3queue_processing_threads_num);
+        }
+        if (s3queue_total_shards_num != from_zk.s3queue_total_shards_num)
+        {
+            throw Exception(
+                ErrorCodes::METADATA_MISMATCH,
+                "Existing table metadata in ZooKeeper differs in s3queue_total_shards_num setting. "
+                "Stored in ZooKeeper: {}, local: {}",
+                from_zk.s3queue_total_shards_num,
+                s3queue_total_shards_num);
+        }
+    }
 }
 
 void S3QueueTableMetadata::checkEquals(const S3QueueTableMetadata & from_zk) const
diff --git a/src/Storages/S3Queue/S3QueueTableMetadata.h b/src/Storages/S3Queue/S3QueueTableMetadata.h
index f15665692c4..30642869930 100644
--- a/src/Storages/S3Queue/S3QueueTableMetadata.h
+++ b/src/Storages/S3Queue/S3QueueTableMetadata.h
@@ -23,6 +23,8 @@ struct S3QueueTableMetadata
     String mode;
     UInt64 s3queue_tracked_files_limit;
     UInt64 s3queue_tracked_file_ttl_sec;
+    UInt64 s3queue_total_shards_num;
+    UInt64 s3queue_processing_threads_num;
 
     S3QueueTableMetadata() = default;
     S3QueueTableMetadata(const StorageS3::Configuration & configuration, const S3QueueSettings & engine_settings, const StorageInMemoryMetadata & storage_metadata);
diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 5209c6f9642..4dc5f7e6556 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -165,6 +165,7 @@ def create_table(
     file_format="CSV",
     auth=DEFAULT_AUTH,
     bucket=None,
+    expect_error=False,
 ):
     auth_params = ",".join(auth)
     bucket = started_cluster.minio_bucket if bucket is None else bucket
@@ -184,6 +185,10 @@ def create_table(
         ENGINE = S3Queue('{url}', {auth_params}, {file_format})
         SETTINGS {",".join((k+"="+repr(v) for k, v in settings.items()))}
         """
+
+    if expect_error:
+        return node.query_and_get_error(create_query)
+
     node.query(create_query)
 
 
@@ -1200,3 +1205,64 @@ def test_shards_distributed(started_cluster, mode, processing_threads):
         zk = started_cluster.get_kazoo_client("zoo1")
         processed_nodes = zk.get_children(f"{keeper_path}/processed/")
         assert len(processed_nodes) == shards_num * processing_threads
+
+
+def test_settings_check(started_cluster):
+    node = started_cluster.instances["instance"]
+    node_2 = started_cluster.instances["instance2"]
+    table_name = f"test_settings_check"
+    dst_table_name = f"{table_name}_dst"
+    keeper_path = f"/clickhouse/test_{table_name}"
+    files_path = f"{table_name}_data"
+    mode = "ordered"
+
+    i = 0
+    create_table(
+        started_cluster,
+        node,
+        table_name,
+        mode,
+        files_path,
+        additional_settings={
+            "keeper_path": keeper_path,
+            "s3queue_processing_threads_num": 5,
+            "s3queue_total_shards_num": 2,
+            "s3queue_current_shard_num": i,
+        },
+    )
+
+    assert (
+        "Existing table metadata in ZooKeeper differs in s3queue_total_shards_num setting. Stored in ZooKeeper: 2, local: 3"
+        in create_table(
+            started_cluster,
+            node_2,
+            table_name,
+            mode,
+            files_path,
+            additional_settings={
+                "keeper_path": keeper_path,
+                "s3queue_processing_threads_num": 5,
+                "s3queue_total_shards_num": 3,
+                "s3queue_current_shard_num": i,
+            },
+            expect_error=True,
+        )
+    )
+
+    assert (
+        "Existing table metadata in ZooKeeper differs in s3queue_processing_threads_num setting. Stored in ZooKeeper: 5, local: 2"
+        in create_table(
+            started_cluster,
+            node_2,
+            table_name,
+            mode,
+            files_path,
+            additional_settings={
+                "keeper_path": keeper_path,
+                "s3queue_processing_threads_num": 2,
+                "s3queue_total_shards_num": 2,
+                "s3queue_current_shard_num": i,
+            },
+            expect_error=True,
+        )
+    )

From d0ea5392db7362cda42befbe9a0239ee1b3e8af8 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 29 Jan 2024 12:36:32 +0100
Subject: [PATCH 171/245] Fix storing iterated keys

---
 src/Storages/S3Queue/S3QueueFilesMetadata.h |  7 ++++
 src/Storages/S3Queue/S3QueueSource.cpp      | 43 +++++++++++++++------
 2 files changed, 38 insertions(+), 12 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index f62898889c3..0cc03783868 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -91,6 +91,13 @@ public:
 
     bool isProcessingIdBelongsToShard(size_t id, size_t shard_id) const { return shard_id * threads_per_shard <= id && id < (shard_id + 1) * threads_per_shard; }
 
+    std::vector<size_t> getProcessingIdsForShard(size_t shard_id) const
+    {
+        std::vector<size_t> res(threads_per_shard);
+        std::iota(res.begin(), res.end(), shard_id * threads_per_shard);
+        return res;
+    }
+
 private:
     const S3QueueMode mode;
     const UInt64 max_set_size;
diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index 96805eca10b..832a50386ee 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -54,8 +54,8 @@ StorageS3QueueSource::FileIterator::FileIterator(
 {
     if (sharded_processing)
     {
-        for (size_t i = 0; i < metadata->getProcessingThreadsNum(); ++i)
-            sharded_keys.emplace(i, std::deque<KeyWithInfoPtr>{});
+        for (const auto & id : metadata->getProcessingIdsForShard(current_shard))
+            sharded_keys.emplace(id, std::deque<KeyWithInfoPtr>{});
     }
 }
 
@@ -73,11 +73,20 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
                 /// we need to check sharded_keys and to next() under lock.
                 lk.lock();
 
-                auto & keys = sharded_keys.at(idx);
-                if (!keys.empty())
+                if (auto it = sharded_keys.find(idx); it != sharded_keys.end())
                 {
-                    val = keys.front();
-                    keys.pop_front();
+                    auto & keys = it->second;
+                    if (!keys.empty())
+                    {
+                        val = keys.front();
+                        keys.pop_front();
+                    }
+                }
+                else
+                {
+                    throw Exception(ErrorCodes::LOGICAL_ERROR,
+                                    "Processing id {} does not exist (Expexted ids: {})",
+                                    idx, fmt::join(metadata->getProcessingIdsForShard(current_shard), ", "));
                 }
             }
 
@@ -86,14 +95,24 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
                 val = glob_iterator->next();
                 if (val && sharded_processing)
                 {
-                    auto shard = metadata->getProcessingIdForPath(val->key);
-                    if (idx != shard)
+                    const auto processing_id_for_key = metadata->getProcessingIdForPath(val->key);
+                    if (idx != processing_id_for_key)
                     {
-                        if (metadata->isProcessingIdBelongsToShard(shard, current_shard))
+                        if (metadata->isProcessingIdBelongsToShard(processing_id_for_key, current_shard))
                         {
-                            LOG_TEST(log, "Key {} is for shard {} (total: {})", val->key, shard, sharded_keys.size());
-                            auto & keys = sharded_keys.at(shard);
-                            keys.push_back(val);
+                            LOG_TEST(log, "Putting key {} into queue of shard {} (total: {})",
+                                     val->key, processing_id_for_key, sharded_keys.size());
+
+                            if (auto it = sharded_keys.find(idx); it != sharded_keys.end())
+                            {
+                                it->second.push_back(val);
+                            }
+                            else
+                            {
+                                throw Exception(ErrorCodes::LOGICAL_ERROR,
+                                                "Processing id {} does not exist (Expexted ids: {})",
+                                                idx, fmt::join(metadata->getProcessingIdsForShard(current_shard), ", "));
+                            }
                         }
                         continue;
                     }

From 9f2093df75f0b0960e1d1a0fa80305f55d00a32e Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Mon, 29 Jan 2024 12:54:29 +0100
Subject: [PATCH 172/245] Restart CI

---
 src/Parsers/ParserDataType.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Parsers/ParserDataType.cpp b/src/Parsers/ParserDataType.cpp
index 99c0b4b29ac..b75f17dca72 100644
--- a/src/Parsers/ParserDataType.cpp
+++ b/src/Parsers/ParserDataType.cpp
@@ -123,7 +123,7 @@ bool ParserDataType::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
         auto test_pos = pos;
         ++test_pos;
         if (ParserToken(TokenType::ClosingRoundBracket).ignore(test_pos, test_expected))
-        { // the end of the type definition was reached, there was a trailing comma
+        { // the end of the type definition was reached and there was a trailing comma
             ++pos;
         }
     }

From c79a151ccac29b18ecdc4b451ecc9beda510d3c4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 13:00:49 +0100
Subject: [PATCH 173/245] Simplify query_run_metric_arrays in perf tests

---
 tests/performance/scripts/compare.sh | 12 ++++--------
 1 file changed, 4 insertions(+), 8 deletions(-)

diff --git a/tests/performance/scripts/compare.sh b/tests/performance/scripts/compare.sh
index 92ba383f965..e4bc64b3e28 100755
--- a/tests/performance/scripts/compare.sh
+++ b/tests/performance/scripts/compare.sh
@@ -444,10 +444,8 @@ create view query_logs as
 create table query_run_metric_arrays engine File(TSV, 'analyze/query-run-metric-arrays.tsv')
     as
     with (
-        -- sumMapState with the list of all keys with 'nan' values. 'nan' is because
-        -- sumMap removes keys with positive/negative zeros.
         with (select groupUniqArrayArray(mapKeys(ProfileEvents)) from query_logs) as all_names
-            select arrayReduce('sumMapState', [(all_names, arrayMap(x->nan, all_names))])
+            select arrayReduce('sumMapState', [(all_names, arrayMap(x->0::Nullable(Float64), all_names))])
         ) as all_metrics
     select test, query_index, version, query_id,
         (finalizeAggregation(
@@ -456,14 +454,12 @@ create table query_run_metric_arrays engine File(TSV, 'analyze/query-run-metric-
                     all_metrics,
                     arrayReduce('sumMapState',
                         [(mapKeys(ProfileEvents),
-                            arrayMap(x->toFloat64(x), mapValues(ProfileEvents)))]
+                            arrayMap(x->toNullable(toFloat64(x)), mapValues(ProfileEvents)))]
                     ),
                     arrayReduce('sumMapState', [(
                         ['client_time', 'server_time', 'memory_usage'],
-                        arrayMap(x->if(x != 0., x, nan), [
-                            toFloat64(query_runs.time),
-                            toFloat64(query_duration_ms / 1000.),
-                            toFloat64(memory_usage)]))])
+                        [toNullable(toFloat64(query_runs.time)), toNullable(toFloat64(query_duration_ms / 1000.)), toNullable(toFloat64(memory_usage))]
+                      )])
                 ]
             )) as metrics_tuple).1 metric_names,
         arrayMap(x->if(isNaN(x),0,x), metrics_tuple.2) metric_values

From 6a2fcb778fa7d5f4149ad275f15244e6903c4ab6 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 13:07:30 +0100
Subject: [PATCH 174/245] Restore comment

---
 tests/performance/scripts/compare.sh | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/performance/scripts/compare.sh b/tests/performance/scripts/compare.sh
index e4bc64b3e28..39c6854fbf9 100755
--- a/tests/performance/scripts/compare.sh
+++ b/tests/performance/scripts/compare.sh
@@ -444,6 +444,8 @@ create view query_logs as
 create table query_run_metric_arrays engine File(TSV, 'analyze/query-run-metric-arrays.tsv')
     as
     with (
+        -- sumMapState with the list of all keys with nullable '0' values because sumMap removes keys with default values
+        -- and 0::Nullable != NULL
         with (select groupUniqArrayArray(mapKeys(ProfileEvents)) from query_logs) as all_names
             select arrayReduce('sumMapState', [(all_names, arrayMap(x->0::Nullable(Float64), all_names))])
         ) as all_metrics

From cef109a887c9c1546db1702eaec48089fb11cfd1 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Mon, 29 Jan 2024 13:19:46 +0100
Subject: [PATCH 175/245] Fix backward compatibility check

---
 docker/test/stateless/stress_tests.lib        | 2 +-
 docker/test/upgrade/run.sh                    | 1 +
 tests/config/config.d/block_number.xml        | 6 ++++++
 tests/config/config.d/merge_tree_settings.xml | 2 --
 tests/config/install.sh                       | 1 +
 5 files changed, 9 insertions(+), 3 deletions(-)
 create mode 100644 tests/config/config.d/block_number.xml

diff --git a/docker/test/stateless/stress_tests.lib b/docker/test/stateless/stress_tests.lib
index ab573555a43..6e1834d6cde 100644
--- a/docker/test/stateless/stress_tests.lib
+++ b/docker/test/stateless/stress_tests.lib
@@ -78,7 +78,7 @@ function configure()
         randomize_config_boolean_value use_compression zookeeper
     fi
 
-    randomize_config_boolean_value allow_experimental_block_number_column merge_tree_settings
+    randomize_config_boolean_value allow_experimental_block_number_column block_number
 
     # for clickhouse-server (via service)
     echo "ASAN_OPTIONS='malloc_context_size=10 verbosity=1 allocator_release_to_os_interval_ms=10000'" >> /etc/environment
diff --git a/docker/test/upgrade/run.sh b/docker/test/upgrade/run.sh
index 9c008209316..aaba5cc6a8c 100644
--- a/docker/test/upgrade/run.sh
+++ b/docker/test/upgrade/run.sh
@@ -122,6 +122,7 @@ rm /etc/clickhouse-server/config.d/merge_tree.xml
 rm /etc/clickhouse-server/config.d/enable_wait_for_shutdown_replicated_tables.xml
 rm /etc/clickhouse-server/config.d/zero_copy_destructive_operations.xml
 rm /etc/clickhouse-server/config.d/storage_conf_02963.xml
+rm /etc/clickhouse-server/config.d/block_number.xml
 rm /etc/clickhouse-server/users.d/nonconst_timezone.xml
 rm /etc/clickhouse-server/users.d/s3_cache_new.xml
 rm /etc/clickhouse-server/users.d/replicated_ddl_entry.xml
diff --git a/tests/config/config.d/block_number.xml b/tests/config/config.d/block_number.xml
new file mode 100644
index 00000000000..b56f1f1afc2
--- /dev/null
+++ b/tests/config/config.d/block_number.xml
@@ -0,0 +1,6 @@
+<clickhouse>
+    <merge_tree>
+        <!-- Setting randomized for stress test, it is disabled here and this line is used to randomize it in the script -->
+        <allow_experimental_block_number_column>0</allow_experimental_block_number_column>
+    </merge_tree>
+</clickhouse>
diff --git a/tests/config/config.d/merge_tree_settings.xml b/tests/config/config.d/merge_tree_settings.xml
index 7dcea114b90..f277c18fa3f 100644
--- a/tests/config/config.d/merge_tree_settings.xml
+++ b/tests/config/config.d/merge_tree_settings.xml
@@ -2,7 +2,5 @@
     <merge_tree>
         <!-- 10 seconds (default is 1 minute) -->
         <zookeeper_session_expiration_check_period>10</zookeeper_session_expiration_check_period>
-        <!-- Setting randomized for stress test, it is disabled here and this line is used to randomize it in the script -->
-        <allow_experimental_block_number_column>0</allow_experimental_block_number_column>
     </merge_tree>
 </clickhouse>
diff --git a/tests/config/install.sh b/tests/config/install.sh
index a68a4c19501..cfe810cda84 100755
--- a/tests/config/install.sh
+++ b/tests/config/install.sh
@@ -64,6 +64,7 @@ ln -sf $SRC_PATH/config.d/backups.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/filesystem_caches_path.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/validate_tcp_client_information.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/zero_copy_destructive_operations.xml $DEST_SERVER_PATH/config.d/
+ln -sf $SRC_PATH/config.d/block_number.xml $DEST_SERVER_PATH/config.d/
 
 # Not supported with fasttest.
 if [ "${DEST_SERVER_PATH}" = "/etc/clickhouse-server" ]

From 5affd6af2ebd07f97e0c9f3f42d0976420cf8e92 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 29 Jan 2024 15:32:22 +0300
Subject: [PATCH 176/245] IVolume constructor improve exception message

---
 src/Disks/IVolume.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Disks/IVolume.cpp b/src/Disks/IVolume.cpp
index 0b072e6ba8b..d763c55c4aa 100644
--- a/src/Disks/IVolume.cpp
+++ b/src/Disks/IVolume.cpp
@@ -46,7 +46,7 @@ IVolume::IVolume(
     }
 
     if (disks.empty())
-        throw Exception(ErrorCodes::NO_ELEMENTS_IN_CONFIG, "Volume must contain at least one disk");
+        throw Exception(ErrorCodes::NO_ELEMENTS_IN_CONFIG, "Volume {} must contain at least one disk", name);
 }
 
 std::optional<UInt64> IVolume::getMaxUnreservedFreeSpace() const

From 71e5ee81d828917907b74655b1282aaf5627d00a Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 13:36:58 +0100
Subject: [PATCH 177/245] Enable JIT with UBSAN

---
 contrib/llvm-project-cmake/CMakeLists.txt                    | 5 ++---
 tests/queries/0_stateless/02252_jit_profile_events.sql       | 2 +-
 .../queries/0_stateless/02723_jit_aggregation_bug_48120.sql  | 2 +-
 3 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/contrib/llvm-project-cmake/CMakeLists.txt b/contrib/llvm-project-cmake/CMakeLists.txt
index d09060912d8..ed73af1277c 100644
--- a/contrib/llvm-project-cmake/CMakeLists.txt
+++ b/contrib/llvm-project-cmake/CMakeLists.txt
@@ -1,6 +1,5 @@
-if (APPLE OR SANITIZE STREQUAL "undefined" OR SANITIZE STREQUAL "memory")
-    # llvm-tblgen, that is used during LLVM build, doesn't work with UBSan.
-    set (ENABLE_EMBEDDED_COMPILER_DEFAULT OFF)
+if (APPLE OR SANITIZE STREQUAL "memory")
+    # llvm-tblgen, that is used during LLVM build, doesn't work with MSAN.
     set (ENABLE_DWARF_PARSER_DEFAULT OFF)
 else()
     set (ENABLE_EMBEDDED_COMPILER_DEFAULT ${ENABLE_LIBRARIES})
diff --git a/tests/queries/0_stateless/02252_jit_profile_events.sql b/tests/queries/0_stateless/02252_jit_profile_events.sql
index fbd6040c21c..4b69dde2a45 100644
--- a/tests/queries/0_stateless/02252_jit_profile_events.sql
+++ b/tests/queries/0_stateless/02252_jit_profile_events.sql
@@ -1,4 +1,4 @@
--- Tags: no-fasttest, no-ubsan, no-asan, no-msan, no-cpu-aarch64
+-- Tags: no-fasttest, no-cpu-aarch64, no-msan
 
 SET compile_expressions = 1;
 SET min_count_to_compile_expression = 0;
diff --git a/tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql b/tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql
index a9a6d3058b2..88561f9d895 100644
--- a/tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql
+++ b/tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql
@@ -1,4 +1,4 @@
--- Tags: no-fasttest, no-ubsan, no-msan, no-cpu-aarch64
+-- Tags: no-fasttest, no-cpu-aarch64, no-msan
 
 drop table if exists dummy;
 CREATE TABLE dummy ( num1 Int32, num2 Enum8('foo' = 0, 'bar' = 1, 'tar' = 2) )

From 9fa76bea7e8215f1359d3c3608fd3a0165210658 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Mon, 29 Jan 2024 13:48:36 +0100
Subject: [PATCH 178/245] Support FORMAT clause in BACKUP/RESTORE query.

---
 src/Parsers/ASTBackupQuery.cpp        | 17 +++++++++--------
 src/Parsers/ASTBackupQuery.h          |  6 +++---
 src/Parsers/ParserQuery.cpp           |  5 +----
 src/Parsers/ParserQueryWithOutput.cpp |  5 ++++-
 4 files changed, 17 insertions(+), 16 deletions(-)

diff --git a/src/Parsers/ASTBackupQuery.cpp b/src/Parsers/ASTBackupQuery.cpp
index 2c26e723687..bdb78eaf971 100644
--- a/src/Parsers/ASTBackupQuery.cpp
+++ b/src/Parsers/ASTBackupQuery.cpp
@@ -261,23 +261,24 @@ ASTPtr ASTBackupQuery::clone() const
     if (settings)
         res->settings = settings->clone();
 
+    cloneOutputOptions(*res);
+
     return res;
 }
 
 
-void ASTBackupQuery::formatImpl(const FormatSettings & format, FormatState &, FormatStateStacked) const
+void ASTBackupQuery::formatQueryImpl(const FormatSettings & fs, FormatState &, FormatStateStacked) const
 {
-    format.ostr << (format.hilite ? hilite_keyword : "") << ((kind == Kind::BACKUP) ? "BACKUP " : "RESTORE ")
-                << (format.hilite ? hilite_none : "");
+    fs.ostr << (fs.hilite ? hilite_keyword : "") << ((kind == Kind::BACKUP) ? "BACKUP " : "RESTORE ") << (fs.hilite ? hilite_none : "");
 
-    formatElements(elements, format);
-    formatOnCluster(format);
+    formatElements(elements, fs);
+    formatOnCluster(fs);
 
-    format.ostr << (format.hilite ? hilite_keyword : "") << ((kind == Kind::BACKUP) ? " TO " : " FROM ") << (format.hilite ? hilite_none : "");
-    backup_name->format(format);
+    fs.ostr << (fs.hilite ? hilite_keyword : "") << ((kind == Kind::BACKUP) ? " TO " : " FROM ") << (fs.hilite ? hilite_none : "");
+    backup_name->format(fs);
 
     if (settings || base_backup_name)
-        formatSettings(settings, base_backup_name, cluster_host_ids, format);
+        formatSettings(settings, base_backup_name, cluster_host_ids, fs);
 }
 
 ASTPtr ASTBackupQuery::getRewrittenASTWithoutOnCluster(const WithoutOnClusterASTRewriteParams & params) const
diff --git a/src/Parsers/ASTBackupQuery.h b/src/Parsers/ASTBackupQuery.h
index 0201c2b14f9..27aa1680748 100644
--- a/src/Parsers/ASTBackupQuery.h
+++ b/src/Parsers/ASTBackupQuery.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Parsers/IAST.h>
+#include <Parsers/ASTQueryWithOutput.h>
 #include <Parsers/ASTQueryWithOnCluster.h>
 
 
@@ -40,7 +40,7 @@ class ASTFunction;
   * For the BACKUP command this clause allows to set the name which an object will have inside the backup.
   * And for the RESTORE command this clause allows to set the name which an object will have after RESTORE has finished.
   */
-class ASTBackupQuery : public IAST, public ASTQueryWithOnCluster
+class ASTBackupQuery : public ASTQueryWithOutput, public ASTQueryWithOnCluster
 {
 public:
     enum Kind
@@ -91,7 +91,7 @@ public:
 
     String getID(char) const override;
     ASTPtr clone() const override;
-    void formatImpl(const FormatSettings & format, FormatState &, FormatStateStacked) const override;
+    void formatQueryImpl(const FormatSettings & format, FormatState &, FormatStateStacked) const override;
     ASTPtr getRewrittenASTWithoutOnCluster(const WithoutOnClusterASTRewriteParams &) const override;
     QueryKind getQueryKind() const override;
 
diff --git a/src/Parsers/ParserQuery.cpp b/src/Parsers/ParserQuery.cpp
index 7ed69940bed..22ddc25019f 100644
--- a/src/Parsers/ParserQuery.cpp
+++ b/src/Parsers/ParserQuery.cpp
@@ -1,6 +1,5 @@
 #include <Parsers/ParserAlterQuery.h>
 #include <Parsers/ParserCreateFunctionQuery.h>
-#include <Parsers/ParserBackupQuery.h>
 #include <Parsers/ParserCreateQuery.h>
 #include <Parsers/ParserCreateIndexQuery.h>
 #include <Parsers/ParserDropFunctionQuery.h>
@@ -61,7 +60,6 @@ bool ParserQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     ParserExternalDDLQuery external_ddl_p;
     ParserTransactionControl transaction_control_p;
     ParserDeleteQuery delete_p;
-    ParserBackupQuery backup_p;
 
     bool res = query_with_output_p.parse(pos, node, expected)
         || insert_p.parse(pos, node, expected)
@@ -86,8 +84,7 @@ bool ParserQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
         || grant_p.parse(pos, node, expected)
         || external_ddl_p.parse(pos, node, expected)
         || transaction_control_p.parse(pos, node, expected)
-        || delete_p.parse(pos, node, expected)
-        || backup_p.parse(pos, node, expected);
+        || delete_p.parse(pos, node, expected);
 
     return res;
 }
diff --git a/src/Parsers/ParserQueryWithOutput.cpp b/src/Parsers/ParserQueryWithOutput.cpp
index f03df6cacfe..7a627ae5f6a 100644
--- a/src/Parsers/ParserQueryWithOutput.cpp
+++ b/src/Parsers/ParserQueryWithOutput.cpp
@@ -2,6 +2,7 @@
 #include <Parsers/ASTSelectWithUnionQuery.h>
 #include <Parsers/ASTSetQuery.h>
 #include <Parsers/ParserAlterQuery.h>
+#include <Parsers/ParserBackupQuery.h>
 #include <Parsers/ParserCheckQuery.h>
 #include <Parsers/ParserCreateQuery.h>
 #include <Parsers/ParserDescribeTableQuery.h>
@@ -65,6 +66,7 @@ bool ParserQueryWithOutput::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     ParserShowGrantsQuery show_grants_p;
     ParserShowPrivilegesQuery show_privileges_p;
     ParserExplainQuery explain_p(end, allow_settings_after_format_in_insert);
+    ParserBackupQuery backup_p;
 
     ASTPtr query;
 
@@ -94,7 +96,8 @@ bool ParserQueryWithOutput::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
         || show_access_p.parse(pos, query, expected)
         || show_access_entities_p.parse(pos, query, expected)
         || show_grants_p.parse(pos, query, expected)
-        || show_privileges_p.parse(pos, query, expected);
+        || show_privileges_p.parse(pos, query, expected)
+        || backup_p.parse(pos, query, expected);
 
     if (!parsed)
         return false;

From 1904e4c6bfde4dd84bdad747b4d6b8764b324846 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Mon, 29 Jan 2024 14:19:51 +0100
Subject: [PATCH 179/245] Add test.

---
 .../02974_backup_query_format_null.reference  |  3 +++
 .../02974_backup_query_format_null.sh         | 22 +++++++++++++++++++
 2 files changed, 25 insertions(+)
 create mode 100644 tests/queries/0_stateless/02974_backup_query_format_null.reference
 create mode 100755 tests/queries/0_stateless/02974_backup_query_format_null.sh

diff --git a/tests/queries/0_stateless/02974_backup_query_format_null.reference b/tests/queries/0_stateless/02974_backup_query_format_null.reference
new file mode 100644
index 00000000000..67bfe658c1f
--- /dev/null
+++ b/tests/queries/0_stateless/02974_backup_query_format_null.reference
@@ -0,0 +1,3 @@
+2
+80
+-12345
diff --git a/tests/queries/0_stateless/02974_backup_query_format_null.sh b/tests/queries/0_stateless/02974_backup_query_format_null.sh
new file mode 100755
index 00000000000..ddba2f6de16
--- /dev/null
+++ b/tests/queries/0_stateless/02974_backup_query_format_null.sh
@@ -0,0 +1,22 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+${CLICKHOUSE_CLIENT} -nm --query "
+DROP TABLE IF EXISTS tbl;
+CREATE TABLE tbl (a Int32) ENGINE = MergeTree() ORDER BY tuple();
+INSERT INTO tbl VALUES (2), (80), (-12345);
+"
+
+backup_name="Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}')"
+
+${CLICKHOUSE_CLIENT} --query "BACKUP TABLE tbl TO ${backup_name} FORMAT Null"
+
+${CLICKHOUSE_CLIENT} -nm --query "
+DROP TABLE tbl;
+RESTORE ALL FROM ${backup_name} FORMAT Null
+"
+
+${CLICKHOUSE_CLIENT} --query "SELECT * FROM tbl"

From 2191569d6b0b20b32af5c19469504817fb0455b1 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 29 Jan 2024 13:13:42 +0000
Subject: [PATCH 180/245] Cosmetics: remove superfluous inline

---
 src/Functions/formatString.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/formatString.h b/src/Functions/formatString.h
index 315e5c06227..bdd36f4aa17 100644
--- a/src/Functions/formatString.h
+++ b/src/Functions/formatString.h
@@ -18,7 +18,7 @@ struct FormatStringImpl
     static constexpr size_t right_padding = 15;
 
     template <typename... Args>
-    static inline void formatExecute(bool possibly_has_column_string, bool possibly_has_column_fixed_string, Args &&... args)
+    static void formatExecute(bool possibly_has_column_string, bool possibly_has_column_fixed_string, Args &&... args)
     {
         if (possibly_has_column_string && possibly_has_column_fixed_string)
             format<true, true>(std::forward<Args>(args)...);
@@ -38,7 +38,7 @@ struct FormatStringImpl
     /// input_rows_count is the number of rows processed.
     /// Precondition: data.size() == offsets.size() == fixed_string_N.size() == constant_strings.size().
     template <bool has_column_string, bool has_column_fixed_string>
-    static inline void format(
+    static void format(
         String pattern,
         const std::vector<const ColumnString::Chars *> & data,
         const std::vector<const ColumnString::Offsets *> & offsets,

From 1aae7d7d953dc2445d0ded7c2d62ab3bd5ae0d6c Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 29 Jan 2024 13:35:19 +0000
Subject: [PATCH 181/245] Cosmetics: Rename variable

---
 src/Functions/concat.cpp              | 18 +++++++++---------
 src/Functions/concatWithSeparator.cpp | 11 +++++------
 2 files changed, 14 insertions(+), 15 deletions(-)

diff --git a/src/Functions/concat.cpp b/src/Functions/concat.cpp
index b057e7fede5..d68f5256f6d 100644
--- a/src/Functions/concat.cpp
+++ b/src/Functions/concat.cpp
@@ -80,21 +80,21 @@ private:
         const ColumnConst * c0_const_string = checkAndGetColumnConst<ColumnString>(c0);
         const ColumnConst * c1_const_string = checkAndGetColumnConst<ColumnString>(c1);
 
-        auto c_res = ColumnString::create();
+        auto col_res = ColumnString::create();
 
         if (c0_string && c1_string)
-            concat(StringSource(*c0_string), StringSource(*c1_string), StringSink(*c_res, c0->size()));
+            concat(StringSource(*c0_string), StringSource(*c1_string), StringSink(*col_res, c0->size()));
         else if (c0_string && c1_const_string)
-            concat(StringSource(*c0_string), ConstSource<StringSource>(*c1_const_string), StringSink(*c_res, c0->size()));
+            concat(StringSource(*c0_string), ConstSource<StringSource>(*c1_const_string), StringSink(*col_res, c0->size()));
         else if (c0_const_string && c1_string)
-            concat(ConstSource<StringSource>(*c0_const_string), StringSource(*c1_string), StringSink(*c_res, c0->size()));
+            concat(ConstSource<StringSource>(*c0_const_string), StringSource(*c1_string), StringSink(*col_res, c0->size()));
         else
         {
             /// Fallback: use generic implementation for not very important cases.
             return executeFormatImpl(arguments, input_rows_count);
         }
 
-        return c_res;
+        return col_res;
     }
 
     ColumnPtr executeFormatImpl(const ColumnsWithTypeAndName & arguments, size_t input_rows_count) const
@@ -102,7 +102,7 @@ private:
         const size_t num_arguments = arguments.size();
         assert(num_arguments >= 2);
 
-        auto c_res = ColumnString::create();
+        auto col_res = ColumnString::create();
         std::vector<const ColumnString::Chars *> data(num_arguments);
         std::vector<const ColumnString::Offsets *> offsets(num_arguments);
         std::vector<size_t> fixed_string_sizes(num_arguments);
@@ -169,11 +169,11 @@ private:
             offsets,
             fixed_string_sizes,
             constant_strings,
-            c_res->getChars(),
-            c_res->getOffsets(),
+            col_res->getChars(),
+            col_res->getOffsets(),
             input_rows_count);
 
-        return c_res;
+        return col_res;
     }
 };
 
diff --git a/src/Functions/concatWithSeparator.cpp b/src/Functions/concatWithSeparator.cpp
index b4f3732710f..00e480c3a6d 100644
--- a/src/Functions/concatWithSeparator.cpp
+++ b/src/Functions/concatWithSeparator.cpp
@@ -27,7 +27,6 @@ class ConcatWithSeparatorImpl : public IFunction
 public:
     static constexpr auto name = Name::name;
     explicit ConcatWithSeparatorImpl(ContextPtr context_) : context(context_) { }
-
     static FunctionPtr create(ContextPtr context) { return std::make_shared<ConcatWithSeparatorImpl>(context); }
 
     String getName() const override { return name; }
@@ -70,8 +69,8 @@ public:
         if (arguments.size() == 1)
             return result_type->createColumnConstWithDefaultValue(input_rows_count);
 
-        auto c_res = ColumnString::create();
-        c_res->reserve(input_rows_count);
+        auto col_res = ColumnString::create();
+        col_res->reserve(input_rows_count);
         const ColumnConst * col_sep = checkAndGetColumnConstStringOrFixedString(arguments[0].column.get());
         if (!col_sep)
             throw Exception(
@@ -129,10 +128,10 @@ public:
             offsets,
             fixed_string_sizes,
             constant_strings,
-            c_res->getChars(),
-            c_res->getOffsets(),
+            col_res->getChars(),
+            col_res->getOffsets(),
             input_rows_count);
-        return std::move(c_res);
+        return std::move(col_res);
     }
 
 private:

From d3cdc8826eb5209562ae743c7a385a7f33bbc015 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Mon, 29 Jan 2024 14:04:23 +0000
Subject: [PATCH 182/245] lower memory usage in vertical merges

---
 .../Transforms/ColumnGathererTransform.cpp    | 16 ++++++---
 .../Transforms/ColumnGathererTransform.h      | 29 ++++++++-------
 src/Storages/MergeTree/MergeTask.cpp          | 10 +++++-
 ...981_vertical_merges_memory_usage.reference |  1 +
 .../02981_vertical_merges_memory_usage.sql    | 35 +++++++++++++++++++
 5 files changed, 73 insertions(+), 18 deletions(-)
 create mode 100644 tests/queries/0_stateless/02981_vertical_merges_memory_usage.reference
 create mode 100644 tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql

diff --git a/src/Processors/Transforms/ColumnGathererTransform.cpp b/src/Processors/Transforms/ColumnGathererTransform.cpp
index d7f52a538e1..b2e8e9bc89e 100644
--- a/src/Processors/Transforms/ColumnGathererTransform.cpp
+++ b/src/Processors/Transforms/ColumnGathererTransform.cpp
@@ -17,9 +17,14 @@ namespace ErrorCodes
 }
 
 ColumnGathererStream::ColumnGathererStream(
-    size_t num_inputs, ReadBuffer & row_sources_buf_, size_t block_preferred_size_)
-    : sources(num_inputs), row_sources_buf(row_sources_buf_)
-    , block_preferred_size(block_preferred_size_)
+    size_t num_inputs,
+    ReadBuffer & row_sources_buf_,
+    size_t block_preferred_size_rows_,
+    size_t block_preferred_size_bytes_)
+    : sources(num_inputs)
+    , row_sources_buf(row_sources_buf_)
+    , block_preferred_size_rows(block_preferred_size_rows_)
+    , block_preferred_size_bytes(block_preferred_size_bytes_)
 {
     if (num_inputs == 0)
         throw Exception(ErrorCodes::EMPTY_DATA_PASSED, "There are no streams to gather");
@@ -124,10 +129,11 @@ ColumnGathererTransform::ColumnGathererTransform(
     const Block & header,
     size_t num_inputs,
     ReadBuffer & row_sources_buf_,
-    size_t block_preferred_size_)
+    size_t block_preferred_size_rows_,
+    size_t block_preferred_size_bytes_)
     : IMergingTransform<ColumnGathererStream>(
         num_inputs, header, header, /*have_all_inputs_=*/ true, /*limit_hint_=*/ 0, /*always_read_till_end_=*/ false,
-        num_inputs, row_sources_buf_, block_preferred_size_)
+        num_inputs, row_sources_buf_, block_preferred_size_rows_, block_preferred_size_bytes_)
     , log(getLogger("ColumnGathererStream"))
 {
     if (header.columns() != 1)
diff --git a/src/Processors/Transforms/ColumnGathererTransform.h b/src/Processors/Transforms/ColumnGathererTransform.h
index 885cb3f81ba..821d04db0df 100644
--- a/src/Processors/Transforms/ColumnGathererTransform.h
+++ b/src/Processors/Transforms/ColumnGathererTransform.h
@@ -5,7 +5,6 @@
 #include <Processors/Merges/Algorithms/IMergingAlgorithm.h>
 #include <Processors/Merges/IMergingTransform.h>
 
-
 namespace Poco { class Logger; }
 
 
@@ -57,7 +56,11 @@ using MergedRowSources = PODArray<RowSourcePart>;
 class ColumnGathererStream final : public IMergingAlgorithm
 {
 public:
-    ColumnGathererStream(size_t num_inputs, ReadBuffer & row_sources_buf_, size_t block_preferred_size_ = DEFAULT_BLOCK_SIZE);
+    ColumnGathererStream(
+        size_t num_inputs,
+        ReadBuffer & row_sources_buf_,
+        size_t block_preferred_size_rows_,
+        size_t block_preferred_size_bytes_);
 
     const char * getName() const override { return "ColumnGathererStream"; }
     void initialize(Inputs inputs) override;
@@ -92,13 +95,12 @@ private:
     std::vector<Source> sources;
     ReadBuffer & row_sources_buf;
 
-    const size_t block_preferred_size;
+    const size_t block_preferred_size_rows;
+    const size_t block_preferred_size_bytes;
 
     Source * source_to_fully_copy = nullptr;
 
     ssize_t next_required_source = -1;
-    size_t cur_block_preferred_size = 0;
-
     UInt64 merged_rows = 0;
     UInt64 merged_bytes = 0;
 };
@@ -110,7 +112,8 @@ public:
         const Block & header,
         size_t num_inputs,
         ReadBuffer & row_sources_buf_,
-        size_t block_preferred_size_ = DEFAULT_BLOCK_SIZE);
+        size_t block_preferred_size_rows_,
+        size_t block_preferred_size_bytes_);
 
     String getName() const override { return "ColumnGathererTransform"; }
 
@@ -134,14 +137,17 @@ void ColumnGathererStream::gather(Column & column_res)
     if (next_required_source == -1)
     {
         /// Start new column.
-        cur_block_preferred_size = std::min(static_cast<size_t>(row_sources_end - row_source_pos), block_preferred_size);
-        column_res.reserve(cur_block_preferred_size);
+        /// Actually reserve works only for fixed size columns.
+        /// So it's safe to ignore preferred size in bytes and call reserve for number of rows.
+        size_t size_to_reserve = std::min(static_cast<size_t>(row_sources_end - row_source_pos), block_preferred_size_rows);
+        column_res.reserve(size_to_reserve);
     }
 
-    size_t cur_size = column_res.size();
     next_required_source = -1;
 
-    while (row_source_pos < row_sources_end && cur_size < cur_block_preferred_size)
+    while (row_source_pos < row_sources_end
+        && column_res.size() < block_preferred_size_rows
+        && column_res.allocatedBytes() < block_preferred_size_bytes)
     {
         RowSourcePart row_source = *row_source_pos;
         size_t source_num = row_source.getSourceNum();
@@ -159,6 +165,7 @@ void ColumnGathererStream::gather(Column & column_res)
         /// Consecutive optimization. TODO: precompute lengths
         size_t len = 1;
         size_t max_len = std::min(static_cast<size_t>(row_sources_end - row_source_pos), source.size - source.pos); // interval should be in the same block
+
         while (len < max_len && row_source_pos->data == row_source.data)
         {
             ++len;
@@ -181,8 +188,6 @@ void ColumnGathererStream::gather(Column & column_res)
                 column_res.insertFrom(*source.column, source.pos);
             else
                 column_res.insertRangeFrom(*source.column, source.pos, len);
-
-            cur_size += len;
         }
 
         source.pos += len;
diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index 4b5b7ca8018..59bdb7006b3 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -588,7 +588,15 @@ void MergeTask::VerticalMergeStage::prepareVerticalMergeForOneColumn() const
     auto pipe = Pipe::unitePipes(std::move(pipes));
 
     ctx->rows_sources_read_buf->seek(0, 0);
-    auto transform = std::make_unique<ColumnGathererTransform>(pipe.getHeader(), pipe.numOutputPorts(), *ctx->rows_sources_read_buf);
+
+    const auto data_settings = global_ctx->data->getSettings();
+    auto transform = std::make_unique<ColumnGathererTransform>(
+        pipe.getHeader(),
+        pipe.numOutputPorts(),
+        *ctx->rows_sources_read_buf,
+        data_settings->merge_max_block_size,
+        data_settings->merge_max_block_size_bytes);
+
     pipe.addTransform(std::move(transform));
 
     ctx->column_parts_pipeline = QueryPipeline(std::move(pipe));
diff --git a/tests/queries/0_stateless/02981_vertical_merges_memory_usage.reference b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.reference
new file mode 100644
index 00000000000..60c254e152b
--- /dev/null
+++ b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.reference
@@ -0,0 +1 @@
+Vertical	OK
diff --git a/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
new file mode 100644
index 00000000000..1305f02c044
--- /dev/null
+++ b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
@@ -0,0 +1,35 @@
+-- Tags: long
+
+DROP TABLE IF EXISTS t_vertical_merge_memory;
+
+CREATE TABLE t_vertical_merge_memory (id UInt64, arr Array(String))
+ENGINE = MergeTree ORDER BY id
+SETTINGS
+    min_bytes_for_wide_part = 0,
+    vertical_merge_algorithm_min_rows_to_activate = 1,
+    vertical_merge_algorithm_min_columns_to_activate = 1,
+    index_granularity = 8192,
+    index_granularity_bytes = '10M',
+    merge_max_block_size = 8192,
+    merge_max_block_size_bytes = '10M';
+
+INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(30000);
+INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(30000);
+
+OPTIMIZE TABLE t_vertical_merge_memory FINAL;
+
+SYSTEM FLUSH LOGS;
+
+SELECT
+    merge_algorithm,
+    peak_memory_usage < 500 * 1024 * 1024
+        ? 'OK'
+        : format('FAIL: memory usage: {}', formatReadableSize(peak_memory_usage))
+FROM system.part_log
+WHERE
+    database = currentDatabase()
+    AND table = 't_vertical_merge_memory'
+    AND event_type = 'MergeParts'
+    AND length(merged_from) = 2;
+
+DROP TABLE IF EXISTS t_vertical_merge_memory;

From c2b7d2047ed09fac37ae85d69d4191a14eb2d31f Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 29 Jan 2024 14:09:40 +0000
Subject: [PATCH 183/245] Support arguments of arbitary type in function
 concatWithSeparator()

Follow-up to #56540
---
 .../functions/string-functions.md             |  2 +-
 src/Functions/concatWithSeparator.cpp         | 47 +++++++---
 .../02495_concat_with_separator.reference     | 39 ++++++++
 .../02495_concat_with_separator.sql           | 89 ++++++++++++++-----
 4 files changed, 142 insertions(+), 35 deletions(-)

diff --git a/docs/en/sql-reference/functions/string-functions.md b/docs/en/sql-reference/functions/string-functions.md
index a2f1b0d7752..60cb3ac4ac4 100644
--- a/docs/en/sql-reference/functions/string-functions.md
+++ b/docs/en/sql-reference/functions/string-functions.md
@@ -515,7 +515,7 @@ Alias: `concat_ws`
 **Arguments**
 
 - sep — separator. Const [String](../../sql-reference/data-types/string.md) or [FixedString](../../sql-reference/data-types/fixedstring.md).
-- exprN — expression to be concatenated. [String](../../sql-reference/data-types/string.md) or [FixedString](../../sql-reference/data-types/fixedstring.md).
+- exprN — expression to be concatenated. Arguments which are not of types [String](../../sql-reference/data-types/string.md) or [FixedString](../../sql-reference/data-types/fixedstring.md) are converted to strings using their default serialization. As this decreases performance, it is not recommended to use non-String/FixedString arguments.
 
 **Returned values**
 
diff --git a/src/Functions/concatWithSeparator.cpp b/src/Functions/concatWithSeparator.cpp
index 00e480c3a6d..ed02f331192 100644
--- a/src/Functions/concatWithSeparator.cpp
+++ b/src/Functions/concatWithSeparator.cpp
@@ -1,5 +1,6 @@
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnString.h>
+#include <Columns/ColumnStringHelpers.h>
 #include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
@@ -48,17 +49,13 @@ public:
                 getName(),
                 arguments.size());
 
-        for (const auto arg_idx : collections::range(0, arguments.size()))
-        {
-            const auto * arg = arguments[arg_idx].get();
-            if (!isStringOrFixedString(arg))
-                throw Exception(
-                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                    "Illegal type {} of argument {} of function {}",
-                    arg->getName(),
-                    arg_idx + 1,
-                    getName());
-        }
+        const auto * separator_arg = arguments[0].get();
+        if (!isStringOrFixedString(separator_arg))
+            throw Exception(
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                "Illegal type {} of first argument of function {}",
+                separator_arg->getName(),
+                getName());
 
         return std::make_shared<DataTypeString>();
     }
@@ -71,6 +68,7 @@ public:
 
         auto col_res = ColumnString::create();
         col_res->reserve(input_rows_count);
+
         const ColumnConst * col_sep = checkAndGetColumnConstStringOrFixedString(arguments[0].column.get());
         if (!col_sep)
             throw Exception(
@@ -87,6 +85,7 @@ public:
         std::vector<const ColumnString::Offsets *> offsets(num_args);
         std::vector<size_t> fixed_string_sizes(num_args);
         std::vector<std::optional<String>> constant_strings(num_args);
+        std::vector<ColumnString::MutablePtr> converted_col_ptrs(num_args);
 
         bool has_column_string = false;
         bool has_column_fixed_string = false;
@@ -110,9 +109,33 @@ public:
                 fixed_string_sizes[2 * i] = fixed_col->getN();
             }
             else if (const ColumnConst * const_col = checkAndGetColumnConstStringOrFixedString(column.get()))
+            {
                 constant_strings[2 * i] = const_col->getValue<String>();
+            }
             else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of argument of function {}", column->getName(), getName());
+            {
+                /// A non-String/non-FixedString-type argument: use the default serialization to convert it to String
+                auto full_column = column->convertToFullIfNeeded();
+                auto serialization = arguments[i +1].type->getDefaultSerialization();
+                auto converted_col_str = ColumnString::create();
+                ColumnStringHelpers::WriteHelper write_helper(*converted_col_str, column->size());
+                auto & write_buffer = write_helper.getWriteBuffer();
+                FormatSettings format_settings;
+                for (size_t row = 0; row < column->size(); ++row)
+                {
+                    serialization->serializeText(*full_column, row, write_buffer, format_settings);
+                    write_helper.rowWritten();
+                }
+                write_helper.finalize();
+
+                /// Keep the pointer alive
+                converted_col_ptrs[i] = std::move(converted_col_str);
+
+                /// Same as the normal `ColumnString` branch
+                has_column_string = true;
+                data[2 * i] = &converted_col_ptrs[i]->getChars();
+                offsets[2 * i] = &converted_col_ptrs[i]->getOffsets();
+            }
         }
 
         String pattern;
diff --git a/tests/queries/0_stateless/02495_concat_with_separator.reference b/tests/queries/0_stateless/02495_concat_with_separator.reference
index 8f0ea917f4b..ebff5deb6aa 100644
--- a/tests/queries/0_stateless/02495_concat_with_separator.reference
+++ b/tests/queries/0_stateless/02495_concat_with_separator.reference
@@ -14,6 +14,45 @@
 1
 1
 1
+1
+1
 \N
 \N
 \N
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+0
diff --git a/tests/queries/0_stateless/02495_concat_with_separator.sql b/tests/queries/0_stateless/02495_concat_with_separator.sql
index 916c4cda1b7..7167d48a1da 100644
--- a/tests/queries/0_stateless/02495_concat_with_separator.sql
+++ b/tests/queries/0_stateless/02495_concat_with_separator.sql
@@ -1,27 +1,72 @@
-select concatWithSeparator('|', 'a', 'b') == 'a|b';
-select concatWithSeparator('|', 'a', materialize('b')) == 'a|b';
-select concatWithSeparator('|', materialize('a'), 'b') == 'a|b';
-select concatWithSeparator('|', materialize('a'), materialize('b')) == 'a|b';
+SET allow_suspicious_low_cardinality_types=1;
 
-select concatWithSeparator('|', 'a', toFixedString('b', 1)) == 'a|b';
-select concatWithSeparator('|', 'a', materialize(toFixedString('b', 1))) == 'a|b';
-select concatWithSeparator('|', materialize('a'), toFixedString('b', 1)) == 'a|b';
-select concatWithSeparator('|', materialize('a'), materialize(toFixedString('b', 1))) == 'a|b';
+-- negative tests
+SELECT concatWithSeparator(materialize('|'), 'a', 'b'); -- { serverError ILLEGAL_COLUMN }
+SELECT concatWithSeparator();                           -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
 
-select concatWithSeparator('|', toFixedString('a', 1), 'b') == 'a|b';
-select concatWithSeparator('|', toFixedString('a', 1), materialize('b')) == 'a|b';
-select concatWithSeparator('|', materialize(toFixedString('a', 1)), 'b') == 'a|b';
-select concatWithSeparator('|', materialize(toFixedString('a', 1)), materialize('b')) == 'a|b';
+-- special cases
+SELECT concatWithSeparator('|') = '';
+SELECT concatWithSeparator('|', 'a') == 'a';
 
-select concatWithSeparator('|', toFixedString('a', 1), toFixedString('b', 1)) == 'a|b';
-select concatWithSeparator('|', toFixedString('a', 1), materialize(toFixedString('b', 1))) == 'a|b';
-select concatWithSeparator('|', materialize(toFixedString('a', 1)), toFixedString('b', 1)) == 'a|b';
-select concatWithSeparator('|', materialize(toFixedString('a', 1)), materialize(toFixedString('b', 1))) == 'a|b';
+SELECT concatWithSeparator('|', 'a', 'b') == 'a|b';
+SELECT concatWithSeparator('|', 'a', materialize('b')) == 'a|b';
+SELECT concatWithSeparator('|', materialize('a'), 'b') == 'a|b';
+SELECT concatWithSeparator('|', materialize('a'), materialize('b')) == 'a|b';
 
-select concatWithSeparator(null, 'a', 'b') == null;
-select concatWithSeparator('1', null, 'b') == null;
-select concatWithSeparator('1', 'a', null) == null;
+SELECT concatWithSeparator('|', 'a', toFixedString('b', 1)) == 'a|b';
+SELECT concatWithSeparator('|', 'a', materialize(toFixedString('b', 1))) == 'a|b';
+SELECT concatWithSeparator('|', materialize('a'), toFixedString('b', 1)) == 'a|b';
+SELECT concatWithSeparator('|', materialize('a'), materialize(toFixedString('b', 1))) == 'a|b';
 
-select concatWithSeparator(materialize('|'), 'a', 'b'); -- { serverError 44 }
-select concatWithSeparator();                           -- { serverError 42 }
-select concatWithSeparator('|', 'a', 100);              -- { serverError 43 }
+SELECT concatWithSeparator('|', toFixedString('a', 1), 'b') == 'a|b';
+SELECT concatWithSeparator('|', toFixedString('a', 1), materialize('b')) == 'a|b';
+SELECT concatWithSeparator('|', materialize(toFixedString('a', 1)), 'b') == 'a|b';
+SELECT concatWithSeparator('|', materialize(toFixedString('a', 1)), materialize('b')) == 'a|b';
+
+SELECT concatWithSeparator('|', toFixedString('a', 1), toFixedString('b', 1)) == 'a|b';
+SELECT concatWithSeparator('|', toFixedString('a', 1), materialize(toFixedString('b', 1))) == 'a|b';
+SELECT concatWithSeparator('|', materialize(toFixedString('a', 1)), toFixedString('b', 1)) == 'a|b';
+SELECT concatWithSeparator('|', materialize(toFixedString('a', 1)), materialize(toFixedString('b', 1))) == 'a|b';
+
+SELECT concatWithSeparator(null, 'a', 'b') == null;
+SELECT concatWithSeparator('1', null, 'b') == null;
+SELECT concatWithSeparator('1', 'a', null) == null;
+
+-- Const String + non-const non-String/non-FixedString type'
+SELECT concatWithSeparator('|', 'a', materialize(42 :: Int8)) == 'a|42';
+SELECT concatWithSeparator('|', 'a', materialize(43 :: Int16)) == 'a|43';
+SELECT concatWithSeparator('|', 'a', materialize(44 :: Int32)) == 'a|44';
+SELECT concatWithSeparator('|', 'a', materialize(45 :: Int64)) == 'a|45';
+SELECT concatWithSeparator('|', 'a', materialize(46 :: Int128)) == 'a|46';
+SELECT concatWithSeparator('|', 'a', materialize(47 :: Int256)) == 'a|47';
+SELECT concatWithSeparator('|', 'a', materialize(48 :: UInt8)) == 'a|48';
+SELECT concatWithSeparator('|', 'a', materialize(49 :: UInt16)) == 'a|49';
+SELECT concatWithSeparator('|', 'a', materialize(50 :: UInt32)) == 'a|50';
+SELECT concatWithSeparator('|', 'a', materialize(51 :: UInt64)) == 'a|51';
+SELECT concatWithSeparator('|', 'a', materialize(52 :: UInt128)) == 'a|52';
+SELECT concatWithSeparator('|', 'a', materialize(53 :: UInt256)) == 'a|53';
+SELECT concatWithSeparator('|', 'a', materialize(42.42 :: Float32)) == 'a|42.42';
+SELECT concatWithSeparator('|', 'a', materialize(43.43 :: Float64)) == 'a|43.43';
+SELECT concatWithSeparator('|', 'a', materialize(44.44 :: Decimal(2))) == 'a|44';
+SELECT concatWithSeparator('|', 'a', materialize(true :: Bool)) == 'a|true';
+SELECT concatWithSeparator('|', 'a', materialize(false :: Bool)) == 'a|false';
+SELECT concatWithSeparator('|', 'a', materialize('foo' :: String)) == 'a|foo';
+SELECT concatWithSeparator('|', 'a', materialize('bar' :: FixedString(3))) == 'a|bar';
+SELECT concatWithSeparator('|', 'a', materialize('foo' :: Nullable(String))) == 'a|foo';
+SELECT concatWithSeparator('|', 'a', materialize('bar' :: Nullable(FixedString(3)))) == 'a|bar';
+SELECT concatWithSeparator('|', 'a', materialize('foo' :: LowCardinality(String))) == 'a|foo';
+SELECT concatWithSeparator('|', 'a', materialize('bar' :: LowCardinality(FixedString(3)))) == 'a|bar';
+SELECT concatWithSeparator('|', 'a', materialize('foo' :: LowCardinality(Nullable(String)))) == 'a|foo';
+SELECT concatWithSeparator('|', 'a', materialize('bar' :: LowCardinality(Nullable(FixedString(3))))) == 'a|bar';
+SELECT concatWithSeparator('|', 'a', materialize(42 :: LowCardinality(Nullable(UInt32)))) == 'a|42';
+SELECT concatWithSeparator('|', 'a', materialize(42 :: LowCardinality(UInt32))) == 'a|42';
+SELECT concatWithSeparator('|', 'a', materialize('fae310ca-d52a-4923-9e9b-02bf67f4b009' :: UUID)) == 'a|fae310ca-d52a-4923-9e9b-02bf67f4b009';
+SELECT concatWithSeparator('|', 'a', materialize('2023-11-14' :: Date)) == 'a|2023-11-14';
+SELECT concatWithSeparator('|', 'a', materialize('2123-11-14' :: Date32)) == 'a|2123-11-14';
+SELECT concatWithSeparator('|', 'a', materialize('2023-11-14 05:50:12' :: DateTime('Europe/Amsterdam'))) == 'a|2023-11-14 05:50:12';
+SELECT concatWithSeparator('|', 'a', materialize('hallo' :: Enum('hallo' = 1))) == 'a|hallo';
+SELECT concatWithSeparator('|', 'a', materialize(['foo', 'bar'] :: Array(String))) == 'a|[\'foo\',\'bar\']';
+SELECT concatWithSeparator('|', 'a', materialize((42, 'foo') :: Tuple(Int32, String))) == 'a|(42,\'foo\')';
+SELECT concatWithSeparator('|', 'a', materialize(map(42, 'foo') :: Map(Int32, String))) == 'a|{42:\'foo\'}';
+SELECT concatWithSeparator('|', 'a', materialize('122.233.64.201' :: IPv4)) == 'a|122.233.64.201';
+SELECT concatWithSeparator('|', 'a', materialize('2001:0001:130F:0002:0003:09C0:876A:130B' :: IPv6)) == 'a|2001:0001:130F:0002:0003:09C0:876A:130B';

From 1f446f78b5902ba1ac3e142dc885ef95c4598130 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Mon, 29 Jan 2024 16:24:16 +0100
Subject: [PATCH 184/245] Fix parameter's name.

---
 src/Parsers/ASTBackupQuery.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Parsers/ASTBackupQuery.h b/src/Parsers/ASTBackupQuery.h
index 27aa1680748..a56cdebc7b3 100644
--- a/src/Parsers/ASTBackupQuery.h
+++ b/src/Parsers/ASTBackupQuery.h
@@ -91,7 +91,7 @@ public:
 
     String getID(char) const override;
     ASTPtr clone() const override;
-    void formatQueryImpl(const FormatSettings & format, FormatState &, FormatStateStacked) const override;
+    void formatQueryImpl(const FormatSettings & fs, FormatState &, FormatStateStacked) const override;
     ASTPtr getRewrittenASTWithoutOnCluster(const WithoutOnClusterASTRewriteParams &) const override;
     QueryKind getQueryKind() const override;
 

From 621c3e85963522127e2d5a62aa42f096e9c289c3 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 29 Jan 2024 16:50:01 +0100
Subject: [PATCH 185/245] Fix upgrade check for new setting

---
 src/Core/SettingsChangesHistory.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 928e05e5bb6..db9bb0b3a80 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -102,7 +102,8 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
-              {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"}}},
+              {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
+              {"azure_max_unexpected_write_error_retries", 4, 0, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},

From ac532599aa48a6b012b498d1cfddf315f48cdcef Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 17:33:53 +0100
Subject: [PATCH 186/245] Don't apply without coverage flags when it's not
 necessary

---
 cmake/sanitize.cmake | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/cmake/sanitize.cmake b/cmake/sanitize.cmake
index 3882b51227e..bc4a029721d 100644
--- a/cmake/sanitize.cmake
+++ b/cmake/sanitize.cmake
@@ -79,7 +79,10 @@ if (SANITIZE_COVERAGE)
 
     # But the actual coverage will be enabled on per-library basis: for ClickHouse code, but not for 3rd-party.
     set (COVERAGE_FLAGS "-fsanitize-coverage=trace-pc-guard,pc-table")
-endif()
 
-set (WITHOUT_COVERAGE_FLAGS "-fno-profile-instr-generate -fno-coverage-mapping -fno-sanitize-coverage=trace-pc-guard,pc-table")
-set (WITHOUT_COVERAGE_FLAGS_LIST -fno-profile-instr-generate -fno-coverage-mapping -fno-sanitize-coverage=trace-pc-guard,pc-table)
+    set (WITHOUT_COVERAGE_FLAGS "-fno-profile-instr-generate -fno-coverage-mapping -fno-sanitize-coverage=trace-pc-guard,pc-table")
+    set (WITHOUT_COVERAGE_FLAGS_LIST -fno-profile-instr-generate -fno-coverage-mapping -fno-sanitize-coverage=trace-pc-guard,pc-table)
+else()
+    set (WITHOUT_COVERAGE_FLAGS "")
+    set (WITHOUT_COVERAGE_FLAGS_LIST "")
+endif()

From b88d0a2b15d902773b7396c1b6a0169c7ae7bcca Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 17:34:11 +0100
Subject: [PATCH 187/245] Don't apply O2 on release builds

---
 src/CMakeLists.txt | 14 ++++++++------
 1 file changed, 8 insertions(+), 6 deletions(-)

diff --git a/src/CMakeLists.txt b/src/CMakeLists.txt
index 027e8a01fb1..5eae5ab6bff 100644
--- a/src/CMakeLists.txt
+++ b/src/CMakeLists.txt
@@ -294,12 +294,14 @@ if (TARGET ch_contrib::gwp_asan)
 endif()
 
 # Otherwise it will slow down stack traces printing too much.
-set_source_files_properties(
-        Common/Elf.cpp
-        Common/Dwarf.cpp
-        Common/SymbolIndex.cpp
-        Common/ThreadFuzzer.cpp
-        PROPERTIES COMPILE_FLAGS "-O2 ${WITHOUT_COVERAGE_FLAGS}")
+if ("${CMAKE_BUILD_TYPE_UC}" STREQUAL "DEBUG")
+    set_source_files_properties(
+            Common/Elf.cpp
+            Common/Dwarf.cpp
+            Common/SymbolIndex.cpp
+            Common/ThreadFuzzer.cpp
+            PROPERTIES COMPILE_FLAGS "-O2 ${WITHOUT_COVERAGE_FLAGS}")
+endif()
 
 target_link_libraries (clickhouse_common_io
         PRIVATE

From cda39e64e4d6b3076b68e2c73067fad3ebf78460 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 17:47:50 +0100
Subject: [PATCH 188/245] Perf: Only consider XML files

---
 tests/performance/scripts/entrypoint.sh | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/performance/scripts/entrypoint.sh b/tests/performance/scripts/entrypoint.sh
index ec7e4d96dde..0c3bfa550f4 100755
--- a/tests/performance/scripts/entrypoint.sh
+++ b/tests/performance/scripts/entrypoint.sh
@@ -118,8 +118,8 @@ then
     # far in the future and have unrelated test changes.
     base=$(git -C right/ch merge-base pr origin/master)
     git -C right/ch diff --name-only "$base" pr -- . | tee all-changed-files.txt
-    git -C right/ch diff --name-only "$base" pr -- tests/performance | tee changed-test-definitions.txt
-    git -C right/ch diff --name-only "$base" pr -- :!tests/performance :!docker/test/performance-comparison | tee other-changed-files.txt
+    git -C right/ch diff --name-only "$base" pr -- tests/performance/*.xml | tee changed-test-definitions.txt
+    git -C right/ch diff --name-only "$base" pr -- :!tests/performance/*.xml :!docker/test/performance-comparison | tee other-changed-files.txt
 fi
 
 # Set python output encoding so that we can print queries with non-ASCII letters.

From 5b1919aff1d5cf91b9effdc7eb611a92f88d3b48 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 29 Jan 2024 20:11:14 +0300
Subject: [PATCH 189/245] Loggers initialization fix

---
 src/Loggers/Loggers.cpp | 23 ++++++++++++-----------
 1 file changed, 12 insertions(+), 11 deletions(-)

diff --git a/src/Loggers/Loggers.cpp b/src/Loggers/Loggers.cpp
index 258853e8162..1d17585cc96 100644
--- a/src/Loggers/Loggers.cpp
+++ b/src/Loggers/Loggers.cpp
@@ -159,7 +159,6 @@ void Loggers::buildLoggers(Poco::Util::AbstractConfiguration & config, Poco::Log
 
     if (config.getBool("logger.use_syslog", false))
     {
-        //const std::string & cmd_name = commandName();
         auto syslog_level = Poco::Logger::parseLevel(config.getString("logger.syslog_level", log_level_string));
         if (syslog_level > max_log_level)
         {
@@ -228,22 +227,24 @@ void Loggers::buildLoggers(Poco::Util::AbstractConfiguration & config, Poco::Log
 
     split->open();
     logger.close();
-    logger.setChannel(split);
 
-    // Global logging level (it can be overridden for specific loggers).
+    logger.setChannel(split);
     logger.setLevel(max_log_level);
 
-    // Set level to all already created loggers
-    std::vector<std::string> names;
-    //logger_root = Logger::root();
-    logger.root().names(names);
-    for (const auto & name : names)
-        logger.root().get(name).setLevel(max_log_level);
-
-    // Attach to the root logger.
+    // Global logging level and channel (it can be overridden for specific loggers).
     logger.root().setLevel(max_log_level);
     logger.root().setChannel(logger.getChannel());
 
+    // Set level and channel to all already created loggers
+    std::vector<std::string> names;
+    logger.names(names);
+
+    for (const auto & name : names)
+    {
+        logger.get(name).setLevel(max_log_level);
+        logger.get(name).setChannel(split);
+    }
+
     // Explicitly specified log levels for specific loggers.
     {
         Poco::Util::AbstractConfiguration::Keys loggers_level;

From 7892adc18beb05335f4f56e6ad3737384ba958ef Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 29 Jan 2024 20:18:25 +0300
Subject: [PATCH 190/245] Add setting
 update_insert_deduplication_token_in_dependent_materialized_views to settings
 changes history

---
 src/Core/SettingsChangesHistory.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 928e05e5bb6..bf3e98820ab 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -102,7 +102,8 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
-              {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"}}},
+              {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
+              {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},

From d0143380d733480f2b3c50dd092a758e6604a2a6 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 29 Jan 2024 17:53:59 +0000
Subject: [PATCH 191/245] Fix not-ready set for system.tables

---
 src/Storages/System/StorageSystemTables.cpp        | 14 +++++++++++---
 .../queries/0_stateless/02841_not_ready_set_bug.sh |  1 +
 2 files changed, 12 insertions(+), 3 deletions(-)

diff --git a/src/Storages/System/StorageSystemTables.cpp b/src/Storages/System/StorageSystemTables.cpp
index a0f6b03cf89..e0d2dd03e78 100644
--- a/src/Storages/System/StorageSystemTables.cpp
+++ b/src/Storages/System/StorageSystemTables.cpp
@@ -693,10 +693,15 @@ public:
     {
     }
 
+    void applyFilters() override;
+
 private:
     ContextPtr context;
     std::vector<UInt8> columns_mask;
     size_t max_block_size;
+
+    ColumnPtr filtered_databases_column;
+    ColumnPtr filtered_tables_column;
 };
 
 void StorageSystemTables::read(
@@ -723,16 +728,19 @@ void StorageSystemTables::read(
     query_plan.addStep(std::move(reading));
 }
 
-void ReadFromSystemTables::initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
+void ReadFromSystemTables::applyFilters()
 {
     auto filter_actions_dag = ActionsDAG::buildFilterActionsDAG(filter_nodes.nodes);
     const ActionsDAG::Node * predicate = nullptr;
     if (filter_actions_dag)
         predicate = filter_actions_dag->getOutputs().at(0);
 
-    ColumnPtr filtered_databases_column = getFilteredDatabases(predicate, context);
-    ColumnPtr filtered_tables_column = getFilteredTables(predicate, filtered_databases_column, context);
+    filtered_databases_column = getFilteredDatabases(predicate, context);
+    filtered_tables_column = getFilteredTables(predicate, filtered_databases_column, context);
+}
 
+void ReadFromSystemTables::initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
+{
     Pipe pipe(std::make_shared<TablesBlockSource>(
         std::move(columns_mask), getOutputStream().header, max_block_size, std::move(filtered_databases_column), std::move(filtered_tables_column), context));
     pipeline.init(std::move(pipe));
diff --git a/tests/queries/0_stateless/02841_not_ready_set_bug.sh b/tests/queries/0_stateless/02841_not_ready_set_bug.sh
index fd7f62d28bf..809640de075 100755
--- a/tests/queries/0_stateless/02841_not_ready_set_bug.sh
+++ b/tests/queries/0_stateless/02841_not_ready_set_bug.sh
@@ -9,3 +9,4 @@ $CLICKHOUSE_CLIENT -q "create table t1 (number UInt64) engine = MergeTree order
 $CLICKHOUSE_CLIENT -q "insert into t1 select number from numbers(10);"
 $CLICKHOUSE_CLIENT --max_threads=2 --max_result_rows=1 --result_overflow_mode=break -q "with tab as (select min(number) from t1 prewhere number in (select number from view(select number, row_number() OVER (partition by number % 2 ORDER BY number DESC) from numbers_mt(1e4)) where number != 2 order by number)) select number from t1 union all select * from tab;" > /dev/null
 
+$CLICKHOUSE_CLIENT -q "SELECT * FROM system.tables WHERE 1 in (SELECT number from numbers(2)) format Null"

From 516daadeef67886c1f6fdf0864004bdc7fcf95a7 Mon Sep 17 00:00:00 2001
From: Arthur Passos <arthur.ti@outlook.com>
Date: Mon, 29 Jan 2024 15:16:00 -0300
Subject: [PATCH 192/245] add static storage assert in datapartcloner

---
 src/Storages/MergeTree/MergeTreeDataPartCloner.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
index e384e1b7066..04019d2c665 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
@@ -257,6 +257,7 @@ std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> cloneAndHand
     const WriteSettings & write_settings,
     const IDataPartStorage::ClonePartParams & params)
 {
+    chassert(!merge_tree_data->isStaticStorage());
     if (!doesStoragePolicyAllowSameDisk(merge_tree_data, src_part))
         throw Exception(
             ErrorCodes::BAD_ARGUMENTS,

From 34134c4f1e4215fec06fed1850d72877b47603f3 Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Mon, 29 Jan 2024 19:25:18 +0100
Subject: [PATCH 193/245] Style fix

---
 tests/queries/0_stateless/02841_not_ready_set_bug.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02841_not_ready_set_bug.sh b/tests/queries/0_stateless/02841_not_ready_set_bug.sh
index 809640de075..3aaffe51578 100755
--- a/tests/queries/0_stateless/02841_not_ready_set_bug.sh
+++ b/tests/queries/0_stateless/02841_not_ready_set_bug.sh
@@ -9,4 +9,4 @@ $CLICKHOUSE_CLIENT -q "create table t1 (number UInt64) engine = MergeTree order
 $CLICKHOUSE_CLIENT -q "insert into t1 select number from numbers(10);"
 $CLICKHOUSE_CLIENT --max_threads=2 --max_result_rows=1 --result_overflow_mode=break -q "with tab as (select min(number) from t1 prewhere number in (select number from view(select number, row_number() OVER (partition by number % 2 ORDER BY number DESC) from numbers_mt(1e4)) where number != 2 order by number)) select number from t1 union all select * from tab;" > /dev/null
 
-$CLICKHOUSE_CLIENT -q "SELECT * FROM system.tables WHERE 1 in (SELECT number from numbers(2)) format Null"
+$CLICKHOUSE_CLIENT -q "SELECT * FROM system.tables WHERE 1 in (SELECT number from numbers(2)) AND database = currentDatabase() format Null"

From 9d5af9d9cf922f5bf803e8b1f7d4ae520e9b3cce Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 29 Jan 2024 19:31:05 +0100
Subject: [PATCH 194/245] Try fix

---
 .../0_stateless/02973_s3_compressed_file_in_error_message.sh    | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
index 2af0a83bd26..764c6a2af54 100755
--- a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
+++ b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
@@ -5,5 +5,5 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_LOCAL -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c -F "a.tsv"
+$CLICKHOUSE_CLIENT -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c -F "a.tsv"
 

From df7d3b8a401669b6ead2ee8b8d48b750bec36e2d Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 29 Jan 2024 17:14:32 +0100
Subject: [PATCH 195/245] Allocate current shard number from keeper

---
 src/Storages/S3Queue/S3QueueFilesMetadata.cpp | 121 +++++++++++++++++-
 src/Storages/S3Queue/S3QueueFilesMetadata.h   |  45 +++++--
 src/Storages/S3Queue/S3QueueSource.cpp        |   4 +-
 src/Storages/S3Queue/StorageS3Queue.cpp       |  35 +++--
 src/Storages/S3Queue/StorageS3Queue.h         |   4 +-
 .../integration/test_storage_s3_queue/test.py |  23 +++-
 6 files changed, 198 insertions(+), 34 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
index 6c3e47d998e..30bb561204f 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
@@ -134,6 +134,7 @@ S3QueueFilesMetadata::S3QueueFilesMetadata(const fs::path & zookeeper_path_, con
     , zookeeper_processing_path(zookeeper_path_ / "processing")
     , zookeeper_processed_path(zookeeper_path_ / "processed")
     , zookeeper_failed_path(zookeeper_path_ / "failed")
+    , zookeeper_shards_path(zookeeper_path_ / "shards")
     , zookeeper_cleanup_lock_path(zookeeper_path_ / "cleanup_lock")
     , log(getLogger("S3QueueFilesMetadata"))
 {
@@ -159,7 +160,11 @@ void S3QueueFilesMetadata::deactivateCleanupTask()
 
 zkutil::ZooKeeperPtr S3QueueFilesMetadata::getZooKeeper() const
 {
-    return Context::getGlobalContextInstance()->getZooKeeper();
+    if (!zookeeper || zookeeper->expired())
+    {
+        zookeeper = Context::getGlobalContextInstance()->getZooKeeper();
+    }
+    return zookeeper;
 }
 
 S3QueueFilesMetadata::FileStatusPtr S3QueueFilesMetadata::getFileStatus(const std::string & path)
@@ -199,9 +204,121 @@ S3QueueFilesMetadata::NodeMetadata S3QueueFilesMetadata::createNodeMetadata(
     return metadata;
 }
 
+bool S3QueueFilesMetadata::isShardedProcessing() const
+{
+    return getProcessingIdsNum() > 1 && mode == S3QueueMode::ORDERED;
+}
+
+size_t S3QueueFilesMetadata::registerNewShard()
+{
+    if (!isShardedProcessing())
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+                        "Cannot register a new shard, because processing is not sharded");
+    }
+
+    const auto zk_client = getZooKeeper();
+    zk_client->createAncestors(zookeeper_shards_path / "");
+
+    std::string shard_node_path;
+    size_t shard_id = 0;
+    for (size_t i = 0; i < shards_num; ++i)
+    {
+        const auto node_path = getZooKeeperPathForShard(i);
+        auto err = zk_client->tryCreate(node_path, "", zkutil::CreateMode::Persistent);
+        if (err == Coordination::Error::ZOK)
+        {
+            shard_node_path = node_path;
+            shard_id = i;
+            break;
+        }
+        else if (err == Coordination::Error::ZNODEEXISTS)
+            continue;
+        else
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                            "Unexpected error: {}", magic_enum::enum_name(err));
+    }
+
+    if (shard_node_path.empty())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Failed to register a new shard");
+
+    LOG_TRACE(log, "Using shard {} (zk node: {})", shard_id, shard_node_path);
+    return shard_id;
+}
+
+std::string S3QueueFilesMetadata::getZooKeeperPathForShard(size_t shard_id) const
+{
+    return zookeeper_shards_path / ("shard" + toString(shard_id));
+}
+
+void S3QueueFilesMetadata::registerNewShard(size_t shard_id)
+{
+    if (!isShardedProcessing())
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+                        "Cannot register a new shard, because processing is not sharded");
+    }
+
+    const auto zk_client = getZooKeeper();
+    const auto node_path = getZooKeeperPathForShard(shard_id);
+    zk_client->createAncestors(node_path);
+
+    auto err = zk_client->tryCreate(node_path, "", zkutil::CreateMode::Persistent);
+    if (err != Coordination::Error::ZOK)
+    {
+        if (err == Coordination::Error::ZNODEEXISTS)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot register shard {}: already exists", shard_id);
+        else
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                            "Unexpected error: {}", magic_enum::enum_name(err));
+    }
+}
+
+bool S3QueueFilesMetadata::isShardRegistered(size_t shard_id)
+{
+    const auto zk_client = getZooKeeper();
+    const auto node_path = getZooKeeperPathForShard(shard_id);
+    return zk_client->exists(node_path);
+}
+
+void S3QueueFilesMetadata::unregisterShard(size_t shard_id)
+{
+    if (!isShardedProcessing())
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+                        "Cannot unregister a shard, because processing is not sharded");
+    }
+
+    const auto zk_client = getZooKeeper();
+    const auto node_path = getZooKeeperPathForShard(shard_id);
+    zk_client->remove(node_path);
+}
+
+size_t S3QueueFilesMetadata::getProcessingIdsNum() const
+{
+    return shards_num * threads_per_shard;
+}
+
+std::vector<size_t> S3QueueFilesMetadata::getProcessingIdsForShard(size_t shard_id) const
+{
+    std::vector<size_t> res(threads_per_shard);
+    std::iota(res.begin(), res.end(), shard_id * threads_per_shard);
+    return res;
+}
+
+bool S3QueueFilesMetadata::isProcessingIdBelongsToShard(size_t id, size_t shard_id) const
+{
+    return shard_id * threads_per_shard <= id && id < (shard_id + 1) * threads_per_shard;
+}
+
+size_t S3QueueFilesMetadata::getIdForProcessingThread(size_t thread_id, size_t shard_id) const
+{
+    return shard_id * threads_per_shard + thread_id;
+}
+
 size_t S3QueueFilesMetadata::getProcessingIdForPath(const std::string & path) const
 {
-    return sipHash64(path.data(), path.size()) % getProcessingThreadsNum();
+    return sipHash64(path.data(), path.size()) % getProcessingIdsNum();
 }
 
 S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAsProcessing(const std::string & path)
diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index 0cc03783868..66e36b4122e 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -80,24 +80,38 @@ public:
 
     void deactivateCleanupTask();
 
-    bool isShardedProcessing() const { return getProcessingThreadsNum() > 1 && mode == S3QueueMode::ORDERED; }
+    /// Should the table use sharded processing?
+    /// We use sharded processing for Ordered mode of S3Queue table.
+    /// It allows to parallelize processing within a single server
+    /// and to allow distributed processing.
+    bool isShardedProcessing() const;
 
-    size_t getProcessingThreadsNum() const { return shards_num * threads_per_shard; }
+    /// Register a new shard for processing.
+    /// Return a shard id of registered shard.
+    size_t registerNewShard();
+    /// Register a new shard for processing by given id.
+    /// Throws exception if shard by this id is already registered.
+    void registerNewShard(size_t shard_id);
+    /// Unregister shard from keeper.
+    void unregisterShard(size_t shard_id);
+    bool isShardRegistered(size_t shard_id);
 
+    /// Total number of processing ids.
+    /// A processing id identifies a single processing thread.
+    /// There might be several processing ids per shard.
+    size_t getProcessingIdsNum() const;
+    /// Get processing ids identified with requested shard.
+    std::vector<size_t> getProcessingIdsForShard(size_t shard_id) const;
+    /// Check if given processing id belongs to a given shard.
+    bool isProcessingIdBelongsToShard(size_t id, size_t shard_id) const;
+    /// Get a processing id for processing thread by given thread id.
+    /// thread id is a value in range [0, threads_per_shard].
+    size_t getIdForProcessingThread(size_t thread_id, size_t shard_id) const;
+
+    /// Calculate which processing id corresponds to a given file path.
+    /// The file will be processed by a thread related to this processing id.
     size_t getProcessingIdForPath(const std::string & path) const;
 
-    /// shard_id must be in range [0, shards_num - 1]
-    size_t getIdForProcessingThread(size_t thread_id, size_t shard_id) const { return shard_id * threads_per_shard + thread_id; }
-
-    bool isProcessingIdBelongsToShard(size_t id, size_t shard_id) const { return shard_id * threads_per_shard <= id && id < (shard_id + 1) * threads_per_shard; }
-
-    std::vector<size_t> getProcessingIdsForShard(size_t shard_id) const
-    {
-        std::vector<size_t> res(threads_per_shard);
-        std::iota(res.begin(), res.end(), shard_id * threads_per_shard);
-        return res;
-    }
-
 private:
     const S3QueueMode mode;
     const UInt64 max_set_size;
@@ -111,9 +125,11 @@ private:
     const fs::path zookeeper_processing_path;
     const fs::path zookeeper_processed_path;
     const fs::path zookeeper_failed_path;
+    const fs::path zookeeper_shards_path;
     const fs::path zookeeper_cleanup_lock_path;
 
     LoggerPtr log;
+    mutable zkutil::ZooKeeperPtr zookeeper;
 
     std::atomic_bool shutdown = false;
     BackgroundSchedulePool::TaskHolder task;
@@ -124,6 +140,7 @@ private:
 
     void setFileProcessedForOrderedMode(ProcessingNodeHolderPtr holder);
     void setFileProcessedForUnorderedMode(ProcessingNodeHolderPtr holder);
+    std::string getZooKeeperPathForShard(size_t shard_id) const;
 
     enum class SetFileProcessingResult
     {
diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index 832a50386ee..e277a81a923 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -85,7 +85,7 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
                 else
                 {
                     throw Exception(ErrorCodes::LOGICAL_ERROR,
-                                    "Processing id {} does not exist (Expexted ids: {})",
+                                    "Processing id {} does not exist (Expected ids: {})",
                                     idx, fmt::join(metadata->getProcessingIdsForShard(current_shard), ", "));
                 }
             }
@@ -110,7 +110,7 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
                             else
                             {
                                 throw Exception(ErrorCodes::LOGICAL_ERROR,
-                                                "Processing id {} does not exist (Expexted ids: {})",
+                                                "Processing id {} does not exist (Expected ids: {})",
                                                 idx, fmt::join(metadata->getProcessingIdsForShard(current_shard), ", "));
                             }
                         }
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index 44e9b818e1e..23ef9aec980 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -93,13 +93,6 @@ namespace
                             "Setting `s3queue_cleanup_interval_min_ms` ({}) must be less or equal to `s3queue_cleanup_interval_max_ms` ({})",
                             s3queue_settings.s3queue_cleanup_interval_min_ms, s3queue_settings.s3queue_cleanup_interval_max_ms);
         }
-
-        if (s3queue_settings.s3queue_current_shard_num >= s3queue_settings.s3queue_total_shards_num)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                            "Setting `s3queue_current_shard_num` ({}) cannot exceed `{}` (`s3queue_total_shards_num` - 1)",
-                            s3queue_settings.s3queue_current_shard_num, s3queue_settings.s3queue_total_shards_num);
-
-        ///TODO: Add a test with different total_shards_settings for same keeper path - exception must be thrown.
     }
 }
 
@@ -111,7 +104,8 @@ StorageS3Queue::StorageS3Queue(
     const ConstraintsDescription & constraints_,
     const String & comment,
     ContextPtr context_,
-    std::optional<FormatSettings> format_settings_)
+    std::optional<FormatSettings> format_settings_,
+    ASTStorage * engine_args)
     : IStorage(table_id_)
     , WithContext(context_)
     , s3queue_settings(std::move(s3queue_settings_))
@@ -174,6 +168,19 @@ StorageS3Queue::StorageS3Queue(
         S3QueueMetadataFactory::instance().remove(zk_path);
         throw;
     }
+
+    if (files_metadata->isShardedProcessing())
+    {
+        if (!s3queue_settings->s3queue_current_shard_num.changed)
+        {
+            s3queue_settings->s3queue_current_shard_num = static_cast<UInt32>(files_metadata->registerNewShard());
+            engine_args->settings->changes.setSetting("s3queue_current_shard_num", s3queue_settings->s3queue_current_shard_num.value);
+        }
+        else if (!files_metadata->isShardRegistered(s3queue_settings->s3queue_current_shard_num))
+        {
+            files_metadata->registerNewShard(s3queue_settings->s3queue_current_shard_num);
+        }
+    }
 }
 
 void StorageS3Queue::startup()
@@ -187,6 +194,7 @@ void StorageS3Queue::shutdown(bool is_drop)
     table_is_being_dropped = is_drop;
     shutdown_called = true;
 
+    LOG_TRACE(log, "Shutting down storage...");
     if (task)
     {
         task->deactivate();
@@ -195,8 +203,16 @@ void StorageS3Queue::shutdown(bool is_drop)
     if (files_metadata)
     {
         files_metadata->deactivateCleanupTask();
+
+        if (is_drop && files_metadata->isShardedProcessing())
+        {
+            files_metadata->unregisterShard(s3queue_settings->s3queue_current_shard_num);
+            LOG_TRACE(log, "Unregistered shard {} from zookeeper", s3queue_settings->s3queue_current_shard_num);
+        }
+
         files_metadata.reset();
     }
+    LOG_TRACE(log, "Shut down storage");
 }
 
 void StorageS3Queue::drop()
@@ -627,7 +643,8 @@ void registerStorageS3QueueImpl(const String & name, StorageFactory & factory)
                 args.constraints,
                 args.comment,
                 args.getContext(),
-                format_settings);
+                format_settings,
+                args.storage_def);
         },
         {
             .supports_settings = true,
diff --git a/src/Storages/S3Queue/StorageS3Queue.h b/src/Storages/S3Queue/StorageS3Queue.h
index fa13086bc22..fd3b4bb4914 100644
--- a/src/Storages/S3Queue/StorageS3Queue.h
+++ b/src/Storages/S3Queue/StorageS3Queue.h
@@ -11,6 +11,7 @@
 #include <Storages/StorageS3.h>
 #include <Interpreters/Context.h>
 #include <IO/S3/BlobStorageLogWriter.h>
+#include <Storages/StorageFactory.h>
 
 
 namespace Aws::S3
@@ -35,7 +36,8 @@ public:
         const ConstraintsDescription & constraints_,
         const String & comment,
         ContextPtr context_,
-        std::optional<FormatSettings> format_settings_);
+        std::optional<FormatSettings> format_settings_,
+        ASTStorage * engine_args);
 
     String getName() const override { return "S3Queue"; }
 
diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 4dc5f7e6556..1495e4954b1 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -89,6 +89,7 @@ def started_cluster():
                 "configs/zookeeper.xml",
                 "configs/s3queue_log.xml",
             ],
+            stay_alive=True,
         )
         cluster.add_instance(
             "instance2",
@@ -1049,7 +1050,6 @@ def test_shards(started_cluster, mode, processing_threads):
                 "keeper_path": keeper_path,
                 "s3queue_processing_threads_num": processing_threads,
                 "s3queue_total_shards_num": shards_num,
-                "s3queue_current_shard_num": i,
             },
         )
         create_mv(node, table, dst_table)
@@ -1115,6 +1115,8 @@ def test_shards(started_cluster, mode, processing_threads):
         zk = started_cluster.get_kazoo_client("zoo1")
         processed_nodes = zk.get_children(f"{keeper_path}/processed/")
         assert len(processed_nodes) == shards_num * processing_threads
+        shard_nodes = zk.get_children(f"{keeper_path}/shards/")
+        assert len(shard_nodes) == shards_num
 
 
 @pytest.mark.parametrize(
@@ -1150,7 +1152,6 @@ def test_shards_distributed(started_cluster, mode, processing_threads):
                 "keeper_path": keeper_path,
                 "s3queue_processing_threads_num": processing_threads,
                 "s3queue_total_shards_num": shards_num,
-                "s3queue_current_shard_num": i,
             },
         )
         i += 1
@@ -1205,6 +1206,8 @@ def test_shards_distributed(started_cluster, mode, processing_threads):
         zk = started_cluster.get_kazoo_client("zoo1")
         processed_nodes = zk.get_children(f"{keeper_path}/processed/")
         assert len(processed_nodes) == shards_num * processing_threads
+        shard_nodes = zk.get_children(f"{keeper_path}/shards/")
+        assert len(shard_nodes) == shards_num
 
 
 def test_settings_check(started_cluster):
@@ -1216,7 +1219,8 @@ def test_settings_check(started_cluster):
     files_path = f"{table_name}_data"
     mode = "ordered"
 
-    i = 0
+    node.restart_clickhouse()
+
     create_table(
         started_cluster,
         node,
@@ -1227,7 +1231,6 @@ def test_settings_check(started_cluster):
             "keeper_path": keeper_path,
             "s3queue_processing_threads_num": 5,
             "s3queue_total_shards_num": 2,
-            "s3queue_current_shard_num": i,
         },
     )
 
@@ -1243,7 +1246,6 @@ def test_settings_check(started_cluster):
                 "keeper_path": keeper_path,
                 "s3queue_processing_threads_num": 5,
                 "s3queue_total_shards_num": 3,
-                "s3queue_current_shard_num": i,
             },
             expect_error=True,
         )
@@ -1261,8 +1263,17 @@ def test_settings_check(started_cluster):
                 "keeper_path": keeper_path,
                 "s3queue_processing_threads_num": 2,
                 "s3queue_total_shards_num": 2,
-                "s3queue_current_shard_num": i,
             },
             expect_error=True,
         )
     )
+
+    assert "s3queue_current_shard_num = 0" in node.query(
+        f"SHOW CREATE TABLE {table_name}"
+    )
+    node.restart_clickhouse()
+    assert "s3queue_current_shard_num = 0" in node.query(
+        f"SHOW CREATE TABLE {table_name}"
+    )
+
+    node.query(f"DROP TABLE {table_name} SYNC")

From 36dc076bbfeac1f617c2b0b1bafc4a582e758762 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 29 Jan 2024 20:04:38 +0100
Subject: [PATCH 196/245] Update test

---
 .../test_broken_projections/test.py           | 28 ++++++-------------
 1 file changed, 8 insertions(+), 20 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index e0b8c3d9247..9597560f5bf 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -215,18 +215,12 @@ def random_str(length=6):
 
 
 def check(node, table, check_result, expect_broken_part="", expected_error=""):
-    query_id = random_str()
-
     if expect_broken_part == "proj1":
         assert expected_error in node.query_and_get_error(
             f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c"
         )
     else:
-        node.query(
-            f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c",
-            query_id=query_id,
-        )
-        time.sleep(2)
+        query_id = node.query(f"SELECT queryID() FROM (SELECT c FROM '{table}' WHERE d == 12 ORDER BY c)").strip()
         node.query("SYSTEM FLUSH LOGS")
         res = node.query(
             f"""
@@ -238,26 +232,20 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
         if res == "":
             res = node.query(
                 """
-                SELECT query, splitByChar('.', arrayJoin(projections))[-1]
-                FROM system.query_log
+                SELECT query_id, query, splitByChar('.', arrayJoin(projections))[-1]
+                FROM system.query_log ORDER BY query_start_time_microseconds DESC
             """
             )
-            print(res)
+            print(f"LOG: {res}")
             assert False
         assert "proj1" in res
 
-    query_id = random_str()
-
     if expect_broken_part == "proj2":
         assert expected_error in node.query_and_get_error(
             f"SELECT d FROM '{table}' WHERE c == 12 ORDER BY d"
         )
     else:
-        node.query(
-            f"SELECT d FROM '{table}' WHERE c == 12 OR c == 16 ORDER BY d",
-            query_id=query_id,
-        )
-        time.sleep(2)
+        query_id = node.query(f"SELECT queryID() FROM (SELECT d FROM '{table}' WHERE c == 12 ORDER BY d)").strip()
         node.query("SYSTEM FLUSH LOGS")
         res = node.query(
             f"""
@@ -269,11 +257,11 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
         if res == "":
             res = node.query(
                 """
-                SELECT query, splitByChar('.', arrayJoin(projections))[-1]
-                FROM system.query_log
+                SELECT query_id, query, splitByChar('.', arrayJoin(projections))[-1]
+                FROM system.query_log ORDER BY query_start_time_microseconds DESC
             """
             )
-            print(res)
+            print(f"LOG: {res}")
             assert False
         assert "proj2" in res
 

From 7cef679f6d4addb98017625065a3a7479d7f16c9 Mon Sep 17 00:00:00 2001
From: slvrtrn <hypnoash@gmail.com>
Date: Mon, 29 Jan 2024 20:11:02 +0100
Subject: [PATCH 197/245] Address PR feedback

---
 src/Server/MySQLHandler.cpp                   | 221 +++++++++---------
 src/Server/MySQLHandler.h                     |   1 +
 .../02967_mysql_settings_override.sh          |   8 +-
 3 files changed, 116 insertions(+), 114 deletions(-)

diff --git a/src/Server/MySQLHandler.cpp b/src/Server/MySQLHandler.cpp
index 260219c1556..72fe3b7cea9 100644
--- a/src/Server/MySQLHandler.cpp
+++ b/src/Server/MySQLHandler.cpp
@@ -57,16 +57,109 @@ namespace ErrorCodes
     extern const int UNSUPPORTED_METHOD;
 }
 
-
 static const size_t PACKET_HEADER_SIZE = 4;
 static const size_t SSL_REQUEST_PAYLOAD_SIZE = 32;
 
-static String showWarningsReplacementQuery(const String & query);
-static String showCountWarningsReplacementQuery(const String & query);
-static String selectEmptyReplacementQuery(const String & query);
-static String showTableStatusReplacementQuery(const String & query);
-static String killConnectionIdReplacementQuery(const String & query);
-static std::optional<String> setSettingReplacementQuery(const String & query, const String & mysql_setting, const String & native_setting);
+static bool checkShouldReplaceQuery(const String & query, const String & prefix)
+{
+    return query.length() >= prefix.length()
+        && std::equal(prefix.begin(), prefix.end(), query.begin(), [](char a, char b) { return std::tolower(a) == std::tolower(b); });
+}
+
+static bool isFederatedServerSetupSetCommand(const String & query)
+{
+    re2::RE2::Options regexp_options;
+    regexp_options.set_case_sensitive(false);
+    static const re2::RE2 expr(
+        "(^(SET NAMES(.*)))"
+        "|(^(SET character_set_results(.*)))"
+        "|(^(SET FOREIGN_KEY_CHECKS(.*)))"
+        "|(^(SET AUTOCOMMIT(.*)))"
+        "|(^(SET sql_mode(.*)))"
+        "|(^(SET @@(.*)))"
+        "|(^(SET SESSION TRANSACTION ISOLATION LEVEL(.*)))", regexp_options);
+    assert(expr.ok());
+    return re2::RE2::FullMatch(query, expr);
+}
+
+/// Always return an empty set with appropriate column definitions for SHOW WARNINGS queries
+/// See also: https://dev.mysql.com/doc/refman/8.0/en/show-warnings.html
+static String showWarningsReplacementQuery([[maybe_unused]] const String & query)
+{
+    return "SELECT '' AS Level, 0::UInt32 AS Code, '' AS Message WHERE false";
+}
+
+static String showCountWarningsReplacementQuery([[maybe_unused]] const String & query)
+{
+    return "SELECT 0::UInt64 AS `@@session.warning_count`";
+}
+
+/// Replace "[query(such as SHOW VARIABLES...)]" into "".
+static String selectEmptyReplacementQuery(const String & query)
+{
+    std::ignore = query;
+    return "select ''";
+}
+
+/// Replace "SHOW TABLE STATUS LIKE 'xx'" into "SELECT ... FROM system.tables WHERE name LIKE 'xx'".
+static String showTableStatusReplacementQuery(const String & query)
+{
+    const String prefix = "SHOW TABLE STATUS LIKE ";
+    if (query.size() > prefix.size())
+    {
+        String suffix = query.data() + prefix.length();
+        return (
+            "SELECT"
+            " name AS Name,"
+            " engine AS Engine,"
+            " '10' AS Version,"
+            " 'Dynamic' AS Row_format,"
+            " 0 AS Rows,"
+            " 0 AS Avg_row_length,"
+            " 0 AS Data_length,"
+            " 0 AS Max_data_length,"
+            " 0 AS Index_length,"
+            " 0 AS Data_free,"
+            " 'NULL' AS Auto_increment,"
+            " metadata_modification_time AS Create_time,"
+            " metadata_modification_time AS Update_time,"
+            " metadata_modification_time AS Check_time,"
+            " 'utf8_bin' AS Collation,"
+            " 'NULL' AS Checksum,"
+            " '' AS Create_options,"
+            " '' AS Comment"
+            " FROM system.tables"
+            " WHERE name LIKE "
+            + suffix);
+    }
+    return query;
+}
+
+static std::optional<String> setSettingReplacementQuery(const String & query, const String & mysql_setting, const String & clickhouse_setting)
+{
+    const String prefix = "SET " + mysql_setting;
+    // if (query.length() >= prefix.length() && boost::iequals(std::string_view(prefix), std::string_view(query.data(), 3)))
+    if (checkShouldReplaceQuery(query, prefix))
+        return "SET " + clickhouse_setting + String(query.data() + prefix.length());
+    return std::nullopt;
+}
+
+/// Replace "KILL QUERY [connection_id]" into "KILL QUERY WHERE query_id LIKE 'mysql:[connection_id]:xxx'".
+static String killConnectionIdReplacementQuery(const String & query)
+{
+    const String prefix = "KILL QUERY ";
+    if (query.size() > prefix.size())
+    {
+        String suffix = query.data() + prefix.length();
+        static const re2::RE2 expr("^[0-9]");
+        if (re2::RE2::FullMatch(suffix, expr))
+        {
+            String replacement = fmt::format("KILL QUERY WHERE query_id LIKE 'mysql:{}:%'", suffix);
+            return replacement;
+        }
+    }
+    return query;
+}
 
 MySQLHandler::MySQLHandler(
     IServer & server_,
@@ -326,8 +419,6 @@ void MySQLHandler::comPing()
     packet_endpoint->sendPacket(OKPacket(0x0, client_capabilities, 0, 0, 0), true);
 }
 
-static bool isFederatedServerSetupSetCommand(const String & query);
-
 void MySQLHandler::comQuery(ReadBuffer & payload, bool binary_protocol)
 {
     String query = String(payload.position(), payload.buffer().end());
@@ -347,7 +438,7 @@ void MySQLHandler::comQuery(ReadBuffer & payload, bool binary_protocol)
         // Queries replacements
         for (auto const & [query_to_replace, replacement_fn] : queries_replacements)
         {
-            if (0 == strncasecmp(query_to_replace.c_str(), query.c_str(), query_to_replace.size()))
+            if (checkShouldReplaceQuery(query, query_to_replace))
             {
                 should_replace = true;
                 replacement_query = replacement_fn(query);
@@ -357,9 +448,9 @@ void MySQLHandler::comQuery(ReadBuffer & payload, bool binary_protocol)
 
         // Settings replacements
         if (!should_replace)
-            for (auto const & [mysql_setting, native_setting] : settings_replacements)
+            for (auto const & [mysql_setting, clickhouse_setting] : settings_replacements)
             {
-                const auto replacement_query_opt = setSettingReplacementQuery(query, mysql_setting, native_setting);
+                const auto replacement_query_opt = setSettingReplacementQuery(query, mysql_setting, clickhouse_setting);
                 if (replacement_query_opt.has_value())
                 {
                     should_replace = true;
@@ -368,8 +459,6 @@ void MySQLHandler::comQuery(ReadBuffer & payload, bool binary_protocol)
                 }
             }
 
-        ReadBufferFromString replacement(replacement_query);
-
         auto query_context = session->makeQueryContext();
         query_context->setCurrentQueryId(fmt::format("mysql:{}:{}", connection_id, toString(UUIDHelpers::generateV4())));
         CurrentThread::QueryScope query_scope{query_context};
@@ -401,7 +490,14 @@ void MySQLHandler::comQuery(ReadBuffer & payload, bool binary_protocol)
             }
         };
 
-        executeQuery(should_replace ? replacement : payload, *out, false, query_context, set_result_details, QueryFlags{}, format_settings);
+        if (should_replace)
+        {
+            ReadBufferFromString replacement(replacement_query);
+            executeQuery(replacement, *out, false, query_context, set_result_details, QueryFlags{}, format_settings);
+        }
+        else
+            executeQuery(payload, *out, false, query_context, set_result_details, QueryFlags{}, format_settings);
+
 
         if (!with_output)
             packet_endpoint->sendPacket(OKPacket(0x00, client_capabilities, affected_rows, 0, 0), true);
@@ -547,99 +643,4 @@ void MySQLHandlerSSL::finishHandshakeSSL(
 }
 
 #endif
-
-static bool isFederatedServerSetupSetCommand(const String & query)
-{
-    re2::RE2::Options regexp_options;
-    regexp_options.set_case_sensitive(false);
-    static const re2::RE2 expr(
-        "(^(SET NAMES(.*)))"
-        "|(^(SET character_set_results(.*)))"
-        "|(^(SET FOREIGN_KEY_CHECKS(.*)))"
-        "|(^(SET AUTOCOMMIT(.*)))"
-        "|(^(SET sql_mode(.*)))"
-        "|(^(SET @@(.*)))"
-        "|(^(SET SESSION TRANSACTION ISOLATION LEVEL(.*)))", regexp_options);
-    assert(expr.ok());
-    return re2::RE2::FullMatch(query, expr);
-}
-
-/// Always return an empty set with appropriate column definitions for SHOW WARNINGS queries
-/// See also: https://dev.mysql.com/doc/refman/8.0/en/show-warnings.html
-static String showWarningsReplacementQuery([[maybe_unused]] const String & query)
-{
-    return "SELECT '' AS Level, 0::UInt32 AS Code, '' AS Message WHERE false";
-}
-
-static String showCountWarningsReplacementQuery([[maybe_unused]] const String & query)
-{
-    return "SELECT 0::UInt64 AS `@@session.warning_count`";
-}
-
-/// Replace "[query(such as SHOW VARIABLES...)]" into "".
-static String selectEmptyReplacementQuery(const String & query)
-{
-    std::ignore = query;
-    return "select ''";
-}
-
-/// Replace "SHOW TABLE STATUS LIKE 'xx'" into "SELECT ... FROM system.tables WHERE name LIKE 'xx'".
-static String showTableStatusReplacementQuery(const String & query)
-{
-    const String prefix = "SHOW TABLE STATUS LIKE ";
-    if (query.size() > prefix.size())
-    {
-        String suffix = query.data() + prefix.length();
-        return (
-            "SELECT"
-            " name AS Name,"
-            " engine AS Engine,"
-            " '10' AS Version,"
-            " 'Dynamic' AS Row_format,"
-            " 0 AS Rows,"
-            " 0 AS Avg_row_length,"
-            " 0 AS Data_length,"
-            " 0 AS Max_data_length,"
-            " 0 AS Index_length,"
-            " 0 AS Data_free,"
-            " 'NULL' AS Auto_increment,"
-            " metadata_modification_time AS Create_time,"
-            " metadata_modification_time AS Update_time,"
-            " metadata_modification_time AS Check_time,"
-            " 'utf8_bin' AS Collation,"
-            " 'NULL' AS Checksum,"
-            " '' AS Create_options,"
-            " '' AS Comment"
-            " FROM system.tables"
-            " WHERE name LIKE "
-            + suffix);
-    }
-    return query;
-}
-
-static std::optional<String> setSettingReplacementQuery(const String & query, const String & mysql_setting, const String & native_setting)
-{
-    const String prefix = "SET " + mysql_setting;
-    if (0 == strncasecmp(prefix.c_str(), query.c_str(), prefix.size()))
-        return "SET " + native_setting + String(query.data() + prefix.length());
-    return std::nullopt;
-}
-
-/// Replace "KILL QUERY [connection_id]" into "KILL QUERY WHERE query_id LIKE 'mysql:[connection_id]:xxx'".
-static String killConnectionIdReplacementQuery(const String & query)
-{
-    const String prefix = "KILL QUERY ";
-    if (query.size() > prefix.size())
-    {
-        String suffix = query.data() + prefix.length();
-        static const re2::RE2 expr("^[0-9]");
-        if (re2::RE2::FullMatch(suffix, expr))
-        {
-            String replacement = fmt::format("KILL QUERY WHERE query_id LIKE 'mysql:{}:%'", suffix);
-            return replacement;
-        }
-    }
-    return query;
-}
-
 }
diff --git a/src/Server/MySQLHandler.h b/src/Server/MySQLHandler.h
index 8f9dcd872db..2deb2b8f435 100644
--- a/src/Server/MySQLHandler.h
+++ b/src/Server/MySQLHandler.h
@@ -96,6 +96,7 @@ protected:
     using QueriesReplacements = std::unordered_map<std::string, QueryReplacementFn>;
     QueriesReplacements queries_replacements;
 
+    /// MySQL setting name --> ClickHouse setting name
     using SettingsReplacements = std::unordered_map<std::string, std::string>;
     SettingsReplacements settings_replacements;
 
diff --git a/tests/queries/0_stateless/02967_mysql_settings_override.sh b/tests/queries/0_stateless/02967_mysql_settings_override.sh
index cee18255eeb..59a2099190a 100755
--- a/tests/queries/0_stateless/02967_mysql_settings_override.sh
+++ b/tests/queries/0_stateless/02967_mysql_settings_override.sh
@@ -2,7 +2,7 @@
 # Tags: no-fasttest
 # Tag no-fasttest: requires mysql client
 
-# Tests the override of certain MySQL proprietary settings to ClickHouse native settings
+# Tests that certain MySQL-proprietary settings are mapped to ClickHouse-native settings.
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -15,17 +15,17 @@ TEST_TABLE="mysql_settings_override_test"
 DROP_TABLE="DROP TABLE IF EXISTS $TEST_TABLE;"
 CREATE_TABLE="CREATE TABLE $TEST_TABLE (s String) ENGINE MergeTree ORDER BY s;"
 INSERT_STMT="INSERT INTO $TEST_TABLE VALUES ('a'), ('b'), ('c'), ('d');"
-SELECT_STMT="SELECT * FROM $TEST_TABLE;"
+SELECT_STMT="SELECT * FROM $TEST_TABLE ORDER BY s;"
 
 echo "-- Init"
 ${MYSQL_CLIENT} --execute "$DROP_TABLE $CREATE_TABLE $INSERT_STMT $SELECT_STMT" # should fetch all 4 records
 
-echo "-- Uppercase tests"
+echo "-- Uppercase setting name"
 ${MYSQL_CLIENT} --execute "SET SQL_SELECT_LIMIT = 2; $SELECT_STMT" # should fetch 2 records out of 4
 ${MYSQL_CLIENT} --execute "SET NET_WRITE_TIMEOUT = 22; $CHANGED_SETTINGS_QUERY"
 ${MYSQL_CLIENT} --execute "SET NET_READ_TIMEOUT = 33; $CHANGED_SETTINGS_QUERY"
 
-echo "-- Lowercase tests"
+echo "-- Lowercase setting name"
 ${MYSQL_CLIENT} --execute "set sql_select_limit=3; $SELECT_STMT" # should fetch 3 records out of 4
 ${MYSQL_CLIENT} --execute "set net_write_timeout=55; $CHANGED_SETTINGS_QUERY"
 ${MYSQL_CLIENT} --execute "set net_read_timeout=66; $CHANGED_SETTINGS_QUERY"

From 50439cc1d5b315a5e34ac5b5ed02c32b9d563f14 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Mon, 29 Jan 2024 19:14:22 +0000
Subject: [PATCH 198/245] Automatic style fix

---
 tests/integration/test_broken_projections/test.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 9597560f5bf..4a4690a5d0a 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -220,7 +220,9 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
             f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c"
         )
     else:
-        query_id = node.query(f"SELECT queryID() FROM (SELECT c FROM '{table}' WHERE d == 12 ORDER BY c)").strip()
+        query_id = node.query(
+            f"SELECT queryID() FROM (SELECT c FROM '{table}' WHERE d == 12 ORDER BY c)"
+        ).strip()
         node.query("SYSTEM FLUSH LOGS")
         res = node.query(
             f"""
@@ -245,7 +247,9 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
             f"SELECT d FROM '{table}' WHERE c == 12 ORDER BY d"
         )
     else:
-        query_id = node.query(f"SELECT queryID() FROM (SELECT d FROM '{table}' WHERE c == 12 ORDER BY d)").strip()
+        query_id = node.query(
+            f"SELECT queryID() FROM (SELECT d FROM '{table}' WHERE c == 12 ORDER BY d)"
+        ).strip()
         node.query("SYSTEM FLUSH LOGS")
         res = node.query(
             f"""

From 5192d383705510e6b4de0016bd475b0582f48b5e Mon Sep 17 00:00:00 2001
From: slvrtrn <hypnoash@gmail.com>
Date: Mon, 29 Jan 2024 20:35:15 +0100
Subject: [PATCH 199/245] Fix tests

---
 .../0_stateless/02967_mysql_settings_override.reference       | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02967_mysql_settings_override.reference b/tests/queries/0_stateless/02967_mysql_settings_override.reference
index bc058f4889e..96cf7ecc403 100644
--- a/tests/queries/0_stateless/02967_mysql_settings_override.reference
+++ b/tests/queries/0_stateless/02967_mysql_settings_override.reference
@@ -4,7 +4,7 @@ a
 b
 c
 d
--- Uppercase tests
+-- Uppercase setting name
 s
 a
 b
@@ -12,7 +12,7 @@ name	value
 send_timeout	22
 name	value
 receive_timeout	33
--- Lowercase tests
+-- Lowercase setting name
 s
 a
 b

From 3a5ba56c36775709d8cfa4b2d6deb081b69dd2a5 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 29 Jan 2024 20:09:09 +0000
Subject: [PATCH 200/245] Fix lazy initialization in RabbitMQ, fix possible
 deadlock on insert into unitialized queue engine

---
 src/Storages/IMessageProducer.cpp             | 11 ++-
 src/Storages/RabbitMQ/StorageRabbitMQ.cpp     | 76 +++++++------------
 src/Storages/RabbitMQ/StorageRabbitMQ.h       |  5 +-
 .../integration/test_storage_rabbitmq/test.py | 12 +++
 4 files changed, 52 insertions(+), 52 deletions(-)

diff --git a/src/Storages/IMessageProducer.cpp b/src/Storages/IMessageProducer.cpp
index c723ec77b70..20c47f6f0b4 100644
--- a/src/Storages/IMessageProducer.cpp
+++ b/src/Storages/IMessageProducer.cpp
@@ -12,7 +12,16 @@ void AsynchronousMessageProducer::start(const ContextPtr & context)
 {
     LOG_TEST(log, "Executing startup");
 
-    initialize();
+    try
+    {
+        initialize();
+    }
+    catch (...)
+    {
+        finished = true;
+        throw;
+    }
+
     producing_task = context->getSchedulePool().createTask(getProducingTaskName(), [this]
     {
         LOG_TEST(log, "Starting producing task loop");
diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
index 025f421db59..868f48d0b7d 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
@@ -69,7 +69,7 @@ StorageRabbitMQ::StorageRabbitMQ(
         ContextPtr context_,
         const ColumnsDescription & columns_,
         std::unique_ptr<RabbitMQSettings> rabbitmq_settings_,
-        bool is_attach_)
+        bool is_attach)
         : IStorage(table_id_)
         , WithContext(context_->getGlobalContext())
         , rabbitmq_settings(std::move(rabbitmq_settings_))
@@ -91,7 +91,6 @@ StorageRabbitMQ::StorageRabbitMQ(
         , unique_strbase(getRandomName())
         , queue_size(std::max(QUEUE_SIZE, static_cast<uint32_t>(getMaxBlockSize())))
         , milliseconds_to_wait(rabbitmq_settings->rabbitmq_empty_queue_backoff_start_ms)
-        , is_attach(is_attach_)
 {
     const auto & config = getContext()->getConfigRef();
 
@@ -318,10 +317,11 @@ void StorageRabbitMQ::connectionFunc()
     try
     {
         if (connection->reconnect())
+        {
             initRabbitMQ();
-
-        streaming_task->scheduleAfter(RESCHEDULE_MS);
-        return;
+            streaming_task->scheduleAfter(RESCHEDULE_MS);
+            return;
+        }
     }
     catch (...)
     {
@@ -373,57 +373,37 @@ void StorageRabbitMQ::initRabbitMQ()
     }
     else
     {
-        try
+        auto rabbit_channel = connection->createChannel();
+
+        /// Main exchange -> Bridge exchange -> ( Sharding exchange ) -> Queues -> Consumers
+
+        initExchange(*rabbit_channel);
+        bindExchange(*rabbit_channel);
+
+        for (const auto i : collections::range(0, num_queues))
+            bindQueue(i + 1, *rabbit_channel);
+
+        if (queues.size() != num_queues)
         {
-            auto rabbit_channel = connection->createChannel();
-
-            /// Main exchange -> Bridge exchange -> ( Sharding exchange ) -> Queues -> Consumers
-
-            initExchange(*rabbit_channel);
-            bindExchange(*rabbit_channel);
-
-            for (const auto i : collections::range(0, num_queues))
-                bindQueue(i + 1, *rabbit_channel);
-
-            if (queues.size() != num_queues)
-            {
-                throw Exception(
-                    ErrorCodes::LOGICAL_ERROR,
-                    "Expected all queues to be initialized (but having {}/{})",
-                    queues.size(), num_queues);
-            }
-
-            LOG_TRACE(log, "RabbitMQ setup completed");
-            rabbit_channel->close();
-        }
-        catch (...)
-        {
-            tryLogCurrentException(log);
-            if (is_attach)
-                return; /// A user will have to reattach the table.
-            throw;
+            throw Exception(
+                ErrorCodes::LOGICAL_ERROR,
+                "Expected all queues to be initialized (but having {}/{})",
+                queues.size(), num_queues);
         }
+
+        LOG_TRACE(log, "RabbitMQ setup completed");
+        rabbit_channel->close();
     }
 
     LOG_TRACE(log, "Registering {} conumers", num_consumers);
 
     for (size_t i = 0; i < num_consumers; ++i)
     {
-        try
-        {
-            auto consumer = createConsumer();
-            consumer->updateChannel(*connection);
-            consumers_ref.push_back(consumer);
-            pushConsumer(consumer);
-            ++num_created_consumers;
-        }
-        catch (...)
-        {
-            if (!is_attach)
-                throw;
-
-            tryLogCurrentException(log);
-        }
+        auto consumer = createConsumer();
+        consumer->updateChannel(*connection);
+        consumers_ref.push_back(consumer);
+        pushConsumer(consumer);
+        ++num_created_consumers;
     }
 
     LOG_TRACE(log, "Registered {}/{} conumers", num_created_consumers, num_consumers);
diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.h b/src/Storages/RabbitMQ/StorageRabbitMQ.h
index be46caf9798..696734617be 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.h
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.h
@@ -27,7 +27,7 @@ public:
             ContextPtr context_,
             const ColumnsDescription & columns_,
             std::unique_ptr<RabbitMQSettings> rabbitmq_settings_,
-            bool is_attach_);
+            bool is_attach);
 
     std::string getName() const override { return "RabbitMQ"; }
 
@@ -158,10 +158,9 @@ private:
 
     size_t read_attempts = 0;
     mutable bool drop_table = false;
-    bool is_attach;
 
     RabbitMQConsumerPtr createConsumer();
-    bool initialized = false;
+    std::atomic<bool> initialized = false;
 
     /// Functions working in the background
     void streamingToViewsFunc();
diff --git a/tests/integration/test_storage_rabbitmq/test.py b/tests/integration/test_storage_rabbitmq/test.py
index 6924f2e1508..28dbca1862c 100644
--- a/tests/integration/test_storage_rabbitmq/test.py
+++ b/tests/integration/test_storage_rabbitmq/test.py
@@ -3538,3 +3538,15 @@ def test_rabbitmq_handle_error_mode_stream(rabbitmq_cluster):
 
     expected = "".join(sorted(expected))
     assert broken_messages == expected
+
+
+def test_attach_broken_table(rabbitmq_cluster):
+    instance.query(
+        "ATTACH TABLE rabbit_queue UUID '2d1cdf1a-f060-4a61-a7c9-5b59e59992c6' (`payload` String) ENGINE = RabbitMQ SETTINGS rabbitmq_host_port = 'nonexisting:5671', rabbitmq_format = 'JSONEachRow', rabbitmq_username = 'test', rabbitmq_password = 'test'"
+    )
+
+    error = instance.query_and_get_error("SELECT * FROM rabbit_queue")
+    assert "CANNOT_CONNECT_RABBITMQ" in error
+
+    error = instance.query_and_get_error("INSERT INTO rabbit_queue VALUES ('test')")
+    assert "CANNOT_CONNECT_RABBITMQ" in error

From 45776ea035f6f33ff9d4324f41a845b509a2b7cf Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 21:24:20 +0100
Subject: [PATCH 201/245] Update SettingsChangesHistory.h

---
 src/Core/SettingsChangesHistory.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index d84249e43b9..8a892d711a7 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -103,7 +103,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
-              {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"}}},
+              {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
               {"azure_max_unexpected_write_error_retries", 4, 0, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},

From 1580f737952c38d50651a7022081480f7e3b602f Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 21:53:05 +0100
Subject: [PATCH 202/245] Update SettingsChangesHistory.h

---
 src/Core/SettingsChangesHistory.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 8a892d711a7..ad04ee79995 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -104,7 +104,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
-              {"azure_max_unexpected_write_error_retries", 4, 0, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
+              {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},

From e8d348b90e27448fc49f2ed2ace93d608923c0fc Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Mon, 29 Jan 2024 20:53:57 +0000
Subject: [PATCH 203/245] Add a test

---
 .../0_stateless/02971_analyzer_remote_id.reference  |  1 +
 .../queries/0_stateless/02971_analyzer_remote_id.sh | 13 +++++++++++++
 2 files changed, 14 insertions(+)
 create mode 100644 tests/queries/0_stateless/02971_analyzer_remote_id.reference
 create mode 100755 tests/queries/0_stateless/02971_analyzer_remote_id.sh

diff --git a/tests/queries/0_stateless/02971_analyzer_remote_id.reference b/tests/queries/0_stateless/02971_analyzer_remote_id.reference
new file mode 100644
index 00000000000..b8626c4cff2
--- /dev/null
+++ b/tests/queries/0_stateless/02971_analyzer_remote_id.reference
@@ -0,0 +1 @@
+4
diff --git a/tests/queries/0_stateless/02971_analyzer_remote_id.sh b/tests/queries/0_stateless/02971_analyzer_remote_id.sh
new file mode 100755
index 00000000000..88bbe38729b
--- /dev/null
+++ b/tests/queries/0_stateless/02971_analyzer_remote_id.sh
@@ -0,0 +1,13 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+${CLICKHOUSE_CLIENT} --query="DROP DATABASE IF EXISTS test_02971"
+${CLICKHOUSE_CLIENT} --query="CREATE DATABASE test_02971"
+
+${CLICKHOUSE_CLIENT} --query="CREATE TABLE test_02971.x ENGINE = MergeTree() ORDER BY number AS SELECT * FROM numbers(2)"
+${CLICKHOUSE_LOCAL} --query="SELECT count() FROM remote('127.0.0.{2,3}', 'test_02971.x') SETTINGS allow_experimental_analyzer = 1"
+
+${CLICKHOUSE_CLIENT} --query="DROP DATABASE IF EXISTS test_02971"

From 182d1c08b8c1bc28d17b64858e4a4376bea27bce Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Mon, 29 Jan 2024 21:21:52 +0000
Subject: [PATCH 204/245] slightly better memory usage in
 AsynchronousBoundedReadBuffer

---
 src/Disks/IO/AsynchronousBoundedReadBuffer.cpp | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp b/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
index 8eecd0d99d1..bd19540bf44 100644
--- a/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
+++ b/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
@@ -48,11 +48,10 @@ AsynchronousBoundedReadBuffer::AsynchronousBoundedReadBuffer(
     const ReadSettings & settings_,
     AsyncReadCountersPtr async_read_counters_,
     FilesystemReadPrefetchesLogPtr prefetches_log_)
-    : ReadBufferFromFileBase(chooseBufferSizeForRemoteReading(settings_, impl_->getFileSize()), nullptr, 0)
+    : ReadBufferFromFileBase(0, nullptr, 0)
     , impl(std::move(impl_))
     , read_settings(settings_)
     , reader(reader_)
-    , prefetch_buffer(chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()))
     , query_id(CurrentThread::isInitialized() && CurrentThread::get().getQueryContext() != nullptr ? CurrentThread::getQueryId() : "")
     , current_reader_id(getRandomASCIIString(8))
     , log(getLogger("AsynchronousBoundedReadBuffer"))
@@ -115,7 +114,7 @@ void AsynchronousBoundedReadBuffer::prefetch(Priority priority)
     last_prefetch_info.submit_time = std::chrono::system_clock::now();
     last_prefetch_info.priority = priority;
 
-    chassert(prefetch_buffer.size() == chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()));
+    prefetch_buffer.resize(chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()));
     prefetch_future = readAsync(prefetch_buffer.data(), prefetch_buffer.size(), priority);
     ProfileEvents::increment(ProfileEvents::RemoteFSPrefetches);
 }
@@ -211,7 +210,7 @@ bool AsynchronousBoundedReadBuffer::nextImpl()
     }
     else
     {
-        chassert(memory.size() == chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()));
+        memory.resize(chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()));
 
         {
             ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::SynchronousRemoteReadWaitMicroseconds);

From 18578c7b1b20d5dfb0755b040e0604256ec680e3 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 29 Jan 2024 21:29:52 +0000
Subject: [PATCH 205/245] Try to make variant tests a bit faster

---
 .../0_stateless/02941_variant_type_1.sh       | 78 +++++++++----------
 .../0_stateless/02941_variant_type_2.sh       | 46 +++++------
 .../0_stateless/02941_variant_type_3.sh       | 48 ++++++------
 .../0_stateless/02941_variant_type_4.sh       | 34 ++++----
 4 files changed, 104 insertions(+), 102 deletions(-)

diff --git a/tests/queries/0_stateless/02941_variant_type_1.sh b/tests/queries/0_stateless/02941_variant_type_1.sh
index 4cf8ad25122..ed365bbd244 100755
--- a/tests/queries/0_stateless/02941_variant_type_1.sh
+++ b/tests/queries/0_stateless/02941_variant_type_1.sh
@@ -12,52 +12,52 @@ CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
 function test1_insert()
 {
     echo "test1 insert"
-    $CH_CLIENT -q "insert into test select number, NULL from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 3, number from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 6, 'str_' || toString(number) from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 9, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 12, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 15, range(number + 1)::Array(UInt64) from numbers(3);"
+    $CH_CLIENT -nmq "insert into test select number, NULL from numbers(3);
+insert into test select number + 3, number from numbers(3);
+insert into test select number + 6, 'str_' || toString(number) from numbers(3);
+insert into test select number + 9, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(3);
+insert into test select number + 12, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(3);
+insert into test select number + 15, range(number + 1)::Array(UInt64) from numbers(3);"
 }
 
 function test1_select()
 {
     echo "test1 select"
-    $CH_CLIENT -q "select v from test order by id;"
-    $CH_CLIENT -q "select v.String from test order by id;"
-    $CH_CLIENT -q "select v.UInt64 from test order by id;"
-    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test order by id;"
+    $CH_CLIENT -nmq "select v from test order by id;
+select v.String from test order by id;
+select v.UInt64 from test order by id;
+select v.\`LowCardinality(String)\` from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;
+select v.\`Array(UInt64)\` from test order by id;
+select v.\`Array(UInt64)\`.size0 from test order by id;"
     echo "-----------------------------------------------------------------------------------------------------------"
 }
 
 function test2_insert()
 {
     echo "test2 insert"
-    $CH_CLIENT -q "insert into test select number, NULL from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 3, number % 2 ? NULL : number from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 6, number % 2 ? NULL : 'str_' || toString(number) from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 9, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(('lc_str_' || toString(number))::LowCardinality(String), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 12, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 15, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(range(number + 1)::Array(UInt64), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
+    $CH_CLIENT -nmq "insert into test select number, NULL from numbers(3);
+insert into test select number + 3, number % 2 ? NULL : number from numbers(3);
+insert into test select number + 6, number % 2 ? NULL : 'str_' || toString(number) from numbers(3);
+insert into test select number + 9, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(('lc_str_' || toString(number))::LowCardinality(String), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);
+insert into test select number + 12, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);
+insert into test select number + 15, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(range(number + 1)::Array(UInt64), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
 }
 
 function test2_select()
 {
     echo "test2 select"
-    $CH_CLIENT -q "select v from test order by id;"
-    $CH_CLIENT -q "select v.String from test order by id;"
-    $CH_CLIENT -q "select v.UInt64 from test order by id;"
-    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test order by id;"
+    $CH_CLIENT -nmq "select v from test order by id;
+select v.String from test order by id;
+select v.UInt64 from test order by id;
+select v.\`LowCardinality(String)\` from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;
+select v.\`Array(UInt64)\` from test order by id;
+select v.\`Array(UInt64)\`.size0 from test order by id;"
     echo "-----------------------------------------------------------------------------------------------------------"
 }
 
@@ -70,15 +70,15 @@ function test3_insert()
 function test3_select()
 {
     echo "test3 select"
-    $CH_CLIENT -q "select v from test order by id;"
-    $CH_CLIENT -q "select v.String from test order by id;"
-    $CH_CLIENT -q "select v.UInt64 from test order by id;"
-    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test order by id;"
+    $CH_CLIENT -nmq "select v from test order by id;
+select v.String from test order by id;
+select v.UInt64 from test order by id;
+select v.\`LowCardinality(String)\` from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;
+select v.\`Array(UInt64)\` from test order by id;
+select v.\`Array(UInt64)\`.size0 from test order by id;"
     echo "-----------------------------------------------------------------------------------------------------------"
 }
 
diff --git a/tests/queries/0_stateless/02941_variant_type_2.sh b/tests/queries/0_stateless/02941_variant_type_2.sh
index 7064dfbf4ec..23666a9b4a8 100755
--- a/tests/queries/0_stateless/02941_variant_type_2.sh
+++ b/tests/queries/0_stateless/02941_variant_type_2.sh
@@ -12,34 +12,34 @@ CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
 function test4_insert()
 {
     echo "test4 insert"
-    $CH_CLIENT -q "insert into test select number, NULL from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 200000, number from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 400000, 'str_' || toString(number) from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 600000, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 800000, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 1000000, range(number % 20 + 1)::Array(UInt64) from numbers(200000);"
+    $CH_CLIENT -nmq "insert into test select number, NULL from numbers(200000);
+insert into test select number + 200000, number from numbers(200000);
+insert into test select number + 400000, 'str_' || toString(number) from numbers(200000);
+insert into test select number + 600000, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(200000);
+insert into test select number + 800000, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(200000);
+insert into test select number + 1000000, range(number % 20 + 1)::Array(UInt64) from numbers(200000);"
 }
 
 function test4_select
 {
     echo "test4 select"
-    $CH_CLIENT -q "select v from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v);"
-    $CH_CLIENT -q "select v.String from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
-    $CH_CLIENT -q "select v.UInt64 from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
-    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`LowCardinality(String)\`);"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test format Null;"
-    $CH_CLIENT -q "select count() from test where not empty(v.\`Array(UInt64)\`);"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
+    $CH_CLIENT -nmq "select v from test format Null;
+select count() from test where isNotNull(v);
+select v.String from test format Null;
+select count() from test where isNotNull(v.String);
+select v.UInt64 from test format Null;
+select count() from test where isNotNull(v.UInt64);
+select v.\`LowCardinality(String)\` from test format Null;
+select count() from test where isNotNull(v.\`LowCardinality(String)\`);
+select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;
+select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;
+select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);
+select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;
+select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);
+select v.\`Array(UInt64)\` from test format Null;
+select count() from test where not empty(v.\`Array(UInt64)\`);
+select v.\`Array(UInt64)\`.size0 from test format Null;
+select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
 }
 
 function run()
diff --git a/tests/queries/0_stateless/02941_variant_type_3.sh b/tests/queries/0_stateless/02941_variant_type_3.sh
index 303039edef7..d6309e26414 100755
--- a/tests/queries/0_stateless/02941_variant_type_3.sh
+++ b/tests/queries/0_stateless/02941_variant_type_3.sh
@@ -12,34 +12,36 @@ CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
 function test5_insert()
 {
     echo "test5 insert"
-    $CH_CLIENT -q "insert into test select number, NULL from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 200000, number % 2 ? NULL : number from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 400000, number % 2 ? NULL : 'str_' || toString(number) from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 600000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(('lc_str_' || toString(number))::LowCardinality(String), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 800000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 1000000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(range(number % 20 + 1)::Array(UInt64), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
+    $CH_CLIENT -nmq "
+insert into test select number, NULL from numbers(200000);
+insert into test select number + 200000, number % 2 ? NULL : number from numbers(200000);
+insert into test select number + 400000, number % 2 ? NULL : 'str_' || toString(number) from numbers(200000);
+insert into test select number + 600000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(('lc_str_' || toString(number))::LowCardinality(String), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);
+insert into test select number + 800000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);
+insert into test select number + 1000000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(range(number % 20 + 1)::Array(UInt64), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
 }
 
 function test5_select()
 {
     echo "test5 select"
-    $CH_CLIENT -q "select v from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v);"
-    $CH_CLIENT -q "select v.String from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
-    $CH_CLIENT -q "select v.UInt64 from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
-    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`LowCardinality(String)\`);"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test format Null;"
-    $CH_CLIENT -q "select count() from test where not empty(v.\`Array(UInt64)\`);"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
+        $CH_CLIENT -nmq "
+select v from test format Null;
+select count() from test where isNotNull(v);
+select v.String from test format Null;
+select count() from test where isNotNull(v.String);
+select v.UInt64 from test format Null;
+select count() from test where isNotNull(v.UInt64);
+select v.\`LowCardinality(String)\` from test format Null;
+select count() from test where isNotNull(v.\`LowCardinality(String)\`);
+select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;
+select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;
+select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);
+select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;
+select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);
+select v.\`Array(UInt64)\` from test format Null;
+select count() from test where not empty(v.\`Array(UInt64)\`);
+select v.\`Array(UInt64)\`.size0 from test format Null;
+select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
 }
 
 function run()
diff --git a/tests/queries/0_stateless/02941_variant_type_4.sh b/tests/queries/0_stateless/02941_variant_type_4.sh
index 169e43c6d69..5ea04db4bb4 100755
--- a/tests/queries/0_stateless/02941_variant_type_4.sh
+++ b/tests/queries/0_stateless/02941_variant_type_4.sh
@@ -18,23 +18,23 @@ function test6_insert()
 function test6_select()
 {
     echo "test6 select"
-    $CH_CLIENT -q "select v from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v);"
-    $CH_CLIENT -q "select v.String from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
-    $CH_CLIENT -q "select v.UInt64 from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
-    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`LowCardinality(String)\`);"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test format Null;"
-    $CH_CLIENT -q "select count() from test where not empty(v.\`Array(UInt64)\`);"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
+    $CH_CLIENT -nmq "select v from test format Null;
+    select count() from test where isNotNull(v);
+    select v.String from test format Null;
+    select count() from test where isNotNull(v.String);
+    select v.UInt64 from test format Null;
+    select count() from test where isNotNull(v.UInt64);
+    select v.\`LowCardinality(String)\` from test format Null;
+    select count() from test where isNotNull(v.\`LowCardinality(String)\`);
+    select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;
+    select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;
+    select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);
+    select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;
+    select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);
+    select v.\`Array(UInt64)\` from test format Null;
+    select count() from test where not empty(v.\`Array(UInt64)\`);
+    select v.\`Array(UInt64)\`.size0 from test format Null;
+    select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
     echo "-----------------------------------------------------------------------------------------------------------"
 }
 

From 559de083a3197ca7db1955377100f12e12b37dce Mon Sep 17 00:00:00 2001
From: Alexey Gerasimchuck <a.gerasimchuck@arenadata.io>
Date: Mon, 29 Jan 2024 23:20:38 +0000
Subject: [PATCH 206/245] Implemented failed login attempt counting using quota

---
 .../operations/system-tables/quota_usage.md   |  2 +
 .../operations/system-tables/quotas_usage.md  |  6 +-
 .../sql-reference/statements/create/quota.md  |  2 +-
 .../operations/system-tables/quota_usage.md   |  7 +-
 .../operations/system-tables/quotas_usage.md  |  3 +-
 .../sql-reference/statements/alter/quota.md   |  2 +-
 .../sql-reference/statements/create/quota.md  |  2 +-
 src/Access/AccessControl.cpp                  | 48 +++++++++-
 src/Access/AccessControl.h                    |  7 +-
 src/Access/Common/QuotaDefs.cpp               |  5 ++
 src/Access/Common/QuotaDefs.h                 | 21 ++---
 src/Access/EnabledQuota.cpp                   | 16 ++++
 src/Access/EnabledQuota.h                     |  2 +
 src/Access/QuotaCache.cpp                     | 31 +++++--
 src/Access/QuotaCache.h                       |  7 +-
 src/Interpreters/Session.cpp                  |  3 +-
 tests/integration/test_quota/test.py          | 79 ++++++++++++----
 tests/integration/test_quota/tiny_limits.xml  |  1 +
 tests/integration/test_quota/two_quotas.xml   |  1 +
 .../0_stateless/01297_create_quota.reference  |  8 +-
 .../02117_show_create_table_system.reference  | 11 ++-
 .../02884_authentication_quota.reference      | 52 +++++++++++
 .../0_stateless/02884_authentication_quota.sh | 90 +++++++++++++++++++
 23 files changed, 346 insertions(+), 60 deletions(-)
 create mode 100644 tests/queries/0_stateless/02884_authentication_quota.reference
 create mode 100755 tests/queries/0_stateless/02884_authentication_quota.sh

diff --git a/docs/en/operations/system-tables/quota_usage.md b/docs/en/operations/system-tables/quota_usage.md
index 0dca7c525f2..3d4b8f62d2d 100644
--- a/docs/en/operations/system-tables/quota_usage.md
+++ b/docs/en/operations/system-tables/quota_usage.md
@@ -25,6 +25,8 @@ Columns:
 - `max_read_rows` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — Maximum number of rows read from all tables and table functions participated in queries.
 - `read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — The total number of bytes read from all tables and table functions participated in queries.
 - `max_read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — Maximum of bytes read from all tables and table functions.
+- `failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — The total count of sequential authentication failures. If the user entered the correct password before exceed `failed_sequential_authentications` threshold then the counter will be reset.
+- `max_failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — Maximum count of sequential authentication failures.
 - `execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — The total query execution time, in seconds (wall time).
 - `max_execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — Maximum of query execution time.
 
diff --git a/docs/en/operations/system-tables/quotas_usage.md b/docs/en/operations/system-tables/quotas_usage.md
index a04018ac2c8..960903fa25f 100644
--- a/docs/en/operations/system-tables/quotas_usage.md
+++ b/docs/en/operations/system-tables/quotas_usage.md
@@ -28,8 +28,10 @@ Columns:
 - `max_read_rows` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — Maximum number of rows read from all tables and table functions participated in queries.
 - `read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — The total number of bytes read from all tables and table functions participated in queries.
 - `max_read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — Maximum of bytes read from all tables and table functions.
-- `execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — The total query execution time, in seconds (wall time).
-- `max_execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — Maximum of query execution time.
+- `failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — The total count of sequential authentication failures. If the user entered the correct password before exceed `failed_sequential_authentications` threshold then the counter will be reset.
+- `max_failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — Maximum count of sequential authentication failures.
+- `execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — The total query execution time, in seconds (wall time).
+- `max_execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — Maximum of query execution time.
 
 ## See Also {#see-also}
 
diff --git a/docs/en/sql-reference/statements/create/quota.md b/docs/en/sql-reference/statements/create/quota.md
index a6ced870c18..d16b40876c7 100644
--- a/docs/en/sql-reference/statements/create/quota.md
+++ b/docs/en/sql-reference/statements/create/quota.md
@@ -21,7 +21,7 @@ CREATE QUOTA [IF NOT EXISTS | OR REPLACE] name [ON CLUSTER cluster_name]
 
 Keys `user_name`, `ip_address`, `client_key`, `client_key, user_name` and `client_key, ip_address` correspond to the fields in the [system.quotas](../../../operations/system-tables/quotas.md) table.
 
-Parameters `queries`, `query_selects`, `query_inserts`, `errors`, `result_rows`, `result_bytes`, `read_rows`, `read_bytes`, `execution_time` correspond to the fields in the [system.quotas_usage](../../../operations/system-tables/quotas_usage.md) table.
+Parameters `queries`, `query_selects`, `query_inserts`, `errors`, `result_rows`, `result_bytes`, `read_rows`, `read_bytes`, `execution_time`, `failed_sequential_authentications` correspond to the fields in the [system.quotas_usage](../../../operations/system-tables/quotas_usage.md) table.
 
 `ON CLUSTER` clause allows creating quotas on a cluster, see [Distributed DDL](../../../sql-reference/distributed-ddl.md).
 
diff --git a/docs/ru/operations/system-tables/quota_usage.md b/docs/ru/operations/system-tables/quota_usage.md
index 96f6debd24e..46305e59da6 100644
--- a/docs/ru/operations/system-tables/quota_usage.md
+++ b/docs/ru/operations/system-tables/quota_usage.md
@@ -26,8 +26,11 @@ slug: /ru/operations/system-tables/quota_usage
 -   `max_read_rows` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — максимальное количество строк, считываемых из всех таблиц и табличных функций, участвующих в запросах.
 -   `read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — общее количество байт, считанных из всех таблиц и табличных функций, участвующих в запросах.
 -   `max_read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — максимальное количество байт, считываемых из всех таблиц и табличных функций.
--   `execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — общее время выполнения запроса, в секундах.
--   `max_execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — максимальное время выполнения запроса.
+- `failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — Общее количество неудачных попыток подряд ввести пароль. Если пользователь ввел верный пароль до преодоления порогового значения `max_failed_sequential_authentications` то счетчик неудачных попыток будет сброшен.
+- `max_failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — Максимальное количество неудачных попыток подряд ввести пароль.
+-   `execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — общее время выполнения запроса, в секундах.
+-   `max_execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — максимальное время выполнения запроса.
+
 
 ## Смотрите также {#see-also}
 
diff --git a/docs/ru/operations/system-tables/quotas_usage.md b/docs/ru/operations/system-tables/quotas_usage.md
index 27e7cdf8abe..4bc0f2e81ca 100644
--- a/docs/ru/operations/system-tables/quotas_usage.md
+++ b/docs/ru/operations/system-tables/quotas_usage.md
@@ -29,9 +29,10 @@ slug: /ru/operations/system-tables/quotas_usage
 -   `max_read_rows` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — максимальное количество строк, считываемых из всех таблиц и табличных функций, участвующих в запросах.
 -   `read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — общее количество байт, считанных из всех таблиц и табличных функций, участвующих в запросах.
 -   `max_read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — максимальное количество байт, считываемых из всех таблиц и табличных функций.
+- `failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — Общее количество неудачных попыток подряд ввести пароль. Если пользователь ввел верный пароль до преодоления порогового значения `max_failed_sequential_authentications` то счетчик неудачных попыток будет сброшен.
+- `max_failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — Максимальное количество неудачных попыток подряд ввести пароль.
 -   `execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — общее время выполнения запроса, в секундах.
 -   `max_execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — максимальное время выполнения запроса.
-
 ## Смотрите также {#see-also}
 
 -   [SHOW QUOTA](../../sql-reference/statements/show.md#show-quota-statement)
diff --git a/docs/ru/sql-reference/statements/alter/quota.md b/docs/ru/sql-reference/statements/alter/quota.md
index 709baea6af0..c14b81c9bf3 100644
--- a/docs/ru/sql-reference/statements/alter/quota.md
+++ b/docs/ru/sql-reference/statements/alter/quota.md
@@ -22,7 +22,7 @@ ALTER QUOTA [IF EXISTS] name [ON CLUSTER cluster_name]
 
 Ключи `user_name`, `ip_address`, `client_key`, `client_key, user_name` и `client_key, ip_address` соответствуют полям таблицы [system.quotas](../../../operations/system-tables/quotas.md).
 
-Параметры `queries`, `query_selects`, `query_inserts`, `errors`, `result_rows`, `result_bytes`, `read_rows`, `read_bytes`, `execution_time` соответствуют полям таблицы [system.quotas_usage](../../../operations/system-tables/quotas_usage.md).
+Параметры `queries`, `query_selects`, `query_inserts`, `errors`, `result_rows`, `result_bytes`, `read_rows`, `read_bytes`, `execution_time`, `failed_sequential_authentications` соответствуют полям таблицы [system.quotas_usage](../../../operations/system-tables/quotas_usage.md).
 
 В секции `ON CLUSTER` можно указать кластеры, на которых создается квота, см. [Распределенные DDL запросы](../../../sql-reference/distributed-ddl.md).
 
diff --git a/docs/ru/sql-reference/statements/create/quota.md b/docs/ru/sql-reference/statements/create/quota.md
index 18eba6b5b1a..398c52fdc73 100644
--- a/docs/ru/sql-reference/statements/create/quota.md
+++ b/docs/ru/sql-reference/statements/create/quota.md
@@ -20,7 +20,7 @@ CREATE QUOTA [IF NOT EXISTS | OR REPLACE] name [ON CLUSTER cluster_name]
 ```
 Ключи `user_name`, `ip_address`, `client_key`, `client_key, user_name` и `client_key, ip_address` соответствуют полям таблицы [system.quotas](../../../operations/system-tables/quotas.md).
 
-Параметры `queries`, `query_selects`, `query_inserts`, `errors`, `result_rows`, `result_bytes`, `read_rows`, `read_bytes`, `execution_time` соответствуют полям таблицы [system.quotas_usage](../../../operations/system-tables/quotas_usage.md).
+Параметры `queries`, `query_selects`, `query_inserts`, `errors`, `result_rows`, `result_bytes`, `read_rows`, `read_bytes`, `execution_time`, `failed_sequential_authentications` соответствуют полям таблицы [system.quotas_usage](../../../operations/system-tables/quotas_usage.md).
 
 В секции `ON CLUSTER` можно указать кластеры, на которых создается квота, см. [Распределенные DDL запросы](../../../sql-reference/distributed-ddl.md).
 
diff --git a/src/Access/AccessControl.cpp b/src/Access/AccessControl.cpp
index 71ad219110d..95262e632f0 100644
--- a/src/Access/AccessControl.cpp
+++ b/src/Access/AccessControl.cpp
@@ -559,16 +559,26 @@ AccessChangesNotifier & AccessControl::getChangesNotifier()
 }
 
 
-AuthResult AccessControl::authenticate(const Credentials & credentials, const Poco::Net::IPAddress & address) const
+AuthResult AccessControl::authenticate(const Credentials & credentials, const Poco::Net::IPAddress & address, const String & forwarded_address) const
 {
+    // NOTE: In the case where the user has never been logged in using LDAP,
+    // Then user_id is not generated, and the authentication quota will always be nullptr.
+    auto authentication_quota = getAuthenticationQuota(credentials.getUserName(), address, forwarded_address);
+    if (authentication_quota)
+        authentication_quota->checkExceeded(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
+
     try
     {
-        return MultipleAccessStorage::authenticate(credentials, address, *external_authenticators, allow_no_password,
-                                                   allow_plaintext_password);
+        const auto auth_result = MultipleAccessStorage::authenticate(credentials, address, *external_authenticators, allow_no_password,
+                                                                     allow_plaintext_password);
+
+        return auth_result;
     }
     catch (...)
     {
         tryLogCurrentException(getLogger(), "from: " + address.toString() + ", user: " + credentials.getUserName()  + ": Authentication failed");
+        if (authentication_quota)
+            authentication_quota->used(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS, 1, true);
 
         WriteBufferFromOwnString message;
         message << credentials.getUserName() << ": Authentication failed: password is incorrect, or there is no user with such name.";
@@ -588,6 +598,9 @@ AuthResult AccessControl::authenticate(const Credentials & credentials, const Po
                                             "{}: Authentication failed: password is incorrect, or there is no user with such name.{}"},
                         ErrorCodes::AUTHENTICATION_FAILED);
     }
+
+    if (authentication_quota)
+        authentication_quota->reset(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
 }
 
 void AccessControl::restoreFromBackup(RestorerFromBackup & restorer)
@@ -763,7 +776,34 @@ std::shared_ptr<const EnabledQuota> AccessControl::getEnabledQuota(
     const String & forwarded_address,
     const String & custom_quota_key) const
 {
-    return quota_cache->getEnabledQuota(user_id, user_name, enabled_roles, address, forwarded_address, custom_quota_key);
+    return quota_cache->getEnabledQuota(user_id, user_name, enabled_roles, address, forwarded_address, custom_quota_key, true);
+}
+
+std::shared_ptr<const EnabledQuota> AccessControl::getAuthenticationQuota(
+    const String & user_name, const Poco::Net::IPAddress & address, const std::string & forwarded_address) const
+{
+    auto user_id = find<User>(user_name);
+    UserPtr user;
+    if (user_id && (user = tryRead<User>(*user_id)))
+    {
+        const auto new_current_roles = user->granted_roles.findGranted(user->default_roles);
+        const auto roles_info = getEnabledRolesInfo(new_current_roles, {});
+
+        // client_key is not received at the moment of authentication during TCP connection
+        // if key type is set to QuotaKeyType::CLIENT_KEY
+        // QuotaCache::QuotaInfo::calculateKey will throw exception without throw_if_client_key_empty = false
+        String quota_key;
+        bool throw_if_client_key_empty = false;
+        return quota_cache->getEnabledQuota(*user_id,
+                                            user->getName(),
+                                            roles_info->enabled_roles,
+                                            address,
+                                            forwarded_address,
+                                            quota_key,
+                                            throw_if_client_key_empty);
+    }
+    else
+        return nullptr;
 }
 
 
diff --git a/src/Access/AccessControl.h b/src/Access/AccessControl.h
index 76431ab4928..904f77faf90 100644
--- a/src/Access/AccessControl.h
+++ b/src/Access/AccessControl.h
@@ -118,7 +118,7 @@ public:
     scope_guard subscribeForChanges(const UUID & id, const OnChangedHandler & handler) const;
     scope_guard subscribeForChanges(const std::vector<UUID> & ids, const OnChangedHandler & handler) const;
 
-    AuthResult authenticate(const Credentials & credentials, const Poco::Net::IPAddress & address) const;
+    AuthResult authenticate(const Credentials & credentials, const Poco::Net::IPAddress & address, const String & forwarded_address) const;
 
     /// Makes a backup of access entities.
     void restoreFromBackup(RestorerFromBackup & restorer) override;
@@ -206,6 +206,11 @@ public:
         const String & forwarded_address,
         const String & custom_quota_key) const;
 
+    std::shared_ptr<const EnabledQuota> getAuthenticationQuota(
+        const String & user_name,
+        const Poco::Net::IPAddress & address,
+        const std::string & forwarded_address) const;
+
     std::vector<QuotaUsage> getAllQuotasUsage() const;
 
     std::shared_ptr<const EnabledSettings> getEnabledSettings(
diff --git a/src/Access/Common/QuotaDefs.cpp b/src/Access/Common/QuotaDefs.cpp
index 4136fd52a00..0e9a4d5a365 100644
--- a/src/Access/Common/QuotaDefs.cpp
+++ b/src/Access/Common/QuotaDefs.cpp
@@ -111,6 +111,11 @@ const QuotaTypeInfo & QuotaTypeInfo::get(QuotaType type)
             static const auto info = make_info("WRITTEN_BYTES", 1);
             return info;
         }
+        case QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS:
+        {
+            static const auto info = make_info("FAILED_SEQUENTIAL_AUTHENTICATIONS", 1);
+            return info;
+        }
         case QuotaType::MAX: break;
     }
     throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected quota type: {}", static_cast<int>(type));
diff --git a/src/Access/Common/QuotaDefs.h b/src/Access/Common/QuotaDefs.h
index dfe2b56ef31..4f849a72b43 100644
--- a/src/Access/Common/QuotaDefs.h
+++ b/src/Access/Common/QuotaDefs.h
@@ -11,16 +11,17 @@ using QuotaValue = UInt64;
 /// Kinds of resource what we wish to quota.
 enum class QuotaType
 {
-    QUERIES,        /// Number of queries.
-    QUERY_SELECTS,  /// Number of select queries.
-    QUERY_INSERTS,  /// Number of insert queries.
-    ERRORS,         /// Number of queries with exceptions.
-    RESULT_ROWS,    /// Number of rows returned as result.
-    RESULT_BYTES,   /// Number of bytes returned as result.
-    READ_ROWS,      /// Number of rows read from tables.
-    READ_BYTES,     /// Number of bytes read from tables.
-    EXECUTION_TIME, /// Total amount of query execution time in nanoseconds.
-    WRITTEN_BYTES,  /// Number of bytes written to tables.
+    QUERIES,                                /// Number of queries.
+    QUERY_SELECTS,                          /// Number of select queries.
+    QUERY_INSERTS,                          /// Number of insert queries.
+    ERRORS,                                 /// Number of queries with exceptions.
+    RESULT_ROWS,                            /// Number of rows returned as result.
+    RESULT_BYTES,                           /// Number of bytes returned as result.
+    READ_ROWS,                              /// Number of rows read from tables.
+    READ_BYTES,                             /// Number of bytes read from tables.
+    EXECUTION_TIME,                         /// Total amount of query execution time in nanoseconds.
+    WRITTEN_BYTES,                          /// Number of bytes written to tables.
+    FAILED_SEQUENTIAL_AUTHENTICATIONS,      /// Number of recent failed authentications.
 
     MAX
 };
diff --git a/src/Access/EnabledQuota.cpp b/src/Access/EnabledQuota.cpp
index a61e795f741..98cce586a54 100644
--- a/src/Access/EnabledQuota.cpp
+++ b/src/Access/EnabledQuota.cpp
@@ -105,6 +105,16 @@ struct EnabledQuota::Impl
         std::uniform_int_distribution<Int64> distribution{0, count - 1};
         return std::chrono::system_clock::duration(distribution(thread_local_rng));
     }
+
+    static void resetQuotaValue(const Intervals & intervals, QuotaType quota_type, QuotaValue value, std::chrono::system_clock::time_point current_time)
+    {
+        const auto quota_type_i = static_cast<size_t>(quota_type);
+        for (const auto & interval : intervals.intervals)
+        {
+            interval.used[quota_type_i] = value;
+            interval.getEndOfInterval(current_time);
+        }
+    }
 };
 
 
@@ -285,6 +295,12 @@ void EnabledQuota::checkExceeded(QuotaType quota_type) const
 }
 
 
+void EnabledQuota::reset(QuotaType quota_type) const
+{
+    const auto loaded = intervals.load();
+    Impl::resetQuotaValue(*loaded, quota_type, 0, std::chrono::system_clock::now());
+}
+
 std::optional<QuotaUsage> EnabledQuota::getUsage() const
 {
     auto loaded = intervals.load();
diff --git a/src/Access/EnabledQuota.h b/src/Access/EnabledQuota.h
index ed1e06fa1f2..c4665da5dc6 100644
--- a/src/Access/EnabledQuota.h
+++ b/src/Access/EnabledQuota.h
@@ -52,6 +52,8 @@ public:
     void checkExceeded() const;
     void checkExceeded(QuotaType quota_type) const;
 
+    void reset(QuotaType quota_type) const;
+
     /// Returns the information about quota consumption.
     std::optional<QuotaUsage> getUsage() const;
 
diff --git a/src/Access/QuotaCache.cpp b/src/Access/QuotaCache.cpp
index 3c25c8833f3..dc49e9680ad 100644
--- a/src/Access/QuotaCache.cpp
+++ b/src/Access/QuotaCache.cpp
@@ -30,7 +30,7 @@ void QuotaCache::QuotaInfo::setQuota(const QuotaPtr & quota_, const UUID & quota
 }
 
 
-String QuotaCache::QuotaInfo::calculateKey(const EnabledQuota & enabled) const
+String QuotaCache::QuotaInfo::calculateKey(const EnabledQuota & enabled, bool throw_if_client_key_empty) const
 {
     const auto & params = enabled.params;
     switch (quota->key_type)
@@ -55,8 +55,15 @@ String QuotaCache::QuotaInfo::calculateKey(const EnabledQuota & enabled) const
         {
             if (!params.client_key.empty())
                 return params.client_key;
-            throw Exception(ErrorCodes::QUOTA_REQUIRES_CLIENT_KEY, "Quota {} (for user {}) requires a client supplied key.",
-                quota->getName(), params.user_name);
+
+            if (throw_if_client_key_empty)
+                throw Exception(
+                    ErrorCodes::QUOTA_REQUIRES_CLIENT_KEY,
+                    "Quota {} (for user {}) requires a client supplied key.",
+                    quota->getName(),
+                    params.user_name);
+            else
+                return ""; // Authentication quota has no client key at time of authentication.
         }
         case QuotaKeyType::CLIENT_KEY_OR_USER_NAME:
         {
@@ -165,7 +172,14 @@ QuotaCache::QuotaCache(const AccessControl & access_control_)
 QuotaCache::~QuotaCache() = default;
 
 
-std::shared_ptr<const EnabledQuota> QuotaCache::getEnabledQuota(const UUID & user_id, const String & user_name, const boost::container::flat_set<UUID> & enabled_roles, const Poco::Net::IPAddress & client_address, const String & forwarded_address, const String & client_key)
+std::shared_ptr<const EnabledQuota> QuotaCache::getEnabledQuota(
+    const UUID & user_id,
+    const String & user_name,
+    const boost::container::flat_set<UUID> & enabled_roles,
+    const Poco::Net::IPAddress & client_address,
+    const String & forwarded_address,
+    const String & client_key,
+    bool throw_if_client_key_empty)
 {
     std::lock_guard lock{mutex};
     ensureAllQuotasRead();
@@ -188,11 +202,10 @@ std::shared_ptr<const EnabledQuota> QuotaCache::getEnabledQuota(const UUID & use
 
     auto res = std::shared_ptr<EnabledQuota>(new EnabledQuota(params));
     enabled_quotas.emplace(std::move(params), res);
-    chooseQuotaToConsumeFor(*res);
+    chooseQuotaToConsumeFor(*res, throw_if_client_key_empty);
     return res;
 }
 
-
 void QuotaCache::ensureAllQuotasRead()
 {
     /// `mutex` is already locked.
@@ -257,13 +270,13 @@ void QuotaCache::chooseQuotaToConsume()
             i = enabled_quotas.erase(i);
         else
         {
-            chooseQuotaToConsumeFor(*elem);
+            chooseQuotaToConsumeFor(*elem, true);
             ++i;
         }
     }
 }
 
-void QuotaCache::chooseQuotaToConsumeFor(EnabledQuota & enabled)
+void QuotaCache::chooseQuotaToConsumeFor(EnabledQuota & enabled, bool throw_if_client_key_empty)
 {
     /// `mutex` is already locked.
     boost::shared_ptr<const Intervals> intervals;
@@ -271,7 +284,7 @@ void QuotaCache::chooseQuotaToConsumeFor(EnabledQuota & enabled)
     {
         if (info.roles->match(enabled.params.user_id, enabled.params.enabled_roles))
         {
-            String key = info.calculateKey(enabled);
+            String key = info.calculateKey(enabled, throw_if_client_key_empty);
             intervals = info.getOrBuildIntervals(key);
             break;
         }
diff --git a/src/Access/QuotaCache.h b/src/Access/QuotaCache.h
index 883ddfe47a8..97cf2d19c2f 100644
--- a/src/Access/QuotaCache.h
+++ b/src/Access/QuotaCache.h
@@ -28,7 +28,8 @@ public:
         const boost::container::flat_set<UUID> & enabled_roles,
         const Poco::Net::IPAddress & address,
         const String & forwarded_address,
-        const String & client_key);
+        const String & client_key,
+        bool throw_if_client_key_empty);
 
     std::vector<QuotaUsage> getAllQuotasUsage() const;
 
@@ -41,7 +42,7 @@ private:
         QuotaInfo(const QuotaPtr & quota_, const UUID & quota_id_) { setQuota(quota_, quota_id_); }
         void setQuota(const QuotaPtr & quota_, const UUID & quota_id_);
 
-        String calculateKey(const EnabledQuota & enabled_quota) const;
+        String calculateKey(const EnabledQuota & enabled_quota, bool throw_if_client_key_empty) const;
         boost::shared_ptr<const Intervals> getOrBuildIntervals(const String & key);
         boost::shared_ptr<const Intervals> rebuildIntervals(const String & key, std::chrono::system_clock::time_point current_time);
         void rebuildAllIntervals();
@@ -56,7 +57,7 @@ private:
     void quotaAddedOrChanged(const UUID & quota_id, const std::shared_ptr<const Quota> & new_quota);
     void quotaRemoved(const UUID & quota_id);
     void chooseQuotaToConsume();
-    void chooseQuotaToConsumeFor(EnabledQuota & enabled_quota);
+    void chooseQuotaToConsumeFor(EnabledQuota & enabled_quota, bool throw_if_client_key_empty);
 
     const AccessControl & access_control;
     mutable std::mutex mutex;
diff --git a/src/Interpreters/Session.cpp b/src/Interpreters/Session.cpp
index 533f33033e3..df97a09f686 100644
--- a/src/Interpreters/Session.cpp
+++ b/src/Interpreters/Session.cpp
@@ -349,10 +349,9 @@ void Session::authenticate(const Credentials & credentials_, const Poco::Net::So
 
     try
     {
-        auto auth_result = global_context->getAccessControl().authenticate(credentials_, address.host());
+        auto auth_result = global_context->getAccessControl().authenticate(credentials_, address.host(), getClientInfo().getLastForwardedFor());
         user_id = auth_result.user_id;
         settings_from_auth_server = auth_result.settings;
-
         LOG_DEBUG(log, "{} Authenticated with global context as user {}",
                 toString(auth_id), toString(*user_id));
     }
diff --git a/tests/integration/test_quota/test.py b/tests/integration/test_quota/test.py
index cec14b0af73..bf64b57a7bf 100644
--- a/tests/integration/test_quota/test.py
+++ b/tests/integration/test_quota/test.py
@@ -40,7 +40,7 @@ def system_quota_usage(canonical):
     canonical_tsv = TSV(canonical)
     query = (
         "SELECT quota_name, quota_key, duration, queries, max_queries, query_selects, max_query_selects, query_inserts, max_query_inserts, errors, max_errors, result_rows, max_result_rows,"
-        "result_bytes, max_result_bytes, read_rows, max_read_rows, read_bytes, max_read_bytes, max_execution_time "
+        "result_bytes, max_result_bytes, read_rows, max_read_rows, read_bytes, max_read_bytes, max_execution_time, max_failed_sequential_authentications "
         "FROM system.quota_usage ORDER BY duration"
     )
     r = TSV(instance.query(query))
@@ -52,7 +52,7 @@ def system_quotas_usage(canonical):
     canonical_tsv = TSV(canonical)
     query = (
         "SELECT quota_name, quota_key, is_current, duration, queries, max_queries, query_selects, max_query_selects, query_inserts, max_query_inserts, errors, max_errors, result_rows, max_result_rows, "
-        "result_bytes, max_result_bytes, read_rows, max_read_rows, read_bytes, max_read_bytes, max_execution_time "
+        "result_bytes, max_result_bytes, read_rows, max_read_rows, read_bytes, max_read_bytes, max_execution_time, max_failed_sequential_authentications "
         "FROM system.quotas_usage ORDER BY quota_name, quota_key, duration"
     )
     r = TSV(instance.query(query))
@@ -130,6 +130,7 @@ def test_quota_from_users_xml():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -156,6 +157,7 @@ def test_quota_from_users_xml():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -183,6 +185,7 @@ def test_quota_from_users_xml():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -211,6 +214,7 @@ def test_quota_from_users_xml():
                 200,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -239,6 +243,7 @@ def test_quota_from_users_xml():
                 400,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -285,6 +290,7 @@ def test_simpliest_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -313,6 +319,7 @@ def test_simpliest_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -351,6 +358,7 @@ def test_tracking_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -377,6 +385,7 @@ def test_tracking_quota():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -405,6 +414,7 @@ def test_tracking_quota():
                 200,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -433,6 +443,7 @@ def test_tracking_quota():
                 400,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -456,7 +467,7 @@ def test_exceed_quota():
         ]
     )
     system_quota_limits(
-        [["myQuota", 31556952, 0, 1, 1, 1, 1, 1, "\\N", 1, "\\N", "\\N", "\\N"]]
+        [["myQuota", 31556952, 0, 1, 1, 1, 1, 1, "\\N", 1, "\\N", "\\N", "\\N", "1"]]
     )
     system_quota_usage(
         [
@@ -481,6 +492,7 @@ def test_exceed_quota():
                 0,
                 "\\N",
                 "\\N",
+                "1",
             ]
         ]
     )
@@ -512,6 +524,7 @@ def test_exceed_quota():
                 0,
                 "\\N",
                 "\\N",
+                "1",
             ]
         ]
     )
@@ -548,6 +561,7 @@ def test_exceed_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -574,6 +588,7 @@ def test_exceed_quota():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -602,6 +617,7 @@ def test_exceed_quota():
                 200,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -638,6 +654,7 @@ def test_add_remove_interval():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -664,6 +681,7 @@ def test_add_remove_interval():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -700,6 +718,7 @@ def test_add_remove_interval():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ],
             [
                 "myQuota",
@@ -715,6 +734,7 @@ def test_add_remove_interval():
                 20000,
                 120,
                 "\\N",
+                "\\N",
             ],
         ]
     )
@@ -741,6 +761,7 @@ def test_add_remove_interval():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ],
             [
                 "myQuota",
@@ -763,6 +784,7 @@ def test_add_remove_interval():
                 0,
                 20000,
                 120,
+                "\\N",
             ],
         ]
     )
@@ -791,6 +813,7 @@ def test_add_remove_interval():
                 200,
                 "\\N",
                 "\\N",
+                "\\N",
             ],
             [
                 "myQuota",
@@ -813,6 +836,7 @@ def test_add_remove_interval():
                 200,
                 20000,
                 120,
+                "\\N",
             ],
         ]
     )
@@ -849,6 +873,7 @@ def test_add_remove_interval():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -875,6 +900,7 @@ def test_add_remove_interval():
                 200,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -903,6 +929,7 @@ def test_add_remove_interval():
                 400,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -947,6 +974,7 @@ def test_add_remove_interval():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -975,6 +1003,7 @@ def test_add_remove_interval():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1011,6 +1040,7 @@ def test_add_remove_interval():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1037,6 +1067,7 @@ def test_add_remove_interval():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1073,6 +1104,7 @@ def test_add_remove_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1100,6 +1132,7 @@ def test_add_remove_quota():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1146,6 +1179,7 @@ def test_add_remove_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ],
             [
                 "myQuota2",
@@ -1161,6 +1195,7 @@ def test_add_remove_quota():
                 400000,
                 60,
                 "\\N",
+                "3",
             ],
             [
                 "myQuota2",
@@ -1176,6 +1211,7 @@ def test_add_remove_quota():
                 "\\N",
                 1800,
                 "\\N",
+                "\\N",
             ],
         ]
     )
@@ -1203,6 +1239,7 @@ def test_add_remove_quota():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1239,6 +1276,7 @@ def test_add_remove_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1266,6 +1304,7 @@ def test_add_remove_quota():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1308,6 +1347,7 @@ def test_add_remove_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1335,6 +1375,7 @@ def test_add_remove_quota():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1371,6 +1412,7 @@ def test_reload_users_xml_by_timer():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1397,7 +1439,7 @@ def test_reload_users_xml_by_timer():
     assert_eq_with_retry(
         instance,
         "SELECT * FROM system.quota_limits",
-        [["myQuota", 31556952, 0, 1, 1, 1, 1, 1, "\\N", 1, "\\N", "\\N", "\\N"]],
+        [["myQuota", 31556952, 0, 1, 1, 1, 1, 1, "\\N", 1, "\\N", "\\N", "\\N", "1"]],
     )
 
 
@@ -1447,15 +1489,15 @@ def test_dcl_introspection():
     )
     assert (
         instance.query("SHOW CREATE QUOTA myQuota2")
-        == "CREATE QUOTA myQuota2 KEYED BY client_key, user_name FOR RANDOMIZED INTERVAL 1 hour MAX result_rows = 4000, result_bytes = 400000, read_rows = 4000, read_bytes = 400000, execution_time = 60, FOR INTERVAL 1 month MAX execution_time = 1800\n"
+        == "CREATE QUOTA myQuota2 KEYED BY client_key, user_name FOR RANDOMIZED INTERVAL 1 hour MAX result_rows = 4000, result_bytes = 400000, read_rows = 4000, read_bytes = 400000, execution_time = 60, failed_sequential_authentications = 3, FOR INTERVAL 1 month MAX execution_time = 1800\n"
     )
     assert (
         instance.query("SHOW CREATE QUOTAS")
         == "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000 TO default\n"
-        "CREATE QUOTA myQuota2 KEYED BY client_key, user_name FOR RANDOMIZED INTERVAL 1 hour MAX result_rows = 4000, result_bytes = 400000, read_rows = 4000, read_bytes = 400000, execution_time = 60, FOR INTERVAL 1 month MAX execution_time = 1800\n"
+        "CREATE QUOTA myQuota2 KEYED BY client_key, user_name FOR RANDOMIZED INTERVAL 1 hour MAX result_rows = 4000, result_bytes = 400000, read_rows = 4000, read_bytes = 400000, execution_time = 60, failed_sequential_authentications = 3, FOR INTERVAL 1 month MAX execution_time = 1800\n"
     )
     assert re.match(
-        "myQuota\\tdefault\\t.*\\t31556952\\t1\\t1000\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t1000\\t200\\t\\\\N\\t.*\\t\\\\N\n",
+        "myQuota\\tdefault\\t.*\\t31556952\\t1\\t1000\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t1000\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
@@ -1478,13 +1520,13 @@ def test_dcl_management():
         == "CREATE QUOTA qA FOR INTERVAL 5 quarter MAX queries = 123 TO default\n"
     )
     assert re.match(
-        "qA\\t\\t.*\\t39446190\\t0\\t123\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t\\\\N\n",
+        "qA\\t\\t.*\\t39446190\\t0\\t123\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
     instance.query("SELECT * from test_table")
     assert re.match(
-        "qA\\t\\t.*\\t39446190\\t1\\t123\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\n",
+        "qA\\t\\t.*\\t39446190\\t1\\t123\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
@@ -1496,15 +1538,15 @@ def test_dcl_management():
         == "CREATE QUOTA qA FOR INTERVAL 30 minute MAX execution_time = 0.5, FOR INTERVAL 5 quarter MAX queries = 321, errors = 10 TO default\n"
     )
     assert re.match(
-        "qA\\t\\t.*\\t1800\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t0.5\\t0\\t\\\\N\n"
-        "qA\\t\\t.*\\t39446190\\t1\\t321\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t10\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
+        "qA\\t\\t.*\\t1800\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t0.5\\t0\\t\\\\N\\t0\\t\\\\N\n"
+        "qA\\t\\t.*\\t39446190\\t1\\t321\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t10\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\n",
         instance.query("SHOW QUOTA"),
     )
 
     instance.query("SELECT * from test_table")
     assert re.match(
-        "qA\\t\\t.*\\t1800\\t1\\t\\\\N\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t0.5\\t0\\t\\\\N\n"
-        "qA\\t\\t.*\\t39446190\\t2\\t321\\t2\\t\\\\N\\t0\\t\\\\N\\t0\\t10\\t100\\t\\\\N\\t400\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
+        "qA\\t\\t.*\\t1800\\t1\\t\\\\N\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t0.5\\t0\\t\\\\N\\t0\\t\\\\N\n"
+        "qA\\t\\t.*\\t39446190\\t2\\t321\\t2\\t\\\\N\\t0\\t\\\\N\\t0\\t10\\t100\\t\\\\N\\t400\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
@@ -1518,7 +1560,7 @@ def test_dcl_management():
 
     instance.query("SELECT * from test_table")
     assert re.match(
-        "qA\\t\\t.*\\t42075936\\t1\\t\\\\N\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
+        "qA\\t\\t.*\\t42075936\\t1\\t\\\\N\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
@@ -1528,13 +1570,13 @@ def test_dcl_management():
         == "CREATE QUOTA qB FOR RANDOMIZED INTERVAL 16 month TRACKING ONLY TO default\n"
     )
     assert re.match(
-        "qB\\t\\t.*\\t42075936\\t1\\t\\\\N\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\n",
+        "qB\\t\\t.*\\t42075936\\t1\\t\\\\N\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
     instance.query("SELECT * from test_table")
     assert re.match(
-        "qB\\t\\t.*\\t42075936\\t2\\t\\\\N\\t2\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
+        "qB\\t\\t.*\\t42075936\\t2\\t\\\\N\\t2\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
@@ -1579,6 +1621,7 @@ def test_query_inserts():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1605,6 +1648,7 @@ def test_query_inserts():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1632,6 +1676,7 @@ def test_query_inserts():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1663,6 +1708,7 @@ def test_query_inserts():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1691,6 +1737,7 @@ def test_query_inserts():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
diff --git a/tests/integration/test_quota/tiny_limits.xml b/tests/integration/test_quota/tiny_limits.xml
index 5821935bb6d..b5014674f98 100644
--- a/tests/integration/test_quota/tiny_limits.xml
+++ b/tests/integration/test_quota/tiny_limits.xml
@@ -12,6 +12,7 @@
                 <errors>1</errors>
                 <read_rows>1</read_rows>
                 <result_rows>1</result_rows>
+                <failed_sequential_authentications>1</failed_sequential_authentications>
             </interval>
         </myQuota>
     </quotas>
diff --git a/tests/integration/test_quota/two_quotas.xml b/tests/integration/test_quota/two_quotas.xml
index 13872286dc6..e3b91b1bf43 100644
--- a/tests/integration/test_quota/two_quotas.xml
+++ b/tests/integration/test_quota/two_quotas.xml
@@ -18,6 +18,7 @@
                 <read_bytes>400000</read_bytes>
                 <result_bytes>400000</result_bytes>
                 <execution_time>60</execution_time>
+                <failed_sequential_authentications>3</failed_sequential_authentications>
             </interval>
             <interval2>
                 <duration>2629746</duration>
diff --git a/tests/queries/0_stateless/01297_create_quota.reference b/tests/queries/0_stateless/01297_create_quota.reference
index 308bbf79024..456c9fc56bb 100644
--- a/tests/queries/0_stateless/01297_create_quota.reference
+++ b/tests/queries/0_stateless/01297_create_quota.reference
@@ -57,10 +57,10 @@ q2_01297	local_directory	[]	[5259492]	0	['r1_01297','u1_01297']	[]
 q3_01297	local_directory	['client_key','user_name']	[5259492,15778476]	0	[]	[]
 q4_01297	local_directory	[]	[604800]	1	[]	['u1_01297']
 -- system.quota_limits
-q2_01297	5259492	0	100	\N	\N	11	1000	10000	1001	10001	2.5	\N
-q3_01297	5259492	0	\N	\N	\N	\N	1002	\N	\N	\N	\N	\N
-q3_01297	15778476	0	100	\N	\N	11	\N	\N	\N	\N	\N	\N
-q4_01297	604800	0	\N	\N	\N	\N	\N	\N	\N	\N	\N	\N
+q2_01297	5259492	0	100	\N	\N	11	1000	10000	1001	10001	2.5	\N	\N
+q3_01297	5259492	0	\N	\N	\N	\N	1002	\N	\N	\N	\N	\N	\N
+q3_01297	15778476	0	100	\N	\N	11	\N	\N	\N	\N	\N	\N	\N
+q4_01297	604800	0	\N	\N	\N	\N	\N	\N	\N	\N	\N	\N	\N
 -- query_selects query_inserts
 CREATE QUOTA q1_01297 KEYED BY user_name FOR INTERVAL 1 minute MAX query_selects = 1 TO r1_01297
 CREATE QUOTA q2_01297 KEYED BY user_name FOR INTERVAL 1 minute MAX query_inserts = 1 TO r1_01297
diff --git a/tests/queries/0_stateless/02117_show_create_table_system.reference b/tests/queries/0_stateless/02117_show_create_table_system.reference
index e89d589857e..4c8f09bb852 100644
--- a/tests/queries/0_stateless/02117_show_create_table_system.reference
+++ b/tests/queries/0_stateless/02117_show_create_table_system.reference
@@ -762,7 +762,8 @@ CREATE TABLE system.quota_limits
     `max_read_rows` Nullable(UInt64),
     `max_read_bytes` Nullable(UInt64),
     `max_execution_time` Nullable(Float64),
-    `max_written_bytes` Nullable(UInt64)
+    `max_written_bytes` Nullable(UInt64),
+    `max_failed_sequential_authentications` Nullable(UInt64)
 )
 ENGINE = SystemQuotaLimits
 COMMENT 'SYSTEM TABLE is built on the fly.'
@@ -792,7 +793,9 @@ CREATE TABLE system.quota_usage
     `execution_time` Nullable(Float64),
     `max_execution_time` Nullable(Float64),
     `written_bytes` Nullable(UInt64),
-    `max_written_bytes` Nullable(UInt64)
+    `max_written_bytes` Nullable(UInt64),
+    `failed_sequential_authentications` Nullable(UInt64),
+    `max_failed_sequential_authentications` Nullable(UInt64)
 )
 ENGINE = SystemQuotaUsage
 COMMENT 'SYSTEM TABLE is built on the fly.'
@@ -836,7 +839,9 @@ CREATE TABLE system.quotas_usage
     `execution_time` Nullable(Float64),
     `max_execution_time` Nullable(Float64),
     `written_bytes` Nullable(UInt64),
-    `max_written_bytes` Nullable(UInt64)
+    `max_written_bytes` Nullable(UInt64),
+    `failed_sequential_authentications` Nullable(UInt64),
+    `max_failed_sequential_authentications` Nullable(UInt64)
 )
 ENGINE = SystemQuotasUsage
 COMMENT 'SYSTEM TABLE is built on the fly.'
diff --git a/tests/queries/0_stateless/02884_authentication_quota.reference b/tests/queries/0_stateless/02884_authentication_quota.reference
new file mode 100644
index 00000000000..02e410ed56f
--- /dev/null
+++ b/tests/queries/0_stateless/02884_authentication_quota.reference
@@ -0,0 +1,52 @@
+> Drop the user, quota, and role if those were created.
+> Create the user with quota with the maximum single authentication attempt.
+> Check if the quota has been created.
+1
+> Login to the user account using the wrong password.
+password is incorrect
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+1	1
+> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed.
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+0	1
+> Login to the user account using the wrong password 2 times to exceed the quota.
+password is incorrect
+QUOTA_EXCEEDED
+> Login to the user account using the correct password, but login is unsuccesful (quota exceed).
+QUOTA_EXCEEDED
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+2	1
+> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3
+> Login to the user account using the wrong password.
+password is incorrect
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+3	3
+> Increaseing MAX FAILED SEQUENTIAL AUTHENTICATIONS should now allow the user to login.
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+0	3
+> Create the role with quota with the maximum single authentication attempt.
+> Login to the user account using the wrong password.
+password is incorrect
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+1	1
+> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed.
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+0	1
+> Login to the user account using the wrong password 2 times to exceed the quota.
+password is incorrect
+QUOTA_EXCEEDED
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+QUOTA_EXCEEDED
+> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3
+> Login to the user account using the wrong password.
+password is incorrect
+> Login to the user account using the correct password.
+> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1
+> Login 2 times to the user account using the wrong password to exceed the quota
+password is incorrect
+> Login to the user account using wrong password and check that the error is 'QUOTA_EXCEEDED'.
+QUOTA_EXCEEDED
+> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'.
+QUOTA_EXCEEDED
+> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'.
+QUOTA_EXCEEDED
diff --git a/tests/queries/0_stateless/02884_authentication_quota.sh b/tests/queries/0_stateless/02884_authentication_quota.sh
new file mode 100755
index 00000000000..fcb2607c3d6
--- /dev/null
+++ b/tests/queries/0_stateless/02884_authentication_quota.sh
@@ -0,0 +1,90 @@
+#!/usr/bin/env bash
+# Tags: no-parallel
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+QUOTA="2884_quota_$$"
+USER="2884_user_$$"
+ROLE="2884_role_$$"
+
+echo "> Drop the user, quota, and role if those were created."
+${CLICKHOUSE_CLIENT} -q "DROP USER IF EXISTS ${USER}"
+${CLICKHOUSE_CLIENT} -q "DROP QUOTA IF EXISTS ${QUOTA}"
+${CLICKHOUSE_CLIENT} -q "DROP ROLE IF EXISTS ${ROLE}"
+
+echo "> Create the user with quota with the maximum single authentication attempt."
+${CLICKHOUSE_CLIENT} -q "CREATE USER ${USER} IDENTIFIED WITH plaintext_password BY 'pass'"
+${CLICKHOUSE_CLIENT} -q "CREATE QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1 TO ${USER}"
+
+echo "> Check if the quota has been created."
+${CLICKHOUSE_CLIENT} -q "SELECT COUNT(*) FROM system.quotas WHERE name = '${QUOTA}'"
+
+echo "> Login to the user account using the wrong password."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null"  2>&1 | grep -m1 -o 'password is incorrect'
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+echo "> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+echo "> Login to the user account using the wrong password 2 times to exceed the quota."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+echo "> Login to the user account using the correct password, but login is unsuccesful (quota exceed)."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+
+echo "> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3"
+${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3 TO ${USER}"
+echo "> Login to the user account using the wrong password."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null"  2>&1 | grep -m1 -o 'password is incorrect'
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+echo "> Increaseing MAX FAILED SEQUENTIAL AUTHENTICATIONS should now allow the user to login."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+
+echo "> Create the role with quota with the maximum single authentication attempt."
+${CLICKHOUSE_CLIENT} -q "CREATE ROLE ${ROLE}"
+${CLICKHOUSE_CLIENT} -q "GRANT ALL ON *.* TO ${ROLE}"
+${CLICKHOUSE_CLIENT} -q "GRANT ${ROLE} to ${USER}"
+${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1 TO ${ROLE}"
+echo "> Login to the user account using the wrong password."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+echo "> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+echo "> Login to the user account using the wrong password 2 times to exceed the quota."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+
+echo "> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3"
+${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3 TO ${USER}"
+echo "> Login to the user account using the wrong password."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+echo "> Login to the user account using the correct password."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+echo "> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1"
+${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1 TO ${USER}"
+echo "> Login 2 times to the user account using the wrong password to exceed the quota"
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+echo "> Login to the user account using wrong password and check that the error is 'QUOTA_EXCEEDED'."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+echo "> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+echo "> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+
+${CLICKHOUSE_CLIENT} -q "DROP USER IF EXISTS ${USER}"
+${CLICKHOUSE_CLIENT} -q "DROP QUOTA IF EXISTS ${QUOTA}"
+${CLICKHOUSE_CLIENT} -q "DROP ROLE IF EXISTS ${ROLE}"

From ff1cdf6beef1ae2d8aed50513a8a1b99e63e61d1 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 00:42:51 +0100
Subject: [PATCH 207/245] Restart CI

---
 tests/integration/test_storage_rabbitmq/test.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/integration/test_storage_rabbitmq/test.py b/tests/integration/test_storage_rabbitmq/test.py
index 28dbca1862c..b778e9fb556 100644
--- a/tests/integration/test_storage_rabbitmq/test.py
+++ b/tests/integration/test_storage_rabbitmq/test.py
@@ -3547,6 +3547,5 @@ def test_attach_broken_table(rabbitmq_cluster):
 
     error = instance.query_and_get_error("SELECT * FROM rabbit_queue")
     assert "CANNOT_CONNECT_RABBITMQ" in error
-
     error = instance.query_and_get_error("INSERT INTO rabbit_queue VALUES ('test')")
     assert "CANNOT_CONNECT_RABBITMQ" in error

From b1d2c0d93a493ec62aa0d3c8a82373624066fcb3 Mon Sep 17 00:00:00 2001
From: Alexey Gerasimchuck <a.gerasimchuck@arenadata.io>
Date: Mon, 29 Jan 2024 23:56:54 +0000
Subject: [PATCH 208/245] minor update

---
 src/Access/AccessControl.cpp | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/src/Access/AccessControl.cpp b/src/Access/AccessControl.cpp
index 95262e632f0..7026fda94b1 100644
--- a/src/Access/AccessControl.cpp
+++ b/src/Access/AccessControl.cpp
@@ -567,12 +567,11 @@ AuthResult AccessControl::authenticate(const Credentials & credentials, const Po
     if (authentication_quota)
         authentication_quota->checkExceeded(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
 
+    AuthResult auth_result;
     try
     {
-        const auto auth_result = MultipleAccessStorage::authenticate(credentials, address, *external_authenticators, allow_no_password,
-                                                                     allow_plaintext_password);
-
-        return auth_result;
+        auth_result = MultipleAccessStorage::authenticate(credentials, address, *external_authenticators, allow_no_password,
+                                                          allow_plaintext_password);
     }
     catch (...)
     {
@@ -601,6 +600,8 @@ AuthResult AccessControl::authenticate(const Credentials & credentials, const Po
 
     if (authentication_quota)
         authentication_quota->reset(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
+
+    return auth_result;
 }
 
 void AccessControl::restoreFromBackup(RestorerFromBackup & restorer)

From 815c73f1e5471abd51ddcb4ca0da2f33a2d630d5 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Tue, 30 Jan 2024 10:41:42 +0800
Subject: [PATCH 209/245] change as request

---
 src/Functions/regexpExtract.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/regexpExtract.cpp b/src/Functions/regexpExtract.cpp
index e7c982d675a..f6bbd2f96f2 100644
--- a/src/Functions/regexpExtract.cpp
+++ b/src/Functions/regexpExtract.cpp
@@ -137,7 +137,7 @@ private:
         if (index < 0 || index >= capture + 1)
             throw Exception(
                 ErrorCodes::INDEX_OF_POSITIONAL_ARGUMENT_IS_OUT_OF_RANGE,
-                "Index value {} is out of range of regexp pattern '{}' in function {}, should be in [0, {})",
+                "Index value {} for regexp pattern `{}` in function {} is out-of-range, should be in [0, {})",
                 index,
                 pattern,
                 getName(),
@@ -189,7 +189,7 @@ private:
             if (index < 0 || index >= capture + 1)
                 throw Exception(
                     ErrorCodes::INDEX_OF_POSITIONAL_ARGUMENT_IS_OUT_OF_RANGE,
-                    "Index value {} is out of range of regexp pattern '{}' in function {}, should be in [0, {})",
+                    "Index value {} for regexp pattern `{}` in function {} is out-of-range, should be in [0, {})",
                     index,
                     pattern,
                     getName(),
@@ -234,7 +234,7 @@ private:
             if (index < 0 || index >= capture + 1)
                 throw Exception(
                     ErrorCodes::INDEX_OF_POSITIONAL_ARGUMENT_IS_OUT_OF_RANGE,
-                    "Index value {} is out of range of regexp pattern '{}' in function {}, should be in [0, {})",
+                    "Index value {} for regexp pattern `{}` in function {} is out-of-range, should be in [0, {})",
                     index,
                     pattern,
                     getName(),

From 89339127a97c79e6ecb2ee476045d218b13e2093 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 07:02:06 +0100
Subject: [PATCH 210/245] Add changelog for 24.1

---
 CHANGELOG.md | 2308 ++++----------------------------------------------
 1 file changed, 161 insertions(+), 2147 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 1b36142cc9f..ea3c954776a 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,2164 +1,178 @@
 ### Table of Contents
-**[ClickHouse release v23.12, 2023-12-28](#2312)**<br/>
-**[ClickHouse release v23.11, 2023-12-06](#2311)**<br/>
-**[ClickHouse release v23.10, 2023-11-02](#2310)**<br/>
-**[ClickHouse release v23.9, 2023-09-28](#239)**<br/>
-**[ClickHouse release v23.8 LTS, 2023-08-31](#238)**<br/>
-**[ClickHouse release v23.7, 2023-07-27](#237)**<br/>
-**[ClickHouse release v23.6, 2023-06-30](#236)**<br/>
-**[ClickHouse release v23.5, 2023-06-08](#235)**<br/>
-**[ClickHouse release v23.4, 2023-04-26](#234)**<br/>
-**[ClickHouse release v23.3 LTS, 2023-03-30](#233)**<br/>
-**[ClickHouse release v23.2, 2023-02-23](#232)**<br/>
-**[ClickHouse release v23.1, 2023-01-25](#231)**<br/>
-**[Changelog for 2022](https://clickhouse.com/docs/en/whats-new/changelog/2022/)**<br/>
+**[ClickHouse release v24.1, 2024-01-30](#241)**<br/>
+**[Changelog for 2023](https://clickhouse.com/docs/en/whats-new/changelog/2023/)**<br/>
 
-# 2023 Changelog
+# 2024 Changelog
 
-### <a id="2312"></a> ClickHouse release 23.12, 2023-12-28
+### <a id="241"></a> ClickHouse release 24.1, 2024-01-30
+
+### ClickHouse release master (b4a5b6060ea) FIXME as compared to v23.12.1.1368-stable (a2faa65b080)
 
 #### Backward Incompatible Change
-* Fix check for non-deterministic functions in TTL expressions. Previously, you could create a TTL expression with non-deterministic functions in some cases, which could lead to undefined behavior later. This fixes [#37250](https://github.com/ClickHouse/ClickHouse/issues/37250). Disallow TTL expressions that don't depend on any columns of a table by default. It can be allowed back by `SET allow_suspicious_ttl_expressions = 1` or `SET compatibility = '23.11'`. Closes [#37286](https://github.com/ClickHouse/ClickHouse/issues/37286). [#51858](https://github.com/ClickHouse/ClickHouse/pull/51858) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The MergeTree setting `clean_deleted_rows` is deprecated, it has no effect anymore. The `CLEANUP` keyword for the `OPTIMIZE` is not allowed by default (it can be unlocked with the `allow_experimental_replacing_merge_with_cleanup` setting). [#58267](https://github.com/ClickHouse/ClickHouse/pull/58267) ([Alexander Tokmakov](https://github.com/tavplubix)). This fixes [#57930](https://github.com/ClickHouse/ClickHouse/issues/57930). This closes [#54988](https://github.com/ClickHouse/ClickHouse/issues/54988). This closes [#54570](https://github.com/ClickHouse/ClickHouse/issues/54570). This closes [#50346](https://github.com/ClickHouse/ClickHouse/issues/50346). This closes [#47579](https://github.com/ClickHouse/ClickHouse/issues/47579). The feature has to be removed because it is not good. We have to remove it as quickly as possible, because there is no other option. [#57932](https://github.com/ClickHouse/ClickHouse/pull/57932) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The setting `print_pretty_type_names` is turned on by default. You can turn it off to keep the old behavior or `SET compatibility = '23.12'`. [#57726](https://github.com/ClickHouse/ClickHouse/pull/57726) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The MergeTree setting `clean_deleted_rows` is deprecated, it has no effect anymore. The `CLEANUP` keyword for `OPTIMIZE` is not allowed by default (unless `allow_experimental_replacing_merge_with_cleanup` is enabled). [#58316](https://github.com/ClickHouse/ClickHouse/pull/58316) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* The function `reverseDNSQuery` is no longer available. This closes [#58368](https://github.com/ClickHouse/ClickHouse/issues/58368). [#58369](https://github.com/ClickHouse/ClickHouse/pull/58369) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Enable various changes to improve the access control in the configuration file. These changes affect the behavior, and you check the `config.xml` in the `access_control_improvements` section. In case you are not confident, keep the values in the configuration file as they were in the previous version. [#58584](https://github.com/ClickHouse/ClickHouse/pull/58584) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Improve the operation of `sumMapFiltered` with NaN values. NaN values are now placed at the end (instead of randomly) and considered different from any values. `-0` is now also treated as equal to `0`; since 0 values are discarded, `-0` values are discarded too. [#58959](https://github.com/ClickHouse/ClickHouse/pull/58959) ([Raúl Marín](https://github.com/Algunenano)).
+* The function `visibleWidth` will behave according to the docs. In previous versions, it simply counted code points after string serialization, like the `lengthUTF8` function, but didn't consider zero-width and combining characters, full-width characters, tabs, and deletes. Now the behavior is changed accordingly. If you want to keep the old behavior, set `function_visible_width_behavior` to `0`, or set `compatibility` to `23.12` or lower. [#59022](https://github.com/ClickHouse/ClickHouse/pull/59022) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* `Kusto` dialect is disabled until these two bugs will be fixed: [#59037](https://github.com/ClickHouse/ClickHouse/issues/59037) and [#59036](https://github.com/ClickHouse/ClickHouse/issues/59036). [#59305](https://github.com/ClickHouse/ClickHouse/pull/59305) ([Alexey Milovidov](https://github.com/alexey-milovidov)). Any attempt to use `Kusto` will result in exception.
+* More efficient implementation of the `FINAL` modifier no longer guarantees preserving the order even if `max_threads = 1`. If you counted on the previous behavior, set `enable_vertical_final` to 0 or `compatibility` to `23.12`. 
 
 #### New Feature
-* Implement Refreshable Materialized Views, requested in [#33919](https://github.com/ClickHouse/ClickHouse/issues/33919). [#56946](https://github.com/ClickHouse/ClickHouse/pull/56946) ([Michael Kolupaev](https://github.com/al13n321), [Michael Guzov](https://github.com/koloshmet)).
-* Introduce `PASTE JOIN`, which allows users to join tables without `ON` clause simply by row numbers. Example: `SELECT * FROM (SELECT number AS a FROM numbers(2)) AS t1 PASTE JOIN (SELECT number AS a FROM numbers(2) ORDER BY a DESC) AS t2`. [#57995](https://github.com/ClickHouse/ClickHouse/pull/57995) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* The `ORDER BY` clause now supports specifying `ALL`, meaning that ClickHouse sorts by all columns in the `SELECT` clause. Example: `SELECT col1, col2 FROM tab WHERE [...] ORDER BY ALL`. [#57875](https://github.com/ClickHouse/ClickHouse/pull/57875) ([zhongyuankai](https://github.com/zhongyuankai)).
-* Added a new mutation command `ALTER TABLE <table> APPLY DELETED MASK`, which allows to enforce applying of mask written by lightweight delete and to remove rows marked as deleted from disk. [#57433](https://github.com/ClickHouse/ClickHouse/pull/57433) ([Anton Popov](https://github.com/CurtizJ)).
-* A handler `/binary` opens a visual viewer of symbols inside the ClickHouse binary. [#58211](https://github.com/ClickHouse/ClickHouse/pull/58211) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added a new SQL function `sqid` to generate Sqids (https://sqids.org/), example: `SELECT sqid(125, 126)`. [#57512](https://github.com/ClickHouse/ClickHouse/pull/57512) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add a new function `seriesPeriodDetectFFT` to detect series period using FFT. [#57574](https://github.com/ClickHouse/ClickHouse/pull/57574) ([Bhavna Jindal](https://github.com/bhavnajindal)).
-* Add an HTTP endpoint for checking if Keeper is ready to accept traffic. [#55876](https://github.com/ClickHouse/ClickHouse/pull/55876) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-* Add 'union' mode for schema inference. In this mode the resulting table schema is the union of all files schemas (so schema is inferred from each file). The mode of schema inference is controlled by a setting `schema_inference_mode` with two possible values - `default` and `union`. Closes [#55428](https://github.com/ClickHouse/ClickHouse/issues/55428). [#55892](https://github.com/ClickHouse/ClickHouse/pull/55892) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add new setting `input_format_csv_try_infer_numbers_from_strings` that allows to infer numbers from strings in CSV format. Closes [#56455](https://github.com/ClickHouse/ClickHouse/issues/56455). [#56859](https://github.com/ClickHouse/ClickHouse/pull/56859) ([Kruglov Pavel](https://github.com/Avogar)).
-* When the number of databases or tables exceeds a configurable threshold, show a warning to the user. [#57375](https://github.com/ClickHouse/ClickHouse/pull/57375) ([凌涛](https://github.com/lingtaolf)).
-* Dictionary with `HASHED_ARRAY` (and `COMPLEX_KEY_HASHED_ARRAY`) layout supports `SHARDS` similarly to `HASHED`. [#57544](https://github.com/ClickHouse/ClickHouse/pull/57544) ([vdimir](https://github.com/vdimir)).
-* Add asynchronous metrics for total primary key bytes and total allocated primary key bytes in memory. [#57551](https://github.com/ClickHouse/ClickHouse/pull/57551) ([Bharat Nallan](https://github.com/bharatnc)).
-* Add `SHA512_256` function. [#57645](https://github.com/ClickHouse/ClickHouse/pull/57645) ([Bharat Nallan](https://github.com/bharatnc)).
-* Add `FORMAT_BYTES` as an alias for `formatReadableSize`. [#57592](https://github.com/ClickHouse/ClickHouse/pull/57592) ([Bharat Nallan](https://github.com/bharatnc)).
-* Allow passing optional session token to the `s3` table function. [#57850](https://github.com/ClickHouse/ClickHouse/pull/57850) ([Shani Elharrar](https://github.com/shanielh)).
-* Introduce a new setting `http_make_head_request`. If it is turned off, the URL table engine will not do a HEAD request to determine the file size. This is needed to support inefficient, misconfigured, or not capable HTTP servers. [#54602](https://github.com/ClickHouse/ClickHouse/pull/54602) ([Fionera](https://github.com/fionera)).
-* It is now possible to refer to ALIAS column in index (non-primary-key) definitions (issue [#55650](https://github.com/ClickHouse/ClickHouse/issues/55650)). Example: `CREATE TABLE tab(col UInt32, col_alias ALIAS col + 1, INDEX idx (col_alias) TYPE minmax) ENGINE = MergeTree ORDER BY col;`. [#57546](https://github.com/ClickHouse/ClickHouse/pull/57546) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added a new setting `readonly` which can be used to specify an S3 disk is read only. It can be useful to create a table on a disk of `s3_plain` type, while having read only access to the underlying S3 bucket. [#57977](https://github.com/ClickHouse/ClickHouse/pull/57977) ([Pengyuan Bian](https://github.com/bianpengyuan)).
-* The primary key analysis in MergeTree tables will now be applied to predicates that include the virtual column `_part_offset` (optionally with `_part`). This feature can serve as a special kind of a secondary index. [#58224](https://github.com/ClickHouse/ClickHouse/pull/58224) ([Amos Bird](https://github.com/amosbird)).
+* Implement Variant data type that represents a union of other data types. Type `Variant(T1, T2, ..., TN)` means that each row of this type has a value of either type `T1` or `T2` or ... or `TN` or none of them (`NULL` value). Variant type is available under a setting `allow_experimental_variant_type`. Reference: [#54864](https://github.com/ClickHouse/ClickHouse/issues/54864). [#58047](https://github.com/ClickHouse/ClickHouse/pull/58047) ([Kruglov Pavel](https://github.com/Avogar)).
+* Certain settings (currently `min_compress_block_size` and `max_compress_block_size`) can now be specified at column-level where they take precedence over the corresponding table-level setting. Example: `CREATE TABLE tab (col String SETTINGS (min_compress_block_size = 81920, max_compress_block_size = 163840)) ENGINE = MergeTree ORDER BY tuple();`. [#55201](https://github.com/ClickHouse/ClickHouse/pull/55201) ([Duc Canh Le](https://github.com/canhld94)).
+* Add `quantileDDSketch` aggregate function as well as the corresponding `quantilesDDSketch` and `medianDDSketch`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
+* Allow to configure any kind of object storage with any kind of metadata type. [#58357](https://github.com/ClickHouse/ClickHouse/pull/58357) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Added `null_status_on_timeout_only_active` and `throw_only_active` modes for `distributed_ddl_output_mode` that allow to avoid waiting for inactive replicas. [#58350](https://github.com/ClickHouse/ClickHouse/pull/58350) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Allow partitions from tables with different partition expressions to be attached when the destination table partition expression doesn't re-partition/split the part. [#39507](https://github.com/ClickHouse/ClickHouse/pull/39507) ([Arthur Passos](https://github.com/arthurpassos)).
+* Add function `arrayShingles()` to compute subarrays, e.g. `arrayShingles([1, 2, 3, 4, 5], 3)` returns `[[1,2,3],[2,3,4],[3,4,5]]`. [#58396](https://github.com/ClickHouse/ClickHouse/pull/58396) ([Zheng Miao](https://github.com/zenmiao7)).
+* Added functions `punycodeEncode()`, `punycodeDecode()`, `idnaEncode()` and `idnaDecode()` which are useful for translating international domain names to an ASCII representation according to the IDNA standard. [#58454](https://github.com/ClickHouse/ClickHouse/pull/58454) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added string similarity functions `dramerauLevenshteinDistance()`, `jaroSimilarity()` and `jaroWinklerSimilarity()`. [#58531](https://github.com/ClickHouse/ClickHouse/pull/58531) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add two settings `output_format_compression_level` to change output compression level and `output_format_compression_zstd_window_log` to explicitly set compression window size and enable long-range mode for zstd compression if output compression method is `zstd`. Applied for `INTO OUTFILE` and when writing to table functions `file`, `url`, `hdfs`, `s3`, and `azureBlobStorage`. [#58539](https://github.com/ClickHouse/ClickHouse/pull/58539) ([Duc Canh Le](https://github.com/canhld94)).
+* Automatically disable ANSI escape sequences in Pretty formats if the output is not a terminal. Add new `auto` mode to setting `output_format_pretty_color`. [#58614](https://github.com/ClickHouse/ClickHouse/pull/58614) ([Shaun Struwig](https://github.com/Blargian)).
+* Added function `sqidDecode()` which decodes [Sqids](https://sqids.org/). [#58544](https://github.com/ClickHouse/ClickHouse/pull/58544) ([Robert Schulze](https://github.com/rschu1ze)).
+* Allow to read Bool values into String in JSON input formats. It's done under a setting `input_format_json_read_bools_as_strings` that is enabled by default. [#58561](https://github.com/ClickHouse/ClickHouse/pull/58561) ([Kruglov Pavel](https://github.com/Avogar)).
+* Added function `seriesDecomposeSTL()` which decomposes a time series into a season, a trend and a residual component. [#57078](https://github.com/ClickHouse/ClickHouse/pull/57078) ([Bhavna Jindal](https://github.com/bhavnajindal)).
+* Introduced MySQL Binlog Client for MaterializedMySQL: One binlog connection for many databases. [#57323](https://github.com/ClickHouse/ClickHouse/pull/57323) ([Val Doroshchuk](https://github.com/valbok)).
+* Intel QuickAssist Technology (QAT) provides hardware-accelerated compression and cryptograpy. ClickHouse got a new compression codec `ZSTD_QAT` which utilizes QAT for zstd compression. The codec uses [Intel's QATlib](https://github.com/intel/qatlib) and [Inte's QAT ZSTD Plugin](https://github.com/intel/QAT-ZSTD-Plugin). Right now, only compression can be accelerated in hardware (a software fallback kicks in in case QAT could not be initialized), decompression always runs in software. [#57509](https://github.com/ClickHouse/ClickHouse/pull/57509) ([jasperzhu](https://github.com/jinjunzh)).
+* Implementing the new way how object storage keys are generated for s3 disks. Now the format could be defined in terms of `re2` regex syntax with `key_template` option in disc description. [#57663](https://github.com/ClickHouse/ClickHouse/pull/57663) ([Sema Checherinda](https://github.com/CheSema)).
+* Table system.dropped_tables_parts contains parts of system.dropped_tables tables (dropped but not yet removed tables). [#58038](https://github.com/ClickHouse/ClickHouse/pull/58038) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Add settings `max_materialized_views_size_for_table` to limit the number of materialized views attached to a table. [#58068](https://github.com/ClickHouse/ClickHouse/pull/58068) ([zhongyuankai](https://github.com/zhongyuankai)).
+* `clickhouse-format` improvements: support INSERT queries with `VALUES`; support comments (use `--comments` to output them); support `--max_line_length` option to format only long queries in multiline. [#58246](https://github.com/ClickHouse/ClickHouse/pull/58246) ([vdimir](https://github.com/vdimir)).
+* Attach all system tables in `clickhouse-local`, including `system.parts`. This closes [#58312](https://github.com/ClickHouse/ClickHouse/issues/58312). [#58359](https://github.com/ClickHouse/ClickHouse/pull/58359) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Support for `Enum` data types in function `transform`. This closes [#58241](https://github.com/ClickHouse/ClickHouse/issues/58241). [#58360](https://github.com/ClickHouse/ClickHouse/pull/58360) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add table `system.database_engines`. [#58390](https://github.com/ClickHouse/ClickHouse/pull/58390) ([Bharat Nallan](https://github.com/bharatnc)). Allow registering database engines independently in the codebase. [#58365](https://github.com/ClickHouse/ClickHouse/pull/58365) ([Bharat Nallan](https://github.com/bharatnc)). Allow registering interpreters independently. [#58443](https://github.com/ClickHouse/ClickHouse/pull/58443) ([Bharat Nallan](https://github.com/bharatnc)).
+* Added `FROM <Replicas>` modifier for `SYSTEM SYNC REPLICA LIGHTWEIGHT` query. With the `FROM` modifier ensures we wait for fetches and drop-ranges only for the specified source replicas, as well as any replica not in zookeeper or with an empty source_replica. [#58393](https://github.com/ClickHouse/ClickHouse/pull/58393) ([Jayme Bird](https://github.com/jaymebrd)).
+* Added setting `update_insert_deduplication_token_in_dependent_materialized_views`. This setting allows to update insert deduplication token with table identifier during insert in dependent materialized views. Closes [#59165](https://github.com/ClickHouse/ClickHouse/issues/59165). [#59238](https://github.com/ClickHouse/ClickHouse/pull/59238) ([Maksim Kita](https://github.com/kitaisreal)).
+* Added statement `SYSTEM RELOAD ASYNCHRONOUS METRICS` which updates the asynchronous metrics. Mostly useful for testing and development. [#53710](https://github.com/ClickHouse/ClickHouse/pull/53710) ([Robert Schulze](https://github.com/rschu1ze)).
 
 #### Performance Improvement
-* Extract non-intersecting parts ranges from MergeTree table during FINAL processing. That way we can avoid additional FINAL logic for this non-intersecting parts ranges. In case when amount of duplicate values with same primary key is low, performance will be almost the same as without FINAL. Improve reading performance for MergeTree FINAL when `do_not_merge_across_partitions_select_final` setting is set. [#58120](https://github.com/ClickHouse/ClickHouse/pull/58120) ([Maksim Kita](https://github.com/kitaisreal)).
-* Made copy between s3 disks using a s3-server-side copy instead of copying through the buffer. Improves `BACKUP/RESTORE` operations and `clickhouse-disks copy` command. [#56744](https://github.com/ClickHouse/ClickHouse/pull/56744) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* Hash JOIN respects setting `max_joined_block_size_rows` and do not produce large blocks for `ALL JOIN`. [#56996](https://github.com/ClickHouse/ClickHouse/pull/56996) ([vdimir](https://github.com/vdimir)).
-* Release memory for aggregation earlier. This may avoid unnecessary external aggregation. [#57691](https://github.com/ClickHouse/ClickHouse/pull/57691) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Improve performance of string serialization. [#57717](https://github.com/ClickHouse/ClickHouse/pull/57717) ([Maksim Kita](https://github.com/kitaisreal)).
-* Support trivial count optimization for `Merge`-engine tables. [#57867](https://github.com/ClickHouse/ClickHouse/pull/57867) ([skyoct](https://github.com/skyoct)).
-* Optimized aggregation in some cases. [#57872](https://github.com/ClickHouse/ClickHouse/pull/57872) ([Anton Popov](https://github.com/CurtizJ)).
-* The `hasAny` function can now take advantage of the full-text skipping indices. [#57878](https://github.com/ClickHouse/ClickHouse/pull/57878) ([Jpnock](https://github.com/Jpnock)).
-* Function `if(cond, then, else)` (and its alias `cond ? then : else`) were optimized to use branch-free evaluation. [#57885](https://github.com/ClickHouse/ClickHouse/pull/57885) ([zhanglistar](https://github.com/zhanglistar)).
-* MergeTree automatically derive `do_not_merge_across_partitions_select_final` setting if partition key expression contains only columns from primary key expression. [#58218](https://github.com/ClickHouse/ClickHouse/pull/58218) ([Maksim Kita](https://github.com/kitaisreal)).
-* Speedup `MIN` and `MAX` for native types. [#58231](https://github.com/ClickHouse/ClickHouse/pull/58231) ([Raúl Marín](https://github.com/Algunenano)).
-* Implement `SLRU` cache policy for filesystem cache. [#57076](https://github.com/ClickHouse/ClickHouse/pull/57076) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* The limit for the number of connections per endpoint for background fetches was raised from `15` to the value of `background_fetches_pool_size` setting. - MergeTree-level setting `replicated_max_parallel_fetches_for_host` became obsolete - MergeTree-level settings `replicated_fetches_http_connection_timeout`, `replicated_fetches_http_send_timeout` and `replicated_fetches_http_receive_timeout` are moved to the Server-level. - Setting `keep_alive_timeout` is added to the list of Server-level settings. [#57523](https://github.com/ClickHouse/ClickHouse/pull/57523) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Make querying `system.filesystem_cache` not memory intensive. [#57687](https://github.com/ClickHouse/ClickHouse/pull/57687) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Reduce memory usage on strings deserialization. [#57787](https://github.com/ClickHouse/ClickHouse/pull/57787) ([Maksim Kita](https://github.com/kitaisreal)).
-* More efficient constructor for Enum - it makes sense when Enum has a boatload of values. [#57887](https://github.com/ClickHouse/ClickHouse/pull/57887) ([Duc Canh Le](https://github.com/canhld94)).
-* An improvement for reading from the filesystem cache: always use `pread` method. [#57970](https://github.com/ClickHouse/ClickHouse/pull/57970) ([Nikita Taranov](https://github.com/nickitat)).
-* Add optimization for AND notEquals chain in logical expression optimizer. This optimization is only available with the experimental Analyzer enabled. [#58214](https://github.com/ClickHouse/ClickHouse/pull/58214) ([Kevin Mingtarja](https://github.com/kevinmingtarja)).
+* Coordination for parallel replicas is rewritten for better parallelism and cache locality. It has been tested for linear scalability on hundreds of replicas. It also got support for reading in order. [#57968](https://github.com/ClickHouse/ClickHouse/pull/57968) ([Nikita Taranov](https://github.com/nickitat)).
+* Replace HTTP outgoing buffering based with the native ClickHouse buffers. Add bytes counting metrics for interfaces. [#56064](https://github.com/ClickHouse/ClickHouse/pull/56064) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Large aggregation states of `uniqExact` will be merged in parallel in distrubuted queries. [#59009](https://github.com/ClickHouse/ClickHouse/pull/59009) ([Nikita Taranov](https://github.com/nickitat)).
+* Lower memory usage after reading from `MergeTree` tables. [#59290](https://github.com/ClickHouse/ClickHouse/pull/59290) ([Anton Popov](https://github.com/CurtizJ)).
+* Lower memory usage in vertical merges. [#59340](https://github.com/ClickHouse/ClickHouse/pull/59340) ([Anton Popov](https://github.com/CurtizJ)).
+* Avoid huge memory consumption during Keeper startup for more cases. [#58455](https://github.com/ClickHouse/ClickHouse/pull/58455) ([Antonio Andelic](https://github.com/antonio2368)).
+* Keeper improvement: reduce Keeper's memory usage for stored nodes. [#59002](https://github.com/ClickHouse/ClickHouse/pull/59002) ([Antonio Andelic](https://github.com/antonio2368)).
+* More cache-friendly final implementation. Note on the behaviour change: previously queries with `FINAL` modifier that read with a single stream (e.g. `max_threads = 1`) produced sorted output without explicitly provided `ORDER BY` clause. This is no longer guaranteed when `enable_vertical_final = true` (and it is so by default). [#54366](https://github.com/ClickHouse/ClickHouse/pull/54366) ([Duc Canh Le](https://github.com/canhld94)).
+* Bypass extra copying in `ReadBufferFromIStream` which is used, e.g., for reading from S3. [#56961](https://github.com/ClickHouse/ClickHouse/pull/56961) ([Nikita Taranov](https://github.com/nickitat)).
+* Optimize array element function when input is Array(Map)/Array(Array(Num)/Array(Array(String))/Array(BigInt)/Array(Decimal). The previous implementations did more allocations than needed. The optimization speed up is up to ~6x especially when input type is Array(Map). [#56403](https://github.com/ClickHouse/ClickHouse/pull/56403) ([李扬](https://github.com/taiyang-li)).
+* Read column once while reading more than one subcolumn from it in compact parts. [#57631](https://github.com/ClickHouse/ClickHouse/pull/57631) ([Kruglov Pavel](https://github.com/Avogar)).
+* Rewrite the AST of `sum(column + constant)` function. This is available as an optimization pass for Analyzer [#57853](https://github.com/ClickHouse/ClickHouse/pull/57853) ([Jiebin Sun](https://github.com/jiebinn)).
+* The evaluation of function `match` now utilizes skipping indices `ngrambf_v1` and `tokenbf_v1`. [#57882](https://github.com/ClickHouse/ClickHouse/pull/57882) ([凌涛](https://github.com/lingtaolf)).
+* The evaluation of function `match` now utilizes inverted indices. [#58284](https://github.com/ClickHouse/ClickHouse/pull/58284) ([凌涛](https://github.com/lingtaolf)).
+* MergeTree `FINAL` does not compare rows from same non-L0 part. [#58142](https://github.com/ClickHouse/ClickHouse/pull/58142) ([Duc Canh Le](https://github.com/canhld94)).
+* Speed up iota calls (filling array with consecutive numbers). [#58271](https://github.com/ClickHouse/ClickHouse/pull/58271) ([Raúl Marín](https://github.com/Algunenano)).
+* Speedup MIN/MAX for non-numeric types. [#58334](https://github.com/ClickHouse/ClickHouse/pull/58334) ([Raúl Marín](https://github.com/Algunenano)).
+* Optimize the combination of filters (like in multi-stage PREWHERE) with BMI2/SSE intrinsics [#58800](https://github.com/ClickHouse/ClickHouse/pull/58800) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
+* Use one thread less in `clickhouse-local`. [#58968](https://github.com/ClickHouse/ClickHouse/pull/58968) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Improve the `multiIf` function performance when the type is Nullable. [#57745](https://github.com/ClickHouse/ClickHouse/pull/57745) ([KevinyhZou](https://github.com/KevinyhZou)).
+* Add `SYSTEM JEMALLOC PURGE` for purging unused jemalloc pages, `SYSTEM JEMALLOC [ ENABLE | DISABLE | FLUSH ] PROFILE` for controlling jemalloc profile if the profiler is enabled. Add jemalloc-related 4LW command in Keeper: `jmst` for dumping jemalloc stats, `jmfp`, `jmep`, `jmdp` for controlling jemalloc profile if the profiler is enabled. [#58665](https://github.com/ClickHouse/ClickHouse/pull/58665) ([Antonio Andelic](https://github.com/antonio2368)).
+* Lower memory consumption in backups to S3. [#58962](https://github.com/ClickHouse/ClickHouse/pull/58962) ([Vitaly Baranov](https://github.com/vitlibar)).
 
 #### Improvement
-* Support for soft memory limit in Keeper. It will refuse requests if the memory usage is close to the maximum. [#57271](https://github.com/ClickHouse/ClickHouse/pull/57271) ([Han Fei](https://github.com/hanfei1991)). [#57699](https://github.com/ClickHouse/ClickHouse/pull/57699) ([Han Fei](https://github.com/hanfei1991)).
-* Make inserts into distributed tables handle updated cluster configuration properly. When the list of cluster nodes is dynamically updated, the Directory Monitor of the distribution table will update it. [#42826](https://github.com/ClickHouse/ClickHouse/pull/42826) ([zhongyuankai](https://github.com/zhongyuankai)).
-* Do not allow creating a replicated table with inconsistent merge parameters. [#56833](https://github.com/ClickHouse/ClickHouse/pull/56833) ([Duc Canh Le](https://github.com/canhld94)).
-* Show uncompressed size in `system.tables`. [#56618](https://github.com/ClickHouse/ClickHouse/issues/56618). [#57186](https://github.com/ClickHouse/ClickHouse/pull/57186) ([Chen Lixiang](https://github.com/chenlx0)).
-* Add `skip_unavailable_shards` as a setting for `Distributed` tables that is similar to the corresponding query-level setting. Closes [#43666](https://github.com/ClickHouse/ClickHouse/issues/43666). [#57218](https://github.com/ClickHouse/ClickHouse/pull/57218) ([Gagan Goel](https://github.com/tntnatbry)).
-* The function `substring` (aliases: `substr`, `mid`) can now be used with `Enum` types. Previously, the first function argument had to be a value of type `String` or `FixedString`. This improves compatibility with 3rd party tools such as Tableau via MySQL interface. [#57277](https://github.com/ClickHouse/ClickHouse/pull/57277) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Function `format` now supports arbitrary argument types (instead of only `String` and `FixedString` arguments). This is important to calculate `SELECT format('The {0} to all questions is {1}', 'answer', 42)`. [#57549](https://github.com/ClickHouse/ClickHouse/pull/57549) ([Robert Schulze](https://github.com/rschu1ze)).
-* Allows to use the `date_trunc` function with a case-insensitive first argument. Both cases are now supported: `SELECT date_trunc('day', now())` and `SELECT date_trunc('DAY', now())`. [#57624](https://github.com/ClickHouse/ClickHouse/pull/57624) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Better hints when a table doesn't exist. [#57342](https://github.com/ClickHouse/ClickHouse/pull/57342) ([Bharat Nallan](https://github.com/bharatnc)).
-* Allow to overwrite `max_partition_size_to_drop` and `max_table_size_to_drop` server settings in query time. [#57452](https://github.com/ClickHouse/ClickHouse/pull/57452) ([Jordi Villar](https://github.com/jrdi)).
-* Slightly better inference of unnamed tupes in JSON formats. [#57751](https://github.com/ClickHouse/ClickHouse/pull/57751) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add support for read-only flag when connecting to Keeper (fixes [#53749](https://github.com/ClickHouse/ClickHouse/issues/53749)). [#57479](https://github.com/ClickHouse/ClickHouse/pull/57479) ([Mikhail Koviazin](https://github.com/mkmkme)).
-* Fix possible distributed sends stuck due to "No such file or directory" (during recovering a batch from disk). Fix possible issues with `error_count` from `system.distribution_queue` (in case of `distributed_directory_monitor_max_sleep_time_ms` >5min). Introduce profile event to track async INSERT failures - `DistributedAsyncInsertionFailures`. [#57480](https://github.com/ClickHouse/ClickHouse/pull/57480) ([Azat Khuzhin](https://github.com/azat)).
-* Support PostgreSQL generated columns and default column values in `MaterializedPostgreSQL` (experimental feature). Closes [#40449](https://github.com/ClickHouse/ClickHouse/issues/40449). [#57568](https://github.com/ClickHouse/ClickHouse/pull/57568) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Allow to apply some filesystem cache config settings changes without server restart. [#57578](https://github.com/ClickHouse/ClickHouse/pull/57578) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Properly handling PostgreSQL table structure with empty array. [#57618](https://github.com/ClickHouse/ClickHouse/pull/57618) ([Mike Kot](https://github.com/myrrc)).
-* Expose the total number of errors occurred since last server restart as a `ClickHouseErrorMetric_ALL` metric. [#57627](https://github.com/ClickHouse/ClickHouse/pull/57627) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Allow nodes in the configuration file with `from_env`/`from_zk` reference and non empty element with replace=1. [#57628](https://github.com/ClickHouse/ClickHouse/pull/57628) ([Azat Khuzhin](https://github.com/azat)).
-* A table function `fuzzJSON` which allows generating a lot of malformed JSON for fuzzing. [#57646](https://github.com/ClickHouse/ClickHouse/pull/57646) ([Julia Kartseva](https://github.com/jkartseva)).
-* Allow IPv6 to UInt128 conversion and binary arithmetic. [#57707](https://github.com/ClickHouse/ClickHouse/pull/57707) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Add a setting for `async inserts deduplication cache` - how long we wait for cache update. Deprecate setting `async_block_ids_cache_min_update_interval_ms`. Now cache is updated only in case of conflicts. [#57743](https://github.com/ClickHouse/ClickHouse/pull/57743) ([alesapin](https://github.com/alesapin)).
-* `sleep()` function now can be cancelled with `KILL QUERY`. [#57746](https://github.com/ClickHouse/ClickHouse/pull/57746) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Forbid `CREATE TABLE ... AS SELECT` queries for `Replicated` table engines in the experimental `Replicated` database because they are not supported. Reference [#35408](https://github.com/ClickHouse/ClickHouse/issues/35408). [#57796](https://github.com/ClickHouse/ClickHouse/pull/57796) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix and improve transforming queries for external databases, to recursively obtain all compatible predicates. [#57888](https://github.com/ClickHouse/ClickHouse/pull/57888) ([flynn](https://github.com/ucasfl)).
-* Support dynamic reloading of the filesystem cache size. Closes [#57866](https://github.com/ClickHouse/ClickHouse/issues/57866). [#57897](https://github.com/ClickHouse/ClickHouse/pull/57897) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Correctly support `system.stack_trace` for threads with blocked SIGRTMIN (these threads can exist in low-quality external libraries such as Apache rdkafka). [#57907](https://github.com/ClickHouse/ClickHouse/pull/57907) ([Azat Khuzhin](https://github.com/azat)). Aand also send signal to the threads only if it is not blocked to avoid waiting `storage_system_stack_trace_pipe_read_timeout_ms` when it does not make any sense. [#58136](https://github.com/ClickHouse/ClickHouse/pull/58136) ([Azat Khuzhin](https://github.com/azat)).
-* Tolerate keeper failures in the quorum inserts' check. [#57986](https://github.com/ClickHouse/ClickHouse/pull/57986) ([Raúl Marín](https://github.com/Algunenano)).
-* Add max/peak RSS (`MemoryResidentMax`) into system.asynchronous_metrics. [#58095](https://github.com/ClickHouse/ClickHouse/pull/58095) ([Azat Khuzhin](https://github.com/azat)).
-* This PR allows users to use s3-style links (`https://` and `s3://`) without mentioning region if it's not default. Also find the correct region if the user mentioned the wrong one. [#58148](https://github.com/ClickHouse/ClickHouse/pull/58148) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* `clickhouse-format --obfuscate` will know about Settings, MergeTreeSettings, and time zones and keep their names unchanged. [#58179](https://github.com/ClickHouse/ClickHouse/pull/58179) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added explicit `finalize()` function in `ZipArchiveWriter`. Simplify too complicated code in `ZipArchiveWriter`. This fixes [#58074](https://github.com/ClickHouse/ClickHouse/issues/58074). [#58202](https://github.com/ClickHouse/ClickHouse/pull/58202) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Make caches with the same path use the same cache objects. This behaviour existed before, but was broken in 23.4. If such caches with the same path have different set of cache settings, an exception will be thrown, that this is not allowed. [#58264](https://github.com/ClickHouse/ClickHouse/pull/58264) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Parallel replicas (experimental feature): friendly settings [#57542](https://github.com/ClickHouse/ClickHouse/pull/57542) ([Igor Nikonov](https://github.com/devcrafter)).
-* Parallel replicas (experimental feature): announcement response handling improvement [#57749](https://github.com/ClickHouse/ClickHouse/pull/57749) ([Igor Nikonov](https://github.com/devcrafter)).
-* Parallel replicas (experimental feature): give more respect to `min_number_of_marks` in `ParallelReplicasReadingCoordinator` [#57763](https://github.com/ClickHouse/ClickHouse/pull/57763) ([Nikita Taranov](https://github.com/nickitat)).
-* Parallel replicas (experimental feature): disable parallel replicas with IN (subquery) [#58133](https://github.com/ClickHouse/ClickHouse/pull/58133) ([Igor Nikonov](https://github.com/devcrafter)).
-* Parallel replicas (experimental feature): add profile event 'ParallelReplicasUsedCount' [#58173](https://github.com/ClickHouse/ClickHouse/pull/58173) ([Igor Nikonov](https://github.com/devcrafter)).
-* Non POST requests such as HEAD will be readonly similar to GET. [#58060](https://github.com/ClickHouse/ClickHouse/pull/58060) ([San](https://github.com/santrancisco)).
-* Add `bytes_uncompressed` column to `system.part_log` [#58167](https://github.com/ClickHouse/ClickHouse/pull/58167) ([Jordi Villar](https://github.com/jrdi)).
-* Add base backup name to `system.backups` and `system.backup_log` tables [#58178](https://github.com/ClickHouse/ClickHouse/pull/58178) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
-* Add support for specifying query parameters in the command line in clickhouse-local [#58210](https://github.com/ClickHouse/ClickHouse/pull/58210) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+* Added comments (brief descriptions) to all columns of system tables. There are several reasons for this: - We use system tables a lot, and sometimes it could be very difficult for developer to understand the purpose and the meaning of a particular column. - We change (add new ones or modify existing) system tables a lot and the documentation for them is always outdated. For example take a look at the documentation page for [`system.parts`](https://clickhouse.com/docs/en/operations/system-tables/parts). It misses a lot of columns - We would like to eventually generate documentation directly from ClickHouse. [#58356](https://github.com/ClickHouse/ClickHouse/pull/58356) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Allow queries without aliases for subqueries for `PASTE JOIN`. [#58654](https://github.com/ClickHouse/ClickHouse/pull/58654) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Enable `MySQL`/`MariaDB` integration on macOS. This closes [#21191](https://github.com/ClickHouse/ClickHouse/issues/21191). [#46316](https://github.com/ClickHouse/ClickHouse/pull/46316) ([Alexey Milovidov](https://github.com/alexey-milovidov)) ([Robert Schulze](https://github.com/rschu1ze)).
+* Disable `max_rows_in_set_to_optimize_join` by default. [#56396](https://github.com/ClickHouse/ClickHouse/pull/56396) ([vdimir](https://github.com/vdimir)).
+* Add `<host_name>` config parameter that allows avoiding resolving hostnames in ON CLUSTER DDL queries and Replicated database engines. This mitigates the possibility of the queue being stuck in case of a change in cluster definition. Closes [#57573](https://github.com/ClickHouse/ClickHouse/issues/57573). [#57603](https://github.com/ClickHouse/ClickHouse/pull/57603) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Increase `load_metadata_threads` to 16 for the filesystem cache. It will make the server start up faster. [#57732](https://github.com/ClickHouse/ClickHouse/pull/57732) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add ability to throttle merges/mutations (`max_mutations_bandwidth_for_server`/`max_merges_bandwidth_for_server`). [#57877](https://github.com/ClickHouse/ClickHouse/pull/57877) ([Azat Khuzhin](https://github.com/azat)).
+* Replaced undocumented (boolean) column `is_hot_reloadable` in system table `system.server_settings` by (Enum8) column `changeable_without_restart` with possible values `No`, `Yes`, `IncreaseOnly` and `DecreaseOnly`. Also documented the column. [#58029](https://github.com/ClickHouse/ClickHouse/pull/58029) ([skyoct](https://github.com/skyoct)).
+* Cluster discovery supports setting username and password, close [#58063](https://github.com/ClickHouse/ClickHouse/issues/58063). [#58123](https://github.com/ClickHouse/ClickHouse/pull/58123) ([vdimir](https://github.com/vdimir)).
+* Support query parameters in `ALTER TABLE ... PART`. [#58297](https://github.com/ClickHouse/ClickHouse/pull/58297) ([Azat Khuzhin](https://github.com/azat)).
+* Create consumers for Kafka tables on the fly (but keep them for some period - `kafka_consumers_pool_ttl_ms`, since last used), this should fix problem with statistics for `system.kafka_consumers` (that does not consumed when nobody reads from Kafka table, which leads to live memory leak and slow table detach) and also this PR enables stats for `system.kafka_consumers` by default again. [#58310](https://github.com/ClickHouse/ClickHouse/pull/58310) ([Azat Khuzhin](https://github.com/azat)).
+* `sparkBar` as an alias to `sparkbar`. [#58335](https://github.com/ClickHouse/ClickHouse/pull/58335) ([凌涛](https://github.com/lingtaolf)).
+* Avoid sending `ComposeObject` requests after upload to `GCS`. [#58343](https://github.com/ClickHouse/ClickHouse/pull/58343) ([Azat Khuzhin](https://github.com/azat)).
+* Correctly handle keys with dot in the name in configurations XMLs. [#58354](https://github.com/ClickHouse/ClickHouse/pull/58354) ([Azat Khuzhin](https://github.com/azat)).
+* Make function `format` return constant on constant arguments. This closes [#58355](https://github.com/ClickHouse/ClickHouse/issues/58355). [#58358](https://github.com/ClickHouse/ClickHouse/pull/58358) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Adding a setting `max_estimated_execution_time` to separate `max_execution_time` and `max_estimated_execution_time`. [#58402](https://github.com/ClickHouse/ClickHouse/pull/58402) ([Zhang Yifan](https://github.com/zhangyifan27)).
+* Provide a hint when an invalid database engine name is used. [#58444](https://github.com/ClickHouse/ClickHouse/pull/58444) ([Bharat Nallan](https://github.com/bharatnc)).
+* Add settings for better control of indexes type in Arrow dictionary. Use signed integer type for indexes by default as Arrow recommends. Closes [#57401](https://github.com/ClickHouse/ClickHouse/issues/57401). [#58519](https://github.com/ClickHouse/ClickHouse/pull/58519) ([Kruglov Pavel](https://github.com/Avogar)).
+* Implement [#58575](https://github.com/ClickHouse/ClickHouse/issues/58575) Support `CLICKHOUSE_PASSWORD_FILE ` environment variable when running the docker image. [#58583](https://github.com/ClickHouse/ClickHouse/pull/58583) ([Eyal Halpern Shalev](https://github.com/Eyal-Shalev)).
+* When executing some queries, which require a lot of streams for reading data, the error `"Paste JOIN requires sorted tables only"` was previously thrown. Now the numbers of streams resize to 1 in that case. [#58608](https://github.com/ClickHouse/ClickHouse/pull/58608) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Better message for INVALID_IDENTIFIER error. [#58703](https://github.com/ClickHouse/ClickHouse/pull/58703) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Improved handling of signed numeric literals in normalizeQuery. [#58710](https://github.com/ClickHouse/ClickHouse/pull/58710) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Support Point data type for MySQL. [#58721](https://github.com/ClickHouse/ClickHouse/pull/58721) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* When comparing a Float32 column and a const string, read the string as Float32 (instead of Float64). [#58724](https://github.com/ClickHouse/ClickHouse/pull/58724) ([Raúl Marín](https://github.com/Algunenano)).
+* Improve S3 compatibility, add ECloud EOS storage support. [#58786](https://github.com/ClickHouse/ClickHouse/pull/58786) ([xleoken](https://github.com/xleoken)).
+* Allow `KILL QUERY` to cancel backups / restores. This PR also makes running backups and restores visible in `system.processes`. Also, there is a new setting in the server configuration now - `shutdown_wait_backups_and_restores` (default=true) which makes the server either wait on shutdown for all running backups and restores to finish or just cancel them. [#58804](https://github.com/ClickHouse/ClickHouse/pull/58804) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Avro format to support ZSTD codec. Closes [#58735](https://github.com/ClickHouse/ClickHouse/issues/58735). [#58805](https://github.com/ClickHouse/ClickHouse/pull/58805) ([flynn](https://github.com/ucasfl)).
+* MySQL interface gained support for `net_write_timeout` and `net_read_timeout` settings. `net_write_timeout` is translated into the native `send_timeout` ClickHouse setting and, similarly, `net_read_timeout` into `receive_timeout`. Fixed an issue where it was possible to set MySQL `sql_select_limit` setting only if the entire statement was in upper case. [#58835](https://github.com/ClickHouse/ClickHouse/pull/58835) ([Serge Klochkov](https://github.com/slvrtrn)).
+* A better exception message while conflict of creating dictionary and table with the same name. [#58841](https://github.com/ClickHouse/ClickHouse/pull/58841) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Make sure that for custom (created from SQL) disks ether `filesystem_caches_path` (a common directory prefix for all filesystem caches) or `custom_cached_disks_base_directory` (a common directory prefix for only filesystem caches created from custom disks) is specified in server config. `custom_cached_disks_base_directory` has higher priority for custom disks over `filesystem_caches_path`, which is used if the former one is absent. Filesystem cache setting `path` must lie inside that directory, otherwise exception will be thrown preventing disk to be created. This will not affect disks created on an older version and server was upgraded - then the exception will not be thrown to allow the server to successfully start). `custom_cached_disks_base_directory` is added to default server config as `/var/lib/clickhouse/caches/`. Closes [#57825](https://github.com/ClickHouse/ClickHouse/issues/57825). [#58869](https://github.com/ClickHouse/ClickHouse/pull/58869) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* MySQL interface gained compatibility with `SHOW WARNINGS`/`SHOW COUNT(*) WARNINGS` queries, though the returned result is always an empty set. [#58929](https://github.com/ClickHouse/ClickHouse/pull/58929) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Skip unavailable replicas when executing parallel distributed `INSERT SELECT`. [#58931](https://github.com/ClickHouse/ClickHouse/pull/58931) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Display word-descriptive log level while enabling structured log formatting in json. [#58936](https://github.com/ClickHouse/ClickHouse/pull/58936) ([Tim Liou](https://github.com/wheatdog)).
+* MySQL interface gained support for `CAST(x AS SIGNED)` and `CAST(x AS UNSIGNED)` statements via data type aliases: `SIGNED` for Int64, and `UNSIGNED` for UInt64. This improves compatibility with BI tools such as Looker Studio. [#58954](https://github.com/ClickHouse/ClickHouse/pull/58954) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Change working directory to the data path in docker container. [#58975](https://github.com/ClickHouse/ClickHouse/pull/58975) ([cangyin](https://github.com/cangyin)).
+* Added setting for Azure Blob Storage `azure_max_unexpected_write_error_retries` , can also be set from config under azure section. [#59001](https://github.com/ClickHouse/ClickHouse/pull/59001) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Allow server to start with broken data lake table. Closes [#58625](https://github.com/ClickHouse/ClickHouse/issues/58625). [#59080](https://github.com/ClickHouse/ClickHouse/pull/59080) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Allow to ignore schema evolution in the `Iceberg` table engine and read all data using schema specified by the user on table creation or latest schema parsed from metadata on table creation. This is done under a setting `iceberg_engine_ignore_schema_evolution` that is disabled by default. Note that enabling this setting can lead to incorrect result as in case of evolved schema all data files will be read using the same schema. [#59133](https://github.com/ClickHouse/ClickHouse/pull/59133) ([Kruglov Pavel](https://github.com/Avogar)).
+* Prohibit mutable operations (`INSERT`/`ALTER`/`OPTIMIZE`/...) on read-only/write-once storages with a proper `TABLE_IS_READ_ONLY` error (to avoid leftovers). Avoid leaving left-overs on write-once disks (`format_version.txt`) on `CREATE`/`ATTACH`. Ignore `DROP` for `ReplicatedMergeTree` (so as for `MergeTree`). Fix iterating over `s3_plain` (`MetadataStorageFromPlainObjectStorage::iterateDirectory`). Note read-only is `web` disk, and write-once is `s3_plain`. [#59170](https://github.com/ClickHouse/ClickHouse/pull/59170) ([Azat Khuzhin](https://github.com/azat)).
+* Fix bug in the experimental `_block_number` column which could lead to logical error during complex combination of `ALTER`s and `merge`s. Fixes [#56202](https://github.com/ClickHouse/ClickHouse/issues/56202). Replaces [#58601](https://github.com/ClickHouse/ClickHouse/issues/58601). [#59295](https://github.com/ClickHouse/ClickHouse/pull/59295) ([alesapin](https://github.com/alesapin)).
+* Play UI understands when an exception is returned inside JSON. Adjustment for [#52853](https://github.com/ClickHouse/ClickHouse/issues/52853). [#59303](https://github.com/ClickHouse/ClickHouse/pull/59303) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* `/binary` HTTP handler allows to specify user, host, and optionally, password in the query string. [#59311](https://github.com/ClickHouse/ClickHouse/pull/59311) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Support backups for compressed in-memory tables. This closes [#57893](https://github.com/ClickHouse/ClickHouse/issues/57893). [#59315](https://github.com/ClickHouse/ClickHouse/pull/59315) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Support the `FORMAT` clause in `BACKUP` and `RESTORE` queries. [#59338](https://github.com/ClickHouse/ClickHouse/pull/59338) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Function `concatWithSeparator` now supports arbitrary argument types (instead of only `String` and `FixedString` arguments). For example, `SELECT concatWithSeparator('.', 'number', 1)` now returns `number.1`. [#59341](https://github.com/ClickHouse/ClickHouse/pull/59341) ([Robert Schulze](https://github.com/rschu1ze)).
 
 #### Build/Testing/Packaging Improvement
-* Randomize more settings [#39663](https://github.com/ClickHouse/ClickHouse/pull/39663) ([Anton Popov](https://github.com/CurtizJ)).
-* Randomize disabled optimizations in CI [#57315](https://github.com/ClickHouse/ClickHouse/pull/57315) ([Raúl Marín](https://github.com/Algunenano)).
-* Allow usage of Azure-related table engines/functions on macOS. [#51866](https://github.com/ClickHouse/ClickHouse/pull/51866) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* ClickHouse Fast Test now uses Musl instead of GLibc. [#57711](https://github.com/ClickHouse/ClickHouse/pull/57711) ([Alexey Milovidov](https://github.com/alexey-milovidov)). The fully-static Musl build is available to download from the CI.
-* Run ClickBench for every commit. This closes [#57708](https://github.com/ClickHouse/ClickHouse/issues/57708). [#57712](https://github.com/ClickHouse/ClickHouse/pull/57712) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Remove the usage of a harmful C/POSIX `select` function from external libraries. [#57467](https://github.com/ClickHouse/ClickHouse/pull/57467) ([Igor Nikonov](https://github.com/devcrafter)).
-* Settings only available in ClickHouse Cloud will be also present in the open-source ClickHouse build for convenience. [#57638](https://github.com/ClickHouse/ClickHouse/pull/57638) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Fixed a possibility of sorting order breakage in TTL GROUP BY [#49103](https://github.com/ClickHouse/ClickHouse/pull/49103) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Fix: split `lttb` bucket strategy, first bucket and last bucket should only contain single point [#57003](https://github.com/ClickHouse/ClickHouse/pull/57003) ([FFish](https://github.com/wxybear)).
-* Fix possible deadlock in the `Template` format during sync after error [#57004](https://github.com/ClickHouse/ClickHouse/pull/57004) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix early stop while parsing a file with skipping lots of errors [#57006](https://github.com/ClickHouse/ClickHouse/pull/57006) ([Kruglov Pavel](https://github.com/Avogar)).
-* Prevent dictionary's ACL bypass via the `dictionary` table function [#57362](https://github.com/ClickHouse/ClickHouse/pull/57362) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Fix another case of a "non-ready set" error found by Fuzzer. [#57423](https://github.com/ClickHouse/ClickHouse/pull/57423) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix several issues regarding PostgreSQL `array_ndims` usage. [#57436](https://github.com/ClickHouse/ClickHouse/pull/57436) ([Ryan Jacobs](https://github.com/ryanmjacobs)).
-* Fix RWLock inconsistency after write lock timeout [#57454](https://github.com/ClickHouse/ClickHouse/pull/57454) ([Vitaly Baranov](https://github.com/vitlibar)). Fix RWLock inconsistency after write lock timeout (again) [#57733](https://github.com/ClickHouse/ClickHouse/pull/57733) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix: don't exclude ephemeral column when building pushing to view chain [#57461](https://github.com/ClickHouse/ClickHouse/pull/57461) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* MaterializedPostgreSQL (experimental issue): fix issue [#41922](https://github.com/ClickHouse/ClickHouse/issues/41922), add test for [#41923](https://github.com/ClickHouse/ClickHouse/issues/41923) [#57515](https://github.com/ClickHouse/ClickHouse/pull/57515) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Ignore ON CLUSTER clause in grant/revoke queries for management of replicated access entities.  [#57538](https://github.com/ClickHouse/ClickHouse/pull/57538) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* Fix crash in clickhouse-local [#57553](https://github.com/ClickHouse/ClickHouse/pull/57553) ([Nikolay Degterinsky](https://github.com/evillique)).
-* A fix for Hash JOIN. [#57564](https://github.com/ClickHouse/ClickHouse/pull/57564) ([vdimir](https://github.com/vdimir)).
-* Fix possible error in PostgreSQL source [#57567](https://github.com/ClickHouse/ClickHouse/pull/57567) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix type correction in Hash JOIN for nested LowCardinality. [#57614](https://github.com/ClickHouse/ClickHouse/pull/57614) ([vdimir](https://github.com/vdimir)).
-* Avoid hangs of `system.stack_trace` by correctly prohibiting parallel reading from it. [#57641](https://github.com/ClickHouse/ClickHouse/pull/57641) ([Azat Khuzhin](https://github.com/azat)).
-* Fix an error for aggregation of sparse columns with `any(...) RESPECT NULL` [#57710](https://github.com/ClickHouse/ClickHouse/pull/57710) ([Azat Khuzhin](https://github.com/azat)).
-* Fix unary operators parsing [#57713](https://github.com/ClickHouse/ClickHouse/pull/57713) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix dependency loading for the experimental table engine `MaterializedPostgreSQL`. [#57754](https://github.com/ClickHouse/ClickHouse/pull/57754) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix retries for disconnected nodes for BACKUP/RESTORE ON CLUSTER [#57764](https://github.com/ClickHouse/ClickHouse/pull/57764) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix result of external aggregation in case of partially materialized projection [#57790](https://github.com/ClickHouse/ClickHouse/pull/57790) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix merge in aggregation functions with `*Map` combinator [#57795](https://github.com/ClickHouse/ClickHouse/pull/57795) ([Anton Popov](https://github.com/CurtizJ)).
-* Disable `system.kafka_consumers` because it has a bug. [#57822](https://github.com/ClickHouse/ClickHouse/pull/57822) ([Azat Khuzhin](https://github.com/azat)).
-* Fix LowCardinality keys support in Merge JOIN. [#57827](https://github.com/ClickHouse/ClickHouse/pull/57827) ([vdimir](https://github.com/vdimir)).
-* A fix for `InterpreterCreateQuery` related to the sample block. [#57855](https://github.com/ClickHouse/ClickHouse/pull/57855) ([Maksim Kita](https://github.com/kitaisreal)).
-* `addresses_expr` were ignored for named collections from PostgreSQL. [#57874](https://github.com/ClickHouse/ClickHouse/pull/57874) ([joelynch](https://github.com/joelynch)).
-* Fix invalid memory access in BLAKE3 (Rust) [#57876](https://github.com/ClickHouse/ClickHouse/pull/57876) ([Raúl Marín](https://github.com/Algunenano)). Then it was rewritten from Rust to C++ for better [memory-safety](https://www.memorysafety.org/). [#57994](https://github.com/ClickHouse/ClickHouse/pull/57994) ([Raúl Marín](https://github.com/Algunenano)).
-* Normalize function names in `CREATE INDEX` [#57906](https://github.com/ClickHouse/ClickHouse/pull/57906) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix handling of unavailable replicas before first request happened [#57933](https://github.com/ClickHouse/ClickHouse/pull/57933) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix literal alias misclassification [#57988](https://github.com/ClickHouse/ClickHouse/pull/57988) ([Chen768959](https://github.com/Chen768959)).
-* Fix invalid preprocessing on Keeper [#58069](https://github.com/ClickHouse/ClickHouse/pull/58069) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix integer overflow in the `Poco` library, related to `UTF32Encoding` [#58073](https://github.com/ClickHouse/ClickHouse/pull/58073) ([Andrey Fedotov](https://github.com/anfedotoff)).
-* Fix parallel replicas (experimental feature) in presence of a scalar subquery with a big integer value [#58118](https://github.com/ClickHouse/ClickHouse/pull/58118) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix `accurateCastOrNull` for out-of-range `DateTime` [#58139](https://github.com/ClickHouse/ClickHouse/pull/58139) ([Andrey Zvonov](https://github.com/zvonand)).
-* Fix possible `PARAMETER_OUT_OF_BOUND` error during subcolumns reading from a wide part in MergeTree [#58175](https://github.com/ClickHouse/ClickHouse/pull/58175) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix a slow-down of CREATE VIEW with an enormous number of subqueries [#58220](https://github.com/ClickHouse/ClickHouse/pull/58220) ([Tao Wang](https://github.com/wangtZJU)).
-* Fix parallel parsing for JSONCompactEachRow [#58181](https://github.com/ClickHouse/ClickHouse/pull/58181) ([Alexey Milovidov](https://github.com/alexey-milovidov)). [#58250](https://github.com/ClickHouse/ClickHouse/pull/58250) ([Kruglov Pavel](https://github.com/Avogar)).
-
-
-### <a id="2311"></a> ClickHouse release 23.11, 2023-12-06
-
-#### Backward Incompatible Change
-* The default ClickHouse server configuration file has enabled `access_management` (user manipulation by SQL queries) and `named_collection_control` (manipulation of named collection by SQL queries) for the `default` user by default. This closes [#56482](https://github.com/ClickHouse/ClickHouse/issues/56482). [#56619](https://github.com/ClickHouse/ClickHouse/pull/56619) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Multiple improvements for `RESPECT NULLS`/`IGNORE NULLS` for window functions. If you use them as aggregate functions and store the states of aggregate functions with these modifiers, they might become incompatible. [#57189](https://github.com/ClickHouse/ClickHouse/pull/57189) ([Raúl Marín](https://github.com/Algunenano)).
-* Remove optimization `optimize_move_functions_out_of_any`. [#57190](https://github.com/ClickHouse/ClickHouse/pull/57190) ([Raúl Marín](https://github.com/Algunenano)).
-* Formatters `%l`/`%k`/`%c` in function `parseDateTime` are now able to parse hours/months without leading zeros, e.g. `select parseDateTime('2023-11-26 8:14', '%F %k:%i')` now works. Set `parsedatetime_parse_without_leading_zeros = 0` to restore the previous behavior which required two digits. Function `formatDateTime` is now also able to print hours/months without leading zeros. This is controlled by setting `formatdatetime_format_without_leading_zeros` but off by default to not break existing use cases. [#55872](https://github.com/ClickHouse/ClickHouse/pull/55872) ([Azat Khuzhin](https://github.com/azat)).
-* You can no longer use the aggregate function `avgWeighted` with arguments of type `Decimal`. Workaround: convert arguments to `Float64`. This closes [#43928](https://github.com/ClickHouse/ClickHouse/issues/43928). This closes [#31768](https://github.com/ClickHouse/ClickHouse/issues/31768). This closes [#56435](https://github.com/ClickHouse/ClickHouse/issues/56435). If you have used this function inside materialized views or projections with `Decimal` arguments, contact support@clickhouse.com. Fixed error in aggregate function `sumMap` and made it slower around 1.5..2 times. It does not matter because the function is garbage anyway. This closes [#54955](https://github.com/ClickHouse/ClickHouse/issues/54955). This closes [#53134](https://github.com/ClickHouse/ClickHouse/issues/53134). This closes [#55148](https://github.com/ClickHouse/ClickHouse/issues/55148). Fix a bug in function `groupArraySample` - it used the same random seed in case more than one aggregate state is generated in a query. [#56350](https://github.com/ClickHouse/ClickHouse/pull/56350) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-
-#### New Feature
-* Added server setting `async_load_databases` for asynchronous loading of databases and tables. Speeds up the server start time. Applies to databases with `Ordinary`, `Atomic` and `Replicated` engines. Their tables load metadata asynchronously. Query to a table increases the priority of the load job and waits for it to be done. Added a new table `system.asynchronous_loader` for introspection. [#49351](https://github.com/ClickHouse/ClickHouse/pull/49351) ([Sergei Trifonov](https://github.com/serxa)).
-* Add system table `blob_storage_log`. It allows auditing all the data written to S3 and other object storages. [#52918](https://github.com/ClickHouse/ClickHouse/pull/52918) ([vdimir](https://github.com/vdimir)).
-* Use statistics to order prewhere conditions better. [#53240](https://github.com/ClickHouse/ClickHouse/pull/53240) ([Han Fei](https://github.com/hanfei1991)).
-* Added support for compression in the Keeper's protocol. It can be enabled on the ClickHouse side by using this flag `use_compression` inside `zookeeper` section. Keep in mind that only ClickHouse Keeper supports compression, while Apache ZooKeeper does not. Resolves [#49507](https://github.com/ClickHouse/ClickHouse/issues/49507). [#54957](https://github.com/ClickHouse/ClickHouse/pull/54957) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Introduce the feature `storage_metadata_write_full_object_key`. If it is set as `true` then metadata files are written with the new format. With that format ClickHouse stores full remote object key in the metadata file which allows better flexibility and optimization. [#55566](https://github.com/ClickHouse/ClickHouse/pull/55566) ([Sema Checherinda](https://github.com/CheSema)).
-* Add new settings and syntax to protect named collections' fields from being overridden. This is meant to prevent a malicious user from obtaining unauthorized access to secrets. [#55782](https://github.com/ClickHouse/ClickHouse/pull/55782) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Add `hostname` column to all system log tables - it is useful if you make the system tables replicated, shared, or distributed. [#55894](https://github.com/ClickHouse/ClickHouse/pull/55894) ([Bharat Nallan](https://github.com/bharatnc)).
-* Add `CHECK ALL TABLES` query. [#56022](https://github.com/ClickHouse/ClickHouse/pull/56022) ([vdimir](https://github.com/vdimir)).
-* Added function `fromDaysSinceYearZero` which is similar to MySQL's `FROM_DAYS`. E.g. `SELECT fromDaysSinceYearZero(739136)` returns `2023-09-08`. [#56088](https://github.com/ClickHouse/ClickHouse/pull/56088) ([Joanna Hulboj](https://github.com/jh0x)).
-* Add an external Python tool to view backups and to extract information from them without using ClickHouse. [#56268](https://github.com/ClickHouse/ClickHouse/pull/56268) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Implement a new setting called `preferred_optimize_projection_name`. If it is set to a non-empty string, the specified projection would be used if possible instead of choosing from all the candidates. [#56309](https://github.com/ClickHouse/ClickHouse/pull/56309) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Add 4-letter command for yielding/resigning leadership (https://github.com/ClickHouse/ClickHouse/issues/56352). [#56354](https://github.com/ClickHouse/ClickHouse/pull/56354) ([Pradeep Chhetri](https://github.com/chhetripradeep)). [#56620](https://github.com/ClickHouse/ClickHouse/pull/56620) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
-* Added a new SQL function, `arrayRandomSample(arr, k)` which returns a sample of k elements from the input array. Similar functionality could previously be achieved only with less convenient syntax, e.g. `SELECT arrayReduce('groupArraySample(3)', range(10))`. [#56416](https://github.com/ClickHouse/ClickHouse/pull/56416) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added support for `Float16` type data to use in `.npy` files. Closes [#56344](https://github.com/ClickHouse/ClickHouse/issues/56344). [#56424](https://github.com/ClickHouse/ClickHouse/pull/56424) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Added a system view `information_schema.statistics` for better compatibility with Tableau Online. [#56425](https://github.com/ClickHouse/ClickHouse/pull/56425) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Add `system.symbols` table useful for introspection of the binary. [#56548](https://github.com/ClickHouse/ClickHouse/pull/56548) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Configurable dashboards. Queries for charts are now loaded using a query, which by default uses a new `system.dashboards` table. [#56771](https://github.com/ClickHouse/ClickHouse/pull/56771) ([Sergei Trifonov](https://github.com/serxa)).
-* Introduce `fileCluster` table function - it is useful if you mount a shared filesystem (NFS and similar) into the `user_files` directory. [#56868](https://github.com/ClickHouse/ClickHouse/pull/56868) ([Andrey Zvonov](https://github.com/zvonand)).
-* Add `_size` virtual column with file size in bytes to `s3/file/hdfs/url/azureBlobStorage` engines. [#57126](https://github.com/ClickHouse/ClickHouse/pull/57126) ([Kruglov Pavel](https://github.com/Avogar)).
-* Expose the number of errors for each error code occurred on a server since last restart from the Prometheus endpoint. [#57209](https://github.com/ClickHouse/ClickHouse/pull/57209) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* ClickHouse keeper reports its running availability zone at `/keeper/availability-zone` path. This can be configured via `<availability_zone><value>us-west-1a</value></availability_zone>`. [#56715](https://github.com/ClickHouse/ClickHouse/pull/56715) ([Jianfei Hu](https://github.com/incfly)).
-* Make ALTER materialized_view MODIFY QUERY non experimental and deprecate `allow_experimental_alter_materialized_view_structure` setting. Fixes [#15206](https://github.com/ClickHouse/ClickHouse/issues/15206). [#57311](https://github.com/ClickHouse/ClickHouse/pull/57311) ([alesapin](https://github.com/alesapin)).
-* Setting `join_algorithm` respects specified order [#51745](https://github.com/ClickHouse/ClickHouse/pull/51745) ([vdimir](https://github.com/vdimir)).
-* Add support for the [well-known Protobuf types](https://protobuf.dev/reference/protobuf/google.protobuf/) in the Protobuf format. [#56741](https://github.com/ClickHouse/ClickHouse/pull/56741) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-
-#### Performance Improvement
-* Adaptive timeouts for interacting with S3. The first attempt is made with low send and receive timeouts. [#56314](https://github.com/ClickHouse/ClickHouse/pull/56314) ([Sema Checherinda](https://github.com/CheSema)).
-* Increase the default value of `max_concurrent_queries` from 100 to 1000. This makes sense when there is a large number of connecting clients, which are slowly sending or receiving data, so the server is not limited by CPU, or when the number of CPU cores is larger than 100. Also, enable the concurrency control by default, and set the desired number of query processing threads in total as twice the number of CPU cores. It improves performance in scenarios with a very large number of concurrent queries. [#46927](https://github.com/ClickHouse/ClickHouse/pull/46927) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Support parallel evaluation of window functions. Fixes [#34688](https://github.com/ClickHouse/ClickHouse/issues/34688). [#39631](https://github.com/ClickHouse/ClickHouse/pull/39631) ([Dmitry Novik](https://github.com/novikd)).
-* `Numbers` table engine (of the `system.numbers` table) now analyzes the condition to generate the needed subset of data, like table's index. [#50909](https://github.com/ClickHouse/ClickHouse/pull/50909) ([JackyWoo](https://github.com/JackyWoo)).
-* Improved the performance of filtering by `IN (...)` condition for `Merge` table engine. [#54905](https://github.com/ClickHouse/ClickHouse/pull/54905) ([Nikita Taranov](https://github.com/nickitat)).
-* An improvement which takes place when the filesystem cache is full and there are big reads. [#55158](https://github.com/ClickHouse/ClickHouse/pull/55158) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Add ability to disable checksums for S3 to avoid excessive pass over the file (this is controlled by the setting `s3_disable_checksum`). [#55559](https://github.com/ClickHouse/ClickHouse/pull/55559) ([Azat Khuzhin](https://github.com/azat)).
-* Now we read synchronously from remote tables when data is in page cache (like we do for local tables). It is faster, it doesn't require synchronisation inside the thread pool, and doesn't hesitate to do `seek`-s on local FS, and reduces CPU wait. [#55841](https://github.com/ClickHouse/ClickHouse/pull/55841) ([Nikita Taranov](https://github.com/nickitat)).
-* Optimization for getting value from `map`, `arrayElement`. It will bring about 30% speedup. - reduce the reserved memory - reduce the `resize` call. [#55957](https://github.com/ClickHouse/ClickHouse/pull/55957) ([lgbo](https://github.com/lgbo-ustc)).
-* Optimization of multi-stage filtering with AVX-512. The performance experiments of the OnTime dataset on the ICX device (Intel Xeon Platinum 8380 CPU, 80 cores, 160 threads) show that this change could bring the improvements of 7.4%, 5.9%, 4.7%, 3.0%, and 4.6% to the QPS of the query Q2, Q3, Q4, Q5 and Q6 respectively while having no impact on others. [#56079](https://github.com/ClickHouse/ClickHouse/pull/56079) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Limit the number of threads busy inside the query profiler. If there are more - they will skip profiling. [#56105](https://github.com/ClickHouse/ClickHouse/pull/56105) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Decrease the amount of virtual function calls in window functions. [#56120](https://github.com/ClickHouse/ClickHouse/pull/56120) ([Maksim Kita](https://github.com/kitaisreal)).
-* Allow recursive Tuple field pruning in ORC data format to speed up scaning. [#56122](https://github.com/ClickHouse/ClickHouse/pull/56122) ([李扬](https://github.com/taiyang-li)).
-* Trivial count optimization for `Npy` data format: queries like `select count() from 'data.npy'` will work much more fast because of caching the results. [#56304](https://github.com/ClickHouse/ClickHouse/pull/56304) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Queries with aggregation and a large number of streams will use less amount of memory during the plan's construction. [#57074](https://github.com/ClickHouse/ClickHouse/pull/57074) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Improve performance of executing queries for use cases with many users and highly concurrent queries (>2000 QPS) by optimizing the access to ProcessList. [#57106](https://github.com/ClickHouse/ClickHouse/pull/57106) ([Andrej Hoos](https://github.com/adikus)).
-* Trivial improvement on array join, reuse some intermediate results. [#57183](https://github.com/ClickHouse/ClickHouse/pull/57183) ([李扬](https://github.com/taiyang-li)).
-* There are cases when stack unwinding was slow. Not anymore. [#57221](https://github.com/ClickHouse/ClickHouse/pull/57221) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Now we use default read pool for reading from external storage when `max_streams = 1`. It is beneficial when read prefetches are enabled. [#57334](https://github.com/ClickHouse/ClickHouse/pull/57334) ([Nikita Taranov](https://github.com/nickitat)).
-* Keeper improvement: improve memory-usage during startup by delaying log preprocessing. [#55660](https://github.com/ClickHouse/ClickHouse/pull/55660) ([Antonio Andelic](https://github.com/antonio2368)).
-* Improved performance of glob matching for `File` and `HDFS` storages. [#56141](https://github.com/ClickHouse/ClickHouse/pull/56141) ([Andrey Zvonov](https://github.com/zvonand)).
-* Posting lists in experimental full text indexes are now compressed which reduces their size by 10-30%. [#56226](https://github.com/ClickHouse/ClickHouse/pull/56226) ([Harry Lee](https://github.com/HarryLeeIBM)).
-* Parallelise `BackupEntriesCollector` in backups. [#56312](https://github.com/ClickHouse/ClickHouse/pull/56312) ([Kseniia Sumarokova](https://github.com/kssenii)).
-
-#### Improvement
-* Add a new `MergeTree` setting `add_implicit_sign_column_constraint_for_collapsing_engine` (disabled by default). When enabled, it adds an implicit CHECK constraint for `CollapsingMergeTree` tables that restricts the value of the `Sign` column to be only -1 or 1. [#56701](https://github.com/ClickHouse/ClickHouse/issues/56701). [#56986](https://github.com/ClickHouse/ClickHouse/pull/56986) ([Kevin Mingtarja](https://github.com/kevinmingtarja)).
-* Enable adding new disk to storage configuration without restart. [#56367](https://github.com/ClickHouse/ClickHouse/pull/56367) ([Duc Canh Le](https://github.com/canhld94)).
-* Support creating and materializing index in the same alter query, also support "modify TTL" and "materialize TTL" in the same query. Closes [#55651](https://github.com/ClickHouse/ClickHouse/issues/55651). [#56331](https://github.com/ClickHouse/ClickHouse/pull/56331) ([flynn](https://github.com/ucasfl)).
-* Add a new table function named `fuzzJSON` with rows containing perturbed versions of the source JSON string with random variations. [#56490](https://github.com/ClickHouse/ClickHouse/pull/56490) ([Julia Kartseva](https://github.com/jkartseva)).
-* Engine `Merge` filters the records according to the row policies of the underlying tables, so you don't have to create another row policy on a `Merge` table. [#50209](https://github.com/ClickHouse/ClickHouse/pull/50209) ([Ilya Golshtein](https://github.com/ilejn)).
-* Add a setting `max_execution_time_leaf` to limit the execution time on shard for distributed query, and `timeout_overflow_mode_leaf` to control the behaviour if timeout happens. [#51823](https://github.com/ClickHouse/ClickHouse/pull/51823) ([Duc Canh Le](https://github.com/canhld94)).
-* Add ClickHouse setting to disable tunneling for HTTPS requests over HTTP proxy. [#55033](https://github.com/ClickHouse/ClickHouse/pull/55033) ([Arthur Passos](https://github.com/arthurpassos)).
-* Set `background_fetches_pool_size` to 16, background_schedule_pool_size to 512 that is better for production usage with frequent small insertions. [#54327](https://github.com/ClickHouse/ClickHouse/pull/54327) ([Denny Crane](https://github.com/den-crane)).
-* While read data from a csv format file, and at end of line is `\r` , which not followed by `\n`, then we will enconter the exception as follows `Cannot parse CSV format: found \r (CR) not followed by \n (LF). Line must end by \n (LF) or \r\n (CR LF) or \n\r.` In clickhouse, the csv end of line must be `\n` or `\r\n` or `\n\r`, so the `\r` must be followed by `\n`, but in some suitation, the csv input data is abnormal, like above, `\r` is at end of line. [#54340](https://github.com/ClickHouse/ClickHouse/pull/54340) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Update Arrow library to release-13.0.0 that supports new encodings. Closes [#44505](https://github.com/ClickHouse/ClickHouse/issues/44505). [#54800](https://github.com/ClickHouse/ClickHouse/pull/54800) ([Kruglov Pavel](https://github.com/Avogar)).
-* Improve performance of ON CLUSTER queries by removing heavy system calls to get all network interfaces when looking for local ip address in the DDL entry hosts list. [#54909](https://github.com/ClickHouse/ClickHouse/pull/54909) ([Duc Canh Le](https://github.com/canhld94)).
-* Fixed accounting of memory allocated before attaching a thread to a query or a user. [#56089](https://github.com/ClickHouse/ClickHouse/pull/56089) ([Nikita Taranov](https://github.com/nickitat)).
-* Add support for `LARGE_LIST` in Apache Arrow formats. [#56118](https://github.com/ClickHouse/ClickHouse/pull/56118) ([edef](https://github.com/edef1c)).
-* Allow manual compaction of `EmbeddedRocksDB` via `OPTIMIZE` query. [#56225](https://github.com/ClickHouse/ClickHouse/pull/56225) ([Azat Khuzhin](https://github.com/azat)).
-* Add ability to specify BlockBasedTableOptions for `EmbeddedRocksDB` tables. [#56264](https://github.com/ClickHouse/ClickHouse/pull/56264) ([Azat Khuzhin](https://github.com/azat)).
-* `SHOW COLUMNS` now displays MySQL's equivalent data type name when the connection was made through the MySQL protocol. Previously, this was the case when setting `use_mysql_types_in_show_columns = 1`. The setting is retained but made obsolete. [#56277](https://github.com/ClickHouse/ClickHouse/pull/56277) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fixed possible `The local set of parts of table doesn't look like the set of parts in ZooKeeper` error if server was restarted just after `TRUNCATE` or `DROP PARTITION`. [#56282](https://github.com/ClickHouse/ClickHouse/pull/56282) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fixed handling of non-const query strings in functions `formatQuery`/ `formatQuerySingleLine`. Also added `OrNull` variants of both functions that return a NULL when a query cannot be parsed instead of throwing an exception. [#56327](https://github.com/ClickHouse/ClickHouse/pull/56327) ([Robert Schulze](https://github.com/rschu1ze)).
-* Allow backup of materialized view with dropped inner table instead of failing the backup. [#56387](https://github.com/ClickHouse/ClickHouse/pull/56387) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Queries to `system.replicas` initiate requests to ZooKeeper when certain columns are queried. When there are thousands of tables these requests might produce a considerable load on ZooKeeper. If there are multiple simultaneous queries to `system.replicas` they do same requests multiple times. The change is to "deduplicate" requests from concurrent queries. [#56420](https://github.com/ClickHouse/ClickHouse/pull/56420) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix translation to MySQL compatible query for querying external databases. [#56456](https://github.com/ClickHouse/ClickHouse/pull/56456) ([flynn](https://github.com/ucasfl)).
-* Add support for backing up and restoring tables using `KeeperMap` engine. [#56460](https://github.com/ClickHouse/ClickHouse/pull/56460) ([Antonio Andelic](https://github.com/antonio2368)).
-* 404 response for CompleteMultipartUpload has to be rechecked. Operation could be done on server even if client got timeout or other network errors. The next retry of CompleteMultipartUpload receives 404 response. If the object key exists that operation is considered as successful. [#56475](https://github.com/ClickHouse/ClickHouse/pull/56475) ([Sema Checherinda](https://github.com/CheSema)).
-* Enable the HTTP OPTIONS method by default - it simplifies requesting ClickHouse from a web browser. [#56483](https://github.com/ClickHouse/ClickHouse/pull/56483) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The value for `dns_max_consecutive_failures` was changed by mistake in [#46550](https://github.com/ClickHouse/ClickHouse/issues/46550) - this is reverted and adjusted to a better value. Also, increased the HTTP keep-alive timeout to a reasonable value from production. [#56485](https://github.com/ClickHouse/ClickHouse/pull/56485) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Load base backups lazily (a base backup won't be loaded until it's needed). Also add some log message and profile events for backups. [#56516](https://github.com/ClickHouse/ClickHouse/pull/56516) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Setting `query_cache_store_results_of_queries_with_nondeterministic_functions` (with values `false` or `true`) was marked obsolete. It was replaced by setting `query_cache_nondeterministic_function_handling`, a three-valued enum that controls how the query cache handles queries with non-deterministic functions: a) throw an exception (default behavior), b) save the non-deterministic query result regardless, or c) ignore, i.e. don't throw an exception and don't cache the result. [#56519](https://github.com/ClickHouse/ClickHouse/pull/56519) ([Robert Schulze](https://github.com/rschu1ze)).
-* Rewrite equality with `is null` check in JOIN ON section. Experimental *Analyzer only*. [#56538](https://github.com/ClickHouse/ClickHouse/pull/56538) ([vdimir](https://github.com/vdimir)).
-* Function`concat` now supports arbitrary argument types (instead of only String and FixedString arguments). This makes it behave more similar to MySQL `concat` implementation. For example, `SELECT concat('ab', 42)` now returns `ab42`. [#56540](https://github.com/ClickHouse/ClickHouse/pull/56540) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Allow getting cache configuration from 'named_collection' section in config or from SQL created named collections. [#56541](https://github.com/ClickHouse/ClickHouse/pull/56541) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* PostgreSQL database engine: Make the removal of outdated tables less aggressive with unsuccessful postgres connection. [#56609](https://github.com/ClickHouse/ClickHouse/pull/56609) ([jsc0218](https://github.com/jsc0218)).
-* It took too much time to connnect to PG when URL is not right, so the relevant query stucks there and get cancelled. [#56648](https://github.com/ClickHouse/ClickHouse/pull/56648) ([jsc0218](https://github.com/jsc0218)).
-* Keeper improvement: disable compressed logs by default in Keeper. [#56763](https://github.com/ClickHouse/ClickHouse/pull/56763) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add config setting `wait_dictionaries_load_at_startup`. [#56782](https://github.com/ClickHouse/ClickHouse/pull/56782) ([Vitaly Baranov](https://github.com/vitlibar)).
-* There was a potential vulnerability in previous ClickHouse versions: if a user has connected and unsuccessfully tried to authenticate with the "interserver secret" method, the server didn't terminate the connection immediately but continued to receive and ignore the leftover packets from the client. While these packets are ignored, they are still parsed, and if they use a compression method with another known vulnerability, it will lead to exploitation of it without authentication. This issue was found with [ClickHouse Bug Bounty Program](https://github.com/ClickHouse/ClickHouse/issues/38986) by https://twitter.com/malacupa. [#56794](https://github.com/ClickHouse/ClickHouse/pull/56794) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fetching a part waits when that part is fully committed on remote replica. It is better not send part in PreActive state. In case of zero copy this is mandatory restriction. [#56808](https://github.com/ClickHouse/ClickHouse/pull/56808) ([Sema Checherinda](https://github.com/CheSema)).
-* Fix possible postgresql logical replication conversion error when using experimental `MaterializedPostgreSQL`. [#53721](https://github.com/ClickHouse/ClickHouse/pull/53721) ([takakawa](https://github.com/takakawa)).
-* Implement user-level setting `alter_move_to_space_execute_async` which allow to execute queries `ALTER TABLE ... MOVE PARTITION|PART TO DISK|VOLUME` asynchronously. The size of pool for background executions is controlled by `background_move_pool_size`. Default behavior is synchronous execution. Fixes [#47643](https://github.com/ClickHouse/ClickHouse/issues/47643). [#56809](https://github.com/ClickHouse/ClickHouse/pull/56809) ([alesapin](https://github.com/alesapin)).
-* Able to filter by engine when scanning system.tables, avoid unnecessary (potentially time-consuming) connection. [#56813](https://github.com/ClickHouse/ClickHouse/pull/56813) ([jsc0218](https://github.com/jsc0218)).
-* Show `total_bytes` and `total_rows` in system tables for RocksDB storage. [#56816](https://github.com/ClickHouse/ClickHouse/pull/56816) ([Aleksandr Musorin](https://github.com/AVMusorin)).
-* Allow basic commands in ALTER for TEMPORARY tables. [#56892](https://github.com/ClickHouse/ClickHouse/pull/56892) ([Sergey](https://github.com/icuken)).
-* LZ4 compression. Buffer compressed block in a rare case when out buffer capacity is not enough for writing compressed block directly to out's buffer. [#56938](https://github.com/ClickHouse/ClickHouse/pull/56938) ([Sema Checherinda](https://github.com/CheSema)).
-* Add metrics for the number of queued jobs, which is useful for the IO thread pool. [#56958](https://github.com/ClickHouse/ClickHouse/pull/56958) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add a setting for PostgreSQL table engine setting in the config file. Added a check for the setting Added documentation around the additional setting. [#56959](https://github.com/ClickHouse/ClickHouse/pull/56959) ([Peignon Melvyn](https://github.com/melvynator)).
-* Function `concat` can now be called with a single argument, e.g., `SELECT concat('abc')`. This makes its behavior more consistent with MySQL's concat implementation. [#57000](https://github.com/ClickHouse/ClickHouse/pull/57000) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Signs all `x-amz-*` headers as required by AWS S3 docs. [#57001](https://github.com/ClickHouse/ClickHouse/pull/57001) ([Arthur Passos](https://github.com/arthurpassos)).
-* Function `fromDaysSinceYearZero` (alias: `FROM_DAYS`) can now be used with unsigned and signed integer types (previously, it had to be an unsigned integer). This improve compatibility with 3rd party tools such as Tableau Online. [#57002](https://github.com/ClickHouse/ClickHouse/pull/57002) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Add `system.s3queue_log` to default config. [#57036](https://github.com/ClickHouse/ClickHouse/pull/57036) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Change the default for `wait_dictionaries_load_at_startup` to true, and use this setting only if `dictionaries_lazy_load` is false. [#57133](https://github.com/ClickHouse/ClickHouse/pull/57133) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Check dictionary source type on creation even if `dictionaries_lazy_load` is enabled. [#57134](https://github.com/ClickHouse/ClickHouse/pull/57134) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Plan-level optimizations can now be enabled/disabled individually. Previously, it was only possible to disable them all. The setting which previously did that (`query_plan_enable_optimizations`) is retained and can still be used to disable all optimizations. [#57152](https://github.com/ClickHouse/ClickHouse/pull/57152) ([Robert Schulze](https://github.com/rschu1ze)).
-* The server's exit code will correspond to the exception code. For example, if the server cannot start due to memory limit, it will exit with the code 241 = MEMORY_LIMIT_EXCEEDED. In previous versions, the exit code for exceptions was always 70 = Poco::Util::ExitCode::EXIT_SOFTWARE. [#57153](https://github.com/ClickHouse/ClickHouse/pull/57153) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Do not demangle and symbolize stack frames from `functional` C++ header. [#57201](https://github.com/ClickHouse/ClickHouse/pull/57201) ([Mike Kot](https://github.com/myrrc)).
-* HTTP server page `/dashboard` now supports charts with multiple lines. [#57236](https://github.com/ClickHouse/ClickHouse/pull/57236) ([Sergei Trifonov](https://github.com/serxa)).
-* The `max_memory_usage_in_client` command line option supports a string value with a suffix (K, M, G, etc). Closes [#56879](https://github.com/ClickHouse/ClickHouse/issues/56879). [#57273](https://github.com/ClickHouse/ClickHouse/pull/57273) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Bumped Intel QPL (used by codec `DEFLATE_QPL`) from v1.2.0 to v1.3.1 . Also fixed a bug in case of BOF (Block On Fault) = 0, changed to handle page faults by falling back to SW path. [#57291](https://github.com/ClickHouse/ClickHouse/pull/57291) ([jasperzhu](https://github.com/jinjunzh)).
-* Increase default `replicated_deduplication_window` of MergeTree settings from 100 to 1k. [#57335](https://github.com/ClickHouse/ClickHouse/pull/57335) ([sichenzhao](https://github.com/sichenzhao)).
-* Stop using `INCONSISTENT_METADATA_FOR_BACKUP` that much. If possible prefer to continue scanning instead of stopping and starting the scanning for backup from the beginning. [#57385](https://github.com/ClickHouse/ClickHouse/pull/57385) ([Vitaly Baranov](https://github.com/vitlibar)).
-
-#### Build/Testing/Packaging Improvement
-* Add SQLLogic test. [#56078](https://github.com/ClickHouse/ClickHouse/pull/56078) ([Han Fei](https://github.com/hanfei1991)).
-* Make `clickhouse-local` and `clickhouse-client` available under short names (`ch`, `chl`, `chc`) for usability. [#56634](https://github.com/ClickHouse/ClickHouse/pull/56634) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Optimized build size further by removing unused code from external libraries. [#56786](https://github.com/ClickHouse/ClickHouse/pull/56786) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add automatic check that there are no large translation units. [#56559](https://github.com/ClickHouse/ClickHouse/pull/56559) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Lower the size of the single-binary distribution. This closes [#55181](https://github.com/ClickHouse/ClickHouse/issues/55181). [#56617](https://github.com/ClickHouse/ClickHouse/pull/56617) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Information about the sizes of every translation unit and binary file after each build will be sent to the CI database in ClickHouse Cloud. This closes [#56107](https://github.com/ClickHouse/ClickHouse/issues/56107). [#56636](https://github.com/ClickHouse/ClickHouse/pull/56636) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Certain files of "Apache Arrow" library (which we use only for non-essential things like parsing the arrow format) were rebuilt all the time regardless of the build cache. This is fixed. [#56657](https://github.com/ClickHouse/ClickHouse/pull/56657) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Avoid recompiling translation units depending on the autogenerated source file about version. [#56660](https://github.com/ClickHouse/ClickHouse/pull/56660) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Tracing data of the linker invocations will be sent to the CI database in ClickHouse Cloud. [#56725](https://github.com/ClickHouse/ClickHouse/pull/56725) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Use DWARF 5 debug symbols for the clickhouse binary (was DWARF 4 previously). [#56770](https://github.com/ClickHouse/ClickHouse/pull/56770) ([Michael Kolupaev](https://github.com/al13n321)).
-* Add a new build option `SANITIZE_COVERAGE`. If it is enabled, the code is instrumented to track the coverage. The collected information is available inside ClickHouse with: (1) a new function `coverage` that returns an array of unique addresses in the code found after the previous coverage reset; (2) `SYSTEM RESET COVERAGE` query that resets the accumulated data. This allows us to compare the coverage of different tests, including differential code coverage. Continuation of [#20539](https://github.com/ClickHouse/ClickHouse/issues/20539). [#56102](https://github.com/ClickHouse/ClickHouse/pull/56102) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Some of the stack frames might not be resolved when collecting stacks. In such cases the raw address might be helpful. [#56267](https://github.com/ClickHouse/ClickHouse/pull/56267) ([Alexander Gololobov](https://github.com/davenger)).
-* Add an option to disable `libssh`. [#56333](https://github.com/ClickHouse/ClickHouse/pull/56333) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Enable temporary_data_in_cache in S3 tests in CI. [#48425](https://github.com/ClickHouse/ClickHouse/pull/48425) ([vdimir](https://github.com/vdimir)).
-* Set the max memory usage for clickhouse-client (`1G`) in the CI. [#56873](https://github.com/ClickHouse/ClickHouse/pull/56873) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Fix exerimental Analyzer - insertion from select with subquery referencing insertion table should process only insertion block. [#50857](https://github.com/ClickHouse/ClickHouse/pull/50857) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix a bug in `str_to_map` function. [#56423](https://github.com/ClickHouse/ClickHouse/pull/56423) ([Arthur Passos](https://github.com/arthurpassos)).
-* Keeper `reconfig`: add timeout before yielding/taking leadership [#53481](https://github.com/ClickHouse/ClickHouse/pull/53481) ([Mike Kot](https://github.com/myrrc)).
-* Fix incorrect header in grace hash join and filter pushdown [#53922](https://github.com/ClickHouse/ClickHouse/pull/53922) ([vdimir](https://github.com/vdimir)).
-* Select from system tables when table based on table function. [#55540](https://github.com/ClickHouse/ClickHouse/pull/55540) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* RFC: Fix "Cannot find column X in source stream" for Distributed queries with LIMIT BY [#55836](https://github.com/ClickHouse/ClickHouse/pull/55836) ([Azat Khuzhin](https://github.com/azat)).
-* Fix 'Cannot read from file:' while running client in a background [#55976](https://github.com/ClickHouse/ClickHouse/pull/55976) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix clickhouse-local exit on bad send_logs_level setting [#55994](https://github.com/ClickHouse/ClickHouse/pull/55994) ([Kruglov Pavel](https://github.com/Avogar)).
-* Bug fix explain ast with parameterized view [#56004](https://github.com/ClickHouse/ClickHouse/pull/56004) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix a crash during table loading on startup [#56232](https://github.com/ClickHouse/ClickHouse/pull/56232) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix ClickHouse-sourced dictionaries with an explicit query [#56236](https://github.com/ClickHouse/ClickHouse/pull/56236) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix segfault in signal handler for Keeper [#56266](https://github.com/ClickHouse/ClickHouse/pull/56266) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix incomplete query result for UNION in view() function. [#56274](https://github.com/ClickHouse/ClickHouse/pull/56274) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix inconsistency of "cast('0' as DateTime64(3))" and "cast('0' as Nullable(DateTime64(3)))" [#56286](https://github.com/ClickHouse/ClickHouse/pull/56286) ([李扬](https://github.com/taiyang-li)).
-* Fix rare race condition related to Memory allocation failure [#56303](https://github.com/ClickHouse/ClickHouse/pull/56303) ([alesapin](https://github.com/alesapin)).
-* Fix restore from backup with `flatten_nested` and `data_type_default_nullable` [#56306](https://github.com/ClickHouse/ClickHouse/pull/56306) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix crash in case of adding a column with type Object(JSON) [#56307](https://github.com/ClickHouse/ClickHouse/pull/56307) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Fix crash in filterPushDown [#56380](https://github.com/ClickHouse/ClickHouse/pull/56380) ([vdimir](https://github.com/vdimir)).
-* Fix restore from backup with mat view and dropped source table [#56383](https://github.com/ClickHouse/ClickHouse/pull/56383) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix segfault during Kerberos initialization [#56401](https://github.com/ClickHouse/ClickHouse/pull/56401) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix buffer overflow in T64 [#56434](https://github.com/ClickHouse/ClickHouse/pull/56434) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix nullable primary key in final (2) [#56452](https://github.com/ClickHouse/ClickHouse/pull/56452) ([Amos Bird](https://github.com/amosbird)).
-* Fix ON CLUSTER queries without database on initial node [#56484](https://github.com/ClickHouse/ClickHouse/pull/56484) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix startup failure due to TTL dependency [#56489](https://github.com/ClickHouse/ClickHouse/pull/56489) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix ALTER COMMENT queries ON CLUSTER [#56491](https://github.com/ClickHouse/ClickHouse/pull/56491) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix ALTER COLUMN with ALIAS [#56493](https://github.com/ClickHouse/ClickHouse/pull/56493) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix empty NAMED COLLECTIONs [#56494](https://github.com/ClickHouse/ClickHouse/pull/56494) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix two cases of projection analysis. [#56502](https://github.com/ClickHouse/ClickHouse/pull/56502) ([Amos Bird](https://github.com/amosbird)).
-* Fix handling of aliases in query cache [#56545](https://github.com/ClickHouse/ClickHouse/pull/56545) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix conversion from `Nullable(Enum)` to `Nullable(String)` [#56644](https://github.com/ClickHouse/ClickHouse/pull/56644) ([Nikolay Degterinsky](https://github.com/evillique)).
-* More reliable log handling in Keeper [#56670](https://github.com/ClickHouse/ClickHouse/pull/56670) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix configuration merge for nodes with substitution attributes [#56694](https://github.com/ClickHouse/ClickHouse/pull/56694) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-* Fix duplicate usage of table function input(). [#56695](https://github.com/ClickHouse/ClickHouse/pull/56695) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix: RabbitMQ OpenSSL dynamic loading issue [#56703](https://github.com/ClickHouse/ClickHouse/pull/56703) ([Igor Nikonov](https://github.com/devcrafter)).
-* Fix crash in GCD codec in case when zeros present in data [#56704](https://github.com/ClickHouse/ClickHouse/pull/56704) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Fix 'mutex lock failed: Invalid argument' in clickhouse-local during insert into function [#56710](https://github.com/ClickHouse/ClickHouse/pull/56710) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix Date text parsing in optimistic path [#56765](https://github.com/ClickHouse/ClickHouse/pull/56765) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix crash in FPC codec [#56795](https://github.com/ClickHouse/ClickHouse/pull/56795) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* DatabaseReplicated: fix DDL query timeout after recovering a replica [#56796](https://github.com/ClickHouse/ClickHouse/pull/56796) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix incorrect nullable columns reporting in MySQL binary protocol [#56799](https://github.com/ClickHouse/ClickHouse/pull/56799) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Support Iceberg metadata files for metastore tables [#56810](https://github.com/ClickHouse/ClickHouse/pull/56810) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix TSAN report under transform [#56817](https://github.com/ClickHouse/ClickHouse/pull/56817) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix SET query and SETTINGS formatting [#56825](https://github.com/ClickHouse/ClickHouse/pull/56825) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix failure to start due to table dependency in joinGet [#56828](https://github.com/ClickHouse/ClickHouse/pull/56828) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix flattening existing Nested columns during ADD COLUMN [#56830](https://github.com/ClickHouse/ClickHouse/pull/56830) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix allow cr end of line for csv [#56901](https://github.com/ClickHouse/ClickHouse/pull/56901) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Fix `tryBase64Decode` with invalid input [#56913](https://github.com/ClickHouse/ClickHouse/pull/56913) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix generating deep nested columns in CapnProto/Protobuf schemas [#56941](https://github.com/ClickHouse/ClickHouse/pull/56941) ([Kruglov Pavel](https://github.com/Avogar)).
-* Prevent incompatible ALTER of projection columns [#56948](https://github.com/ClickHouse/ClickHouse/pull/56948) ([Amos Bird](https://github.com/amosbird)).
-* Fix sqlite file path validation [#56984](https://github.com/ClickHouse/ClickHouse/pull/56984) ([San](https://github.com/santrancisco)).
-* S3Queue: fix metadata reference increment [#56990](https://github.com/ClickHouse/ClickHouse/pull/56990) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* S3Queue minor fix [#56999](https://github.com/ClickHouse/ClickHouse/pull/56999) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix file path validation for DatabaseFileSystem [#57029](https://github.com/ClickHouse/ClickHouse/pull/57029) ([San](https://github.com/santrancisco)).
-* Fix `fuzzBits` with `ARRAY JOIN` [#57033](https://github.com/ClickHouse/ClickHouse/pull/57033) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix Nullptr dereference in partial merge join with joined_subquery_re… [#57048](https://github.com/ClickHouse/ClickHouse/pull/57048) ([vdimir](https://github.com/vdimir)).
-* Fix race condition in RemoteSource [#57052](https://github.com/ClickHouse/ClickHouse/pull/57052) ([Raúl Marín](https://github.com/Algunenano)).
-* Implement `bitHammingDistance` for big integers [#57073](https://github.com/ClickHouse/ClickHouse/pull/57073) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* S3-style links bug fix [#57075](https://github.com/ClickHouse/ClickHouse/pull/57075) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Fix JSON_QUERY function with multiple numeric paths [#57096](https://github.com/ClickHouse/ClickHouse/pull/57096) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Fix buffer overflow in Gorilla codec [#57107](https://github.com/ClickHouse/ClickHouse/pull/57107) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Close interserver connection on any exception before authentication [#57142](https://github.com/ClickHouse/ClickHouse/pull/57142) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix segfault after ALTER UPDATE with Nullable MATERIALIZED column [#57147](https://github.com/ClickHouse/ClickHouse/pull/57147) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix incorrect JOIN plan optimization with partially materialized normal projection [#57196](https://github.com/ClickHouse/ClickHouse/pull/57196) ([Amos Bird](https://github.com/amosbird)).
-* Ignore comments when comparing column descriptions [#57259](https://github.com/ClickHouse/ClickHouse/pull/57259) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix `ReadonlyReplica` metric for all cases [#57267](https://github.com/ClickHouse/ClickHouse/pull/57267) ([Antonio Andelic](https://github.com/antonio2368)).
-* Background merges correctly use temporary data storage in the cache [#57275](https://github.com/ClickHouse/ClickHouse/pull/57275) ([vdimir](https://github.com/vdimir)).
-* Keeper fix for changelog and snapshots [#57299](https://github.com/ClickHouse/ClickHouse/pull/57299) ([Antonio Andelic](https://github.com/antonio2368)).
-* Ignore finished ON CLUSTER tasks if hostname changed [#57339](https://github.com/ClickHouse/ClickHouse/pull/57339) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* MergeTree mutations reuse source part index granularity [#57352](https://github.com/ClickHouse/ClickHouse/pull/57352) ([Maksim Kita](https://github.com/kitaisreal)).
-* FS cache: add a limit for background download [#57424](https://github.com/ClickHouse/ClickHouse/pull/57424) ([Kseniia Sumarokova](https://github.com/kssenii)).
-
-
-### <a id="2310"></a> ClickHouse release 23.10, 2023-11-02
-
-#### Backward Incompatible Change
-* There is no longer an option to automatically remove broken data parts. This closes [#55174](https://github.com/ClickHouse/ClickHouse/issues/55174). [#55184](https://github.com/ClickHouse/ClickHouse/pull/55184) ([Alexey Milovidov](https://github.com/alexey-milovidov)). [#55557](https://github.com/ClickHouse/ClickHouse/pull/55557) ([Jihyuk Bok](https://github.com/tomahawk28)).
-* The obsolete in-memory data parts can no longer be read from the write-ahead log. If you have configured in-memory parts before, they have to be removed before the upgrade. [#55186](https://github.com/ClickHouse/ClickHouse/pull/55186) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Remove the integration with Meilisearch. Reason: it was compatible only with the old version 0.18. The recent version of Meilisearch changed the protocol and does not work anymore. Note: we would appreciate it if you help to return it back. [#55189](https://github.com/ClickHouse/ClickHouse/pull/55189) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Rename directory monitor concept into background INSERT. All the settings `*directory_monitor*` had been renamed to `distributed_background_insert*`. *Backward compatibility should be preserved* (since old settings had been added as an alias). [#55978](https://github.com/ClickHouse/ClickHouse/pull/55978) ([Azat Khuzhin](https://github.com/azat)).
-* Do not interpret the `send_timeout` set on the client side as the `receive_timeout` on the server side and vise-versa. [#56035](https://github.com/ClickHouse/ClickHouse/pull/56035) ([Azat Khuzhin](https://github.com/azat)).
-* Comparison of time intervals with different units will throw an exception. This closes [#55942](https://github.com/ClickHouse/ClickHouse/issues/55942). You might have occasionally rely on the previous behavior when the underlying numeric values were compared regardless of the units. [#56090](https://github.com/ClickHouse/ClickHouse/pull/56090) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Rewrited the experimental `S3Queue` table engine completely: changed the way we keep information in zookeeper which allows to make less zookeeper requests, added caching of zookeeper state in cases when we know the state will not change, improved the polling from s3 process to make it less aggressive, changed the way ttl and max set for trached files is maintained, now it is a background process. Added `system.s3queue` and `system.s3queue_log` tables. Closes [#54998](https://github.com/ClickHouse/ClickHouse/issues/54998). [#54422](https://github.com/ClickHouse/ClickHouse/pull/54422) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Arbitrary paths on HTTP endpoint are no longer interpreted as a request to the `/query` endpoint. [#55521](https://github.com/ClickHouse/ClickHouse/pull/55521) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-
-#### New Feature
-* Add function `arrayFold(accumulator, x1, ..., xn -> expression, initial, array1, ..., arrayn)` which applies a lambda function to multiple arrays of the same cardinality and collects the result in an accumulator. [#49794](https://github.com/ClickHouse/ClickHouse/pull/49794) ([Lirikl](https://github.com/Lirikl)).
-* Support for `Npy` format. `SELECT * FROM file('example_array.npy', Npy)`. [#55982](https://github.com/ClickHouse/ClickHouse/pull/55982) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* If a table has a space-filling curve in its key, e.g., `ORDER BY mortonEncode(x, y)`, the conditions on its arguments, e.g., `x >= 10 AND x <= 20 AND y >= 20 AND y <= 30` can be used for indexing. A setting `analyze_index_with_space_filling_curves` is added to enable or disable this analysis. This closes [#41195](https://github.com/ClickHouse/ClickHouse/issue/41195). Continuation of [#4538](https://github.com/ClickHouse/ClickHouse/pull/4538). Continuation of [#6286](https://github.com/ClickHouse/ClickHouse/pull/6286). Continuation of [#28130](https://github.com/ClickHouse/ClickHouse/pull/28130). Continuation of [#41753](https://github.com/ClickHouse/ClickHouse/pull/#41753). [#55642](https://github.com/ClickHouse/ClickHouse/pull/55642) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* A new setting called `force_optimize_projection_name`, it takes a name of projection as an argument. If it's value set to a non-empty string, ClickHouse checks that this projection is used in the query at least once. Closes [#55331](https://github.com/ClickHouse/ClickHouse/issues/55331). [#56134](https://github.com/ClickHouse/ClickHouse/pull/56134) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Support asynchronous inserts with external data via native protocol. Previously it worked only if data is inlined into query. [#54730](https://github.com/ClickHouse/ClickHouse/pull/54730) ([Anton Popov](https://github.com/CurtizJ)).
-* Added aggregation function `lttb` which uses the [Largest-Triangle-Three-Buckets](https://skemman.is/bitstream/1946/15343/3/SS_MSthesis.pdf) algorithm for downsampling data for visualization. [#53145](https://github.com/ClickHouse/ClickHouse/pull/53145) ([Sinan](https://github.com/sinsinan)).
-* Query`CHECK TABLE` has better performance and usability (sends progress updates, cancellable). Support checking particular part with `CHECK TABLE ... PART 'part_name'`. [#53404](https://github.com/ClickHouse/ClickHouse/pull/53404) ([vdimir](https://github.com/vdimir)).
-* Added function `jsonMergePatch`. When working with JSON data as strings, it provides a way to merge these strings (of JSON objects) together to form a single string containing a single JSON object. [#54364](https://github.com/ClickHouse/ClickHouse/pull/54364) ([Memo](https://github.com/Joeywzr)).
-* The second part of Kusto Query Language dialect support. [Phase 1 implementation ](https://github.com/ClickHouse/ClickHouse/pull/37961) has been merged. [#42510](https://github.com/ClickHouse/ClickHouse/pull/42510) ([larryluogit](https://github.com/larryluogit)).
-* Added a new SQL function, `arrayRandomSample(arr, k)` which returns a sample of k elements from the input array. Similar functionality could previously be achieved only with less convenient syntax, e.g. "SELECT arrayReduce('groupArraySample(3)', range(10))". [#54391](https://github.com/ClickHouse/ClickHouse/pull/54391) ([itayisraelov](https://github.com/itayisraelov)).
-* Introduce `-ArgMin`/`-ArgMax` aggregate combinators which allow to aggregate by min/max values only. One use case can be found in [#54818](https://github.com/ClickHouse/ClickHouse/issues/54818). This PR also reorganize combinators into dedicated folder. [#54947](https://github.com/ClickHouse/ClickHouse/pull/54947) ([Amos Bird](https://github.com/amosbird)).
-* Allow to drop cache for Protobuf format with `SYSTEM DROP SCHEMA FORMAT CACHE [FOR Protobuf]`. [#55064](https://github.com/ClickHouse/ClickHouse/pull/55064) ([Aleksandr Musorin](https://github.com/AVMusorin)).
-* Add external HTTP Basic authenticator. [#55199](https://github.com/ClickHouse/ClickHouse/pull/55199) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* Added function `byteSwap` which reverses the bytes of unsigned integers. This is particularly useful for reversing values of types which are represented as unsigned integers internally such as IPv4. [#55211](https://github.com/ClickHouse/ClickHouse/pull/55211) ([Priyansh Agrawal](https://github.com/Priyansh121096)).
-* Added function `formatQuery` which returns a formatted version (possibly spanning multiple lines) of a SQL query string. Also added function `formatQuerySingleLine` which does the same but the returned string will not contain linebreaks. [#55239](https://github.com/ClickHouse/ClickHouse/pull/55239) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Added `DWARF` input format that reads debug symbols from an ELF executable/library/object file. [#55450](https://github.com/ClickHouse/ClickHouse/pull/55450) ([Michael Kolupaev](https://github.com/al13n321)).
-* Allow to save unparsed records and errors in RabbitMQ, NATS and FileLog engines. Add virtual columns `_error` and `_raw_message`(for NATS and RabbitMQ), `_raw_record` (for FileLog) that are filled when ClickHouse fails to parse new record. The behaviour is controlled under storage settings `nats_handle_error_mode` for NATS, `rabbitmq_handle_error_mode` for RabbitMQ, `handle_error_mode` for FileLog similar to `kafka_handle_error_mode`. If it's set to `default`, en exception will be thrown when ClickHouse fails to parse a record, if it's set to `stream`, erorr and raw record will be saved into virtual columns. Closes [#36035](https://github.com/ClickHouse/ClickHouse/issues/36035). [#55477](https://github.com/ClickHouse/ClickHouse/pull/55477) ([Kruglov Pavel](https://github.com/Avogar)).
-* Keeper client improvement: add `get_all_children_number command` that returns number of all children nodes under a specific path. [#55485](https://github.com/ClickHouse/ClickHouse/pull/55485) ([guoxiaolong](https://github.com/guoxiaolongzte)).
-* Keeper client improvement: add `get_direct_children_number` command that returns number of direct children nodes under a path. [#55898](https://github.com/ClickHouse/ClickHouse/pull/55898) ([xuzifu666](https://github.com/xuzifu666)).
-* Add statement `SHOW SETTING setting_name` which is a simpler version of existing statement `SHOW SETTINGS`. [#55979](https://github.com/ClickHouse/ClickHouse/pull/55979) ([Maksim Kita](https://github.com/kitaisreal)).
-* Added fields `substreams` and `filenames` to the `system.parts_columns` table. [#55108](https://github.com/ClickHouse/ClickHouse/pull/55108) ([Anton Popov](https://github.com/CurtizJ)).
-* Add support for `SHOW MERGES` query. [#55815](https://github.com/ClickHouse/ClickHouse/pull/55815) ([megao](https://github.com/jetgm)).
-* Introduce a setting `create_table_empty_primary_key_by_default` for default `ORDER BY ()`. [#55899](https://github.com/ClickHouse/ClickHouse/pull/55899) ([Srikanth Chekuri](https://github.com/srikanthccv)).
-
-#### Performance Improvement
-* Add option `query_plan_preserve_num_streams_after_window_functions` to preserve the number of streams after evaluating window functions to allow parallel stream processing. [#50771](https://github.com/ClickHouse/ClickHouse/pull/50771) ([frinkr](https://github.com/frinkr)).
-* Release more streams if data is small. [#53867](https://github.com/ClickHouse/ClickHouse/pull/53867) ([Jiebin Sun](https://github.com/jiebinn)).
-* RoaringBitmaps being optimized before serialization. [#55044](https://github.com/ClickHouse/ClickHouse/pull/55044) ([UnamedRus](https://github.com/UnamedRus)).
-* Posting lists in inverted indexes are now optimized to use the smallest possible representation for internal bitmaps. Depending on the repetitiveness of the data, this may significantly reduce the space consumption of inverted indexes. [#55069](https://github.com/ClickHouse/ClickHouse/pull/55069) ([Harry Lee](https://github.com/HarryLeeIBM)).
-* Fix contention on Context lock, this significantly improves performance for a lot of short-running concurrent queries. [#55121](https://github.com/ClickHouse/ClickHouse/pull/55121) ([Maksim Kita](https://github.com/kitaisreal)).
-* Improved the performance of inverted index creation by 30%. This was achieved by replacing `std::unordered_map` with `absl::flat_hash_map`. [#55210](https://github.com/ClickHouse/ClickHouse/pull/55210) ([Harry Lee](https://github.com/HarryLeeIBM)).
-* Support ORC filter push down (rowgroup level). [#55330](https://github.com/ClickHouse/ClickHouse/pull/55330) ([李扬](https://github.com/taiyang-li)).
-* Improve performance of external aggregation with a lot of temporary files. [#55489](https://github.com/ClickHouse/ClickHouse/pull/55489) ([Maksim Kita](https://github.com/kitaisreal)).
-* Set a reasonable size for the marks cache for secondary indices by default to avoid loading the marks over and over again. [#55654](https://github.com/ClickHouse/ClickHouse/pull/55654) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Avoid unnecessary reconstruction of index granules when reading skip indexes. This addresses [#55653](https://github.com/ClickHouse/ClickHouse/issues/55653#issuecomment-1763766009). [#55683](https://github.com/ClickHouse/ClickHouse/pull/55683) ([Amos Bird](https://github.com/amosbird)).
-* Cache CAST function in set during execution to improve the performance of function `IN` when set element type doesn't exactly match column type. [#55712](https://github.com/ClickHouse/ClickHouse/pull/55712) ([Duc Canh Le](https://github.com/canhld94)).
-* Performance improvement for `ColumnVector::insertMany` and `ColumnVector::insertManyFrom`. [#55714](https://github.com/ClickHouse/ClickHouse/pull/55714) ([frinkr](https://github.com/frinkr)).
-* Optimized Map subscript operations by predicting the next row's key position and reduce the comparisons. [#55929](https://github.com/ClickHouse/ClickHouse/pull/55929) ([lgbo](https://github.com/lgbo-ustc)).
-* Support struct fields pruning in Parquet (in previous versions it didn't work in some cases). [#56117](https://github.com/ClickHouse/ClickHouse/pull/56117) ([lgbo](https://github.com/lgbo-ustc)).
-* Add the ability to tune the number of parallel replicas used in a query execution based on the estimation of rows to read. [#51692](https://github.com/ClickHouse/ClickHouse/pull/51692) ([Raúl Marín](https://github.com/Algunenano)).
-* Optimized external aggregation memory consumption in case many temporary files were generated. [#54798](https://github.com/ClickHouse/ClickHouse/pull/54798) ([Nikita Taranov](https://github.com/nickitat)).
-* Distributed queries executed in `async_socket_for_remote` mode (default) now respect `max_threads` limit. Previously, some queries could create excessive threads (up to `max_distributed_connections`), causing server performance issues. [#53504](https://github.com/ClickHouse/ClickHouse/pull/53504) ([filimonov](https://github.com/filimonov)).
-* Caching skip-able entries while executing DDL from Zookeeper distributed DDL queue. [#54828](https://github.com/ClickHouse/ClickHouse/pull/54828) ([Duc Canh Le](https://github.com/canhld94)).
-* Experimental inverted indexes do not store tokens with too many matches (i.e. row ids in the posting list). This saves space and avoids ineffective index lookups when sequential scans would be equally fast or faster. The previous heuristics (`density` parameter passed to the index definition) that controlled when tokens would not be stored was too confusing for users. A much simpler heuristics based on parameter `max_rows_per_postings_list` (default: 64k) is introduced which directly controls the maximum allowed number of row ids in a postings list. [#55616](https://github.com/ClickHouse/ClickHouse/pull/55616) ([Harry Lee](https://github.com/HarryLeeIBM)).
-* Improve write performance to `EmbeddedRocksDB` tables. [#55732](https://github.com/ClickHouse/ClickHouse/pull/55732) ([Duc Canh Le](https://github.com/canhld94)).
-* Improved overall resilience for ClickHouse in case of many parts within partition (more than 1000). It might reduce the number of `TOO_MANY_PARTS` errors. [#55526](https://github.com/ClickHouse/ClickHouse/pull/55526) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Reduced memory consumption during loading of hierarchical dictionaries. [#55838](https://github.com/ClickHouse/ClickHouse/pull/55838) ([Nikita Taranov](https://github.com/nickitat)).
-* All dictionaries support setting `dictionary_use_async_executor`. [#55839](https://github.com/ClickHouse/ClickHouse/pull/55839) ([vdimir](https://github.com/vdimir)).
-* Prevent excesive memory usage when deserializing AggregateFunctionTopKGenericData. [#55947](https://github.com/ClickHouse/ClickHouse/pull/55947) ([Raúl Marín](https://github.com/Algunenano)).
-* On a Keeper with lots of watches AsyncMetrics threads can consume 100% of CPU for noticable time in `DB::KeeperStorage::getSessionsWithWatchesCount`. The fix is to avoid traversing heavy `watches` and `list_watches` sets. [#56054](https://github.com/ClickHouse/ClickHouse/pull/56054) ([Alexander Gololobov](https://github.com/davenger)).
-* Add setting `optimize_trivial_approximate_count_query` to use `count` approximation for storage EmbeddedRocksDB. Enable trivial count for StorageJoin. [#55806](https://github.com/ClickHouse/ClickHouse/pull/55806) ([Duc Canh Le](https://github.com/canhld94)).
-
-#### Improvement
-* Functions `toDayOfWeek` (MySQL alias: `DAYOFWEEK`), `toYearWeek` (`YEARWEEK`) and `toWeek` (`WEEK`) now supports `String` arguments. This makes its behavior consistent with MySQL's behavior. [#55589](https://github.com/ClickHouse/ClickHouse/pull/55589) ([Robert Schulze](https://github.com/rschu1ze)).
-* Introduced setting `date_time_overflow_behavior` with possible values `ignore`, `throw`, `saturate` that controls the overflow behavior when converting from Date, Date32, DateTime64, Integer or Float to Date, Date32, DateTime or DateTime64. [#55696](https://github.com/ClickHouse/ClickHouse/pull/55696) ([Andrey Zvonov](https://github.com/zvonand)).
-* Implement query parameters support for `ALTER TABLE ... ACTION PARTITION [ID] {parameter_name:ParameterType}`. Merges [#49516](https://github.com/ClickHouse/ClickHouse/issues/49516). Closes [#49449](https://github.com/ClickHouse/ClickHouse/issues/49449). [#55604](https://github.com/ClickHouse/ClickHouse/pull/55604) ([alesapin](https://github.com/alesapin)).
-* Print processor ids in a prettier manner in EXPLAIN. [#48852](https://github.com/ClickHouse/ClickHouse/pull/48852) ([Vlad Seliverstov](https://github.com/behebot)).
-* Creating a direct dictionary with a lifetime field will be rejected at create time (as the lifetime does not make sense for direct dictionaries). Fixes: [#27861](https://github.com/ClickHouse/ClickHouse/issues/27861). [#49043](https://github.com/ClickHouse/ClickHouse/pull/49043) ([Rory Crispin](https://github.com/RoryCrispin)).
-* Allow parameters in queries with partitions like `ALTER TABLE t DROP PARTITION`. Closes [#49449](https://github.com/ClickHouse/ClickHouse/issues/49449). [#49516](https://github.com/ClickHouse/ClickHouse/pull/49516) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add a new column `xid` for `system.zookeeper_connection`. [#50702](https://github.com/ClickHouse/ClickHouse/pull/50702) ([helifu](https://github.com/helifu)).
-* Display the correct server settings in `system.server_settings` after configuration reload. [#53774](https://github.com/ClickHouse/ClickHouse/pull/53774) ([helifu](https://github.com/helifu)).
-* Add support for mathematical minus `−` character in queries, similar to `-`. [#54100](https://github.com/ClickHouse/ClickHouse/pull/54100) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add replica groups to the experimental `Replicated` database engine. Closes [#53620](https://github.com/ClickHouse/ClickHouse/issues/53620). [#54421](https://github.com/ClickHouse/ClickHouse/pull/54421) ([Nikolay Degterinsky](https://github.com/evillique)).
-* It is better to retry retriable s3 errors than totally fail the query. Set bigger value to the s3_retry_attempts by default. [#54770](https://github.com/ClickHouse/ClickHouse/pull/54770) ([Sema Checherinda](https://github.com/CheSema)).
-* Add load balancing mode `hostname_levenshtein_distance`. [#54826](https://github.com/ClickHouse/ClickHouse/pull/54826) ([JackyWoo](https://github.com/JackyWoo)).
-* Improve hiding secrets in logs. [#55089](https://github.com/ClickHouse/ClickHouse/pull/55089) ([Vitaly Baranov](https://github.com/vitlibar)).
-* For now the projection analysis will be performed only on top of query plan. The setting `query_plan_optimize_projection` became obsolete (it was enabled by default long time ago). [#55112](https://github.com/ClickHouse/ClickHouse/pull/55112) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* When function `untuple` is now called on a tuple with named elements and itself has an alias (e.g. `select untuple(tuple(1)::Tuple(element_alias Int)) AS untuple_alias`), then the result column name is now generated from the untuple alias and the tuple element alias (in the example: "untuple_alias.element_alias"). [#55123](https://github.com/ClickHouse/ClickHouse/pull/55123) ([garcher22](https://github.com/garcher22)).
-* Added setting `describe_include_virtual_columns`, which allows to include virtual columns of table into result of `DESCRIBE` query. Added setting `describe_compact_output`. If it is set to `true`, `DESCRIBE` query returns only names and types of columns without extra information. [#55129](https://github.com/ClickHouse/ClickHouse/pull/55129) ([Anton Popov](https://github.com/CurtizJ)).
-* Sometimes `OPTIMIZE` with `optimize_throw_if_noop=1` may fail with an error `unknown reason` while the real cause of it - different projections in different parts. This behavior is fixed. [#55130](https://github.com/ClickHouse/ClickHouse/pull/55130) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Allow to have several `MaterializedPostgreSQL` tables following the same Postgres table. By default this behaviour is not enabled (for compatibility, because it is a backward-incompatible change), but can be turned on with setting `materialized_postgresql_use_unique_replication_consumer_identifier`. Closes [#54918](https://github.com/ClickHouse/ClickHouse/issues/54918). [#55145](https://github.com/ClickHouse/ClickHouse/pull/55145) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Allow to parse negative `DateTime64` and `DateTime` with fractional part from short strings. [#55146](https://github.com/ClickHouse/ClickHouse/pull/55146) ([Andrey Zvonov](https://github.com/zvonand)).
-* To improve compatibility with MySQL, 1. `information_schema.tables` now includes the new field `table_rows`, and 2. `information_schema.columns` now includes the new field `extra`. [#55215](https://github.com/ClickHouse/ClickHouse/pull/55215) ([Robert Schulze](https://github.com/rschu1ze)).
-* Clickhouse-client won't show "0 rows in set" if it is zero and if exception was thrown. [#55240](https://github.com/ClickHouse/ClickHouse/pull/55240) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Support rename table without keyword `TABLE` like `RENAME db.t1 to db.t2`. [#55373](https://github.com/ClickHouse/ClickHouse/pull/55373) ([凌涛](https://github.com/lingtaolf)).
-* Add `internal_replication` to `system.clusters`. [#55377](https://github.com/ClickHouse/ClickHouse/pull/55377) ([Konstantin Morozov](https://github.com/k-morozov)).
-* Select remote proxy resolver based on request protocol, add proxy feature docs and remove `DB::ProxyConfiguration::Protocol::ANY`. [#55430](https://github.com/ClickHouse/ClickHouse/pull/55430) ([Arthur Passos](https://github.com/arthurpassos)).
-* Avoid retrying keeper operations on INSERT after table shutdown. [#55519](https://github.com/ClickHouse/ClickHouse/pull/55519) ([Azat Khuzhin](https://github.com/azat)).
-* `SHOW COLUMNS` now correctly reports type `FixedString` as `BLOB` if setting `use_mysql_types_in_show_columns` is on. Also added two new settings, `mysql_map_string_to_text_in_show_columns` and `mysql_map_fixed_string_to_text_in_show_columns` to switch the output for types `String` and `FixedString` as `TEXT` or `BLOB`. [#55617](https://github.com/ClickHouse/ClickHouse/pull/55617) ([Serge Klochkov](https://github.com/slvrtrn)).
-* During ReplicatedMergeTree tables startup clickhouse server checks set of parts for unexpected parts (exists locally, but not in zookeeper). All unexpected parts move to detached directory and instead of them server tries to restore some ancestor (covered) parts. Now server tries to restore closest ancestors instead of random covered parts. [#55645](https://github.com/ClickHouse/ClickHouse/pull/55645) ([alesapin](https://github.com/alesapin)).
-* The advanced dashboard now supports draggable charts on touch devices. This closes [#54206](https://github.com/ClickHouse/ClickHouse/issues/54206). [#55649](https://github.com/ClickHouse/ClickHouse/pull/55649) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Use the default query format if declared when outputting exception with `http_write_exception_in_output_format`. [#55739](https://github.com/ClickHouse/ClickHouse/pull/55739) ([Raúl Marín](https://github.com/Algunenano)).
-* Provide a better message for common MATERIALIZED VIEW pitfalls. [#55826](https://github.com/ClickHouse/ClickHouse/pull/55826) ([Raúl Marín](https://github.com/Algunenano)).
-* If you dropped the current database, you will still be able to run some queries in `clickhouse-local` and switch to another database. This makes the behavior consistent with `clickhouse-client`. This closes [#55834](https://github.com/ClickHouse/ClickHouse/issues/55834). [#55853](https://github.com/ClickHouse/ClickHouse/pull/55853) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Functions `(add|subtract)(Year|Quarter|Month|Week|Day|Hour|Minute|Second|Millisecond|Microsecond|Nanosecond)` now support string-encoded date arguments, e.g. `SELECT addDays('2023-10-22', 1)`. This increases compatibility with MySQL and is needed by Tableau Online. [#55869](https://github.com/ClickHouse/ClickHouse/pull/55869) ([Robert Schulze](https://github.com/rschu1ze)).
-* The setting `apply_deleted_mask` when disabled allows to read rows that where marked as deleted by lightweight DELETE queries. This is useful for debugging. [#55952](https://github.com/ClickHouse/ClickHouse/pull/55952) ([Alexander Gololobov](https://github.com/davenger)).
-* Allow skipping `null` values when serailizing Tuple to json objects, which makes it possible to keep compatiability with Spark's `to_json` function, which is also useful for gluten. [#55956](https://github.com/ClickHouse/ClickHouse/pull/55956) ([李扬](https://github.com/taiyang-li)).
-* Functions `(add|sub)Date` now support string-encoded date arguments, e.g. `SELECT addDate('2023-10-22 11:12:13', INTERVAL 5 MINUTE)`. The same support for string-encoded date arguments is added to the plus and minus operators, e.g. `SELECT '2023-10-23' + INTERVAL 1 DAY`. This increases compatibility with MySQL and is needed by Tableau Online. [#55960](https://github.com/ClickHouse/ClickHouse/pull/55960) ([Robert Schulze](https://github.com/rschu1ze)).
-* Allow unquoted strings with CR (`\r`) in CSV format. Closes [#39930](https://github.com/ClickHouse/ClickHouse/issues/39930). [#56046](https://github.com/ClickHouse/ClickHouse/pull/56046) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow to run `clickhouse-keeper` using embedded config. [#56086](https://github.com/ClickHouse/ClickHouse/pull/56086) ([Maksim Kita](https://github.com/kitaisreal)).
-* Set limit of the maximum configuration value for `queued.min.messages` to avoid problem with start fetching data with Kafka. [#56121](https://github.com/ClickHouse/ClickHouse/pull/56121) ([Stas Morozov](https://github.com/r3b-fish)).
-* Fixed a typo in SQL function `minSampleSizeContinous` (renamed `minSampleSizeContinuous`). Old name is preserved for backward compatibility. This closes: [#56139](https://github.com/ClickHouse/ClickHouse/issues/56139). [#56143](https://github.com/ClickHouse/ClickHouse/pull/56143) ([Dorota Szeremeta](https://github.com/orotaday)).
-* Print path for broken parts on disk before shutting down the server. Before this change if a part is corrupted on disk and server cannot start, it was almost impossible to understand which part is broken. This is fixed. [#56181](https://github.com/ClickHouse/ClickHouse/pull/56181) ([Duc Canh Le](https://github.com/canhld94)).
-
-#### Build/Testing/Packaging Improvement
-* If the database in Docker is already initialized, it doesn't need to be initialized again upon subsequent launches. This can potentially fix the issue of infinite container restarts when the database fails to load within 1000 attempts (relevant for very large databases and multi-node setups). [#50724](https://github.com/ClickHouse/ClickHouse/pull/50724) ([Alexander Nikolaev](https://github.com/AlexNik)).
-* Resource with source code including submodules is built in Darwin special build task. It may be used to build ClickHouse without checking out the submodules. [#51435](https://github.com/ClickHouse/ClickHouse/pull/51435) ([Ilya Yatsishin](https://github.com/qoega)).
-* An error was occuring when building ClickHouse with the AVX series of instructions enabled globally (which isn't recommended). The reason is that snappy does not enable `SNAPPY_HAVE_X86_CRC32`. [#55049](https://github.com/ClickHouse/ClickHouse/pull/55049) ([monchickey](https://github.com/monchickey)).
-* Solve issue with launching standalone `clickhouse-keeper` from `clickhouse-server` package. [#55226](https://github.com/ClickHouse/ClickHouse/pull/55226) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* In the tests, RabbitMQ version is updated to 3.12.6. Improved logs collection for RabbitMQ tests. [#55424](https://github.com/ClickHouse/ClickHouse/pull/55424) ([Ilya Yatsishin](https://github.com/qoega)).
-* Modified the error message difference between openssl and boringssl to fix the functional test. [#55975](https://github.com/ClickHouse/ClickHouse/pull/55975) ([MeenaRenganathan22](https://github.com/MeenaRenganathan22)).
-* Use upstream repo for apache datasketches. [#55787](https://github.com/ClickHouse/ClickHouse/pull/55787) ([Nikita Taranov](https://github.com/nickitat)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Skip hardlinking inverted index files in mutation [#47663](https://github.com/ClickHouse/ClickHouse/pull/47663) ([cangyin](https://github.com/cangyin)).
-* Fixed bug of `match` function (regex) with pattern containing alternation produces incorrect key condition. Closes #53222. [#54696](https://github.com/ClickHouse/ClickHouse/pull/54696) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix 'Cannot find column' in read-in-order optimization with ARRAY JOIN [#51746](https://github.com/ClickHouse/ClickHouse/pull/51746) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Support missed experimental `Object(Nullable(json))` subcolumns in query. [#54052](https://github.com/ClickHouse/ClickHouse/pull/54052) ([zps](https://github.com/VanDarkholme7)).
-* Re-add fix for `accurateCastOrNull` [#54629](https://github.com/ClickHouse/ClickHouse/pull/54629) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Fix detecting `DEFAULT` for columns of a Distributed table created without AS [#55060](https://github.com/ClickHouse/ClickHouse/pull/55060) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Proper cleanup in case of exception in ctor of ShellCommandSource [#55103](https://github.com/ClickHouse/ClickHouse/pull/55103) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix deadlock in LDAP assigned role update [#55119](https://github.com/ClickHouse/ClickHouse/pull/55119) ([Julian Maicher](https://github.com/jmaicher)).
-* Suppress error statistics update for internal exceptions [#55128](https://github.com/ClickHouse/ClickHouse/pull/55128) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix deadlock in backups [#55132](https://github.com/ClickHouse/ClickHouse/pull/55132) ([alesapin](https://github.com/alesapin)).
-* Fix storage Iceberg files retrieval [#55144](https://github.com/ClickHouse/ClickHouse/pull/55144) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix partition pruning of extra columns in set. [#55172](https://github.com/ClickHouse/ClickHouse/pull/55172) ([Amos Bird](https://github.com/amosbird)).
-* Fix recalculation of skip indexes in ALTER UPDATE queries when table has adaptive granularity [#55202](https://github.com/ClickHouse/ClickHouse/pull/55202) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix for background download in fs cache [#55252](https://github.com/ClickHouse/ClickHouse/pull/55252) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Avoid possible memory leaks in compressors in case of missing buffer finalization [#55262](https://github.com/ClickHouse/ClickHouse/pull/55262) ([Azat Khuzhin](https://github.com/azat)).
-* Fix functions execution over sparse columns [#55275](https://github.com/ClickHouse/ClickHouse/pull/55275) ([Azat Khuzhin](https://github.com/azat)).
-* Fix incorrect merging of Nested for SELECT FINAL FROM SummingMergeTree [#55276](https://github.com/ClickHouse/ClickHouse/pull/55276) ([Azat Khuzhin](https://github.com/azat)).
-* Fix bug with inability to drop detached partition in replicated merge tree on top of S3 without zero copy [#55309](https://github.com/ClickHouse/ClickHouse/pull/55309) ([alesapin](https://github.com/alesapin)).
-* Fix a crash in MergeSortingPartialResultTransform (due to zero chunks after `remerge`) [#55335](https://github.com/ClickHouse/ClickHouse/pull/55335) ([Azat Khuzhin](https://github.com/azat)).
-* Fix data-race in CreatingSetsTransform (on errors) due to throwing shared exception [#55338](https://github.com/ClickHouse/ClickHouse/pull/55338) ([Azat Khuzhin](https://github.com/azat)).
-* Fix trash optimization (up to a certain extent) [#55353](https://github.com/ClickHouse/ClickHouse/pull/55353) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix leak in StorageHDFS [#55370](https://github.com/ClickHouse/ClickHouse/pull/55370) ([Azat Khuzhin](https://github.com/azat)).
-* Fix parsing of arrays in cast operator [#55417](https://github.com/ClickHouse/ClickHouse/pull/55417) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix filtering by virtual columns with OR filter in query [#55418](https://github.com/ClickHouse/ClickHouse/pull/55418) ([Azat Khuzhin](https://github.com/azat)).
-* Fix MongoDB connection issues [#55419](https://github.com/ClickHouse/ClickHouse/pull/55419) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix MySQL interface boolean representation [#55427](https://github.com/ClickHouse/ClickHouse/pull/55427) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Fix MySQL text protocol DateTime formatting and LowCardinality(Nullable(T)) types reporting [#55479](https://github.com/ClickHouse/ClickHouse/pull/55479) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Make `use_mysql_types_in_show_columns` affect only `SHOW COLUMNS` [#55481](https://github.com/ClickHouse/ClickHouse/pull/55481) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix stack symbolizer parsing `DW_FORM_ref_addr` incorrectly and sometimes crashing [#55483](https://github.com/ClickHouse/ClickHouse/pull/55483) ([Michael Kolupaev](https://github.com/al13n321)).
-* Destroy fiber in case of exception in cancelBefore in AsyncTaskExecutor [#55516](https://github.com/ClickHouse/ClickHouse/pull/55516) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix Query Parameters not working with custom HTTP handlers [#55521](https://github.com/ClickHouse/ClickHouse/pull/55521) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-* Fix checking of non handled data for Values format [#55527](https://github.com/ClickHouse/ClickHouse/pull/55527) ([Azat Khuzhin](https://github.com/azat)).
-* Fix 'Invalid cursor state' in odbc interacting with MS SQL Server [#55558](https://github.com/ClickHouse/ClickHouse/pull/55558) ([vdimir](https://github.com/vdimir)).
-* Fix max execution time and 'break' overflow mode [#55577](https://github.com/ClickHouse/ClickHouse/pull/55577) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix crash in QueryNormalizer with cyclic aliases [#55602](https://github.com/ClickHouse/ClickHouse/pull/55602) ([vdimir](https://github.com/vdimir)).
-* Disable wrong optimization and add a test [#55609](https://github.com/ClickHouse/ClickHouse/pull/55609) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Merging [#52352](https://github.com/ClickHouse/ClickHouse/issues/52352) [#55621](https://github.com/ClickHouse/ClickHouse/pull/55621) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add a test to avoid incorrect decimal sorting [#55662](https://github.com/ClickHouse/ClickHouse/pull/55662) ([Amos Bird](https://github.com/amosbird)).
-* Fix progress bar for s3 and azure Cluster functions with url without globs [#55666](https://github.com/ClickHouse/ClickHouse/pull/55666) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix filtering by virtual columns with OR filter in query (resubmit) [#55678](https://github.com/ClickHouse/ClickHouse/pull/55678) ([Azat Khuzhin](https://github.com/azat)).
-* Fixes and improvements for Iceberg storage [#55695](https://github.com/ClickHouse/ClickHouse/pull/55695) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix data race in CreatingSetsTransform (v2) [#55786](https://github.com/ClickHouse/ClickHouse/pull/55786) ([Azat Khuzhin](https://github.com/azat)).
-* Throw exception when parsing illegal string as float if precise_float_parsing is true [#55861](https://github.com/ClickHouse/ClickHouse/pull/55861) ([李扬](https://github.com/taiyang-li)).
-* Disable predicate pushdown if the CTE contains stateful functions [#55871](https://github.com/ClickHouse/ClickHouse/pull/55871) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix normalize ASTSelectWithUnionQuery, as it was stripping `FORMAT` from the query [#55887](https://github.com/ClickHouse/ClickHouse/pull/55887) ([flynn](https://github.com/ucasfl)).
-* Try to fix possible segfault in Native ORC input format [#55891](https://github.com/ClickHouse/ClickHouse/pull/55891) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix window functions in case of sparse columns. [#55895](https://github.com/ClickHouse/ClickHouse/pull/55895) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* fix: StorageNull supports subcolumns [#55912](https://github.com/ClickHouse/ClickHouse/pull/55912) ([FFish](https://github.com/wxybear)).
-* Do not write retriable errors for Replicated mutate/merge into error log [#55944](https://github.com/ClickHouse/ClickHouse/pull/55944) ([Azat Khuzhin](https://github.com/azat)).
-* Fix `SHOW DATABASES LIMIT <N>` [#55962](https://github.com/ClickHouse/ClickHouse/pull/55962) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix autogenerated Protobuf schema with fields with underscore [#55974](https://github.com/ClickHouse/ClickHouse/pull/55974) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix dateTime64ToSnowflake64() with non-default scale [#55983](https://github.com/ClickHouse/ClickHouse/pull/55983) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix output/input of Arrow dictionary column [#55989](https://github.com/ClickHouse/ClickHouse/pull/55989) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix fetching schema from schema registry in AvroConfluent [#55991](https://github.com/ClickHouse/ClickHouse/pull/55991) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix 'Block structure mismatch' on concurrent ALTER and INSERTs in Buffer table [#55995](https://github.com/ClickHouse/ClickHouse/pull/55995) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix incorrect free space accounting for least_used JBOD policy [#56030](https://github.com/ClickHouse/ClickHouse/pull/56030) ([Azat Khuzhin](https://github.com/azat)).
-* Fix missing scalar issue when evaluating subqueries inside table functions [#56057](https://github.com/ClickHouse/ClickHouse/pull/56057) ([Amos Bird](https://github.com/amosbird)).
-* Fix wrong query result when http_write_exception_in_output_format=1 [#56135](https://github.com/ClickHouse/ClickHouse/pull/56135) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix schema cache for fallback JSON->JSONEachRow with changed settings [#56172](https://github.com/ClickHouse/ClickHouse/pull/56172) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add error handler to odbc-bridge [#56185](https://github.com/ClickHouse/ClickHouse/pull/56185) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-
-
-### <a id="239"></a> ClickHouse release 23.9, 2023-09-28
-
-#### Backward Incompatible Change
-* Remove the `status_info` configuration option and dictionaries status from the default Prometheus handler. [#54090](https://github.com/ClickHouse/ClickHouse/pull/54090) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The experimental parts metadata cache is removed from the codebase. [#54215](https://github.com/ClickHouse/ClickHouse/pull/54215) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Disable setting `input_format_json_try_infer_numbers_from_strings` by default, so we don't try to infer numbers from strings in JSON formats by default to avoid possible parsing errors when sample data contains strings that looks like a number. [#55099](https://github.com/ClickHouse/ClickHouse/pull/55099) ([Kruglov Pavel](https://github.com/Avogar)).
-
-#### New Feature
-* Improve schema inference from JSON formats: 1) Now it's possible to infer named Tuples from JSON objects without experimantal JSON type under a setting `input_format_json_try_infer_named_tuples_from_objects` in JSON formats. Previously without experimantal type JSON we could only infer JSON objects as Strings or Maps, now we can infer named Tuple. Resulting Tuple type will conain all keys of objects that were read in data sample during schema inference. It can be useful for reading structured JSON data without sparse objects. The setting is enabled by default. 2) Allow parsing JSON array into a column with type String under setting `input_format_json_read_arrays_as_strings`. It can help reading arrays with values with different types. 3) Allow to use type String for JSON keys with unkown types (`null`/`[]`/`{}`) in sample data under setting `input_format_json_infer_incomplete_types_as_strings`. Now in JSON formats we can read any value into String column and we can avoid getting error `Cannot determine type for column 'column_name' by first 25000 rows of data, most likely this column contains only Nulls or empty Arrays/Maps` during schema inference by using type String for unknown types, so the data will be read successfully. [#54427](https://github.com/ClickHouse/ClickHouse/pull/54427) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added IO scheduling support for remote disks. Storage configuration for disk types `s3`, `s3_plain`, `hdfs` and `azure_blob_storage` can now contain `read_resource` and `write_resource` elements holding resource names. Scheduling policies for these resources can be configured in a separate server configuration section `resources`. Queries can be marked using setting `workload` and classified using server configuration section `workload_classifiers` to achieve diverse resource scheduling goals. More details in [the docs](https://clickhouse.com/docs/en/operations/workload-scheduling). [#47009](https://github.com/ClickHouse/ClickHouse/pull/47009) ([Sergei Trifonov](https://github.com/serxa)). Added "bandwidth_limit" IO scheduling node type. It allows you to specify `max_speed` and `max_burst` constraints on traffic passing though this node. [#54618](https://github.com/ClickHouse/ClickHouse/pull/54618) ([Sergei Trifonov](https://github.com/serxa)).
-* Added new type of authentication based on SSH keys. It works only for the native TCP protocol. [#41109](https://github.com/ClickHouse/ClickHouse/pull/41109) ([George Gamezardashvili](https://github.com/InfJoker)).
-* Added a new column `_block_number` for MergeTree tables. [#44532](https://github.com/ClickHouse/ClickHouse/issues/44532). [#47532](https://github.com/ClickHouse/ClickHouse/pull/47532) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Add `IF EMPTY` clause for `DROP TABLE` queries. [#48915](https://github.com/ClickHouse/ClickHouse/pull/48915) ([Pavel Novitskiy](https://github.com/pnovitskiy)).
-* SQL functions `toString(datetime, timezone)` and `formatDateTime(datetime, format, timezone)` now support non-constant timezone arguments. [#53680](https://github.com/ClickHouse/ClickHouse/pull/53680) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Add support for `ALTER TABLE MODIFY COMMENT`. Note: something similar was added by an external contributor a long time ago, but the feature did not work at all and only confused users. This closes [#36377](https://github.com/ClickHouse/ClickHouse/issues/36377). [#51304](https://github.com/ClickHouse/ClickHouse/pull/51304) ([Alexey Milovidov](https://github.com/alexey-milovidov)). Note: this command does not propagate between replicas, so the replicas of a table could have different comments.
-* Added `GCD` a.k.a. "greatest common denominator" as a new data compression codec. The codec computes the GCD of all column values, and then divides each value by the GCD. The GCD codec is a data preparation codec (similar to Delta and DoubleDelta) and cannot be used stand-alone. It works with data integer, decimal and date/time type. A viable use case for the GCD codec are column values that change (increase/decrease) in multiples of the GCD, e.g. 24 - 28 - 16 - 24 - 8 - 24 (assuming GCD = 4). [#53149](https://github.com/ClickHouse/ClickHouse/pull/53149) ([Alexander Nam](https://github.com/seshWCS)).
-* Two new type aliases `DECIMAL(P)` (as shortcut for `DECIMAL(P, 0)` and `DECIMAL` (as shortcut for `DECIMAL(10, 0)`) were added. This makes ClickHouse more compatible with MySQL's SQL dialect. [#53328](https://github.com/ClickHouse/ClickHouse/pull/53328) ([Val Doroshchuk](https://github.com/valbok)).
-* Added a new system log table `backup_log` to track all `BACKUP` and `RESTORE` operations. [#53638](https://github.com/ClickHouse/ClickHouse/pull/53638) ([Victor Krasnov](https://github.com/sirvickr)).
-* Added a format setting `output_format_markdown_escape_special_characters` (default: false). The setting controls whether special characters like `!`, `#`, `$` etc. are escaped (i.e. prefixed by a backslash) in the `Markdown` output format. [#53860](https://github.com/ClickHouse/ClickHouse/pull/53860) ([irenjj](https://github.com/irenjj)).
-* Add function `decodeHTMLComponent`. [#54097](https://github.com/ClickHouse/ClickHouse/pull/54097) ([Bharat Nallan](https://github.com/bharatnc)).
-* Added `peak_threads_usage` to query_log table. [#54335](https://github.com/ClickHouse/ClickHouse/pull/54335) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Add `SHOW FUNCTIONS` support to clickhouse-client. [#54337](https://github.com/ClickHouse/ClickHouse/pull/54337) ([Julia Kartseva](https://github.com/wat-ze-hex)).
-* Added function `toDaysSinceYearZero` with alias `TO_DAYS` (for compatibility with MySQL) which returns the number of days passed since `0001-01-01` (in Proleptic Gregorian Calendar). [#54479](https://github.com/ClickHouse/ClickHouse/pull/54479) ([Robert Schulze](https://github.com/rschu1ze)). Function `toDaysSinceYearZero` now supports arguments of type `DateTime` and `DateTime64`. [#54856](https://github.com/ClickHouse/ClickHouse/pull/54856) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Added functions `YYYYMMDDtoDate`, `YYYYMMDDtoDate32`, `YYYYMMDDhhmmssToDateTime` and `YYYYMMDDhhmmssToDateTime64`. They convert a date or date with time encoded as integer (e.g. 20230911) into a native date or date with time. As such, they provide the opposite functionality of existing functions `YYYYMMDDToDate`, `YYYYMMDDToDateTime`, `YYYYMMDDhhmmddToDateTime`, `YYYYMMDDhhmmddToDateTime64`. [#54509](https://github.com/ClickHouse/ClickHouse/pull/54509) ([Quanfa Fu](https://github.com/dentiscalprum)) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add several string distance functions, including `byteHammingDistance`, `editDistance`. [#54935](https://github.com/ClickHouse/ClickHouse/pull/54935) ([flynn](https://github.com/ucasfl)).
-* Allow specifying the expiration date and, optionally, the time for user credentials with `VALID UNTIL datetime` clause. [#51261](https://github.com/ClickHouse/ClickHouse/pull/51261) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Allow S3-style URLs for table functions `s3`, `gcs`, `oss`. URL is automatically converted to HTTP. Example: `'s3://clickhouse-public-datasets/hits.csv'` is converted to `'https://clickhouse-public-datasets.s3.amazonaws.com/hits.csv'`. [#54931](https://github.com/ClickHouse/ClickHouse/pull/54931) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Add new setting `print_pretty_type_names` to print pretty deep nested types like Tuple/Maps/Arrays. [#55095](https://github.com/ClickHouse/ClickHouse/pull/55095) ([Kruglov Pavel](https://github.com/Avogar)).
-
-#### Performance Improvement
-* Speed up reading from S3 by enabling prefetches by default. [#53709](https://github.com/ClickHouse/ClickHouse/pull/53709) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Do not implicitly read PK and version columns in lonely parts if unnecessary for queries with FINAL. [#53919](https://github.com/ClickHouse/ClickHouse/pull/53919) ([Duc Canh Le](https://github.com/canhld94)).
-* Optimize group by constant keys. Will optimize queries with group by `_file/_path` after https://github.com/ClickHouse/ClickHouse/pull/53529. [#53549](https://github.com/ClickHouse/ClickHouse/pull/53549) ([Kruglov Pavel](https://github.com/Avogar)).
-* Improve performance of sorting for `Decimal` columns. Improve performance of insertion into `MergeTree` if ORDER BY contains a `Decimal` column. Improve performance of sorting when data is already sorted or almost sorted. [#35961](https://github.com/ClickHouse/ClickHouse/pull/35961) ([Maksim Kita](https://github.com/kitaisreal)).
-* Improve performance for huge query analysis. Fixes [#51224](https://github.com/ClickHouse/ClickHouse/issues/51224). [#51469](https://github.com/ClickHouse/ClickHouse/pull/51469) ([frinkr](https://github.com/frinkr)).
-* An optimization to rewrite `COUNT(DISTINCT ...)` and various `uniq` variants to `count` if it is selected from a subquery with GROUP BY. [#52082](https://github.com/ClickHouse/ClickHouse/pull/52082) [#52645](https://github.com/ClickHouse/ClickHouse/pull/52645) ([JackyWoo](https://github.com/JackyWoo)).
-* Remove manual calls to `mmap/mremap/munmap` and delegate all this work to `jemalloc` - and it slightly improves performance. [#52792](https://github.com/ClickHouse/ClickHouse/pull/52792) ([Nikita Taranov](https://github.com/nickitat)).
-* Fixed high in CPU consumption when working with NATS. [#54399](https://github.com/ClickHouse/ClickHouse/pull/54399) ([Vasilev Pyotr](https://github.com/vahpetr)).
-* Since we use separate instructions for executing `toString` with datetime argument, it is possible to improve performance a bit for non-datetime arguments and have some parts of the code cleaner. Follows up [#53680](https://github.com/ClickHouse/ClickHouse/issues/53680). [#54443](https://github.com/ClickHouse/ClickHouse/pull/54443) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Instead of serializing json elements into a `std::stringstream`, this PR try to put the serialization result into `ColumnString` direclty. [#54613](https://github.com/ClickHouse/ClickHouse/pull/54613) ([lgbo](https://github.com/lgbo-ustc)).
-* Enable ORDER BY optimization for reading data in corresponding order from a MergeTree table in case that the table is behind a view. [#54628](https://github.com/ClickHouse/ClickHouse/pull/54628) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Improve JSON SQL functions by reusing `GeneratorJSONPath` and removing several shared pointers. [#54735](https://github.com/ClickHouse/ClickHouse/pull/54735) ([lgbo](https://github.com/lgbo-ustc)).
-* Keeper tries to batch flush requests for better performance. [#53049](https://github.com/ClickHouse/ClickHouse/pull/53049) ([Antonio Andelic](https://github.com/antonio2368)).
-* Now `clickhouse-client` processes files in parallel in case of `INFILE 'glob_expression'`. Closes [#54218](https://github.com/ClickHouse/ClickHouse/issues/54218). [#54533](https://github.com/ClickHouse/ClickHouse/pull/54533) ([Max K.](https://github.com/mkaynov)).
-* Allow to use primary key for IN function where primary key column types are different from `IN` function right side column types. Example: `SELECT id FROM test_table WHERE id IN (SELECT '5')`. Closes [#48936](https://github.com/ClickHouse/ClickHouse/issues/48936). [#54544](https://github.com/ClickHouse/ClickHouse/pull/54544) ([Maksim Kita](https://github.com/kitaisreal)).
-* Hash JOIN tries to shrink internal buffers consuming half of maximal available memory (set by `max_bytes_in_join`). [#54584](https://github.com/ClickHouse/ClickHouse/pull/54584) ([vdimir](https://github.com/vdimir)).
-* Respect `max_block_size` for array join to avoid possible OOM. Close [#54290](https://github.com/ClickHouse/ClickHouse/issues/54290). [#54664](https://github.com/ClickHouse/ClickHouse/pull/54664) ([李扬](https://github.com/taiyang-li)).
-* Reuse HTTP connections in the `s3` table function. [#54812](https://github.com/ClickHouse/ClickHouse/pull/54812) ([Michael Kolupaev](https://github.com/al13n321)).
-* Replace the linear search in `MergeTreeRangeReader::Stream::ceilRowsToCompleteGranules` with a binary search. [#54869](https://github.com/ClickHouse/ClickHouse/pull/54869) ([usurai](https://github.com/usurai)).
-
-#### Experimental Feature
-* The creation of `Annoy` indexes can now be parallelized using setting `max_threads_for_annoy_index_creation`. [#54047](https://github.com/ClickHouse/ClickHouse/pull/54047) ([Robert Schulze](https://github.com/rschu1ze)).
-* Parallel replicas over distributed don't read from all replicas [#54199](https://github.com/ClickHouse/ClickHouse/pull/54199) ([Igor Nikonov](https://github.com/devcrafter)).
-
-#### Improvement
-* Allow to replace long names of files of columns in `MergeTree` data parts to hashes of names. It helps to avoid `File name too long` error in some cases. [#50612](https://github.com/ClickHouse/ClickHouse/pull/50612) ([Anton Popov](https://github.com/CurtizJ)).
-* Parse data in `JSON` format as `JSONEachRow` if failed to parse metadata. It will allow to read files with `.json` extension even if real format is JSONEachRow. Closes [#45740](https://github.com/ClickHouse/ClickHouse/issues/45740). [#54405](https://github.com/ClickHouse/ClickHouse/pull/54405) ([Kruglov Pavel](https://github.com/Avogar)).
-* Output valid JSON/XML on excetpion during HTTP query execution. Add setting `http_write_exception_in_output_format` to enable/disable this behaviour (enabled by default). [#52853](https://github.com/ClickHouse/ClickHouse/pull/52853) ([Kruglov Pavel](https://github.com/Avogar)).
-* View `information_schema.tables` now has a new field `data_length` which shows the approximate size of the data on disk. Required to run queries generated by Amazon QuickSight. [#55037](https://github.com/ClickHouse/ClickHouse/pull/55037) ([Robert Schulze](https://github.com/rschu1ze)).
-* The MySQL interface gained a minimal implementation of prepared statements, just enough to allow a connection from Tableau Online to ClickHouse via the MySQL connector. [#54115](https://github.com/ClickHouse/ClickHouse/pull/54115) ([Serge Klochkov](https://github.com/slvrtrn)). Please note: the prepared statements implementation is pretty minimal, we do not support arguments binding yet, it is not required in this particular Tableau online use case. It will be implemented as a follow-up if necessary after extensive testing of Tableau Online in case we discover issues.
-* Support case-insensitive and dot-all matching modes in `regexp_tree` dictionaries. [#50906](https://github.com/ClickHouse/ClickHouse/pull/50906) ([Johann Gan](https://github.com/johanngan)).
-* Keeper improvement: Add a `createIfNotExists` Keeper command. [#48855](https://github.com/ClickHouse/ClickHouse/pull/48855) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-* More precise integer type inference, fix [#51236](https://github.com/ClickHouse/ClickHouse/issues/51236). [#53003](https://github.com/ClickHouse/ClickHouse/pull/53003) ([Chen768959](https://github.com/Chen768959)).
-* Introduced resolving of charsets in the string literals for MaterializedMySQL. [#53220](https://github.com/ClickHouse/ClickHouse/pull/53220) ([Val Doroshchuk](https://github.com/valbok)).
-* Fix a subtle issue with a rarely used `EmbeddedRocksDB` table engine in an extremely rare scenario: sometimes the `EmbeddedRocksDB` table engine does not close files correctly in NFS after running `DROP TABLE`. [#53502](https://github.com/ClickHouse/ClickHouse/pull/53502) ([Mingliang Pan](https://github.com/liangliangpan)).
-* `RESTORE TABLE ON CLUSTER` must create replicated tables with a matching UUID on hosts. Otherwise the macro `{uuid}` in ZooKeeper path can't work correctly after RESTORE. This PR implements that. [#53765](https://github.com/ClickHouse/ClickHouse/pull/53765) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Added restore setting `restore_broken_parts_as_detached`: if it's true the RESTORE process won't stop on broken parts while restoring, instead all the broken parts will be copied to the `detached` folder with the prefix `broken-from-backup'. If it's false the RESTORE process will stop on the first broken part (if any). The default value is false. [#53877](https://github.com/ClickHouse/ClickHouse/pull/53877) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Add `elapsed_ns` field to HTTP headers X-ClickHouse-Progress and X-ClickHouse-Summary. [#54179](https://github.com/ClickHouse/ClickHouse/pull/54179) ([joelynch](https://github.com/joelynch)).
-* Implementation of `reconfig` (https://github.com/ClickHouse/ClickHouse/pull/49450), `sync`, and `exists` commands for keeper-client. [#54201](https://github.com/ClickHouse/ClickHouse/pull/54201) ([pufit](https://github.com/pufit)).
-* `clickhouse-local` and `clickhouse-client` now allow to specify the `--query` parameter multiple times, e.g. `./clickhouse-client --query "SELECT 1" --query "SELECT 2"`. This syntax is slightly more intuitive than `./clickhouse-client --multiquery "SELECT  1;S ELECT 2"`, a bit easier to script (e.g. `queries.push_back('--query "$q"')`) and more consistent with the behavior of existing parameter `--queries-file` (e.g. `./clickhouse client --queries-file queries1.sql --queries-file queries2.sql`). [#54249](https://github.com/ClickHouse/ClickHouse/pull/54249) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add sub-second precision to `formatReadableTimeDelta`. [#54250](https://github.com/ClickHouse/ClickHouse/pull/54250) ([Andrey Zvonov](https://github.com/zvonand)).
-* Enable `allow_remove_stale_moving_parts` by default. [#54260](https://github.com/ClickHouse/ClickHouse/pull/54260) ([vdimir](https://github.com/vdimir)).
-* Fix using count from cache and improve progress bar for reading from archives. [#54271](https://github.com/ClickHouse/ClickHouse/pull/54271) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add support for S3 credentials using SSO. To define a profile to be used with SSO, set `AWS_PROFILE` environment variable. [#54347](https://github.com/ClickHouse/ClickHouse/pull/54347) ([Antonio Andelic](https://github.com/antonio2368)).
-* Support NULL as default for nested types Array/Tuple/Map for input formats. Closes [#51100](https://github.com/ClickHouse/ClickHouse/issues/51100). [#54351](https://github.com/ClickHouse/ClickHouse/pull/54351) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow reading some unusual configuration of chunks from Arrow/Parquet formats. [#54370](https://github.com/ClickHouse/ClickHouse/pull/54370) ([Arthur Passos](https://github.com/arthurpassos)).
-* Add `STD` alias to `stddevPop` function for MySQL compatibility. Closes [#54274](https://github.com/ClickHouse/ClickHouse/issues/54274). [#54382](https://github.com/ClickHouse/ClickHouse/pull/54382) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add `addDate` function for compatibility with MySQL and `subDate` for consistency. Reference [#54275](https://github.com/ClickHouse/ClickHouse/issues/54275). [#54400](https://github.com/ClickHouse/ClickHouse/pull/54400) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add `modification_time` into `system.detached_parts`. [#54506](https://github.com/ClickHouse/ClickHouse/pull/54506) ([Azat Khuzhin](https://github.com/azat)).
-* Added a setting `splitby_max_substrings_includes_remaining_string` which controls if functions "splitBy*()" with argument "max_substring" > 0 include the remaining string (if any) in the result array (Python/Spark semantics) or not. The default behavior does not change. [#54518](https://github.com/ClickHouse/ClickHouse/pull/54518) ([Robert Schulze](https://github.com/rschu1ze)).
-* Better integer types inference for `Int64`/`UInt64` fields. Continuation of [#53003](https://github.com/ClickHouse/ClickHouse/pull/53003). Now it works also for nested types like Arrays of Arrays and for functions like `map/tuple`. Issue: [#51236](https://github.com/ClickHouse/ClickHouse/issues/51236). [#54553](https://github.com/ClickHouse/ClickHouse/pull/54553) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added array operations for multiplying, dividing and modulo on scalar. Works in each way, for example `5 * [5, 5]` and `[5, 5] * 5` - both cases are possible. [#54608](https://github.com/ClickHouse/ClickHouse/pull/54608) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Add optional `version` argument to `rm` command in `keeper-client` to support safer deletes. [#54708](https://github.com/ClickHouse/ClickHouse/pull/54708) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* Disable killing the server by systemd (that may lead to data loss when using Buffer tables). [#54744](https://github.com/ClickHouse/ClickHouse/pull/54744) ([Azat Khuzhin](https://github.com/azat)).
-* Added field `is_deterministic` to system table `system.functions` which indicates whether the result of a function is stable between two invocations (given exactly the same inputs) or not. [#54766](https://github.com/ClickHouse/ClickHouse/pull/54766) [#55035](https://github.com/ClickHouse/ClickHouse/pull/55035) ([Robert Schulze](https://github.com/rschu1ze)).
-* Made the views in schema `information_schema` more compatible with the equivalent views in MySQL (i.e. modified and extended them) up to a point where Tableau Online is able to connect to ClickHouse. More specifically: 1. The type of field `information_schema.tables.table_type` changed from Enum8 to String. 2. Added fields `table_comment` and `table_collation` to view `information_schema.table`. 3. Added views `information_schema.key_column_usage` and `referential_constraints`. 4. Replaced uppercase aliases in `information_schema` views with concrete uppercase columns. [#54773](https://github.com/ClickHouse/ClickHouse/pull/54773) ([Serge Klochkov](https://github.com/slvrtrn)).
-* The query cache now returns an error if the user tries to cache the result of a query with a non-deterministic function such as `now`, `randomString` and `dictGet`. Compared to the previous behavior (silently don't cache the result), this reduces confusion and surprise for users. [#54801](https://github.com/ClickHouse/ClickHouse/pull/54801) ([Robert Schulze](https://github.com/rschu1ze)).
-* Forbid special columns like materialized/ephemeral/alias for `file`/`s3`/`url`/... storages, fix insert into ephemeral columns from files. Closes [#53477](https://github.com/ClickHouse/ClickHouse/issues/53477). [#54803](https://github.com/ClickHouse/ClickHouse/pull/54803) ([Kruglov Pavel](https://github.com/Avogar)).
-* More configurable collecting metadata for backup. [#54804](https://github.com/ClickHouse/ClickHouse/pull/54804) ([Vitaly Baranov](https://github.com/vitlibar)).
-* `clickhouse-local`'s log file (if enabled with --server_logs_file flag) will now prefix each line with timestamp, thread id, etc, just like `clickhouse-server`. [#54807](https://github.com/ClickHouse/ClickHouse/pull/54807) ([Michael Kolupaev](https://github.com/al13n321)).
-* Field `is_obsolete` in the `system.merge_tree_settings` table - it is now 1 for obsolete merge tree settings. Previously, only the description indicated that the setting is obsolete. [#54837](https://github.com/ClickHouse/ClickHouse/pull/54837) ([Robert Schulze](https://github.com/rschu1ze)).
-* Make it possible to use plural when using interval literals. `INTERVAL 2 HOURS` should be equivalent to `INTERVAL 2 HOUR`. [#54860](https://github.com/ClickHouse/ClickHouse/pull/54860) ([Jordi Villar](https://github.com/jrdi)).
-* Always allow the creation of a projection with `Nullable` PK. This fixes [#54814](https://github.com/ClickHouse/ClickHouse/issues/54814). [#54895](https://github.com/ClickHouse/ClickHouse/pull/54895) ([Amos Bird](https://github.com/amosbird)).
-* Retry backup's S3 operations after connection reset failure. [#54900](https://github.com/ClickHouse/ClickHouse/pull/54900) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Make the exception message exact in case of the maximum value of a settings is less than the minimum value. [#54925](https://github.com/ClickHouse/ClickHouse/pull/54925) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* `LIKE`, `match`, and other regular expressions matching functions now allow matching with patterns containing non-UTF-8 substrings by falling back to binary matching. Example: you can use `string LIKE '\xFE\xFF%'` to detect BOM. This closes [#54486](https://github.com/ClickHouse/ClickHouse/issues/54486). [#54942](https://github.com/ClickHouse/ClickHouse/pull/54942) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added `ContextLockWaitMicroseconds` profile event. [#55029](https://github.com/ClickHouse/ClickHouse/pull/55029) ([Maksim Kita](https://github.com/kitaisreal)).
-* The Keeper dynamically adjusts log levels. [#50372](https://github.com/ClickHouse/ClickHouse/pull/50372) ([helifu](https://github.com/helifu)).
-* Added function `timestamp` for compatibility with MySQL. Closes [#54275](https://github.com/ClickHouse/ClickHouse/issues/54275). [#54639](https://github.com/ClickHouse/ClickHouse/pull/54639) ([Nikolay Degterinsky](https://github.com/evillique)).
-
-#### Build/Testing/Packaging Improvement
-* Bumped the compiler of official and continuous integration builds of ClickHouse from Clang 16 to 17. [#53831](https://github.com/ClickHouse/ClickHouse/pull/53831) ([Robert Schulze](https://github.com/rschu1ze)).
-* Regenerated tld data for lookups (`tldLookup.generated.cpp`). [#54269](https://github.com/ClickHouse/ClickHouse/pull/54269) ([Bharat Nallan](https://github.com/bharatnc)).
-* Remove the redundant `clickhouse-keeper-client` symlink. [#54587](https://github.com/ClickHouse/ClickHouse/pull/54587) ([Tomas Barton](https://github.com/deric)).
-* Use `/usr/bin/env` to resolve bash - now it supports Nix OS. [#54603](https://github.com/ClickHouse/ClickHouse/pull/54603) ([Fionera](https://github.com/fionera)).
-* CMake added `PROFILE_CPU` option needed to perform `perf record` without using a DWARF call graph. [#54917](https://github.com/ClickHouse/ClickHouse/pull/54917) ([Maksim Kita](https://github.com/kitaisreal)).
-* If the linker is different than LLD, stop with a fatal error. [#55036](https://github.com/ClickHouse/ClickHouse/pull/55036) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Replaced the library to handle (encode/decode) base64 values from Turbo-Base64 to aklomp-base64. Both are SIMD-accelerated on x86 and ARM but 1. the license of the latter (BSD-2) is more favorable for ClickHouse, Turbo64 switched in the meantime to GPL-3, 2. with more GitHub stars, aklomp-base64 seems more future-proof, 3. aklomp-base64 has a slightly nicer API (which is arguably subjective), and 4. aklomp-base64 does not require us to hack around bugs (like non-threadsafe initialization). Note: aklomp-base64 rejects unpadded base64 values whereas Turbo-Base64 decodes them on a best-effort basis. RFC-4648 leaves it open whether padding is mandatory or not, but depending on the context this may be a behavioral change to be aware of. [#54119](https://github.com/ClickHouse/ClickHouse/pull/54119) ([Mikhail Koviazin](https://github.com/mkmkme)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Fix REPLACE/MOVE PARTITION with zero-copy replication (note: "zero-copy replication" is an experimental feature) [#54193](https://github.com/ClickHouse/ClickHouse/pull/54193) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix zero copy locks with hardlinks (note: "zero-copy replication" is an experimental feature) [#54859](https://github.com/ClickHouse/ClickHouse/pull/54859) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix zero copy garbage (note: "zero-copy replication" is an experimental feature) [#54550](https://github.com/ClickHouse/ClickHouse/pull/54550) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Pass HTTP retry timeout as milliseconds (it was incorrect before). [#54438](https://github.com/ClickHouse/ClickHouse/pull/54438) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix misleading error message in OUTFILE with `CapnProto`/`Protobuf` [#52870](https://github.com/ClickHouse/ClickHouse/pull/52870) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix summary reporting with parallel replicas with LIMIT [#53050](https://github.com/ClickHouse/ClickHouse/pull/53050) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix throttling of BACKUPs from/to S3 (in case native copy was not used) and in some other places as well [#53336](https://github.com/ClickHouse/ClickHouse/pull/53336) ([Azat Khuzhin](https://github.com/azat)).
-* Fix IO throttling during copying whole directories [#53338](https://github.com/ClickHouse/ClickHouse/pull/53338) ([Azat Khuzhin](https://github.com/azat)).
-* Fix: moved to prewhere condition actions can lose column [#53492](https://github.com/ClickHouse/ClickHouse/pull/53492) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fixed internal error when replacing with byte-equal parts [#53735](https://github.com/ClickHouse/ClickHouse/pull/53735) ([Pedro Riera](https://github.com/priera)).
-* Fix: require columns participating in interpolate expression [#53754](https://github.com/ClickHouse/ClickHouse/pull/53754) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix cluster discovery initialization + setting up fail points in config [#54113](https://github.com/ClickHouse/ClickHouse/pull/54113) ([vdimir](https://github.com/vdimir)).
-* Fix issues in `accurateCastOrNull` [#54136](https://github.com/ClickHouse/ClickHouse/pull/54136) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Fix nullable primary key with the FINAL modifier [#54164](https://github.com/ClickHouse/ClickHouse/pull/54164) ([Amos Bird](https://github.com/amosbird)).
-* Fixed error that prevented insertion in replicated materialized view of new data in presence of duplicated data. [#54184](https://github.com/ClickHouse/ClickHouse/pull/54184) ([Pedro Riera](https://github.com/priera)).
-* Fix: allow `IPv6` for bloom filter [#54200](https://github.com/ClickHouse/ClickHouse/pull/54200) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* fix possible type mismatch with `IPv4` [#54212](https://github.com/ClickHouse/ClickHouse/pull/54212) ([Bharat Nallan](https://github.com/bharatnc)).
-* Fix `system.data_skipping_indices` for recreated indices [#54225](https://github.com/ClickHouse/ClickHouse/pull/54225) ([Artur Malchanau](https://github.com/Hexta)).
-* fix name clash for multiple join rewriter v2 [#54240](https://github.com/ClickHouse/ClickHouse/pull/54240) ([Tao Wang](https://github.com/wangtZJU)).
-* Fix unexpected errors in `system.errors` after join [#54306](https://github.com/ClickHouse/ClickHouse/pull/54306) ([vdimir](https://github.com/vdimir)).
-* Fix `isZeroOrNull(NULL)` [#54316](https://github.com/ClickHouse/ClickHouse/pull/54316) ([flynn](https://github.com/ucasfl)).
-* Fix: parallel replicas over distributed with `prefer_localhost_replica` = 1 [#54334](https://github.com/ClickHouse/ClickHouse/pull/54334) ([Igor Nikonov](https://github.com/devcrafter)).
-* Fix logical error in vertical merge + replacing merge tree + optimize cleanup [#54368](https://github.com/ClickHouse/ClickHouse/pull/54368) ([alesapin](https://github.com/alesapin)).
-* Fix possible error `URI contains invalid characters` in the `s3` table function [#54373](https://github.com/ClickHouse/ClickHouse/pull/54373) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix segfault in AST optimization of `arrayExists` function [#54379](https://github.com/ClickHouse/ClickHouse/pull/54379) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Check for overflow before addition in `analysisOfVariance` function [#54385](https://github.com/ClickHouse/ClickHouse/pull/54385) ([Antonio Andelic](https://github.com/antonio2368)).
-* Reproduce and fix the bug in removeSharedRecursive [#54430](https://github.com/ClickHouse/ClickHouse/pull/54430) ([Sema Checherinda](https://github.com/CheSema)).
-* Fix possible incorrect result with SimpleAggregateFunction in PREWHERE and FINAL [#54436](https://github.com/ClickHouse/ClickHouse/pull/54436) ([Azat Khuzhin](https://github.com/azat)).
-* Fix filtering parts with indexHint for non analyzer [#54449](https://github.com/ClickHouse/ClickHouse/pull/54449) ([Azat Khuzhin](https://github.com/azat)).
-* Fix aggregate projections with normalized states [#54480](https://github.com/ClickHouse/ClickHouse/pull/54480) ([Amos Bird](https://github.com/amosbird)).
-* `clickhouse-local`: something for multiquery parameter [#54498](https://github.com/ClickHouse/ClickHouse/pull/54498) ([CuiShuoGuo](https://github.com/bakam412)).
-* `clickhouse-local` supports `--database` command line argument [#54503](https://github.com/ClickHouse/ClickHouse/pull/54503) ([vdimir](https://github.com/vdimir)).
-* Fix possible parsing error in `-WithNames` formats with disabled `input_format_with_names_use_header` [#54513](https://github.com/ClickHouse/ClickHouse/pull/54513) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix rare case of CHECKSUM_DOESNT_MATCH error [#54549](https://github.com/ClickHouse/ClickHouse/pull/54549) ([alesapin](https://github.com/alesapin)).
-* Fix sorting of UNION ALL of already sorted results [#54564](https://github.com/ClickHouse/ClickHouse/pull/54564) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix snapshot install in Keeper [#54572](https://github.com/ClickHouse/ClickHouse/pull/54572) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix race in `ColumnUnique` [#54575](https://github.com/ClickHouse/ClickHouse/pull/54575) ([Nikita Taranov](https://github.com/nickitat)).
-* Annoy/Usearch index: Fix LOGICAL_ERROR during build-up with default values [#54600](https://github.com/ClickHouse/ClickHouse/pull/54600) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix serialization of `ColumnDecimal` [#54601](https://github.com/ClickHouse/ClickHouse/pull/54601) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix schema inference for *Cluster functions for column names with spaces [#54635](https://github.com/ClickHouse/ClickHouse/pull/54635) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix using structure from insertion tables in case of defaults and explicit insert columns [#54655](https://github.com/ClickHouse/ClickHouse/pull/54655) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix: avoid using regex match, possibly containing alternation, as a key condition. [#54696](https://github.com/ClickHouse/ClickHouse/pull/54696) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix ReplacingMergeTree with vertical merge and cleanup [#54706](https://github.com/ClickHouse/ClickHouse/pull/54706) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix virtual columns having incorrect values after ORDER BY [#54811](https://github.com/ClickHouse/ClickHouse/pull/54811) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix filtering parts with indexHint for non analyzer [#54825](https://github.com/ClickHouse/ClickHouse/pull/54825) [#54449](https://github.com/ClickHouse/ClickHouse/pull/54449) ([Azat Khuzhin](https://github.com/azat)).
-* Fix Keeper segfault during shutdown [#54841](https://github.com/ClickHouse/ClickHouse/pull/54841) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix `Invalid number of rows in Chunk` in MaterializedPostgreSQL [#54844](https://github.com/ClickHouse/ClickHouse/pull/54844) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Move obsolete format settings to separate section [#54855](https://github.com/ClickHouse/ClickHouse/pull/54855) ([Kruglov Pavel](https://github.com/Avogar)).
-* Rebuild `minmax_count_projection` when partition key gets modified [#54943](https://github.com/ClickHouse/ClickHouse/pull/54943) ([Amos Bird](https://github.com/amosbird)).
-* Fix bad cast to `ColumnVector<Int128>` in function `if` [#55019](https://github.com/ClickHouse/ClickHouse/pull/55019) ([Kruglov Pavel](https://github.com/Avogar)).
-* Prevent attaching parts from tables with different projections or indices [#55062](https://github.com/ClickHouse/ClickHouse/pull/55062) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* Store NULL in scalar result map for empty subquery result [#52240](https://github.com/ClickHouse/ClickHouse/pull/52240) ([vdimir](https://github.com/vdimir)).
-* Fix `FINAL` produces invalid read ranges in a rare case [#54934](https://github.com/ClickHouse/ClickHouse/pull/54934) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix: insert quorum w/o keeper retries [#55026](https://github.com/ClickHouse/ClickHouse/pull/55026) ([Igor Nikonov](https://github.com/devcrafter)).
-* Fix simple state with nullable [#55030](https://github.com/ClickHouse/ClickHouse/pull/55030) ([Pedro Riera](https://github.com/priera)).
-
-
-### <a id="238"></a> ClickHouse release 23.8 LTS, 2023-08-31
-
-#### Backward Incompatible Change
-* If a dynamic disk contains a name, it should be specified as `disk = disk(name = 'disk_name'`, ...) in disk function arguments. In previous version it could be specified as `disk = disk_<disk_name>(...)`, which is no longer supported. [#52820](https://github.com/ClickHouse/ClickHouse/pull/52820) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* `clickhouse-benchmark` will establish connections in parallel when invoked with `--concurrency` more than one. Previously it was unusable if you ran it with 1000 concurrent connections from Europe to the US. Correct calculation of QPS for connections with high latency. Backward incompatible change: the option for JSON output of `clickhouse-benchmark` is removed. If you've used this option, you can also extract data from the `system.query_log` in JSON format as a workaround. [#53293](https://github.com/ClickHouse/ClickHouse/pull/53293) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The `microseconds` column is removed from the `system.text_log`, and the `milliseconds` column is removed from the `system.metric_log`, because they are redundant in the presence of the `event_time_microseconds` column. [#53601](https://github.com/ClickHouse/ClickHouse/pull/53601) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Deprecate the metadata cache feature. It is experimental and we have never used it. The feature is dangerous: [#51182](https://github.com/ClickHouse/ClickHouse/issues/51182). Remove the `system.merge_tree_metadata_cache` system table. The metadata cache is still available in this version but will be removed soon. This closes [#39197](https://github.com/ClickHouse/ClickHouse/issues/39197). [#51303](https://github.com/ClickHouse/ClickHouse/pull/51303) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Disable support for 3DES in TLS connections. [#52893](https://github.com/ClickHouse/ClickHouse/pull/52893) ([Kenji Noguchi](https://github.com/knoguchi)).
-
-#### New Feature
-* Direct import from zip/7z/tar archives. Example: `file('*.zip :: *.csv')`. [#50321](https://github.com/ClickHouse/ClickHouse/pull/50321) ([nikitakeba](https://github.com/nikitakeba)).
-* Add column `ptr` to `system.trace_log` for `trace_type = 'MemorySample'`. This column contains an address of allocation. Added function `flameGraph` which can build flamegraph containing allocated and not released memory. Reworking of [#38391](https://github.com/ClickHouse/ClickHouse/issues/38391). [#45322](https://github.com/ClickHouse/ClickHouse/pull/45322) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Added table function `azureBlobStorageCluster`. The supported set of features is very similar to table function `s3Cluster`. [#50795](https://github.com/ClickHouse/ClickHouse/pull/50795) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Allow using `cluster`, `clusterAllReplicas`, `remote`, and `remoteSecure` without table name in issue [#50808](https://github.com/ClickHouse/ClickHouse/issues/50808). [#50848](https://github.com/ClickHouse/ClickHouse/pull/50848) ([Yangkuan Liu](https://github.com/LiuYangkuan)).
-* A system table to monitor Kafka consumers. [#50999](https://github.com/ClickHouse/ClickHouse/pull/50999) ([Ilya Golshtein](https://github.com/ilejn)).
-* Added `max_sessions_for_user` setting. [#51724](https://github.com/ClickHouse/ClickHouse/pull/51724) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* New functions `toUTCTimestamp/fromUTCTimestamp` to act same as spark's `to_utc_timestamp/from_utc_timestamp`. [#52117](https://github.com/ClickHouse/ClickHouse/pull/52117) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Add new functions `structureToCapnProtoSchema`/`structureToProtobufSchema` that convert ClickHouse table structure to CapnProto/Protobuf format schema. Allow to input/output data in CapnProto/Protobuf format without external format schema using autogenerated schema from table structure (controlled by settings `format_capn_proto_use_autogenerated_schema`/`format_protobuf_use_autogenerated_schema`). Allow to export autogenerated schema while input/output using setting `output_format_schema`. [#52278](https://github.com/ClickHouse/ClickHouse/pull/52278) ([Kruglov Pavel](https://github.com/Avogar)).
-* A new field `query_cache_usage` in `system.query_log` now shows if and how the query cache was used. [#52384](https://github.com/ClickHouse/ClickHouse/pull/52384) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add new function `startsWithUTF8` and `endsWithUTF8`. [#52555](https://github.com/ClickHouse/ClickHouse/pull/52555) ([李扬](https://github.com/taiyang-li)).
-* Allow variable number of columns in TSV/CustomSeparated/JSONCompactEachRow, make schema inference work with variable number of columns. Add settings `input_format_tsv_allow_variable_number_of_columns`, `input_format_custom_allow_variable_number_of_columns`, `input_format_json_compact_allow_variable_number_of_columns`. [#52692](https://github.com/ClickHouse/ClickHouse/pull/52692) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added `SYSTEM STOP/START PULLING REPLICATION LOG` queries (for testing `ReplicatedMergeTree`). [#52881](https://github.com/ClickHouse/ClickHouse/pull/52881) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Allow to execute constant non-deterministic functions in mutations on initiator. [#53129](https://github.com/ClickHouse/ClickHouse/pull/53129) ([Anton Popov](https://github.com/CurtizJ)).
-* Add input format `One` that doesn't read any data and always returns single row with column `dummy` with type `UInt8` and value `0` like `system.one`. It can be used together with `_file/_path` virtual columns to list files in file/s3/url/hdfs/etc table functions without reading any data. [#53209](https://github.com/ClickHouse/ClickHouse/pull/53209) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add `tupleConcat` function. Closes [#52759](https://github.com/ClickHouse/ClickHouse/issues/52759). [#53239](https://github.com/ClickHouse/ClickHouse/pull/53239) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Support `TRUNCATE DATABASE` operation. [#53261](https://github.com/ClickHouse/ClickHouse/pull/53261) ([Bharat Nallan](https://github.com/bharatnc)).
-* Add `max_threads_for_indexes` setting to limit number of threads used for primary key processing. [#53313](https://github.com/ClickHouse/ClickHouse/pull/53313) ([jorisgio](https://github.com/jorisgio)).
-* Re-add SipHash keyed functions. [#53525](https://github.com/ClickHouse/ClickHouse/pull/53525) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* ([#52755](https://github.com/ClickHouse/ClickHouse/issues/52755) , [#52895](https://github.com/ClickHouse/ClickHouse/issues/52895)) Added functions `arrayRotateLeft`, `arrayRotateRight`, `arrayShiftLeft`, `arrayShiftRight`. [#53557](https://github.com/ClickHouse/ClickHouse/pull/53557) ([Mikhail Koviazin](https://github.com/mkmkme)).
-* Add column `name` to `system.clusters` as an alias to cluster. [#53605](https://github.com/ClickHouse/ClickHouse/pull/53605) ([irenjj](https://github.com/irenjj)).
-* The advanced dashboard now allows mass editing (save/load). [#53608](https://github.com/ClickHouse/ClickHouse/pull/53608) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The advanced dashboard now has an option to maximize charts and move them around. [#53622](https://github.com/ClickHouse/ClickHouse/pull/53622) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added support for adding and subtracting arrays: `[5,2] + [1,7]`. Division and multiplication were not implemented due to confusion between pointwise multiplication and the scalar product of arguments. Closes [#49939](https://github.com/ClickHouse/ClickHouse/issues/49939). [#52625](https://github.com/ClickHouse/ClickHouse/pull/52625) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Add support for string literals as table names. Closes [#52178](https://github.com/ClickHouse/ClickHouse/issues/52178). [#52635](https://github.com/ClickHouse/ClickHouse/pull/52635) ([hendrik-m](https://github.com/hendrik-m)).
-
-#### Experimental Feature
-* Add new table engine `S3Queue` for streaming data import from s3. Closes [#37012](https://github.com/ClickHouse/ClickHouse/issues/37012). [#49086](https://github.com/ClickHouse/ClickHouse/pull/49086) ([s-kat](https://github.com/s-kat)). It is not ready to use. Do not use it.
-* Enable parallel reading from replicas over distributed table. Related to [#49708](https://github.com/ClickHouse/ClickHouse/issues/49708). [#53005](https://github.com/ClickHouse/ClickHouse/pull/53005) ([Igor Nikonov](https://github.com/devcrafter)).
-* Add experimental support for HNSW as approximate neighbor search method. [#53447](https://github.com/ClickHouse/ClickHouse/pull/53447) ([Davit Vardanyan](https://github.com/davvard)). This is currently intended for those who continue working on the implementation. Do not use it.
-
-#### Performance Improvement
-* Parquet filter pushdown. I.e. when reading Parquet files, row groups (chunks of the file) are skipped based on the WHERE condition and the min/max values in each column. In particular, if the file is roughly sorted by some column, queries that filter by a short range of that column will be much faster. [#52951](https://github.com/ClickHouse/ClickHouse/pull/52951) ([Michael Kolupaev](https://github.com/al13n321)).
-* Optimize reading small row groups by batching them together in Parquet. Closes [#53069](https://github.com/ClickHouse/ClickHouse/issues/53069). [#53281](https://github.com/ClickHouse/ClickHouse/pull/53281) ([Kruglov Pavel](https://github.com/Avogar)).
-* Optimize count from files in most input formats. Closes [#44334](https://github.com/ClickHouse/ClickHouse/issues/44334). [#53637](https://github.com/ClickHouse/ClickHouse/pull/53637) ([Kruglov Pavel](https://github.com/Avogar)).
-* Use filter by file/path before reading in `url`/`file`/`hdfs` table functions. [#53529](https://github.com/ClickHouse/ClickHouse/pull/53529) ([Kruglov Pavel](https://github.com/Avogar)).
-* Enable JIT compilation for AArch64, PowerPC, SystemZ, RISC-V. [#38217](https://github.com/ClickHouse/ClickHouse/pull/38217) ([Maksim Kita](https://github.com/kitaisreal)).
-* Add setting `rewrite_count_distinct_if_with_count_distinct_implementation` to rewrite `countDistinctIf` with `count_distinct_implementation`. Closes [#30642](https://github.com/ClickHouse/ClickHouse/issues/30642). [#46051](https://github.com/ClickHouse/ClickHouse/pull/46051) ([flynn](https://github.com/ucasfl)).
-* Speed up merging of states of `uniq` and `uniqExact` aggregate functions by parallelizing conversion before merge. [#50748](https://github.com/ClickHouse/ClickHouse/pull/50748) ([Jiebin Sun](https://github.com/jiebinn)).
-* Optimize aggregation performance of nullable string key when using a large number of variable length keys. [#51399](https://github.com/ClickHouse/ClickHouse/pull/51399) ([LiuNeng](https://github.com/liuneng1994)).
-* Add a pass in Analyzer for time filter optimization with preimage. The performance experiments of SSB on the ICX device (Intel Xeon Platinum 8380 CPU, 80 cores, 160 threads) show that this change could bring an improvement of 8.5% to the geomean QPS when the experimental analyzer is enabled. [#52091](https://github.com/ClickHouse/ClickHouse/pull/52091) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Optimize the merge if all hash sets are single-level in the `uniqExact` (COUNT DISTINCT) function. [#52973](https://github.com/ClickHouse/ClickHouse/pull/52973) ([Jiebin Sun](https://github.com/jiebinn)).
-* `Join` table engine: do not clone hash join data structure with all columns. [#53046](https://github.com/ClickHouse/ClickHouse/pull/53046) ([Duc Canh Le](https://github.com/canhld94)).
-* Implement native `ORC` input format without the "apache arrow" library to improve performance. [#53324](https://github.com/ClickHouse/ClickHouse/pull/53324) ([李扬](https://github.com/taiyang-li)).
-* The dashboard will tell the server to compress the data, which is useful for large time frames over slow internet connections. For example, one chart with 86400 points can be 1.5 MB uncompressed and 60 KB compressed with `br`. [#53569](https://github.com/ClickHouse/ClickHouse/pull/53569) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Better utilization of thread pool for BACKUPs and RESTOREs. [#53649](https://github.com/ClickHouse/ClickHouse/pull/53649) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Load filesystem cache metadata on startup in parallel. Configured by `load_metadata_threads` (default: 1) cache config setting. Related to [#52037](https://github.com/ClickHouse/ClickHouse/issues/52037). [#52943](https://github.com/ClickHouse/ClickHouse/pull/52943) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Improve `move_primary_key_columns_to_end_of_prewhere`. [#53337](https://github.com/ClickHouse/ClickHouse/pull/53337) ([Han Fei](https://github.com/hanfei1991)).
-* This optimizes the interaction with ClickHouse Keeper. Previously the caller could register the same watch callback multiple times. In that case each entry was consuming memory and the same callback was called multiple times which didn't make much sense. In order to avoid this the caller could have some logic to not add the same watch multiple times. With this change this deduplication is done internally if the watch callback is passed via shared_ptr. [#53452](https://github.com/ClickHouse/ClickHouse/pull/53452) ([Alexander Gololobov](https://github.com/davenger)).
-* Cache number of rows in files for count in file/s3/url/hdfs/azure functions. The cache can be enabled/disabled by setting `use_cache_for_count_from_files` (enabled by default). Continuation of https://github.com/ClickHouse/ClickHouse/pull/53637. [#53692](https://github.com/ClickHouse/ClickHouse/pull/53692) ([Kruglov Pavel](https://github.com/Avogar)).
-* More careful thread management will improve the speed of the S3 table function over a large number of files by more than ~25%. [#53668](https://github.com/ClickHouse/ClickHouse/pull/53668) ([pufit](https://github.com/pufit)).
-
-#### Improvement
-* Add `stderr_reaction` configuration/setting to control the reaction (none, log or throw) when external command stderr has data. This helps make debugging external command easier. [#43210](https://github.com/ClickHouse/ClickHouse/pull/43210) ([Amos Bird](https://github.com/amosbird)).
-* Add `partition` column to the `system part_log` and merge table. [#48990](https://github.com/ClickHouse/ClickHouse/pull/48990) ([Jianfei Hu](https://github.com/incfly)).
-* The sizes of the (index) uncompressed/mark, mmap and query caches can now be configured dynamically at runtime (without server restart). [#51446](https://github.com/ClickHouse/ClickHouse/pull/51446) ([Robert Schulze](https://github.com/rschu1ze)).
-* If a dictionary is created with a complex key, automatically choose the "complex key" layout variant. [#49587](https://github.com/ClickHouse/ClickHouse/pull/49587) ([xiebin](https://github.com/xbthink)).
-* Add setting `use_concurrency_control` for better testing of the new concurrency control feature. [#49618](https://github.com/ClickHouse/ClickHouse/pull/49618) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added suggestions for mistyped names for databases and tables. [#49801](https://github.com/ClickHouse/ClickHouse/pull/49801) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* While read small files from HDFS by Gluten, we found that it will cost more times when compare to directly query by Spark. And we did something with that. [#50063](https://github.com/ClickHouse/ClickHouse/pull/50063) ([KevinyhZou](https://github.com/KevinyhZou)).
-* There were too many worthless error logs after session expiration, which we didn't like. [#50171](https://github.com/ClickHouse/ClickHouse/pull/50171) ([helifu](https://github.com/helifu)).
-* Introduce fallback ZooKeeper sessions which are time-bound. Fixed `index` column in system.zookeeper_connection for DNS addresses. [#50424](https://github.com/ClickHouse/ClickHouse/pull/50424) ([Anton Kozlov](https://github.com/tonickkozlov)).
-* Add ability to log when max_partitions_per_insert_block is reached. [#50948](https://github.com/ClickHouse/ClickHouse/pull/50948) ([Sean Haynes](https://github.com/seandhaynes)).
-* Added a bunch of custom commands to clickhouse-keeper-client (mostly to make ClickHouse debugging easier). [#51117](https://github.com/ClickHouse/ClickHouse/pull/51117) ([pufit](https://github.com/pufit)).
-* Updated check for connection string in `azureBlobStorage` table function as connection string with "sas" does not always begin with the default endpoint and updated connection URL to include "sas" token after adding Azure's container to URL. [#51141](https://github.com/ClickHouse/ClickHouse/pull/51141) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix description for filtering sets in the `full_sorting_merge` JOIN algorithm. [#51329](https://github.com/ClickHouse/ClickHouse/pull/51329) ([Tanay Tummalapalli](https://github.com/ttanay)).
-* Fixed memory consumption in `Aggregator` when `max_block_size` is huge. [#51566](https://github.com/ClickHouse/ClickHouse/pull/51566) ([Nikita Taranov](https://github.com/nickitat)).
-* Add `SYSTEM SYNC FILESYSTEM CACHE` command. It will compare in-memory state of filesystem cache with what it has on disk and fix in-memory state if needed. This is only needed if you are making manual interventions in on-disk data, which is highly discouraged. [#51622](https://github.com/ClickHouse/ClickHouse/pull/51622) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Attempt to create a generic proxy resolver for CH while keeping backwards compatibility with existing S3 storage conf proxy resolver. [#51749](https://github.com/ClickHouse/ClickHouse/pull/51749) ([Arthur Passos](https://github.com/arthurpassos)).
-* Support reading tuple subcolumns from file/s3/hdfs/url/azureBlobStorage table functions. [#51806](https://github.com/ClickHouse/ClickHouse/pull/51806) ([Kruglov Pavel](https://github.com/Avogar)).
-* Function `arrayIntersect` now returns the values in the order, corresponding to the first argument. Closes [#27622](https://github.com/ClickHouse/ClickHouse/issues/27622). [#51850](https://github.com/ClickHouse/ClickHouse/pull/51850) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Add new queries, which allow to create/drop of access entities in specified access storage or move access entities from one access storage to another. [#51912](https://github.com/ClickHouse/ClickHouse/pull/51912) ([pufit](https://github.com/pufit)).
-* Make `ALTER TABLE FREEZE` queries not replicated in the Replicated database engine. [#52064](https://github.com/ClickHouse/ClickHouse/pull/52064) ([Mike Kot](https://github.com/myrrc)).
-* Added possibility to flush system tables on unexpected shutdown. [#52174](https://github.com/ClickHouse/ClickHouse/pull/52174) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Fix the case when `s3` table function refused to work with pre-signed URLs. close [#50846](https://github.com/ClickHouse/ClickHouse/issues/50846). [#52310](https://github.com/ClickHouse/ClickHouse/pull/52310) ([chen](https://github.com/xiedeyantu)).
-* Add column `name` as an alias to `event` and `metric` in the `system.events` and `system.metrics` tables. Closes [#51257](https://github.com/ClickHouse/ClickHouse/issues/51257). [#52315](https://github.com/ClickHouse/ClickHouse/pull/52315) ([chen](https://github.com/xiedeyantu)).
-* Added support of syntax `CREATE UNIQUE INDEX` in parser as a no-op for better SQL compatibility. `UNIQUE` index is not supported. Set `create_index_ignore_unique = 1` to ignore UNIQUE keyword in queries. [#52320](https://github.com/ClickHouse/ClickHouse/pull/52320) ([Ilya Yatsishin](https://github.com/qoega)).
-* Add support of predefined macro (`{database}` and `{table}`) in some Kafka engine settings: topic, consumer, client_id, etc. [#52386](https://github.com/ClickHouse/ClickHouse/pull/52386) ([Yury Bogomolov](https://github.com/ybogo)).
-* Disable updating the filesystem cache during backup/restore. Filesystem cache must not be updated during backup/restore, it seems it just slows down the process without any profit (because the BACKUP command can read a lot of data and it's no use to put all the data to the filesystem cache and immediately evict it). [#52402](https://github.com/ClickHouse/ClickHouse/pull/52402) ([Vitaly Baranov](https://github.com/vitlibar)).
-* The configuration of S3 endpoint allow using it from the root, and append '/' automatically if needed. [#47809](https://github.com/ClickHouse/ClickHouse/issues/47809). [#52600](https://github.com/ClickHouse/ClickHouse/pull/52600) ([xiaolei565](https://github.com/xiaolei565)).
-* For clickhouse-local allow positional options and populate global UDF settings (user_scripts_path and user_defined_executable_functions_config). [#52643](https://github.com/ClickHouse/ClickHouse/pull/52643) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* `system.asynchronous_metrics` now includes metrics "QueryCacheEntries" and "QueryCacheBytes" to inspect the query cache. [#52650](https://github.com/ClickHouse/ClickHouse/pull/52650) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added possibility to use `s3_storage_class` parameter in the `SETTINGS` clause of the `BACKUP` statement for backups to S3. [#52658](https://github.com/ClickHouse/ClickHouse/pull/52658) ([Roman Vasin](https://github.com/rvasin)).
-* Add utility `print-backup-info.py` which parses a backup metadata file and prints information about the backup. [#52690](https://github.com/ClickHouse/ClickHouse/pull/52690) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Closes [#49510](https://github.com/ClickHouse/ClickHouse/issues/49510). Currently we have database and table names case-sensitive, but BI tools query `information_schema` sometimes in lowercase, sometimes in uppercase. For this reason we have `information_schema` database, containing lowercase tables, such as `information_schema.tables` and `INFORMATION_SCHEMA` database, containing uppercase tables, such as `INFORMATION_SCHEMA.TABLES`. But some tools are querying `INFORMATION_SCHEMA.tables` and `information_schema.TABLES`. The proposed solution is to duplicate both lowercase and uppercase tables in lowercase and uppercase `information_schema` database. [#52695](https://github.com/ClickHouse/ClickHouse/pull/52695) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Query`CHECK TABLE` has better performance and usability (sends progress updates, cancellable). [#52745](https://github.com/ClickHouse/ClickHouse/pull/52745) ([vdimir](https://github.com/vdimir)).
-* Add support for `modulo`, `intDiv`, `intDivOrZero` for tuples by distributing them across tuple's elements. [#52758](https://github.com/ClickHouse/ClickHouse/pull/52758) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Search for default `yaml` and `yml` configs in clickhouse-client after `xml`. [#52767](https://github.com/ClickHouse/ClickHouse/pull/52767) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* When merging into non-'clickhouse' rooted configuration, configs with different root node name just bypassed without exception. [#52770](https://github.com/ClickHouse/ClickHouse/pull/52770) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Now it's possible to specify min (`memory_profiler_sample_min_allocation_size`) and max (`memory_profiler_sample_max_allocation_size`) size for allocations to be tracked with sampling memory profiler. [#52779](https://github.com/ClickHouse/ClickHouse/pull/52779) ([alesapin](https://github.com/alesapin)).
-* Add `precise_float_parsing` setting to switch float parsing methods (fast/precise). [#52791](https://github.com/ClickHouse/ClickHouse/pull/52791) ([Andrey Zvonov](https://github.com/zvonand)).
-* Use the same default paths for `clickhouse-keeper` (symlink) as for `clickhouse-keeper` (executable). [#52861](https://github.com/ClickHouse/ClickHouse/pull/52861) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Improve error message for table function `remote`. Closes [#40220](https://github.com/ClickHouse/ClickHouse/issues/40220). [#52959](https://github.com/ClickHouse/ClickHouse/pull/52959) ([jiyoungyoooo](https://github.com/jiyoungyoooo)).
-* Added the possibility to specify custom storage policy in the `SETTINGS` clause of `RESTORE` queries. [#52970](https://github.com/ClickHouse/ClickHouse/pull/52970) ([Victor Krasnov](https://github.com/sirvickr)).
-* Add the ability to throttle the S3 requests on backup operations (`BACKUP` and `RESTORE` commands now honor `s3_max_[get/put]_[rps/burst]`). [#52974](https://github.com/ClickHouse/ClickHouse/pull/52974) ([Daniel Pozo Escalona](https://github.com/danipozo)).
-* Add settings to ignore ON CLUSTER clause in queries for management of replicated user-defined functions or access control entities with replicated storage. [#52975](https://github.com/ClickHouse/ClickHouse/pull/52975) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* EXPLAIN actions for JOIN step. [#53006](https://github.com/ClickHouse/ClickHouse/pull/53006) ([Maksim Kita](https://github.com/kitaisreal)).
-* Make `hasTokenOrNull` and `hasTokenCaseInsensitiveOrNull` return null for empty needles. [#53059](https://github.com/ClickHouse/ClickHouse/pull/53059) ([ltrk2](https://github.com/ltrk2)).
-* Allow to restrict allowed paths for filesystem caches. Mainly useful for dynamic disks. If in server config `filesystem_caches_path` is specified, all filesystem caches' paths will be restricted to this directory. E.g. if the `path` in cache config is relative - it will be put in `filesystem_caches_path`; if `path` in cache config is absolute, it will be required to lie inside `filesystem_caches_path`. If `filesystem_caches_path` is not specified in config, then behaviour will be the same as in earlier versions. [#53124](https://github.com/ClickHouse/ClickHouse/pull/53124) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Added a bunch of custom commands (mostly to make ClickHouse debugging easier). [#53127](https://github.com/ClickHouse/ClickHouse/pull/53127) ([pufit](https://github.com/pufit)).
-* Add diagnostic info about file name during schema inference - it helps when you process multiple files with globs. [#53135](https://github.com/ClickHouse/ClickHouse/pull/53135) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Client will load suggestions using the main connection if the second connection is not allowed to create a session. [#53177](https://github.com/ClickHouse/ClickHouse/pull/53177) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Add EXCEPT clause to `SYSTEM STOP/START LISTEN QUERIES [ALL/DEFAULT/CUSTOM]` query, for example `SYSTEM STOP LISTEN QUERIES ALL EXCEPT TCP, HTTP`. [#53280](https://github.com/ClickHouse/ClickHouse/pull/53280) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Change the default of `max_concurrent_queries` from 100 to 1000. It's ok to have many concurrent queries if they are not heavy, and mostly waiting for the network. Note: don't confuse concurrent queries and QPS: for example, ClickHouse server can do tens of thousands of QPS with less than 100 concurrent queries. [#53285](https://github.com/ClickHouse/ClickHouse/pull/53285) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Limit number of concurrent background partition optimize merges. [#53405](https://github.com/ClickHouse/ClickHouse/pull/53405) ([Duc Canh Le](https://github.com/canhld94)).
-* Added a setting `allow_moving_table_directory_to_trash` that allows to ignore `Directory for table data already exists` error when replicating/recovering a `Replicated` database. [#53425](https://github.com/ClickHouse/ClickHouse/pull/53425) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* If server settings `asynchronous_metrics_update_period_s` and `asynchronous_heavy_metrics_update_period_s` are misconfigured to 0, it will now fail gracefully instead of terminating the application. [#53428](https://github.com/ClickHouse/ClickHouse/pull/53428) ([Robert Schulze](https://github.com/rschu1ze)).
-* The ClickHouse server now respects memory limits changed via cgroups when reloading its configuration. [#53455](https://github.com/ClickHouse/ClickHouse/pull/53455) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add ability to turn off flush of Distributed tables on `DETACH`, `DROP`, or server shutdown. [#53501](https://github.com/ClickHouse/ClickHouse/pull/53501) ([Azat Khuzhin](https://github.com/azat)).
-* The `domainRFC` function now supports IPv6 in square brackets. [#53506](https://github.com/ClickHouse/ClickHouse/pull/53506) ([Chen768959](https://github.com/Chen768959)).
-* Use longer timeout for S3 CopyObject requests, which are used in backups. [#53533](https://github.com/ClickHouse/ClickHouse/pull/53533) ([Michael Kolupaev](https://github.com/al13n321)).
-* Added server setting `aggregate_function_group_array_max_element_size`. This setting is used to limit array size for `groupArray` function at serialization. The default value is `16777215`. [#53550](https://github.com/ClickHouse/ClickHouse/pull/53550) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* `SCHEMA` was added as alias for `DATABASE` to improve MySQL compatibility. [#53587](https://github.com/ClickHouse/ClickHouse/pull/53587) ([Daniël van Eeden](https://github.com/dveeden)).
-* Add asynchronous metrics about tables in the system database. For example, `TotalBytesOfMergeTreeTablesSystem`. This closes [#53603](https://github.com/ClickHouse/ClickHouse/issues/53603). [#53604](https://github.com/ClickHouse/ClickHouse/pull/53604) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* SQL editor in the Play UI and Dashboard will not use Grammarly. [#53614](https://github.com/ClickHouse/ClickHouse/pull/53614) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* As expert-level settings, it is now possible to (1) configure the size_ratio (i.e. the relative size of the protected queue) of the [index] mark/uncompressed caches, (2) configure the cache policy of the index mark and index uncompressed caches. [#53657](https://github.com/ClickHouse/ClickHouse/pull/53657) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added client info validation to the query packet in TCPHandler. [#53673](https://github.com/ClickHouse/ClickHouse/pull/53673) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Retry loading parts in case of network errors while interaction with Microsoft Azure. [#53750](https://github.com/ClickHouse/ClickHouse/pull/53750) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Stacktrace for exceptions, Materailized view exceptions are propagated. [#53766](https://github.com/ClickHouse/ClickHouse/pull/53766) ([Ilya Golshtein](https://github.com/ilejn)).
-* If no hostname or port were specified, keeper client will try to search for a connection string in the ClickHouse's config.xml. [#53769](https://github.com/ClickHouse/ClickHouse/pull/53769) ([pufit](https://github.com/pufit)).
-* Add profile event `PartsLockMicroseconds` which shows the amount of microseconds we hold the data parts lock in MergeTree table engine family. [#53797](https://github.com/ClickHouse/ClickHouse/pull/53797) ([alesapin](https://github.com/alesapin)).
-* Make reconnect limit in RAFT limits configurable for keeper. This configuration can help to make keeper to rebuild connection with peers quicker if the current connection is broken. [#53817](https://github.com/ClickHouse/ClickHouse/pull/53817) ([Pengyuan Bian](https://github.com/bianpengyuan)).
-* Ignore foreign keys in tables definition to improve compatibility with MySQL, so a user wouldn't need to rewrite his SQL of the foreign key part, ref [#53380](https://github.com/ClickHouse/ClickHouse/issues/53380). [#53864](https://github.com/ClickHouse/ClickHouse/pull/53864) ([jsc0218](https://github.com/jsc0218)).
-
-#### Build/Testing/Packaging Improvement
-* Don't expose symbols from ClickHouse binary to dynamic linker. It might fix [#43933](https://github.com/ClickHouse/ClickHouse/issues/43933). [#47475](https://github.com/ClickHouse/ClickHouse/pull/47475) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add `clickhouse-keeper-client` symlink to the clickhouse-server package. [#51882](https://github.com/ClickHouse/ClickHouse/pull/51882) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* Add https://github.com/elliotchance/sqltest to CI to report the SQL 2016 conformance. [#52293](https://github.com/ClickHouse/ClickHouse/pull/52293) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Upgrade PRQL to 0.9.3. [#53060](https://github.com/ClickHouse/ClickHouse/pull/53060) ([Maximilian Roos](https://github.com/max-sixty)).
-* System tables from CI checks are exported to ClickHouse Cloud. [#53086](https://github.com/ClickHouse/ClickHouse/pull/53086) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The compiler's profile data (`-ftime-trace`) is uploaded to ClickHouse Cloud. [#53100](https://github.com/ClickHouse/ClickHouse/pull/53100) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Speed up Debug and Tidy builds. [#53178](https://github.com/ClickHouse/ClickHouse/pull/53178) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Speed up the build by removing tons and tonnes of garbage. One of the frequently included headers was poisoned by boost. [#53180](https://github.com/ClickHouse/ClickHouse/pull/53180) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Remove even more garbage. [#53182](https://github.com/ClickHouse/ClickHouse/pull/53182) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The function `arrayAUC` was using heavy C++ templates - ditched them. [#53183](https://github.com/ClickHouse/ClickHouse/pull/53183) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Some translation units were always rebuilt regardless of ccache. The culprit is found and fixed. [#53184](https://github.com/ClickHouse/ClickHouse/pull/53184) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The compiler's profile data (`-ftime-trace`) is uploaded to ClickHouse Cloud., the second attempt after [#53100](https://github.com/ClickHouse/ClickHouse/issues/53100). [#53213](https://github.com/ClickHouse/ClickHouse/pull/53213) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Export logs from CI in stateful tests to ClickHouse Cloud. [#53351](https://github.com/ClickHouse/ClickHouse/pull/53351) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Export logs from CI in stress tests. [#53353](https://github.com/ClickHouse/ClickHouse/pull/53353) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Export logs from CI in fuzzer. [#53354](https://github.com/ClickHouse/ClickHouse/pull/53354) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Preserve environment parameters in `clickhouse start` command. Fixes [#51962](https://github.com/ClickHouse/ClickHouse/issues/51962). [#53418](https://github.com/ClickHouse/ClickHouse/pull/53418) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* Follow up for [#53418](https://github.com/ClickHouse/ClickHouse/issues/53418). Small improvements for install_check.py, adding tests for proper ENV parameters passing to the main process on `init.d start`. [#53457](https://github.com/ClickHouse/ClickHouse/pull/53457) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* Reorganize file management in CMake to prevent potential duplications. For instance, `indexHint.cpp` is duplicated in both `dbms_sources` and `clickhouse_functions_sources`. [#53621](https://github.com/ClickHouse/ClickHouse/pull/53621) ([Amos Bird](https://github.com/amosbird)).
-* Upgrade snappy to 1.1.10. [#53672](https://github.com/ClickHouse/ClickHouse/pull/53672) ([李扬](https://github.com/taiyang-li)).
-* Slightly improve cmake build by sanitizing some dependencies and removing some duplicates. Each commit includes a short description of the changes made. [#53759](https://github.com/ClickHouse/ClickHouse/pull/53759) ([Amos Bird](https://github.com/amosbird)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Do not reset (experimental) Annoy index during build-up with more than one mark [#51325](https://github.com/ClickHouse/ClickHouse/pull/51325) ([Tian Xinhui](https://github.com/xinhuitian)).
-* Fix usage of temporary directories during RESTORE [#51493](https://github.com/ClickHouse/ClickHouse/pull/51493) ([Azat Khuzhin](https://github.com/azat)).
-* Fix binary arithmetic for Nullable(IPv4) [#51642](https://github.com/ClickHouse/ClickHouse/pull/51642) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Support IPv4 and IPv6 data types as dictionary attributes [#51756](https://github.com/ClickHouse/ClickHouse/pull/51756) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* A fix for checksum of compress marks [#51777](https://github.com/ClickHouse/ClickHouse/pull/51777) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix mistakenly comma parsing as part of datetime in CSV best effort parsing [#51950](https://github.com/ClickHouse/ClickHouse/pull/51950) ([Kruglov Pavel](https://github.com/Avogar)).
-* Don't throw exception when executable UDF has parameters [#51961](https://github.com/ClickHouse/ClickHouse/pull/51961) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix recalculation of skip indexes and projections in `ALTER DELETE` queries [#52530](https://github.com/ClickHouse/ClickHouse/pull/52530) ([Anton Popov](https://github.com/CurtizJ)).
-* MaterializedMySQL: Fix the infinite loop in ReadBuffer::read [#52621](https://github.com/ClickHouse/ClickHouse/pull/52621) ([Val Doroshchuk](https://github.com/valbok)).
-* Load suggestion only with `clickhouse` dialect [#52628](https://github.com/ClickHouse/ClickHouse/pull/52628) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* Init and destroy ares channel on demand. [#52634](https://github.com/ClickHouse/ClickHouse/pull/52634) ([Arthur Passos](https://github.com/arthurpassos)).
-* Fix filtering by virtual columns with OR expression [#52653](https://github.com/ClickHouse/ClickHouse/pull/52653) ([Azat Khuzhin](https://github.com/azat)).
-* Fix crash in function `tuple` with one sparse column argument [#52659](https://github.com/ClickHouse/ClickHouse/pull/52659) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix named collections on cluster [#52687](https://github.com/ClickHouse/ClickHouse/pull/52687) ([Al Korgun](https://github.com/alkorgun)).
-* Fix reading of unnecessary column in case of multistage `PREWHERE` [#52689](https://github.com/ClickHouse/ClickHouse/pull/52689) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix unexpected sort result on multi columns with nulls first direction [#52761](https://github.com/ClickHouse/ClickHouse/pull/52761) ([copperybean](https://github.com/copperybean)).
-* Fix data race in Keeper reconfiguration [#52804](https://github.com/ClickHouse/ClickHouse/pull/52804) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix sorting of sparse columns with large limit [#52827](https://github.com/ClickHouse/ClickHouse/pull/52827) ([Anton Popov](https://github.com/CurtizJ)).
-* clickhouse-keeper: fix implementation of server with poll. [#52833](https://github.com/ClickHouse/ClickHouse/pull/52833) ([Andy Fiddaman](https://github.com/citrus-it)).
-* Make regexp analyzer recognize named capturing groups [#52840](https://github.com/ClickHouse/ClickHouse/pull/52840) ([Han Fei](https://github.com/hanfei1991)).
-* Fix possible assert in `~PushingAsyncPipelineExecutor` in clickhouse-local [#52862](https://github.com/ClickHouse/ClickHouse/pull/52862) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix reading of empty `Nested(Array(LowCardinality(...)))` [#52949](https://github.com/ClickHouse/ClickHouse/pull/52949) ([Anton Popov](https://github.com/CurtizJ)).
-* Added new tests for session_log and fixed the inconsistency between login and logout. [#52958](https://github.com/ClickHouse/ClickHouse/pull/52958) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Fix password leak in show create mysql table [#52962](https://github.com/ClickHouse/ClickHouse/pull/52962) ([Duc Canh Le](https://github.com/canhld94)).
-* Convert sparse column format to full in CreateSetAndFilterOnTheFlyStep [#53000](https://github.com/ClickHouse/ClickHouse/pull/53000) ([vdimir](https://github.com/vdimir)).
-* Fix rare race condition with empty key prefix directory deletion in fs cache [#53055](https://github.com/ClickHouse/ClickHouse/pull/53055) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix ZstdDeflatingWriteBuffer truncating the output sometimes [#53064](https://github.com/ClickHouse/ClickHouse/pull/53064) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix query_id in part_log with async flush queries [#53103](https://github.com/ClickHouse/ClickHouse/pull/53103) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix possible error from cache "Read unexpected size" [#53121](https://github.com/ClickHouse/ClickHouse/pull/53121) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Disable the new parquet encoder [#53130](https://github.com/ClickHouse/ClickHouse/pull/53130) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix "Not-ready Set" exception [#53162](https://github.com/ClickHouse/ClickHouse/pull/53162) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix character escaping in the PostgreSQL engine [#53250](https://github.com/ClickHouse/ClickHouse/pull/53250) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Experimental session_log table: Added new tests for session_log and fixed the inconsistency between login and logout. [#53255](https://github.com/ClickHouse/ClickHouse/pull/53255) ([Alexey Gerasimchuck](https://github.com/Demilivor)). Fixed inconsistency between login success and logout [#53302](https://github.com/ClickHouse/ClickHouse/pull/53302) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Fix adding sub-second intervals to DateTime [#53309](https://github.com/ClickHouse/ClickHouse/pull/53309) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix "Context has expired" error in dictionaries [#53342](https://github.com/ClickHouse/ClickHouse/pull/53342) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix incorrect normal projection AST format [#53347](https://github.com/ClickHouse/ClickHouse/pull/53347) ([Amos Bird](https://github.com/amosbird)).
-* Forbid use_structure_from_insertion_table_in_table_functions when execute Scalar [#53348](https://github.com/ClickHouse/ClickHouse/pull/53348) ([flynn](https://github.com/ucasfl)).
-* Fix loading lazy database during system.table select query [#53372](https://github.com/ClickHouse/ClickHouse/pull/53372) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fixed system.data_skipping_indices for MaterializedMySQL [#53381](https://github.com/ClickHouse/ClickHouse/pull/53381) ([Filipp Ozinov](https://github.com/bakwc)).
-* Fix processing single carriage return in TSV file segmentation engine [#53407](https://github.com/ClickHouse/ClickHouse/pull/53407) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix `Context has expired` error properly [#53433](https://github.com/ClickHouse/ClickHouse/pull/53433) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix `timeout_overflow_mode` when having subquery in the rhs of IN [#53439](https://github.com/ClickHouse/ClickHouse/pull/53439) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix an unexpected behavior in [#53152](https://github.com/ClickHouse/ClickHouse/issues/53152) [#53440](https://github.com/ClickHouse/ClickHouse/pull/53440) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Fix JSON_QUERY Function parse error while path is all number [#53470](https://github.com/ClickHouse/ClickHouse/pull/53470) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Fix wrong columns order for queries with parallel FINAL. [#53489](https://github.com/ClickHouse/ClickHouse/pull/53489) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fixed SELECTing from ReplacingMergeTree with do_not_merge_across_partitions_select_final [#53511](https://github.com/ClickHouse/ClickHouse/pull/53511) ([Vasily Nemkov](https://github.com/Enmk)).
-* Flush async insert queue first on shutdown [#53547](https://github.com/ClickHouse/ClickHouse/pull/53547) ([joelynch](https://github.com/joelynch)).
-* Fix crash in join on sparse columna [#53548](https://github.com/ClickHouse/ClickHouse/pull/53548) ([vdimir](https://github.com/vdimir)).
-* Fix possible UB in Set skipping index for functions with incorrect args [#53559](https://github.com/ClickHouse/ClickHouse/pull/53559) ([Azat Khuzhin](https://github.com/azat)).
-* Fix possible UB in inverted indexes (experimental feature) [#53560](https://github.com/ClickHouse/ClickHouse/pull/53560) ([Azat Khuzhin](https://github.com/azat)).
-* Fix: interpolate expression takes source column instead of same name aliased from select expression. [#53572](https://github.com/ClickHouse/ClickHouse/pull/53572) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix number of dropped granules in EXPLAIN PLAN index=1 [#53616](https://github.com/ClickHouse/ClickHouse/pull/53616) ([wangxiaobo](https://github.com/wzb5212)).
-* Correctly handle totals and extremes with `DelayedSource` [#53644](https://github.com/ClickHouse/ClickHouse/pull/53644) ([Antonio Andelic](https://github.com/antonio2368)).
-* Prepared set cache in mutation pipeline stuck [#53645](https://github.com/ClickHouse/ClickHouse/pull/53645) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix bug on mutations with subcolumns of type JSON in predicates of UPDATE and DELETE queries. [#53677](https://github.com/ClickHouse/ClickHouse/pull/53677) ([VanDarkholme7](https://github.com/VanDarkholme7)).
-* Fix filter pushdown for full_sorting_merge join [#53699](https://github.com/ClickHouse/ClickHouse/pull/53699) ([vdimir](https://github.com/vdimir)).
-* Try to fix bug with `NULL::LowCardinality(Nullable(...)) NOT IN` [#53706](https://github.com/ClickHouse/ClickHouse/pull/53706) ([Andrey Zvonov](https://github.com/zvonand)).
-* Fix: sorted distinct with sparse columns [#53711](https://github.com/ClickHouse/ClickHouse/pull/53711) ([Igor Nikonov](https://github.com/devcrafter)).
-* `transform`: correctly handle default column with multiple rows [#53742](https://github.com/ClickHouse/ClickHouse/pull/53742) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Fix fuzzer crash in parseDateTime [#53764](https://github.com/ClickHouse/ClickHouse/pull/53764) ([Robert Schulze](https://github.com/rschu1ze)).
-* MaterializedPostgreSQL: fix uncaught exception in getCreateTableQueryImpl [#53832](https://github.com/ClickHouse/ClickHouse/pull/53832) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix possible segfault while using PostgreSQL engine [#53847](https://github.com/ClickHouse/ClickHouse/pull/53847) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix named_collection_admin alias [#54066](https://github.com/ClickHouse/ClickHouse/pull/54066) ([Kseniia Sumarokova](https://github.com/kssenii)).
-
-### <a id="237"></a> ClickHouse release 23.7, 2023-07-27
-
-#### Backward Incompatible Change
-* Add `NAMED COLLECTION` access type (aliases `USE NAMED COLLECTION`, `NAMED COLLECTION USAGE`). This PR is backward incompatible because this access type is disabled by default (because a parent access type `NAMED COLLECTION ADMIN` is disabled by default as well). Proposed in [#50277](https://github.com/ClickHouse/ClickHouse/issues/50277). To grant use `GRANT NAMED COLLECTION ON collection_name TO user` or `GRANT NAMED COLLECTION ON * TO user`, to be able to give these grants `named_collection_admin` is required in config (previously it was named `named_collection_control`, so will remain as an alias). [#50625](https://github.com/ClickHouse/ClickHouse/pull/50625) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fixing a typo in the `system.parts` column name `last_removal_attemp_time`. Now it is named `last_removal_attempt_time`. [#52104](https://github.com/ClickHouse/ClickHouse/pull/52104) ([filimonov](https://github.com/filimonov)).
-* Bump version of the distributed_ddl_entry_format_version to 5 by default (enables opentelemetry and initial_query_idd pass through). This will not allow to process existing entries for distributed DDL after *downgrade* (but note, that usually there should be no such unprocessed entries). [#52128](https://github.com/ClickHouse/ClickHouse/pull/52128) ([Azat Khuzhin](https://github.com/azat)).
-* Check projection metadata the same way we check ordinary metadata. This change may prevent the server from starting in case there was a table with an invalid projection. An example is a projection that created positional columns in PK (e.g. `projection p (select * order by 1, 4)` which is not allowed in table PK and can cause a crash during insert/merge). Drop such projections before the update. Fixes [#52353](https://github.com/ClickHouse/ClickHouse/issues/52353). [#52361](https://github.com/ClickHouse/ClickHouse/pull/52361) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* The experimental feature `hashid` is removed due to a bug. The quality of implementation was questionable at the start, and it didn't get through the experimental status. This closes [#52406](https://github.com/ClickHouse/ClickHouse/issues/52406). [#52449](https://github.com/ClickHouse/ClickHouse/pull/52449) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-
-#### New Feature
-* Added `Overlay` database engine to combine multiple databases into one. Added `Filesystem` database engine to represent a directory in the filesystem as a set of implicitly available tables with auto-detected formats and structures. A new `S3` database engine allows to read-only interact with s3 storage by representing a prefix as a set of tables. A new `HDFS` database engine allows to interact with HDFS storage in the same way. [#48821](https://github.com/ClickHouse/ClickHouse/pull/48821) ([alekseygolub](https://github.com/alekseygolub)).
-* Add support for external disks in Keeper for storing snapshots and logs. [#50098](https://github.com/ClickHouse/ClickHouse/pull/50098) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add support for multi-directory selection (`{}`) globs. [#50559](https://github.com/ClickHouse/ClickHouse/pull/50559) ([Andrey Zvonov](https://github.com/zvonand)).
-* Kafka connector can fetch Avro schema from schema registry with basic authentication using url-encoded credentials. [#49664](https://github.com/ClickHouse/ClickHouse/pull/49664) ([Ilya Golshtein](https://github.com/ilejn)).
-* Add function `arrayJaccardIndex` which computes the Jaccard similarity between two arrays. [#50076](https://github.com/ClickHouse/ClickHouse/pull/50076) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Add a column `is_obsolete` to `system.settings` and similar tables. Closes [#50819](https://github.com/ClickHouse/ClickHouse/issues/50819). [#50826](https://github.com/ClickHouse/ClickHouse/pull/50826) ([flynn](https://github.com/ucasfl)).
-* Implement support of encrypted elements in configuration file. Added possibility to use encrypted text in leaf elements of configuration file. The text is encrypted using encryption codecs from `<encryption_codecs>` section. [#50986](https://github.com/ClickHouse/ClickHouse/pull/50986) ([Roman Vasin](https://github.com/rvasin)).
-* Grace Hash Join algorithm is now applicable to FULL and RIGHT JOINs. [#49483](https://github.com/ClickHouse/ClickHouse/issues/49483). [#51013](https://github.com/ClickHouse/ClickHouse/pull/51013) ([lgbo](https://github.com/lgbo-ustc)).
-* Add `SYSTEM STOP LISTEN` query for more graceful termination. Closes [#47972](https://github.com/ClickHouse/ClickHouse/issues/47972). [#51016](https://github.com/ClickHouse/ClickHouse/pull/51016) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add `input_format_csv_allow_variable_number_of_columns` options. [#51273](https://github.com/ClickHouse/ClickHouse/pull/51273) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Another boring feature: add function `substring_index`, as in Spark or MySQL. [#51472](https://github.com/ClickHouse/ClickHouse/pull/51472) ([李扬](https://github.com/taiyang-li)).
-* A system table `jemalloc_bins` to show stats for jemalloc bins. Example `SELECT *, size * (nmalloc - ndalloc) AS allocated_bytes FROM system.jemalloc_bins WHERE allocated_bytes > 0 ORDER BY allocated_bytes DESC LIMIT 10`. Enjoy. [#51674](https://github.com/ClickHouse/ClickHouse/pull/51674) ([Alexander Gololobov](https://github.com/davenger)).
-* Add `RowBinaryWithDefaults` format with extra byte before each column as a flag for using the column's default value. Closes [#50854](https://github.com/ClickHouse/ClickHouse/issues/50854). [#51695](https://github.com/ClickHouse/ClickHouse/pull/51695) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added `default_temporary_table_engine` setting. Same as `default_table_engine` but for temporary tables. [#51292](https://github.com/ClickHouse/ClickHouse/issues/51292). [#51708](https://github.com/ClickHouse/ClickHouse/pull/51708) ([velavokr](https://github.com/velavokr)).
-* Added new `initcap` / `initcapUTF8` functions which convert the first letter of each word to upper case and the rest to lower case. [#51735](https://github.com/ClickHouse/ClickHouse/pull/51735) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Create table now supports `PRIMARY KEY` syntax in column definition. Columns are added to primary index in the same order columns are defined. [#51881](https://github.com/ClickHouse/ClickHouse/pull/51881) ([Ilya Yatsishin](https://github.com/qoega)).
-* Added the possibility to use date and time format specifiers in log and error log file names, either in config files (`log` and `errorlog` tags) or command line arguments (`--log-file` and `--errorlog-file`). [#51945](https://github.com/ClickHouse/ClickHouse/pull/51945) ([Victor Krasnov](https://github.com/sirvickr)).
-* Added Peak Memory Usage statistic to HTTP headers. [#51946](https://github.com/ClickHouse/ClickHouse/pull/51946) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Added new `hasSubsequence` (+`CaseInsensitive` and `UTF8` versions) functions to match subsequences in strings. [#52050](https://github.com/ClickHouse/ClickHouse/pull/52050) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Add `array_agg` as alias of `groupArray` for PostgreSQL compatibility. Closes [#52100](https://github.com/ClickHouse/ClickHouse/issues/52100). ### Documentation entry for user-facing changes. [#52135](https://github.com/ClickHouse/ClickHouse/pull/52135) ([flynn](https://github.com/ucasfl)).
-* Add `any_value` as a compatibility alias for `any` aggregate function. Closes [#52140](https://github.com/ClickHouse/ClickHouse/issues/52140). [#52147](https://github.com/ClickHouse/ClickHouse/pull/52147) ([flynn](https://github.com/ucasfl)).
-* Add aggregate function `array_concat_agg` for compatibility with BigQuery, it's alias of `groupArrayArray`. Closes [#52139](https://github.com/ClickHouse/ClickHouse/issues/52139). [#52149](https://github.com/ClickHouse/ClickHouse/pull/52149) ([flynn](https://github.com/ucasfl)).
-* Add `OCTET_LENGTH` as an alias to `length`. Closes [#52153](https://github.com/ClickHouse/ClickHouse/issues/52153). [#52176](https://github.com/ClickHouse/ClickHouse/pull/52176) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Added `firstLine` function to extract the first line from the multi-line string. This closes [#51172](https://github.com/ClickHouse/ClickHouse/issues/51172). [#52209](https://github.com/ClickHouse/ClickHouse/pull/52209) ([Mikhail Koviazin](https://github.com/mkmkme)).
-* Implement KQL-style formatting for the `Interval` data type. This is only needed for compatibility with the `Kusto` query language. [#45671](https://github.com/ClickHouse/ClickHouse/pull/45671) ([ltrk2](https://github.com/ltrk2)).
-* Added query `SYSTEM FLUSH ASYNC INSERT QUEUE` which flushes all pending asynchronous inserts to the destination tables. Added a server-side setting `async_insert_queue_flush_on_shutdown` (`true` by default) which determines whether to flush queue of asynchronous inserts on graceful shutdown. Setting `async_insert_threads` is now a server-side setting. [#49160](https://github.com/ClickHouse/ClickHouse/pull/49160) ([Anton Popov](https://github.com/CurtizJ)).
-* Aliases `current_database` and a new function `current_schemas` for compatibility with PostgreSQL. [#51076](https://github.com/ClickHouse/ClickHouse/pull/51076) ([Pedro Riera](https://github.com/priera)).
-* Add alias for functions `today` (now available under the `curdate`/`current_date` names) and `now` (`current_timestamp`). [#52106](https://github.com/ClickHouse/ClickHouse/pull/52106) ([Lloyd-Pottiger](https://github.com/Lloyd-Pottiger)).
-* Support `async_deduplication_token` for async insert. [#52136](https://github.com/ClickHouse/ClickHouse/pull/52136) ([Han Fei](https://github.com/hanfei1991)).
-* Add new setting `disable_url_encoding` that allows to disable decoding/encoding path in uri in URL engine. [#52337](https://github.com/ClickHouse/ClickHouse/pull/52337) ([Kruglov Pavel](https://github.com/Avogar)).
-
-#### Performance Improvement
-* Enable automatic selection of the sparse serialization format by default. It improves performance. The format is supported since version 22.1. After this change, downgrading to versions older than 22.1 might not be possible. A downgrade may require to set `ratio_of_defaults_for_sparse_serialization=0.9375` [55153](https://github.com/ClickHouse/ClickHouse/issues/55153). You can turn off the usage of the sparse serialization format by providing the `ratio_of_defaults_for_sparse_serialization = 1` setting for your MergeTree tables. [#49631](https://github.com/ClickHouse/ClickHouse/pull/49631) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Enable `move_all_conditions_to_prewhere` and `enable_multiple_prewhere_read_steps` settings by default. [#46365](https://github.com/ClickHouse/ClickHouse/pull/46365) ([Alexander Gololobov](https://github.com/davenger)).
-* Improves performance of some queries by tuning allocator. [#46416](https://github.com/ClickHouse/ClickHouse/pull/46416) ([Azat Khuzhin](https://github.com/azat)).
-* Now we use fixed-size tasks in `MergeTreePrefetchedReadPool` as in `MergeTreeReadPool`. Also from now we use connection pool for S3 requests. [#49732](https://github.com/ClickHouse/ClickHouse/pull/49732) ([Nikita Taranov](https://github.com/nickitat)).
-* More pushdown to the right side of join. [#50532](https://github.com/ClickHouse/ClickHouse/pull/50532) ([Nikita Taranov](https://github.com/nickitat)).
-* Improve grace_hash join by reserving hash table's size (resubmit). [#50875](https://github.com/ClickHouse/ClickHouse/pull/50875) ([lgbo](https://github.com/lgbo-ustc)).
-* Waiting on lock in `OpenedFileCache` could be noticeable sometimes. We sharded it into multiple sub-maps (each with its own lock) to avoid contention. [#51341](https://github.com/ClickHouse/ClickHouse/pull/51341) ([Nikita Taranov](https://github.com/nickitat)).
-* Move conditions with primary key columns to the end of PREWHERE chain. The idea is that conditions with PK columns are likely to be used in PK analysis and will not contribute much more to PREWHERE filtering. [#51958](https://github.com/ClickHouse/ClickHouse/pull/51958) ([Alexander Gololobov](https://github.com/davenger)).
-* Speed up `COUNT(DISTINCT)` for String types by inlining SipHash. The performance experiments of *OnTime* on the ICX device (Intel Xeon Platinum 8380 CPU, 80 cores, 160 threads) show that this change could bring an improvement of *11.6%* to the QPS of the query *Q8* while having no impact on others. [#52036](https://github.com/ClickHouse/ClickHouse/pull/52036) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Enable `allow_vertical_merges_from_compact_to_wide_parts` by default. It will save memory usage during merges. [#52295](https://github.com/ClickHouse/ClickHouse/pull/52295) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix incorrect projection analysis which invalidates primary keys. This issue only exists when `query_plan_optimize_primary_key = 1, query_plan_optimize_projection = 1`. This fixes [#48823](https://github.com/ClickHouse/ClickHouse/issues/48823). This fixes [#51173](https://github.com/ClickHouse/ClickHouse/issues/51173). [#52308](https://github.com/ClickHouse/ClickHouse/pull/52308) ([Amos Bird](https://github.com/amosbird)).
-* Reduce the number of syscalls in `FileCache::loadMetadata` - this speeds up server startup if the filesystem cache is configured. [#52435](https://github.com/ClickHouse/ClickHouse/pull/52435) ([Raúl Marín](https://github.com/Algunenano)).
-* Allow to have strict lower boundary for file segment size by downloading remaining data in the background. Minimum size of file segment (if actual file size is bigger) is configured as cache configuration setting `boundary_alignment`, by default `4Mi`. Number of background threads are configured as cache configuration setting `background_download_threads`, by default `2`. Also `max_file_segment_size` was increased from `8Mi` to `32Mi` in this PR. [#51000](https://github.com/ClickHouse/ClickHouse/pull/51000) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Decreased default timeouts for S3 from 30 seconds to 3 seconds, and for other HTTP from 180 seconds to 30 seconds. [#51171](https://github.com/ClickHouse/ClickHouse/pull/51171) ([Michael Kolupaev](https://github.com/al13n321)).
-* New setting `merge_tree_determine_task_size_by_prewhere_columns` added. If set to `true` only sizes of the columns from `PREWHERE` section will be considered to determine reading task size. Otherwise all the columns from query are considered. [#52606](https://github.com/ClickHouse/ClickHouse/pull/52606) ([Nikita Taranov](https://github.com/nickitat)).
-
-#### Improvement
-* Use read_bytes/total_bytes_to_read for progress bar in s3/file/url/... table functions for better progress indication. [#51286](https://github.com/ClickHouse/ClickHouse/pull/51286) ([Kruglov Pavel](https://github.com/Avogar)).
-* Introduce a table setting `wait_for_unique_parts_send_before_shutdown_ms` which specify the amount of time replica will wait before closing interserver handler for replicated sends. Also fix inconsistency with shutdown of tables and interserver handlers: now server shutdown tables first and only after it shut down interserver handlers. [#51851](https://github.com/ClickHouse/ClickHouse/pull/51851) ([alesapin](https://github.com/alesapin)).
-* Allow SQL standard `FETCH` without `OFFSET`. See https://antonz.org/sql-fetch/. [#51293](https://github.com/ClickHouse/ClickHouse/pull/51293) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Allow filtering HTTP headers for the URL/S3 table functions with the new `http_forbid_headers` section in config. Both exact matching and regexp filters are available. [#51038](https://github.com/ClickHouse/ClickHouse/pull/51038) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Don't show messages about `16 EiB` free space in logs, as they don't make sense. This closes [#49320](https://github.com/ClickHouse/ClickHouse/issues/49320). [#49342](https://github.com/ClickHouse/ClickHouse/pull/49342) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Properly check the limit for the `sleepEachRow` function. Add a setting `function_sleep_max_microseconds_per_block`. This is needed for generic query fuzzer. [#49343](https://github.com/ClickHouse/ClickHouse/pull/49343) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix two issues in `geoHash` functions. [#50066](https://github.com/ClickHouse/ClickHouse/pull/50066) ([李扬](https://github.com/taiyang-li)).
-* Log async insert flush queries into `system.query_log`. [#51160](https://github.com/ClickHouse/ClickHouse/pull/51160) ([Raúl Marín](https://github.com/Algunenano)).
-* Functions `date_diff` and `age` now support millisecond/microsecond unit and work with microsecond precision. [#51291](https://github.com/ClickHouse/ClickHouse/pull/51291) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Improve parsing of path in clickhouse-keeper-client. [#51359](https://github.com/ClickHouse/ClickHouse/pull/51359) ([Azat Khuzhin](https://github.com/azat)).
-* A third-party product depending on ClickHouse (Gluten: a Plugin to Double SparkSQL's Performance) had a bug. This fix avoids heap overflow in that third-party product while reading from HDFS. [#51386](https://github.com/ClickHouse/ClickHouse/pull/51386) ([李扬](https://github.com/taiyang-li)).
-* Add ability to disable native copy for S3 (setting for BACKUP/RESTORE `allow_s3_native_copy`, and `s3_allow_native_copy` for `s3`/`s3_plain` disks). [#51448](https://github.com/ClickHouse/ClickHouse/pull/51448) ([Azat Khuzhin](https://github.com/azat)).
-* Add column `primary_key_size` to `system.parts` table to show compressed primary key size on disk. Closes [#51400](https://github.com/ClickHouse/ClickHouse/issues/51400). [#51496](https://github.com/ClickHouse/ClickHouse/pull/51496) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Allow running `clickhouse-local` without procfs, without home directory existing, and without name resolution plugins from glibc. [#51518](https://github.com/ClickHouse/ClickHouse/pull/51518) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add placeholder `%a` for rull filename in rename_files_after_processing setting. [#51603](https://github.com/ClickHouse/ClickHouse/pull/51603) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add column `modification_time` into `system.parts_columns`. [#51685](https://github.com/ClickHouse/ClickHouse/pull/51685) ([Azat Khuzhin](https://github.com/azat)).
-* Add new setting `input_format_csv_use_default_on_bad_values` to CSV format that allows to insert default value when parsing of a single field failed. [#51716](https://github.com/ClickHouse/ClickHouse/pull/51716) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Added a crash log flush to the disk after the unexpected crash. [#51720](https://github.com/ClickHouse/ClickHouse/pull/51720) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Fix behavior in dashboard page where errors unrelated to authentication are not shown. Also fix 'overlapping' chart behavior. [#51744](https://github.com/ClickHouse/ClickHouse/pull/51744) ([Zach Naimon](https://github.com/ArctypeZach)).
-* Allow UUID to UInt128 conversion. [#51765](https://github.com/ClickHouse/ClickHouse/pull/51765) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Added support for function `range` of Nullable arguments. [#51767](https://github.com/ClickHouse/ClickHouse/pull/51767) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Convert condition like `toyear(x) = c` to `c1 <= x < c2`. [#51795](https://github.com/ClickHouse/ClickHouse/pull/51795) ([Han Fei](https://github.com/hanfei1991)).
-* Improve MySQL compatibility of the statement `SHOW INDEX`. [#51796](https://github.com/ClickHouse/ClickHouse/pull/51796) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix `use_structure_from_insertion_table_in_table_functions` does not work with `MATERIALIZED` and `ALIAS` columns. Closes [#51817](https://github.com/ClickHouse/ClickHouse/issues/51817). Closes [#51019](https://github.com/ClickHouse/ClickHouse/issues/51019). [#51825](https://github.com/ClickHouse/ClickHouse/pull/51825) ([flynn](https://github.com/ucasfl)).
-* Cache dictionary now requests only unique keys from source. Closes [#51762](https://github.com/ClickHouse/ClickHouse/issues/51762). [#51853](https://github.com/ClickHouse/ClickHouse/pull/51853) ([Maksim Kita](https://github.com/kitaisreal)).
-* Fixed the case when settings were not applied for EXPLAIN query when FORMAT was provided. [#51859](https://github.com/ClickHouse/ClickHouse/pull/51859) ([Nikita Taranov](https://github.com/nickitat)).
-* Allow SETTINGS before FORMAT in DESCRIBE TABLE query for compatibility with SELECT query. Closes [#51544](https://github.com/ClickHouse/ClickHouse/issues/51544). [#51899](https://github.com/ClickHouse/ClickHouse/pull/51899) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Var-Int encoded integers (e.g. used by the native protocol) can now use the full 64-bit range. 3rd party clients are advised to update their var-int code accordingly. [#51905](https://github.com/ClickHouse/ClickHouse/pull/51905) ([Robert Schulze](https://github.com/rschu1ze)).
-* Update certificates when they change without the need to manually SYSTEM RELOAD CONFIG. [#52030](https://github.com/ClickHouse/ClickHouse/pull/52030) ([Mike Kot](https://github.com/myrrc)).
-* Added `allow_create_index_without_type` setting that allow to ignore `ADD INDEX` queries without specified `TYPE`. Standard SQL queries will just succeed without changing table schema. [#52056](https://github.com/ClickHouse/ClickHouse/pull/52056) ([Ilya Yatsishin](https://github.com/qoega)).
-* Log messages are written to the `system.text_log` from the server startup. [#52113](https://github.com/ClickHouse/ClickHouse/pull/52113) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* In cases where the HTTP endpoint has multiple IP addresses and the first of them is unreachable, a timeout exception was thrown. Made session creation with handling all resolved endpoints. [#52116](https://github.com/ClickHouse/ClickHouse/pull/52116) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* Avro input format now supports Union even if it contains only a single type. Closes [#52131](https://github.com/ClickHouse/ClickHouse/issues/52131). [#52137](https://github.com/ClickHouse/ClickHouse/pull/52137) ([flynn](https://github.com/ucasfl)).
-* Add setting `optimize_use_implicit_projections` to disable implicit projections (currently only `min_max_count` projection). [#52152](https://github.com/ClickHouse/ClickHouse/pull/52152) ([Amos Bird](https://github.com/amosbird)).
-* It was possible to use the function `hasToken` for infinite loop. Now this possibility is removed. This closes [#52156](https://github.com/ClickHouse/ClickHouse/issues/52156). [#52160](https://github.com/ClickHouse/ClickHouse/pull/52160) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Create ZK ancestors optimistically. [#52195](https://github.com/ClickHouse/ClickHouse/pull/52195) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix [#50582](https://github.com/ClickHouse/ClickHouse/issues/50582). Avoid the `Not found column ... in block` error in some cases of reading in-order and constants. [#52259](https://github.com/ClickHouse/ClickHouse/pull/52259) ([Chen768959](https://github.com/Chen768959)).
-* Check whether S2 geo primitives are invalid as early as possible on ClickHouse side. This closes: [#27090](https://github.com/ClickHouse/ClickHouse/issues/27090). [#52260](https://github.com/ClickHouse/ClickHouse/pull/52260) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Add back missing projection QueryAccessInfo when `query_plan_optimize_projection = 1`. This fixes [#50183](https://github.com/ClickHouse/ClickHouse/issues/50183) . This fixes [#50093](https://github.com/ClickHouse/ClickHouse/issues/50093). [#52327](https://github.com/ClickHouse/ClickHouse/pull/52327) ([Amos Bird](https://github.com/amosbird)).
-* When `ZooKeeperRetriesControl` rethrows an error, it's more useful to see its original stack trace, not the one from `ZooKeeperRetriesControl` itself. [#52347](https://github.com/ClickHouse/ClickHouse/pull/52347) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Wait for zero copy replication lock even if some disks don't support it. [#52376](https://github.com/ClickHouse/ClickHouse/pull/52376) ([Raúl Marín](https://github.com/Algunenano)).
-* Now interserver port will be closed only after tables are shut down. [#52498](https://github.com/ClickHouse/ClickHouse/pull/52498) ([alesapin](https://github.com/alesapin)).
-
-#### Experimental Feature
-* Writing parquet files is 10x faster, it's multi-threaded now. Almost the same speed as reading. [#49367](https://github.com/ClickHouse/ClickHouse/pull/49367) ([Michael Kolupaev](https://github.com/al13n321)). This is controlled by the setting `output_format_parquet_use_custom_encoder` which is disabled by default, because the feature is non-ideal.
-* Added support for [PRQL](https://prql-lang.org/) as a query language. [#50686](https://github.com/ClickHouse/ClickHouse/pull/50686) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* Allow to add disk name for custom disks. Previously custom disks would use an internal generated disk name. Now it will be possible with `disk = disk_<name>(...)` (e.g. disk will have name `name`) . [#51552](https://github.com/ClickHouse/ClickHouse/pull/51552) ([Kseniia Sumarokova](https://github.com/kssenii)). This syntax can be changed in this release.
-* (experimental MaterializedMySQL) Fixed crash when `mysqlxx::Pool::Entry` is used after it was disconnected. [#52063](https://github.com/ClickHouse/ClickHouse/pull/52063) ([Val Doroshchuk](https://github.com/valbok)).
-* (experimental MaterializedMySQL) `CREATE TABLE ... AS SELECT` .. is now supported in MaterializedMySQL. [#52067](https://github.com/ClickHouse/ClickHouse/pull/52067) ([Val Doroshchuk](https://github.com/valbok)).
-* (experimental MaterializedMySQL) Introduced automatic conversion of text types to utf8 for MaterializedMySQL. [#52084](https://github.com/ClickHouse/ClickHouse/pull/52084) ([Val Doroshchuk](https://github.com/valbok)).
-* (experimental MaterializedMySQL) Now unquoted UTF-8 strings are supported in DDL for MaterializedMySQL. [#52318](https://github.com/ClickHouse/ClickHouse/pull/52318) ([Val Doroshchuk](https://github.com/valbok)).
-* (experimental MaterializedMySQL) Now double quoted comments are supported in MaterializedMySQL. [#52355](https://github.com/ClickHouse/ClickHouse/pull/52355) ([Val Doroshchuk](https://github.com/valbok)).
-* Upgrade Intel QPL from v1.1.0 to v1.2.0 2. Upgrade Intel accel-config from v3.5 to v4.0 3. Fixed issue that Device IOTLB miss has big perf. impact for IAA accelerators. [#52180](https://github.com/ClickHouse/ClickHouse/pull/52180) ([jasperzhu](https://github.com/jinjunzh)).
-* The `session_timezone` setting (new in version 23.6) is demoted to experimental. [#52445](https://github.com/ClickHouse/ClickHouse/pull/52445) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Support ZooKeeper `reconfig` command for ClickHouse Keeper with incremental reconfiguration which can be enabled via `keeper_server.enable_reconfiguration` setting. Support adding servers, removing servers, and changing server priorities. [#49450](https://github.com/ClickHouse/ClickHouse/pull/49450) ([Mike Kot](https://github.com/myrrc)). It is suspected that this feature is incomplete.
-
-#### Build/Testing/Packaging Improvement
-* Add experimental ClickHouse builds for Linux RISC-V 64 to CI. [#31398](https://github.com/ClickHouse/ClickHouse/pull/31398) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add integration test check with the enabled Analyzer. [#50926](https://github.com/ClickHouse/ClickHouse/pull/50926) [#52210](https://github.com/ClickHouse/ClickHouse/pull/52210) ([Dmitry Novik](https://github.com/novikd)).
-* Reproducible builds for Rust. [#52395](https://github.com/ClickHouse/ClickHouse/pull/52395) ([Azat Khuzhin](https://github.com/azat)).
-* Update Cargo dependencies. [#51721](https://github.com/ClickHouse/ClickHouse/pull/51721) ([Raúl Marín](https://github.com/Algunenano)).
-* Make the function `CHColumnToArrowColumn::fillArrowArrayWithArrayColumnData` to work with nullable arrays, which are not possible in ClickHouse, but needed for Gluten. [#52112](https://github.com/ClickHouse/ClickHouse/pull/52112) ([李扬](https://github.com/taiyang-li)).
-* We've updated the CCTZ library to master, but there are no user-visible changes. [#52124](https://github.com/ClickHouse/ClickHouse/pull/52124) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The `system.licenses` table now includes the hard-forked library Poco. This closes [#52066](https://github.com/ClickHouse/ClickHouse/issues/52066). [#52127](https://github.com/ClickHouse/ClickHouse/pull/52127) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Check that there are no cases of bad punctuation: whitespace before a comma like `Hello ,world` instead of `Hello, world`. [#52549](https://github.com/ClickHouse/ClickHouse/pull/52549) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Fix MaterializedPostgreSQL syncTables [#49698](https://github.com/ClickHouse/ClickHouse/pull/49698) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix projection with optimize_aggregators_of_group_by_keys [#49709](https://github.com/ClickHouse/ClickHouse/pull/49709) ([Amos Bird](https://github.com/amosbird)).
-* Fix optimize_skip_unused_shards with JOINs [#51037](https://github.com/ClickHouse/ClickHouse/pull/51037) ([Azat Khuzhin](https://github.com/azat)).
-* Fix formatDateTime() with fractional negative datetime64 [#51290](https://github.com/ClickHouse/ClickHouse/pull/51290) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Functions `hasToken*` were totally wrong. Add a test for [#43358](https://github.com/ClickHouse/ClickHouse/issues/43358) [#51378](https://github.com/ClickHouse/ClickHouse/pull/51378) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix optimization to move functions before sorting. [#51481](https://github.com/ClickHouse/ClickHouse/pull/51481) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix Block structure mismatch in Pipe::unitePipes for FINAL [#51492](https://github.com/ClickHouse/ClickHouse/pull/51492) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix SIGSEGV for clusters with zero weight across all shards (fixes INSERT INTO FUNCTION clusterAllReplicas()) [#51545](https://github.com/ClickHouse/ClickHouse/pull/51545) ([Azat Khuzhin](https://github.com/azat)).
-* Fix timeout for hedged requests [#51582](https://github.com/ClickHouse/ClickHouse/pull/51582) ([Azat Khuzhin](https://github.com/azat)).
-* Fix logical error in ANTI join with NULL [#51601](https://github.com/ClickHouse/ClickHouse/pull/51601) ([vdimir](https://github.com/vdimir)).
-* Fix for moving 'IN' conditions to PREWHERE [#51610](https://github.com/ClickHouse/ClickHouse/pull/51610) ([Alexander Gololobov](https://github.com/davenger)).
-* Do not apply PredicateExpressionsOptimizer for ASOF/ANTI join [#51633](https://github.com/ClickHouse/ClickHouse/pull/51633) ([vdimir](https://github.com/vdimir)).
-* Fix async insert with deduplication for ReplicatedMergeTree using merging algorithms [#51676](https://github.com/ClickHouse/ClickHouse/pull/51676) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix reading from empty column in `parseSipHashKey` [#51804](https://github.com/ClickHouse/ClickHouse/pull/51804) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix segfault when create invalid EmbeddedRocksdb table [#51847](https://github.com/ClickHouse/ClickHouse/pull/51847) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix inserts into MongoDB tables [#51876](https://github.com/ClickHouse/ClickHouse/pull/51876) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix deadlock on DatabaseCatalog shutdown [#51908](https://github.com/ClickHouse/ClickHouse/pull/51908) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix error in subquery operators [#51922](https://github.com/ClickHouse/ClickHouse/pull/51922) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix async connect to hosts with multiple ips [#51934](https://github.com/ClickHouse/ClickHouse/pull/51934) ([Kruglov Pavel](https://github.com/Avogar)).
-* Do not remove inputs after ActionsDAG::merge [#51947](https://github.com/ClickHouse/ClickHouse/pull/51947) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Check refcount in `RemoveManyObjectStorageOperation::finalize` instead of `execute` [#51954](https://github.com/ClickHouse/ClickHouse/pull/51954) ([vdimir](https://github.com/vdimir)).
-* Allow parametric UDFs [#51964](https://github.com/ClickHouse/ClickHouse/pull/51964) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Small fix for toDateTime64() for dates after 2283-12-31 [#52130](https://github.com/ClickHouse/ClickHouse/pull/52130) ([Andrey Zvonov](https://github.com/zvonand)).
-* Fix ORDER BY tuple of WINDOW functions [#52145](https://github.com/ClickHouse/ClickHouse/pull/52145) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix incorrect projection analysis when aggregation expression contains monotonic functions [#52151](https://github.com/ClickHouse/ClickHouse/pull/52151) ([Amos Bird](https://github.com/amosbird)).
-* Fix error in `groupArrayMoving` functions [#52161](https://github.com/ClickHouse/ClickHouse/pull/52161) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Disable direct join for range dictionary [#52187](https://github.com/ClickHouse/ClickHouse/pull/52187) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix sticky mutations test (and extremely rare race condition) [#52197](https://github.com/ClickHouse/ClickHouse/pull/52197) ([alesapin](https://github.com/alesapin)).
-* Fix race in Web disk [#52211](https://github.com/ClickHouse/ClickHouse/pull/52211) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix data race in Connection::setAsyncCallback on unknown packet from server [#52219](https://github.com/ClickHouse/ClickHouse/pull/52219) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix temp data deletion on startup, add test [#52275](https://github.com/ClickHouse/ClickHouse/pull/52275) ([vdimir](https://github.com/vdimir)).
-* Don't use minmax_count projections when counting nullable columns [#52297](https://github.com/ClickHouse/ClickHouse/pull/52297) ([Amos Bird](https://github.com/amosbird)).
-* MergeTree/ReplicatedMergeTree should use server timezone for log entries [#52325](https://github.com/ClickHouse/ClickHouse/pull/52325) ([Azat Khuzhin](https://github.com/azat)).
-* Fix parameterized view with cte and multiple usage [#52328](https://github.com/ClickHouse/ClickHouse/pull/52328) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Disable expression templates for time intervals [#52335](https://github.com/ClickHouse/ClickHouse/pull/52335) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix `apply_snapshot` in Keeper [#52358](https://github.com/ClickHouse/ClickHouse/pull/52358) ([Antonio Andelic](https://github.com/antonio2368)).
-* Update build-osx.md [#52377](https://github.com/ClickHouse/ClickHouse/pull/52377) ([AlexBykovski](https://github.com/AlexBykovski)).
-* Fix `countSubstrings` hang with empty needle and a column haystack [#52409](https://github.com/ClickHouse/ClickHouse/pull/52409) ([Sergei Trifonov](https://github.com/serxa)).
-* Fix normal projection with merge table  [#52432](https://github.com/ClickHouse/ClickHouse/pull/52432) ([Amos Bird](https://github.com/amosbird)).
-* Fix possible double-free in Aggregator [#52439](https://github.com/ClickHouse/ClickHouse/pull/52439) ([Nikita Taranov](https://github.com/nickitat)).
-* Fixed inserting into Buffer engine [#52440](https://github.com/ClickHouse/ClickHouse/pull/52440) ([Vasily Nemkov](https://github.com/Enmk)).
-* The implementation of AnyHash was non-conformant. [#52448](https://github.com/ClickHouse/ClickHouse/pull/52448) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Check recursion depth in OptimizedRegularExpression [#52451](https://github.com/ClickHouse/ClickHouse/pull/52451) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix data-race DatabaseReplicated::startupTables()/canExecuteReplicatedMetadataAlter() [#52490](https://github.com/ClickHouse/ClickHouse/pull/52490) ([Azat Khuzhin](https://github.com/azat)).
-* Fix abort in function `transform` [#52513](https://github.com/ClickHouse/ClickHouse/pull/52513) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix lightweight delete after drop of projection [#52517](https://github.com/ClickHouse/ClickHouse/pull/52517) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix possible error "Cannot drain connections: cancel first" [#52585](https://github.com/ClickHouse/ClickHouse/pull/52585) ([Kruglov Pavel](https://github.com/Avogar)).
-
-
-### <a id="236"></a> ClickHouse release 23.6, 2023-06-29
-
-#### Backward Incompatible Change
-* Delete feature `do_not_evict_index_and_mark_files` in the fs cache. This feature was only making things worse. [#51253](https://github.com/ClickHouse/ClickHouse/pull/51253) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Remove ALTER support for experimental LIVE VIEW. [#51287](https://github.com/ClickHouse/ClickHouse/pull/51287) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Decrease the default values for `http_max_field_value_size` and `http_max_field_name_size` to 128 KiB. [#51163](https://github.com/ClickHouse/ClickHouse/pull/51163) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* CGroups metrics related to CPU are replaced with one metric, `CGroupMaxCPU` for better usability. The `Normalized` CPU usage metrics will be normalized to CGroups limits instead of the total number of CPUs when they are set. This closes [#50836](https://github.com/ClickHouse/ClickHouse/issues/50836). [#50835](https://github.com/ClickHouse/ClickHouse/pull/50835) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-
-#### New Feature
-* The function `transform` as well as `CASE` with value matching started to support all data types. This closes [#29730](https://github.com/ClickHouse/ClickHouse/issues/29730). This closes [#32387](https://github.com/ClickHouse/ClickHouse/issues/32387). This closes [#50827](https://github.com/ClickHouse/ClickHouse/issues/50827). This closes [#31336](https://github.com/ClickHouse/ClickHouse/issues/31336). This closes [#40493](https://github.com/ClickHouse/ClickHouse/issues/40493). [#51351](https://github.com/ClickHouse/ClickHouse/pull/51351) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added option `--rename_files_after_processing <pattern>`. This closes [#34207](https://github.com/ClickHouse/ClickHouse/issues/34207). [#49626](https://github.com/ClickHouse/ClickHouse/pull/49626) ([alekseygolub](https://github.com/alekseygolub)).
-* Add support for `TRUNCATE` modifier in `INTO OUTFILE` clause. Suggest using `APPEND` or `TRUNCATE` for `INTO OUTFILE` when file exists. [#50950](https://github.com/ClickHouse/ClickHouse/pull/50950) ([alekar](https://github.com/alekar)).
-* Add table engine `Redis` and table function `redis`. It allows querying external Redis servers. [#50150](https://github.com/ClickHouse/ClickHouse/pull/50150) ([JackyWoo](https://github.com/JackyWoo)).
-* Allow to skip empty files in file/s3/url/hdfs table functions using settings `s3_skip_empty_files`, `hdfs_skip_empty_files`, `engine_file_skip_empty_files`, `engine_url_skip_empty_files`. [#50364](https://github.com/ClickHouse/ClickHouse/pull/50364) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add a new setting named `use_mysql_types_in_show_columns` to alter the `SHOW COLUMNS` SQL statement to display MySQL equivalent types when a client is connected via the MySQL compatibility port. [#49577](https://github.com/ClickHouse/ClickHouse/pull/49577) ([Thomas Panetti](https://github.com/tpanetti)).
-* Clickhouse-client can now be called with a connection string instead of "--host", "--port", "--user" etc. [#50689](https://github.com/ClickHouse/ClickHouse/pull/50689) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Add setting `session_timezone`; it is used as the default timezone for a session when not explicitly specified. [#44149](https://github.com/ClickHouse/ClickHouse/pull/44149) ([Andrey Zvonov](https://github.com/zvonand)).
-* Codec DEFLATE_QPL is now controlled via server setting "enable_deflate_qpl_codec" (default: false) instead of setting "allow_experimental_codecs". This marks DEFLATE_QPL non-experimental. [#50775](https://github.com/ClickHouse/ClickHouse/pull/50775) ([Robert Schulze](https://github.com/rschu1ze)).
-
-#### Performance Improvement
-* Improved scheduling of merge selecting and cleanup tasks in `ReplicatedMergeTree`. The tasks will not be executed too frequently when there's nothing to merge or cleanup. Added settings `max_merge_selecting_sleep_ms`, `merge_selecting_sleep_slowdown_factor`, `max_cleanup_delay_period` and `cleanup_thread_preferred_points_per_iteration`. It should close [#31919](https://github.com/ClickHouse/ClickHouse/issues/31919). [#50107](https://github.com/ClickHouse/ClickHouse/pull/50107) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Make filter push down through cross join. [#50605](https://github.com/ClickHouse/ClickHouse/pull/50605) ([Han Fei](https://github.com/hanfei1991)).
-* Improve performance with enabled QueryProfiler using thread-local timer_id instead of global object. [#48778](https://github.com/ClickHouse/ClickHouse/pull/48778) ([Jiebin Sun](https://github.com/jiebinn)).
-* Rewrite CapnProto input/output format to improve its performance. Map column names and CapnProto fields case insensitive, fix reading/writing of nested structure fields. [#49752](https://github.com/ClickHouse/ClickHouse/pull/49752) ([Kruglov Pavel](https://github.com/Avogar)).
-* Optimize parquet write performance for parallel threads. [#50102](https://github.com/ClickHouse/ClickHouse/pull/50102) ([Hongbin Ma](https://github.com/binmahone)).
-* Disable `parallelize_output_from_storages` for processing MATERIALIZED VIEWs and storages with one block only. [#50214](https://github.com/ClickHouse/ClickHouse/pull/50214) ([Azat Khuzhin](https://github.com/azat)).
-* Merge PR [#46558](https://github.com/ClickHouse/ClickHouse/pull/46558). Avoid block permutation during sort if the block is already sorted. [#50697](https://github.com/ClickHouse/ClickHouse/pull/50697) ([Alexey Milovidov](https://github.com/alexey-milovidov), [Maksim Kita](https://github.com/kitaisreal)).
-* Make multiple list requests to ZooKeeper in parallel to speed up reading from system.zookeeper table. [#51042](https://github.com/ClickHouse/ClickHouse/pull/51042) ([Alexander Gololobov](https://github.com/davenger)).
-* Speedup initialization of DateTime lookup tables for time zones. This should reduce startup/connect time of clickhouse-client especially in debug build as it is rather heavy. [#51347](https://github.com/ClickHouse/ClickHouse/pull/51347) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix data lakes slowness because of synchronous head requests. (Related to Iceberg/Deltalake/Hudi being slow with a lot of files). [#50976](https://github.com/ClickHouse/ClickHouse/pull/50976) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Do not read all the columns from right GLOBAL JOIN table. [#50721](https://github.com/ClickHouse/ClickHouse/pull/50721) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-
-#### Experimental Feature
-* Support parallel replicas with the analyzer. [#50441](https://github.com/ClickHouse/ClickHouse/pull/50441) ([Raúl Marín](https://github.com/Algunenano)).
-* Add random sleep before large merges/mutations execution to split load more evenly between replicas in case of zero-copy replication. [#51282](https://github.com/ClickHouse/ClickHouse/pull/51282) ([alesapin](https://github.com/alesapin)).
-* Do not replicate `ALTER PARTITION` queries and mutations through `Replicated` database if it has only one shard and the underlying table is `ReplicatedMergeTree`. [#51049](https://github.com/ClickHouse/ClickHouse/pull/51049) ([Alexander Tokmakov](https://github.com/tavplubix)).
-
-#### Improvement
-* Relax the thresholds for "too many parts" to be more modern. Return the backpressure during long-running insert queries. [#50856](https://github.com/ClickHouse/ClickHouse/pull/50856) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Allow to cast IPv6 to IPv4 address for CIDR ::ffff:0:0/96 (IPv4-mapped addresses). [#49759](https://github.com/ClickHouse/ClickHouse/pull/49759) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Update MongoDB protocol to support MongoDB 5.1 version and newer. Support for the versions with the old protocol (<3.6) is preserved. Closes [#45621](https://github.com/ClickHouse/ClickHouse/issues/45621), [#49879](https://github.com/ClickHouse/ClickHouse/issues/49879). [#50061](https://github.com/ClickHouse/ClickHouse/pull/50061) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add setting `input_format_max_bytes_to_read_for_schema_inference` to limit the number of bytes to read in schema inference. Closes [#50577](https://github.com/ClickHouse/ClickHouse/issues/50577). [#50592](https://github.com/ClickHouse/ClickHouse/pull/50592) ([Kruglov Pavel](https://github.com/Avogar)).
-* Respect setting `input_format_null_as_default` in schema inference. [#50602](https://github.com/ClickHouse/ClickHouse/pull/50602) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow to skip trailing empty lines in CSV/TSV/CustomSeparated formats via settings `input_format_csv_skip_trailing_empty_lines`, `input_format_tsv_skip_trailing_empty_lines` and `input_format_custom_skip_trailing_empty_lines` (disabled by default). Closes [#49315](https://github.com/ClickHouse/ClickHouse/issues/49315). [#50635](https://github.com/ClickHouse/ClickHouse/pull/50635) ([Kruglov Pavel](https://github.com/Avogar)).
-* Functions "toDateOrDefault|OrNull" and "accuateCast[OrDefault|OrNull]" now correctly parse numeric arguments. [#50709](https://github.com/ClickHouse/ClickHouse/pull/50709) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Support CSV with whitespace or `\t` field delimiters, and these delimiters are supported in Spark. [#50712](https://github.com/ClickHouse/ClickHouse/pull/50712) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Settings `number_of_mutations_to_delay` and `number_of_mutations_to_throw` are enabled by default now with values 500 and 1000 respectively. [#50726](https://github.com/ClickHouse/ClickHouse/pull/50726) ([Anton Popov](https://github.com/CurtizJ)).
-* The dashboard correctly shows missing values. This closes [#50831](https://github.com/ClickHouse/ClickHouse/issues/50831). [#50832](https://github.com/ClickHouse/ClickHouse/pull/50832) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added the possibility to use date and time arguments in the syslog timestamp format in functions `parseDateTimeBestEffort*` and `parseDateTime64BestEffort*`. [#50925](https://github.com/ClickHouse/ClickHouse/pull/50925) ([Victor Krasnov](https://github.com/sirvickr)).
-* Command line parameter "--password" in clickhouse-client can now be specified only once. [#50966](https://github.com/ClickHouse/ClickHouse/pull/50966) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Use `hash_of_all_files` from `system.parts` to check identity of parts during on-cluster backups. [#50997](https://github.com/ClickHouse/ClickHouse/pull/50997) ([Vitaly Baranov](https://github.com/vitlibar)).
-* The system table zookeeper_connection connected_time identifies the time when the connection is established (standard format), and session_uptime_elapsed_seconds is added, which labels the duration of the established connection session (in seconds). [#51026](https://github.com/ClickHouse/ClickHouse/pull/51026) ([郭小龙](https://github.com/guoxiaolongzte)).
-* Improve the progress bar for file/s3/hdfs/url table functions by using chunk size from source data and using incremental total size counting in each thread. Fix the progress bar for *Cluster functions. This closes [#47250](https://github.com/ClickHouse/ClickHouse/issues/47250). [#51088](https://github.com/ClickHouse/ClickHouse/pull/51088) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add total_bytes_to_read to the Progress packet in TCP protocol for better Progress bar. [#51158](https://github.com/ClickHouse/ClickHouse/pull/51158) ([Kruglov Pavel](https://github.com/Avogar)).
-* Better checking of data parts on disks with filesystem cache. [#51164](https://github.com/ClickHouse/ClickHouse/pull/51164) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix sometimes not correct current_elements_num in fs cache. [#51242](https://github.com/ClickHouse/ClickHouse/pull/51242) ([Kseniia Sumarokova](https://github.com/kssenii)).
-
-#### Build/Testing/Packaging Improvement
-* Add embedded keeper-client to standalone keeper binary. [#50964](https://github.com/ClickHouse/ClickHouse/pull/50964) ([pufit](https://github.com/pufit)).
-* Actual LZ4 version is used now. [#50621](https://github.com/ClickHouse/ClickHouse/pull/50621) ([Nikita Taranov](https://github.com/nickitat)).
-* ClickHouse server will print the list of changed settings on fatal errors. This closes [#51137](https://github.com/ClickHouse/ClickHouse/issues/51137). [#51138](https://github.com/ClickHouse/ClickHouse/pull/51138) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Allow building ClickHouse with clang-17. [#51300](https://github.com/ClickHouse/ClickHouse/pull/51300) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* [SQLancer](https://github.com/sqlancer/sqlancer) check is considered stable as bugs that were triggered by it are fixed. Now failures of SQLancer check will be reported as failed check status. [#51340](https://github.com/ClickHouse/ClickHouse/pull/51340) ([Ilya Yatsishin](https://github.com/qoega)).
-* Split huge `RUN` in Dockerfile into smaller conditional. Install the necessary tools on demand in the same `RUN` layer, and remove them after that. Upgrade the OS only once at the beginning. Use a modern way to check the signed repository. Downgrade the base repo to ubuntu:20.04 to address the issues on older docker versions. Upgrade golang version to address golang vulnerabilities. [#51504](https://github.com/ClickHouse/ClickHouse/pull/51504) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Improve aliases for clickhouse binary (now `ch`/`clickhouse` is `clickhouse-local` or `clickhouse` depends on the arguments) and add bash completion for new aliases. [#58344](https://github.com/ClickHouse/ClickHouse/pull/58344) ([Azat Khuzhin](https://github.com/azat)).
+* Add settings changes check to CI to check that all settings changes are reflected in settings changes history. [#58555](https://github.com/ClickHouse/ClickHouse/pull/58555) ([Kruglov Pavel](https://github.com/Avogar)).
+* Use tables directly attached from S3 in stateful tests. [#58791](https://github.com/ClickHouse/ClickHouse/pull/58791) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Save the whole `fuzzer.log` as an archive instead of the last 100k lines. `tail -n 100000` often removes lines with table definitions. Example:. [#58821](https://github.com/ClickHouse/ClickHouse/pull/58821) ([Dmitry Novik](https://github.com/novikd)).
+* Enable Rust on macOS with Aarch64 (this will add fuzzy search in client with skim and the PRQL language, though I don't think that are people who host ClickHouse on darwin, so it is mostly for fuzzy search in client I would say). [#59272](https://github.com/ClickHouse/ClickHouse/pull/59272) ([Azat Khuzhin](https://github.com/azat)).
+* Fix aggregation issue in mixed x86_64 and ARM clusters [#59132](https://github.com/ClickHouse/ClickHouse/pull/59132) ([Harry Lee](https://github.com/HarryLeeIBM)).
 
 #### Bug Fix (user-visible misbehavior in an official stable release)
 
-* Report loading status for executable dictionaries correctly [#48775](https://github.com/ClickHouse/ClickHouse/pull/48775) ([Anton Kozlov](https://github.com/tonickkozlov)).
-* Proper mutation of skip indices and projections [#50104](https://github.com/ClickHouse/ClickHouse/pull/50104) ([Amos Bird](https://github.com/amosbird)).
-* Cleanup moving parts [#50489](https://github.com/ClickHouse/ClickHouse/pull/50489) ([vdimir](https://github.com/vdimir)).
-* Fix backward compatibility for IP types hashing in aggregate functions [#50551](https://github.com/ClickHouse/ClickHouse/pull/50551) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix Log family table return wrong rows count after truncate [#50585](https://github.com/ClickHouse/ClickHouse/pull/50585) ([flynn](https://github.com/ucasfl)).
-* Fix bug in `uniqExact` parallel merging [#50590](https://github.com/ClickHouse/ClickHouse/pull/50590) ([Nikita Taranov](https://github.com/nickitat)).
-* Revert recent grace hash join changes [#50699](https://github.com/ClickHouse/ClickHouse/pull/50699) ([vdimir](https://github.com/vdimir)).
-* Query Cache: Try to fix bad cast from `ColumnConst` to `ColumnVector<char8_t>` [#50704](https://github.com/ClickHouse/ClickHouse/pull/50704) ([Robert Schulze](https://github.com/rschu1ze)).
-* Avoid storing logs in Keeper containing unknown operation [#50751](https://github.com/ClickHouse/ClickHouse/pull/50751) ([Antonio Andelic](https://github.com/antonio2368)).
-* SummingMergeTree support for DateTime64 [#50797](https://github.com/ClickHouse/ClickHouse/pull/50797) ([Jordi Villar](https://github.com/jrdi)).
-* Add compatibility setting for non-const timezones [#50834](https://github.com/ClickHouse/ClickHouse/pull/50834) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix hashing of LDAP params in the cache entries [#50865](https://github.com/ClickHouse/ClickHouse/pull/50865) ([Julian Maicher](https://github.com/jmaicher)).
-* Fallback to parsing big integer from String instead of exception in Parquet format [#50873](https://github.com/ClickHouse/ClickHouse/pull/50873) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix checking the lock file too often while writing a backup [#50889](https://github.com/ClickHouse/ClickHouse/pull/50889) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Do not apply projection if read-in-order was enabled. [#50923](https://github.com/ClickHouse/ClickHouse/pull/50923) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix race in the Azure blob storage iterator [#50936](https://github.com/ClickHouse/ClickHouse/pull/50936) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix erroneous `sort_description` propagation in `CreatingSets` [#50955](https://github.com/ClickHouse/ClickHouse/pull/50955) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix Iceberg v2 optional metadata parsing [#50974](https://github.com/ClickHouse/ClickHouse/pull/50974) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* MaterializedMySQL: Keep parentheses for empty table overrides [#50977](https://github.com/ClickHouse/ClickHouse/pull/50977) ([Val Doroshchuk](https://github.com/valbok)).
-* Fix crash in BackupCoordinationStageSync::setError() [#51012](https://github.com/ClickHouse/ClickHouse/pull/51012) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix subtly broken copy-on-write of ColumnLowCardinality dictionary [#51064](https://github.com/ClickHouse/ClickHouse/pull/51064) ([Michael Kolupaev](https://github.com/al13n321)).
-* Generate safe IVs [#51086](https://github.com/ClickHouse/ClickHouse/pull/51086) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Fix ineffective query cache for SELECTs with subqueries [#51132](https://github.com/ClickHouse/ClickHouse/pull/51132) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix Set index with constant nullable comparison. [#51205](https://github.com/ClickHouse/ClickHouse/pull/51205) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix a crash in s3 and s3Cluster functions [#51209](https://github.com/ClickHouse/ClickHouse/pull/51209) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix a crash with compiled expressions [#51231](https://github.com/ClickHouse/ClickHouse/pull/51231) ([LiuNeng](https://github.com/liuneng1994)).
-* Fix use-after-free in StorageURL when switching URLs [#51260](https://github.com/ClickHouse/ClickHouse/pull/51260) ([Michael Kolupaev](https://github.com/al13n321)).
-* Updated check for parameterized view [#51272](https://github.com/ClickHouse/ClickHouse/pull/51272) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix multiple writing of same file to backup [#51299](https://github.com/ClickHouse/ClickHouse/pull/51299) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix fuzzer failure in ActionsDAG [#51301](https://github.com/ClickHouse/ClickHouse/pull/51301) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Remove garbage from function `transform` [#51350](https://github.com/ClickHouse/ClickHouse/pull/51350) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add join keys conversion for nested LowCardinality [#51550](https://github.com/ClickHouse/ClickHouse/pull/51550) ([vdimir](https://github.com/vdimir)).
+* Flatten only true Nested type if flatten_nested=1, not all Array(Tuple) [#56132](https://github.com/ClickHouse/ClickHouse/pull/56132) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix a bug with projections and the `aggregate_functions_null_for_empty` setting during insertion. [#56944](https://github.com/ClickHouse/ClickHouse/pull/56944) ([Amos Bird](https://github.com/amosbird)).
+* Fixed potential exception due to stale profile UUID [#57263](https://github.com/ClickHouse/ClickHouse/pull/57263) ([Vasily Nemkov](https://github.com/Enmk)).
+* Fix working with read buffers in StreamingFormatExecutor [#57438](https://github.com/ClickHouse/ClickHouse/pull/57438) ([Kruglov Pavel](https://github.com/Avogar)).
+* Ignore MVs with dropped target table during pushing to views [#57520](https://github.com/ClickHouse/ClickHouse/pull/57520) ([Kruglov Pavel](https://github.com/Avogar)).
+* Eliminate possible race between ALTER_METADATA and MERGE_PARTS [#57755](https://github.com/ClickHouse/ClickHouse/pull/57755) ([Azat Khuzhin](https://github.com/azat)).
+* Fix the expressions order bug in group by with rollup [#57786](https://github.com/ClickHouse/ClickHouse/pull/57786) ([Chen768959](https://github.com/Chen768959)).
+* A fix for the obsolete "zero-copy" replication feature: Fix lost blobs after dropping a replica with broken detached parts [#58333](https://github.com/ClickHouse/ClickHouse/pull/58333) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Allow users to work with symlinks in user_files_path [#58447](https://github.com/ClickHouse/ClickHouse/pull/58447) ([Duc Canh Le](https://github.com/canhld94)).
+* Fix a crash when graphite table does not have an agg function [#58453](https://github.com/ClickHouse/ClickHouse/pull/58453) ([Duc Canh Le](https://github.com/canhld94)).
+* Delay reading from StorageKafka to allow multiple reads in materialized views [#58477](https://github.com/ClickHouse/ClickHouse/pull/58477) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Fix a stupid case of intersecting parts [#58482](https://github.com/ClickHouse/ClickHouse/pull/58482) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* MergeTreePrefetchedReadPool disable for LIMIT only queries [#58505](https://github.com/ClickHouse/ClickHouse/pull/58505) ([Maksim Kita](https://github.com/kitaisreal)).
+* Enable ordinary databases while restoration [#58520](https://github.com/ClickHouse/ClickHouse/pull/58520) ([Jihyuk Bok](https://github.com/tomahawk28)).
+* Fix Apache Hive threadpool reading for ORC/Parquet/... [#58537](https://github.com/ClickHouse/ClickHouse/pull/58537) ([sunny](https://github.com/sunny19930321)).
+* Hide credentials in `system.backup_log`'s `base_backup_name` column [#58550](https://github.com/ClickHouse/ClickHouse/pull/58550) ([Daniel Pozo Escalona](https://github.com/danipozo)).
+* `toStartOfInterval` for milli- microsencods values rounding [#58557](https://github.com/ClickHouse/ClickHouse/pull/58557) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Disable `max_joined_block_rows` in ConcurrentHashJoin [#58595](https://github.com/ClickHouse/ClickHouse/pull/58595) ([vdimir](https://github.com/vdimir)).
+* Fix join using nullable in the old analyzer [#58596](https://github.com/ClickHouse/ClickHouse/pull/58596) ([vdimir](https://github.com/vdimir)).
+* `makeDateTime64`: Allow non-const fraction argument [#58597](https://github.com/ClickHouse/ClickHouse/pull/58597) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix possible NULL dereference during symbolizing inline frames [#58607](https://github.com/ClickHouse/ClickHouse/pull/58607) ([Azat Khuzhin](https://github.com/azat)).
+* Improve isolation of query cache entries under re-created users or role switches [#58611](https://github.com/ClickHouse/ClickHouse/pull/58611) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix broken partition key analysis when doing projection optimization [#58638](https://github.com/ClickHouse/ClickHouse/pull/58638) ([Amos Bird](https://github.com/amosbird)).
+* Query cache: Fix per-user quota [#58731](https://github.com/ClickHouse/ClickHouse/pull/58731) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix stream partitioning in parallel window functions [#58739](https://github.com/ClickHouse/ClickHouse/pull/58739) ([Dmitry Novik](https://github.com/novikd)).
+* Fix double destroy call on exception throw in addBatchLookupTable8 [#58745](https://github.com/ClickHouse/ClickHouse/pull/58745) ([Raúl Marín](https://github.com/Algunenano)).
+* Don't process requests in Keeper during shutdown [#58765](https://github.com/ClickHouse/ClickHouse/pull/58765) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix a null pointer dereference in `SlabsPolygonIndex::find` [#58771](https://github.com/ClickHouse/ClickHouse/pull/58771) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Fix JSONExtract function for LowCardinality(Nullable) columns [#58808](https://github.com/ClickHouse/ClickHouse/pull/58808) ([vdimir](https://github.com/vdimir)).
+* A fix for unexpected accumulation of memory usage while creating a huge number of tables by CREATE and DROP. [#58831](https://github.com/ClickHouse/ClickHouse/pull/58831) ([Maksim Kita](https://github.com/kitaisreal)).
+* Multiple read file log storage in mv [#58877](https://github.com/ClickHouse/ClickHouse/pull/58877) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Restriction for the access key id for s3. [#58900](https://github.com/ClickHouse/ClickHouse/pull/58900) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* Fix possible crash in clickhouse-local during loading suggestions [#58907](https://github.com/ClickHouse/ClickHouse/pull/58907) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix crash when `indexHint` is used [#58911](https://github.com/ClickHouse/ClickHouse/pull/58911) ([Dmitry Novik](https://github.com/novikd)).
+* Fix StorageURL forgetting headers on server restart [#58933](https://github.com/ClickHouse/ClickHouse/pull/58933) ([Michael Kolupaev](https://github.com/al13n321)).
+* Analyzer: fix storage replacement with insertion block [#58958](https://github.com/ClickHouse/ClickHouse/pull/58958) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Fix seek in ReadBufferFromZipArchive [#58966](https://github.com/ClickHouse/ClickHouse/pull/58966) ([Michael Kolupaev](https://github.com/al13n321)).
+* A fix for experimental inverted indices (don't use in production): `DROP INDEX` of inverted index now removes all relevant files from persistence [#59040](https://github.com/ClickHouse/ClickHouse/pull/59040) ([mochi](https://github.com/MochiXu)).
+* Fix data race on query_factories_info [#59049](https://github.com/ClickHouse/ClickHouse/pull/59049) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Disable "Too many redirects" error retry [#59099](https://github.com/ClickHouse/ClickHouse/pull/59099) ([skyoct](https://github.com/skyoct)).
+* Fix not started database shutdown deadlock [#59137](https://github.com/ClickHouse/ClickHouse/pull/59137) ([Sergei Trifonov](https://github.com/serxa)).
+* Fix: LIMIT BY and LIMIT in distributed query [#59153](https://github.com/ClickHouse/ClickHouse/pull/59153) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix crash with nullable timezone for `toString` [#59190](https://github.com/ClickHouse/ClickHouse/pull/59190) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Fix abort in iceberg metadata on bad file paths [#59275](https://github.com/ClickHouse/ClickHouse/pull/59275) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix architecture name in select of Rust target [#59307](https://github.com/ClickHouse/ClickHouse/pull/59307) ([p1rattttt](https://github.com/p1rattttt)).
+* Fix a logical error about "not-ready set" for querying from `system.tables` with a subquery in the IN clause. [#59351](https://github.com/ClickHouse/ClickHouse/pull/59351) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
 
-
-### <a id="235"></a> ClickHouse release 23.5, 2023-06-08
-
-#### Upgrade Notes
-* Compress marks and primary key by default. It significantly reduces the cold query time. Upgrade notes: the support for compressed marks and primary key has been added in version 22.9. If you turned on compressed marks or primary key or installed version 23.5 or newer, which has compressed marks or primary key on by default, you will not be able to downgrade to version 22.8 or earlier. You can also explicitly disable compressed marks or primary keys by specifying the `compress_marks` and `compress_primary_key` settings in the `<merge_tree>` section of the server configuration file. **Upgrade notes:** If you upgrade from versions prior to 22.9, you should either upgrade all replicas at once or disable the compression before upgrade, or upgrade through an intermediate version, where the compressed marks are supported but not enabled by default, such as 23.3. [#42587](https://github.com/ClickHouse/ClickHouse/pull/42587) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Make local object storage work consistently with s3 object storage, fix problem with append (closes [#48465](https://github.com/ClickHouse/ClickHouse/issues/48465)), make it configurable as independent storage. The change is backward incompatible because the cache on top of local object storage is not compatible to previous versions. [#48791](https://github.com/ClickHouse/ClickHouse/pull/48791) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* The experimental feature "in-memory data parts" is removed. The data format is still supported, but the settings are no-op, and compact or wide parts will be used instead. This closes [#45409](https://github.com/ClickHouse/ClickHouse/issues/45409). [#49429](https://github.com/ClickHouse/ClickHouse/pull/49429) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Changed default values of settings `parallelize_output_from_storages` and `input_format_parquet_preserve_order`. This allows ClickHouse to reorder rows when reading from files (e.g. CSV or Parquet), greatly improving performance in many cases. To restore the old behavior of preserving order, use `parallelize_output_from_storages = 0`, `input_format_parquet_preserve_order = 1`. [#49479](https://github.com/ClickHouse/ClickHouse/pull/49479) ([Michael Kolupaev](https://github.com/al13n321)).
-* Make projections production-ready. Add the `optimize_use_projections` setting to control whether the projections will be selected for SELECT queries. The setting `allow_experimental_projection_optimization` is obsolete and does nothing. [#49719](https://github.com/ClickHouse/ClickHouse/pull/49719) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Mark `joinGet` as non-deterministic (so as `dictGet`). It allows using them in mutations without an extra setting. [#49843](https://github.com/ClickHouse/ClickHouse/pull/49843) ([Azat Khuzhin](https://github.com/azat)).
-* Revert the "`groupArray` returns cannot be nullable" change (due to binary compatibility breakage for `groupArray`/`groupArrayLast`/`groupArraySample` over `Nullable` types, which likely will lead to `TOO_LARGE_ARRAY_SIZE` or `CANNOT_READ_ALL_DATA`). [#49971](https://github.com/ClickHouse/ClickHouse/pull/49971) ([Azat Khuzhin](https://github.com/azat)).
-* Setting `enable_memory_bound_merging_of_aggregation_results` is enabled by default. If you update from version prior to 22.12, we recommend to set this flag to `false` until update is finished. [#50319](https://github.com/ClickHouse/ClickHouse/pull/50319) ([Nikita Taranov](https://github.com/nickitat)).
-
-#### New Feature
-* Added storage engine AzureBlobStorage and azureBlobStorage table function. The supported set of features is very similar to storage/table function S3 [#50604] (https://github.com/ClickHouse/ClickHouse/pull/50604) ([alesapin](https://github.com/alesapin)) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni).
-* Added native ClickHouse Keeper CLI Client, it is available as `clickhouse keeper-client` [#47414](https://github.com/ClickHouse/ClickHouse/pull/47414) ([pufit](https://github.com/pufit)).
-* Add `urlCluster` table function. Refactor all *Cluster table functions to reduce code duplication. Make schema inference work for all possible *Cluster function signatures and for named collections. Closes [#38499](https://github.com/ClickHouse/ClickHouse/issues/38499). [#45427](https://github.com/ClickHouse/ClickHouse/pull/45427) ([attack204](https://github.com/attack204)), Pavel Kruglov.
-* The query cache can now be used for production workloads. [#47977](https://github.com/ClickHouse/ClickHouse/pull/47977) ([Robert Schulze](https://github.com/rschu1ze)). The query cache can now support queries with totals and extremes modifier. [#48853](https://github.com/ClickHouse/ClickHouse/pull/48853) ([Robert Schulze](https://github.com/rschu1ze)). Make `allow_experimental_query_cache` setting as obsolete for backward-compatibility. It was removed in https://github.com/ClickHouse/ClickHouse/pull/47977. [#49934](https://github.com/ClickHouse/ClickHouse/pull/49934) ([Timur Solodovnikov](https://github.com/tsolodov)).
-* Geographical data types (`Point`, `Ring`, `Polygon`, and `MultiPolygon`) are production-ready. [#50022](https://github.com/ClickHouse/ClickHouse/pull/50022) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add schema inference to PostgreSQL, MySQL, MeiliSearch, and SQLite table engines. Closes [#49972](https://github.com/ClickHouse/ClickHouse/issues/49972). [#50000](https://github.com/ClickHouse/ClickHouse/pull/50000) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Password type in queries like `CREATE USER u IDENTIFIED BY 'p'` will be automatically set according to the setting `default_password_type` in the `config.xml` on the server. Closes [#42915](https://github.com/ClickHouse/ClickHouse/issues/42915). [#44674](https://github.com/ClickHouse/ClickHouse/pull/44674) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add bcrypt password authentication type. Closes [#34599](https://github.com/ClickHouse/ClickHouse/issues/34599). [#44905](https://github.com/ClickHouse/ClickHouse/pull/44905) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Introduces new keyword `INTO OUTFILE 'file.txt' APPEND`. [#48880](https://github.com/ClickHouse/ClickHouse/pull/48880) ([alekar](https://github.com/alekar)).
-* Added `system.zookeeper_connection` table that shows information about Keeper connections. [#45245](https://github.com/ClickHouse/ClickHouse/pull/45245) ([mateng915](https://github.com/mateng0915)).
-* Add new function `generateRandomStructure` that generates random table structure. It can be used in combination with table function `generateRandom`. [#47409](https://github.com/ClickHouse/ClickHouse/pull/47409) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow the use of `CASE` without an `ELSE` branch and extended `transform` to deal with more types. Also fix some issues that made transform() return incorrect results when decimal types were mixed with other numeric types. [#48300](https://github.com/ClickHouse/ClickHouse/pull/48300) ([Salvatore Mesoraca](https://github.com/aiven-sal)). This closes #2655. This closes #9596. This closes #38666.
-* Added [server-side encryption using KMS keys](https://docs.aws.amazon.com/AmazonS3/latest/userguide/UsingKMSEncryption.html) with S3 tables, and the `header` setting with S3 disks. Closes [#48723](https://github.com/ClickHouse/ClickHouse/issues/48723). [#48724](https://github.com/ClickHouse/ClickHouse/pull/48724) ([Johann Gan](https://github.com/johanngan)).
-* Add MemoryTracker for the background tasks (merges and mutation). Introduces `merges_mutations_memory_usage_soft_limit` and `merges_mutations_memory_usage_to_ram_ratio` settings that represent the soft memory limit for merges and mutations. If this limit is reached ClickHouse won't schedule new merge or mutation tasks. Also `MergesMutationsMemoryTracking` metric is introduced to allow observing current memory usage of background tasks. Resubmit [#46089](https://github.com/ClickHouse/ClickHouse/issues/46089). Closes [#48774](https://github.com/ClickHouse/ClickHouse/issues/48774). [#48787](https://github.com/ClickHouse/ClickHouse/pull/48787) ([Dmitry Novik](https://github.com/novikd)).
-* Function `dotProduct` work for array. [#49050](https://github.com/ClickHouse/ClickHouse/pull/49050) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Support statement `SHOW INDEX` to improve compatibility with MySQL. [#49158](https://github.com/ClickHouse/ClickHouse/pull/49158) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add virtual column `_file` and `_path` support to table function `url`. - Improve error message for table function `url`. - resolves [#49231](https://github.com/ClickHouse/ClickHouse/issues/49231) - resolves [#49232](https://github.com/ClickHouse/ClickHouse/issues/49232). [#49356](https://github.com/ClickHouse/ClickHouse/pull/49356) ([Ziyi Tan](https://github.com/Ziy1-Tan)).
-* Adding the `grants` field in the users.xml file, which allows specifying grants for users. [#49381](https://github.com/ClickHouse/ClickHouse/pull/49381) ([pufit](https://github.com/pufit)).
-* Support full/right join by using grace hash join algorithm. [#49483](https://github.com/ClickHouse/ClickHouse/pull/49483) ([lgbo](https://github.com/lgbo-ustc)).
-* `WITH FILL` modifier groups filling by sorting prefix. Controlled by `use_with_fill_by_sorting_prefix` setting (enabled by default). Related to [#33203](https://github.com/ClickHouse/ClickHouse/issues/33203)#issuecomment-1418736794. [#49503](https://github.com/ClickHouse/ClickHouse/pull/49503) ([Igor Nikonov](https://github.com/devcrafter)).
-* Clickhouse-client now accepts queries after "--multiquery" when "--query" (or "-q") is absent. example: clickhouse-client --multiquery "select 1; select 2;". [#49870](https://github.com/ClickHouse/ClickHouse/pull/49870) ([Alexey Gerasimchuk](https://github.com/Demilivor)).
-* Add separate `handshake_timeout` for receiving Hello packet from replica. Closes [#48854](https://github.com/ClickHouse/ClickHouse/issues/48854). [#49948](https://github.com/ClickHouse/ClickHouse/pull/49948) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added a function "space" which repeats a space as many times as specified. [#50103](https://github.com/ClickHouse/ClickHouse/pull/50103) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added --input_format_csv_trim_whitespaces option. [#50215](https://github.com/ClickHouse/ClickHouse/pull/50215) ([Alexey Gerasimchuk](https://github.com/Demilivor)).
-* Allow the `dictGetAll` function for regexp tree dictionaries to return values from multiple matches as arrays. Closes [#50254](https://github.com/ClickHouse/ClickHouse/issues/50254). [#50255](https://github.com/ClickHouse/ClickHouse/pull/50255) ([Johann Gan](https://github.com/johanngan)).
-* Added `toLastDayOfWeek` function to round a date or a date with time up to the nearest Saturday or Sunday. [#50315](https://github.com/ClickHouse/ClickHouse/pull/50315) ([Victor Krasnov](https://github.com/sirvickr)).
-* Ability to ignore a skip index by specifying `ignore_data_skipping_indices`. [#50329](https://github.com/ClickHouse/ClickHouse/pull/50329) ([Boris Kuschel](https://github.com/bkuschel)).
-* Add `system.user_processes` table and `SHOW USER PROCESSES` query to show memory info and ProfileEvents on user level. [#50492](https://github.com/ClickHouse/ClickHouse/pull/50492) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* Add server and format settings `display_secrets_in_show_and_select` for displaying secrets of tables, databases, table functions, and dictionaries. Add privilege `displaySecretsInShowAndSelect` controlling which users can view secrets. [#46528](https://github.com/ClickHouse/ClickHouse/pull/46528) ([Mike Kot](https://github.com/myrrc)).
-* Allow to set up a ROW POLICY for all tables that belong to a DATABASE. [#47640](https://github.com/ClickHouse/ClickHouse/pull/47640) ([Ilya Golshtein](https://github.com/ilejn)).
-
-#### Performance Improvement
-* Compress marks and primary key by default. It significantly reduces the cold query time. Upgrade notes: the support for compressed marks and primary key has been added in version 22.9. If you turned on compressed marks or primary key or installed version 23.5 or newer, which has compressed marks or primary key on by default, you will not be able to downgrade to version 22.8 or earlier. You can also explicitly disable compressed marks or primary keys by specifying the `compress_marks` and `compress_primary_key` settings in the `<merge_tree>` section of the server configuration file. [#42587](https://github.com/ClickHouse/ClickHouse/pull/42587) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* New setting s3_max_inflight_parts_for_one_file sets the limit of concurrently loaded parts with multipart upload request in scope of one file. [#49961](https://github.com/ClickHouse/ClickHouse/pull/49961) ([Sema Checherinda](https://github.com/CheSema)).
-* When reading from multiple files reduce parallel parsing threads for each file. Resolves [#42192](https://github.com/ClickHouse/ClickHouse/issues/42192). [#46661](https://github.com/ClickHouse/ClickHouse/pull/46661) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Use aggregate projection only if it reads fewer granules than normal reading. It should help in case if query hits the PK of the table, but not the projection. Fixes [#49150](https://github.com/ClickHouse/ClickHouse/issues/49150). [#49417](https://github.com/ClickHouse/ClickHouse/pull/49417) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Do not store blocks in `ANY` hash join if nothing is inserted. [#48633](https://github.com/ClickHouse/ClickHouse/pull/48633) ([vdimir](https://github.com/vdimir)).
-* Fixes aggregate combinator `-If` when JIT compiled, and enable JIT compilation for aggregate functions. Closes [#48120](https://github.com/ClickHouse/ClickHouse/issues/48120). [#49083](https://github.com/ClickHouse/ClickHouse/pull/49083) ([Igor Nikonov](https://github.com/devcrafter)).
-* For reading from remote tables we use smaller tasks (instead of reading the whole part) to make tasks stealing work * task size is determined by size of columns to read * always use 1mb buffers for reading from s3 * boundaries of cache segments aligned to 1mb so they have decent size even with small tasks. it also should prevent fragmentation. [#49287](https://github.com/ClickHouse/ClickHouse/pull/49287) ([Nikita Taranov](https://github.com/nickitat)).
-* Introduced settings: - `merge_max_block_size_bytes` to limit the amount of memory used for background operations. - `vertical_merge_algorithm_min_bytes_to_activate` to add another condition to activate vertical merges. [#49313](https://github.com/ClickHouse/ClickHouse/pull/49313) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Default size of a read buffer for reading from local filesystem changed to a slightly better value. Also two new settings are introduced: `max_read_buffer_size_local_fs` and `max_read_buffer_size_remote_fs`. [#49321](https://github.com/ClickHouse/ClickHouse/pull/49321) ([Nikita Taranov](https://github.com/nickitat)).
-* Improve memory usage and speed of `SPARSE_HASHED`/`HASHED` dictionaries (e.g. `SPARSE_HASHED` now eats 2.6x less memory, and is ~2x faster). [#49380](https://github.com/ClickHouse/ClickHouse/pull/49380) ([Azat Khuzhin](https://github.com/azat)).
-* Optimize the `system.query_log` and `system.query_thread_log` tables by applying `LowCardinality` when appropriate. The queries over these tables will be faster. [#49530](https://github.com/ClickHouse/ClickHouse/pull/49530) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Better performance when reading local `Parquet` files (through parallel reading). [#49539](https://github.com/ClickHouse/ClickHouse/pull/49539) ([Michael Kolupaev](https://github.com/al13n321)).
-* Improve the performance of `RIGHT/FULL JOIN` by up to 2 times in certain scenarios, especially when joining a small left table with a large right table. [#49585](https://github.com/ClickHouse/ClickHouse/pull/49585) ([lgbo](https://github.com/lgbo-ustc)).
-* Improve performance of BLAKE3 by 11% by enabling LTO for Rust. [#49600](https://github.com/ClickHouse/ClickHouse/pull/49600) ([Azat Khuzhin](https://github.com/azat)). Now it is on par with C++.
-* Optimize the structure of the `system.opentelemetry_span_log`. Use `LowCardinality` where appropriate. Although this table is generally stupid (it is using the Map data type even for common attributes), it will be slightly better. [#49647](https://github.com/ClickHouse/ClickHouse/pull/49647) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Try to reserve hash table's size in `grace_hash` join. [#49816](https://github.com/ClickHouse/ClickHouse/pull/49816) ([lgbo](https://github.com/lgbo-ustc)).
-* Parallel merge of `uniqExactIf` states. Closes [#49885](https://github.com/ClickHouse/ClickHouse/issues/49885). [#50285](https://github.com/ClickHouse/ClickHouse/pull/50285) ([flynn](https://github.com/ucasfl)).
-* Keeper improvement: add `CheckNotExists` request to Keeper, which allows to improve the performance of Replicated tables. [#48897](https://github.com/ClickHouse/ClickHouse/pull/48897) ([Antonio Andelic](https://github.com/antonio2368)).
-* Keeper performance improvements: avoid serializing same request twice while processing. Cache deserialization results of large requests. Controlled by new coordination setting `min_request_size_for_cache`. [#49004](https://github.com/ClickHouse/ClickHouse/pull/49004) ([Antonio Andelic](https://github.com/antonio2368)).
-* Reduced number of `List` ZooKeeper requests when selecting parts to merge and a lot of partitions do not have anything to merge. [#49637](https://github.com/ClickHouse/ClickHouse/pull/49637) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Rework locking in the FS cache [#44985](https://github.com/ClickHouse/ClickHouse/pull/44985) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Disable pure parallel replicas if trivial count optimization is possible. [#50594](https://github.com/ClickHouse/ClickHouse/pull/50594) ([Raúl Marín](https://github.com/Algunenano)).
-* Don't send head request for all keys in Iceberg schema inference, only for keys that are used for reaing data. [#50203](https://github.com/ClickHouse/ClickHouse/pull/50203) ([Kruglov Pavel](https://github.com/Avogar)).
-* Setting `enable_memory_bound_merging_of_aggregation_results` is enabled by default. [#50319](https://github.com/ClickHouse/ClickHouse/pull/50319) ([Nikita Taranov](https://github.com/nickitat)).
-
-#### Experimental Feature
-* `DEFLATE_QPL` codec lower the minimum simd version to SSE 4.2. [doc change in qpl](https://github.com/intel/qpl/commit/3f8f5cea27739f5261e8fd577dc233ffe88bf679) - Intel® QPL relies on a run-time kernels dispatcher and cpuid check to choose the best available implementation(sse/avx2/avx512) - restructured cmakefile for qpl build in clickhouse to align with latest upstream qpl. [#49811](https://github.com/ClickHouse/ClickHouse/pull/49811) ([jasperzhu](https://github.com/jinjunzh)).
-* Add initial support to do JOINs with pure parallel replicas. [#49544](https://github.com/ClickHouse/ClickHouse/pull/49544) ([Raúl Marín](https://github.com/Algunenano)).
-* More parallelism on `Outdated` parts removal with "zero-copy replication". [#49630](https://github.com/ClickHouse/ClickHouse/pull/49630) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Parallel Replicas: 1) Fixed an error `NOT_FOUND_COLUMN_IN_BLOCK` in case of using parallel replicas with non-replicated storage with disabled setting `parallel_replicas_for_non_replicated_merge_tree` 2) Now `allow_experimental_parallel_reading_from_replicas` have 3 possible values - 0, 1 and 2. 0 - disabled, 1 - enabled, silently disable them in case of failure (in case of FINAL or JOIN), 2 - enabled, throw an exception in case of failure. 3) If FINAL modifier is used in SELECT query and parallel replicas are enabled, ClickHouse will try to disable them if `allow_experimental_parallel_reading_from_replicas` is set to 1 and throw an exception otherwise. [#50195](https://github.com/ClickHouse/ClickHouse/pull/50195) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* When parallel replicas are enabled they will always skip unavailable servers (the behavior is controlled by the setting `skip_unavailable_shards`, enabled by default and can be only disabled). This closes: [#48565](https://github.com/ClickHouse/ClickHouse/issues/48565). [#50293](https://github.com/ClickHouse/ClickHouse/pull/50293) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-
-#### Improvement
-* The `BACKUP` command will not decrypt data from encrypted disks while making a backup. Instead the data will be stored in a backup in encrypted form. Such backups can be restored only to an encrypted disk with the same (or extended) list of encryption keys. [#48896](https://github.com/ClickHouse/ClickHouse/pull/48896) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Added possibility to use temporary tables in FROM part of ATTACH PARTITION FROM and REPLACE PARTITION FROM. [#49436](https://github.com/ClickHouse/ClickHouse/pull/49436) ([Roman Vasin](https://github.com/rvasin)).
-* Added setting `async_insert` for `MergeTree` tables. It has the same meaning as query-level setting `async_insert` and enables asynchronous inserts for specific table. Note: it doesn't take effect for insert queries from `clickhouse-client`, use query-level setting in that case. [#49122](https://github.com/ClickHouse/ClickHouse/pull/49122) ([Anton Popov](https://github.com/CurtizJ)).
-* Add support for size suffixes in quota creation statement parameters. [#49087](https://github.com/ClickHouse/ClickHouse/pull/49087) ([Eridanus](https://github.com/Eridanus117)).
-* Extend `first_value` and `last_value` to accept NULL. [#46467](https://github.com/ClickHouse/ClickHouse/pull/46467) ([lgbo](https://github.com/lgbo-ustc)).
-* Add alias `str_to_map` and `mapFromString` for `extractKeyValuePairs`. closes https://github.com/clickhouse/clickhouse/issues/47185. [#49466](https://github.com/ClickHouse/ClickHouse/pull/49466) ([flynn](https://github.com/ucasfl)).
-* Add support for CGroup version 2 for asynchronous metrics about the memory usage and availability. This closes [#37983](https://github.com/ClickHouse/ClickHouse/issues/37983). [#45999](https://github.com/ClickHouse/ClickHouse/pull/45999) ([sichenzhao](https://github.com/sichenzhao)).
-* Cluster table functions should always skip unavailable shards. close [#46314](https://github.com/ClickHouse/ClickHouse/issues/46314). [#46765](https://github.com/ClickHouse/ClickHouse/pull/46765) ([zk_kiger](https://github.com/zk-kiger)).
-* Allow CSV file to contain empty columns in its header. [#47496](https://github.com/ClickHouse/ClickHouse/pull/47496) ([你不要过来啊](https://github.com/iiiuwioajdks)).
-* Add Google Cloud Storage S3 compatible table function `gcs`. Like the `oss` and `cosn` functions, it is just an alias over the `s3` table function, and it does not bring any new features. [#47815](https://github.com/ClickHouse/ClickHouse/pull/47815) ([Kuba Kaflik](https://github.com/jkaflik)).
-* Add ability to use strict parts size for S3 (compatibility with CloudFlare R2 S3 Storage). [#48492](https://github.com/ClickHouse/ClickHouse/pull/48492) ([Azat Khuzhin](https://github.com/azat)).
-* Added new columns with info about `Replicated` database replicas to `system.clusters`: `database_shard_name`, `database_replica_name`, `is_active`. Added an optional `FROM SHARD` clause to `SYSTEM DROP DATABASE REPLICA` query. [#48548](https://github.com/ClickHouse/ClickHouse/pull/48548) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Add a new column `zookeeper_name` in system.replicas, to indicate on which (auxiliary) zookeeper cluster the replicated table's metadata is stored. [#48549](https://github.com/ClickHouse/ClickHouse/pull/48549) ([cangyin](https://github.com/cangyin)).
-* `IN` operator support the comparison of `Date` and `Date32`. Closes [#48736](https://github.com/ClickHouse/ClickHouse/issues/48736). [#48806](https://github.com/ClickHouse/ClickHouse/pull/48806) ([flynn](https://github.com/ucasfl)).
-* Support for erasure codes in `HDFS`, author: @M1eyu2018, @tomscut. [#48833](https://github.com/ClickHouse/ClickHouse/pull/48833) ([M1eyu](https://github.com/M1eyu2018)).
-* Implement SYSTEM DROP REPLICA from auxiliary ZooKeeper clusters, may be close [#48931](https://github.com/ClickHouse/ClickHouse/issues/48931). [#48932](https://github.com/ClickHouse/ClickHouse/pull/48932) ([wangxiaobo](https://github.com/wzb5212)).
-* Add Array data type to MongoDB. Closes [#48598](https://github.com/ClickHouse/ClickHouse/issues/48598). [#48983](https://github.com/ClickHouse/ClickHouse/pull/48983) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Support storing `Interval` data types in tables. [#49085](https://github.com/ClickHouse/ClickHouse/pull/49085) ([larryluogit](https://github.com/larryluogit)).
-* Allow using `ntile` window function without explicit window frame definition: `ntile(3) OVER (ORDER BY a)`, close [#46763](https://github.com/ClickHouse/ClickHouse/issues/46763). [#49093](https://github.com/ClickHouse/ClickHouse/pull/49093) ([vdimir](https://github.com/vdimir)).
-* Added settings (`number_of_mutations_to_delay`, `number_of_mutations_to_throw`) to delay or throw `ALTER` queries that create mutations (`ALTER UPDATE`, `ALTER DELETE`, `ALTER MODIFY COLUMN`, ...) in case when table already has a lot of unfinished mutations. [#49117](https://github.com/ClickHouse/ClickHouse/pull/49117) ([Anton Popov](https://github.com/CurtizJ)).
-* Catch exception from `create_directories` in filesystem cache. [#49203](https://github.com/ClickHouse/ClickHouse/pull/49203) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Copies embedded examples to a new field `example` in `system.functions` to supplement the field `description`. [#49222](https://github.com/ClickHouse/ClickHouse/pull/49222) ([Dan Roscigno](https://github.com/DanRoscigno)).
-* Enable connection options for the MongoDB dictionary. Example: ``` xml <source> <mongodb> <host>localhost</host> <port>27017</port> <user></user> <password></password> <db>test</db> <collection>dictionary_source</collection> <options>ssl=true</options> </mongodb> </source> ``` ### Documentation entry for user-facing changes. [#49225](https://github.com/ClickHouse/ClickHouse/pull/49225) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* Added an alias `asymptotic` for `asymp` computational method for `kolmogorovSmirnovTest`. Improved documentation. [#49286](https://github.com/ClickHouse/ClickHouse/pull/49286) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Aggregation function groupBitAnd/Or/Xor now work on signed integer data. This makes them consistent with the behavior of scalar functions bitAnd/Or/Xor. [#49292](https://github.com/ClickHouse/ClickHouse/pull/49292) ([exmy](https://github.com/exmy)).
-* Split function-documentation into more fine-granular fields. [#49300](https://github.com/ClickHouse/ClickHouse/pull/49300) ([Robert Schulze](https://github.com/rschu1ze)).
-* Use multiple threads shared between all tables within a server to load outdated data parts. The the size of the pool and its queue is controlled by `max_outdated_parts_loading_thread_pool_size` and `outdated_part_loading_thread_pool_queue_size` settings. [#49317](https://github.com/ClickHouse/ClickHouse/pull/49317) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Don't overestimate the size of processed data for `LowCardinality` columns when they share dictionaries between blocks. This closes [#49322](https://github.com/ClickHouse/ClickHouse/issues/49322). See also [#48745](https://github.com/ClickHouse/ClickHouse/issues/48745). [#49323](https://github.com/ClickHouse/ClickHouse/pull/49323) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Parquet writer now uses reasonable row group size when invoked through `OUTFILE`. [#49325](https://github.com/ClickHouse/ClickHouse/pull/49325) ([Michael Kolupaev](https://github.com/al13n321)).
-* Allow restricted keywords like `ARRAY` as an alias if the alias is quoted. Closes [#49324](https://github.com/ClickHouse/ClickHouse/issues/49324). [#49360](https://github.com/ClickHouse/ClickHouse/pull/49360) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Data parts loading and deletion jobs were moved to shared server-wide pools instead of per-table pools. Pools sizes are controlled via settings `max_active_parts_loading_thread_pool_size`, `max_outdated_parts_loading_thread_pool_size` and `max_parts_cleaning_thread_pool_size` in top-level config. Table-level settings `max_part_loading_threads` and `max_part_removal_threads` became obsolete. [#49474](https://github.com/ClickHouse/ClickHouse/pull/49474) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Allow `?password=pass` in URL of the Play UI. Password is replaced in browser history. [#49505](https://github.com/ClickHouse/ClickHouse/pull/49505) ([Mike Kot](https://github.com/myrrc)).
-* Allow reading zero-size objects from remote filesystems. (because empty files are not backup'd, so we might end up with zero blobs in metadata file). Closes [#49480](https://github.com/ClickHouse/ClickHouse/issues/49480). [#49519](https://github.com/ClickHouse/ClickHouse/pull/49519) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Attach thread MemoryTracker to `total_memory_tracker` after `ThreadGroup` detached. [#49527](https://github.com/ClickHouse/ClickHouse/pull/49527) ([Dmitry Novik](https://github.com/novikd)).
-* Fix parameterized views when a query parameter is used multiple times in the query. [#49556](https://github.com/ClickHouse/ClickHouse/pull/49556) ([Azat Khuzhin](https://github.com/azat)).
-* Release memory allocated for the last sent ProfileEvents snapshot in the context of a query. Followup [#47564](https://github.com/ClickHouse/ClickHouse/issues/47564). [#49561](https://github.com/ClickHouse/ClickHouse/pull/49561) ([Dmitry Novik](https://github.com/novikd)).
-* Function "makeDate" now provides a MySQL-compatible overload (year & day of the year argument). [#49603](https://github.com/ClickHouse/ClickHouse/pull/49603) ([Robert Schulze](https://github.com/rschu1ze)).
-* Support `dictionary` table function for `RegExpTreeDictionary`. [#49666](https://github.com/ClickHouse/ClickHouse/pull/49666) ([Han Fei](https://github.com/hanfei1991)).
-* Added weighted fair IO scheduling policy. Added dynamic resource manager, which allows IO scheduling hierarchy to be updated in runtime w/o server restarts. [#49671](https://github.com/ClickHouse/ClickHouse/pull/49671) ([Sergei Trifonov](https://github.com/serxa)).
-* Add compose request after multipart upload to GCS. This enables the usage of copy operation on objects uploaded with the multipart upload. It's recommended to set `s3_strict_upload_part_size` to some value because compose request can fail on objects created with parts of different sizes. [#49693](https://github.com/ClickHouse/ClickHouse/pull/49693) ([Antonio Andelic](https://github.com/antonio2368)).
-* For the `extractKeyValuePairs` function: improve the "best-effort" parsing logic to accept `key_value_delimiter` as a valid part of the value. This also simplifies branching and might even speed up things a bit. [#49760](https://github.com/ClickHouse/ClickHouse/pull/49760) ([Arthur Passos](https://github.com/arthurpassos)).
-* Add `initial_query_id` field for system.processors_profile_log [#49777](https://github.com/ClickHouse/ClickHouse/pull/49777) ([helifu](https://github.com/helifu)).
-* System log tables can now have custom sorting keys. [#49778](https://github.com/ClickHouse/ClickHouse/pull/49778) ([helifu](https://github.com/helifu)).
-* A new field `partitions` to `system.query_log` is used to indicate which partitions are participating in the calculation. [#49779](https://github.com/ClickHouse/ClickHouse/pull/49779) ([helifu](https://github.com/helifu)).
-* Added `enable_the_endpoint_id_with_zookeeper_name_prefix` setting for `ReplicatedMergeTree` (disabled by default). When enabled, it adds ZooKeeper cluster name to table's interserver communication endpoint. It avoids `Duplicate interserver IO endpoint` errors when having replicated tables with the same path, but different auxiliary ZooKeepers. [#49780](https://github.com/ClickHouse/ClickHouse/pull/49780) ([helifu](https://github.com/helifu)).
-* Add query parameters to `clickhouse-local`. Closes [#46561](https://github.com/ClickHouse/ClickHouse/issues/46561). [#49785](https://github.com/ClickHouse/ClickHouse/pull/49785) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Allow loading dictionaries and functions from YAML by default. In previous versions, it required editing the `dictionaries_config` or `user_defined_executable_functions_config` in the configuration file, as they expected `*.xml` files. [#49812](https://github.com/ClickHouse/ClickHouse/pull/49812) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The Kafka table engine now allows to use alias columns. [#49824](https://github.com/ClickHouse/ClickHouse/pull/49824) ([Aleksandr Musorin](https://github.com/AVMusorin)).
-* Add setting to limit the max number of pairs produced by `extractKeyValuePairs`, a safeguard to avoid using way too much memory. [#49836](https://github.com/ClickHouse/ClickHouse/pull/49836) ([Arthur Passos](https://github.com/arthurpassos)).
-* Add support for (an unusual) case where the arguments in the `IN` operator are single-element tuples. [#49844](https://github.com/ClickHouse/ClickHouse/pull/49844) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* `bitHammingDistance` function support `String` and `FixedString` data type. Closes [#48827](https://github.com/ClickHouse/ClickHouse/issues/48827). [#49858](https://github.com/ClickHouse/ClickHouse/pull/49858) ([flynn](https://github.com/ucasfl)).
-* Fix timeout resetting errors in the client on OS X. [#49863](https://github.com/ClickHouse/ClickHouse/pull/49863) ([alekar](https://github.com/alekar)).
-* Add support for big integers, such as UInt128, Int128, UInt256, and Int256 in the function `bitCount`. This enables Hamming distance over large bit masks for AI applications. [#49867](https://github.com/ClickHouse/ClickHouse/pull/49867) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fingerprints to be used instead of key IDs in encrypted disks. This simplifies the configuration of encrypted disks. [#49882](https://github.com/ClickHouse/ClickHouse/pull/49882) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Add UUID data type to PostgreSQL. Closes [#49739](https://github.com/ClickHouse/ClickHouse/issues/49739). [#49894](https://github.com/ClickHouse/ClickHouse/pull/49894) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Function `toUnixTimestamp` now accepts `Date` and `Date32` arguments. [#49989](https://github.com/ClickHouse/ClickHouse/pull/49989) ([Victor Krasnov](https://github.com/sirvickr)).
-* Charge only server memory for dictionaries. [#49995](https://github.com/ClickHouse/ClickHouse/pull/49995) ([Azat Khuzhin](https://github.com/azat)).
-* The server will allow using the `SQL_*` settings such as `SQL_AUTO_IS_NULL` as no-ops for MySQL compatibility. This closes [#49927](https://github.com/ClickHouse/ClickHouse/issues/49927). [#50013](https://github.com/ClickHouse/ClickHouse/pull/50013) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Preserve initial_query_id for ON CLUSTER queries, which is useful for introspection (under `distributed_ddl_entry_format_version=5`). [#50015](https://github.com/ClickHouse/ClickHouse/pull/50015) ([Azat Khuzhin](https://github.com/azat)).
-* Preserve backward incompatibility for renamed settings by using aliases (`allow_experimental_projection_optimization` for `optimize_use_projections`, `allow_experimental_lightweight_delete` for `enable_lightweight_delete`). [#50044](https://github.com/ClickHouse/ClickHouse/pull/50044) ([Azat Khuzhin](https://github.com/azat)).
-* Support passing FQDN through setting my_hostname to register cluster node in keeper. Add setting of invisible to support multi compute groups. A compute group as a cluster, is invisible to other compute groups. [#50186](https://github.com/ClickHouse/ClickHouse/pull/50186) ([Yangkuan Liu](https://github.com/LiuYangkuan)).
-* Fix PostgreSQL reading all the data even though `LIMIT n` could be specified. [#50187](https://github.com/ClickHouse/ClickHouse/pull/50187) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Add new profile events for queries with subqueries (`QueriesWithSubqueries`/`SelectQueriesWithSubqueries`/`InsertQueriesWithSubqueries`). [#50204](https://github.com/ClickHouse/ClickHouse/pull/50204) ([Azat Khuzhin](https://github.com/azat)).
-* Adding the roles field in the users.xml file, which allows specifying roles with grants via a config file. [#50278](https://github.com/ClickHouse/ClickHouse/pull/50278) ([pufit](https://github.com/pufit)).
-* Report `CGroupCpuCfsPeriod` and `CGroupCpuCfsQuota` in AsynchronousMetrics. - Respect cgroup v2 memory limits during server startup. [#50379](https://github.com/ClickHouse/ClickHouse/pull/50379) ([alekar](https://github.com/alekar)).
-* Add a signal handler for SIGQUIT to work the same way as SIGINT. Closes [#50298](https://github.com/ClickHouse/ClickHouse/issues/50298). [#50435](https://github.com/ClickHouse/ClickHouse/pull/50435) ([Nikolay Degterinsky](https://github.com/evillique)).
-* In case JSON parse fails due to the large size of the object output the last position to allow debugging. [#50474](https://github.com/ClickHouse/ClickHouse/pull/50474) ([Valentin Alexeev](https://github.com/valentinalexeev)).
-* Support decimals with not fixed size. Closes [#49130](https://github.com/ClickHouse/ClickHouse/issues/49130). [#50586](https://github.com/ClickHouse/ClickHouse/pull/50586) ([Kruglov Pavel](https://github.com/Avogar)).
-
-#### Build/Testing/Packaging Improvement
-* New and improved `keeper-bench`. Everything can be customized from YAML/XML file: - request generator - each type of request generator can have a specific set of fields - multi requests can be generated just by doing the same under `multi` key - for each request or subrequest in multi a `weight` field can be defined to control distribution - define trees that need to be setup for a test run - hosts can be defined with all timeouts customizable and it's possible to control how many sessions to generate for each host - integers defined with `min_value` and `max_value` fields are random number generators. [#48547](https://github.com/ClickHouse/ClickHouse/pull/48547) ([Antonio Andelic](https://github.com/antonio2368)).
-* Io_uring is not supported on macos, don't choose it when running tests on local to avoid occasional failures. [#49250](https://github.com/ClickHouse/ClickHouse/pull/49250) ([Frank Chen](https://github.com/FrankChen021)).
-* Support named fault injection for testing. [#49361](https://github.com/ClickHouse/ClickHouse/pull/49361) ([Han Fei](https://github.com/hanfei1991)).
-* Allow running ClickHouse in the OS where the `prctl` (process control) syscall is not available, such as AWS Lambda. [#49538](https://github.com/ClickHouse/ClickHouse/pull/49538) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fixed the issue of build conflict between contrib/isa-l and isa-l in qpl [49296](https://github.com/ClickHouse/ClickHouse/issues/49296). [#49584](https://github.com/ClickHouse/ClickHouse/pull/49584) ([jasperzhu](https://github.com/jinjunzh)).
-* Utilities are now only build if explicitly requested ("-DENABLE_UTILS=1") instead of by default, this reduces link times in typical development builds. [#49620](https://github.com/ClickHouse/ClickHouse/pull/49620) ([Robert Schulze](https://github.com/rschu1ze)).
-* Pull build description of idxd-config into a separate CMake file to avoid accidental removal in future. [#49651](https://github.com/ClickHouse/ClickHouse/pull/49651) ([jasperzhu](https://github.com/jinjunzh)).
-* Add CI check with an enabled analyzer in the master. Follow-up [#49562](https://github.com/ClickHouse/ClickHouse/issues/49562). [#49668](https://github.com/ClickHouse/ClickHouse/pull/49668) ([Dmitry Novik](https://github.com/novikd)).
-* Switch to LLVM/clang 16. [#49678](https://github.com/ClickHouse/ClickHouse/pull/49678) ([Azat Khuzhin](https://github.com/azat)).
-* Allow building ClickHouse with clang-17. [#49851](https://github.com/ClickHouse/ClickHouse/pull/49851) ([Alexey Milovidov](https://github.com/alexey-milovidov)). [#50410](https://github.com/ClickHouse/ClickHouse/pull/50410) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* ClickHouse is now easier to be integrated into other cmake projects. [#49991](https://github.com/ClickHouse/ClickHouse/pull/49991) ([Amos Bird](https://github.com/amosbird)). (Which is strongly discouraged - Alexey Milovidov).
-* Fix strange additional QEMU logging after [#47151](https://github.com/ClickHouse/ClickHouse/issues/47151), see https://s3.amazonaws.com/clickhouse-test-reports/50078/a4743996ee4f3583884d07bcd6501df0cfdaa346/stateless_tests__release__databasereplicated__[3_4].html. [#50442](https://github.com/ClickHouse/ClickHouse/pull/50442) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* ClickHouse can work on Linux RISC-V 6.1.22. This closes [#50456](https://github.com/ClickHouse/ClickHouse/issues/50456). [#50457](https://github.com/ClickHouse/ClickHouse/pull/50457) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Bump internal protobuf to v3.18 (fixes bogus CVE-2022-1941). [#50400](https://github.com/ClickHouse/ClickHouse/pull/50400) ([Robert Schulze](https://github.com/rschu1ze)).
-* Bump internal libxml2 to v2.10.4 (fixes bogus CVE-2023-28484 and bogus CVE-2023-29469). [#50402](https://github.com/ClickHouse/ClickHouse/pull/50402) ([Robert Schulze](https://github.com/rschu1ze)).
-* Bump c-ares to v1.19.1 (bogus CVE-2023-32067, bogus CVE-2023-31130, bogus CVE-2023-31147). [#50403](https://github.com/ClickHouse/ClickHouse/pull/50403) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix bogus CVE-2022-2469 in libgsasl. [#50404](https://github.com/ClickHouse/ClickHouse/pull/50404) ([Robert Schulze](https://github.com/rschu1ze)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-
-* ActionsDAG: fix wrong optimization [#47584](https://github.com/ClickHouse/ClickHouse/pull/47584) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Correctly handle concurrent snapshots in Keeper [#48466](https://github.com/ClickHouse/ClickHouse/pull/48466) ([Antonio Andelic](https://github.com/antonio2368)).
-* MergeTreeMarksLoader holds DataPart instead of DataPartStorage [#48515](https://github.com/ClickHouse/ClickHouse/pull/48515) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Sequence state fix [#48603](https://github.com/ClickHouse/ClickHouse/pull/48603) ([Ilya Golshtein](https://github.com/ilejn)).
-* Back/Restore concurrency check on previous fails [#48726](https://github.com/ClickHouse/ClickHouse/pull/48726) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix Attaching a table with non-existent ZK path does not increase the ReadonlyReplica metric [#48954](https://github.com/ClickHouse/ClickHouse/pull/48954) ([wangxiaobo](https://github.com/wzb5212)).
-* Fix possible terminate called for uncaught exception in some places [#49112](https://github.com/ClickHouse/ClickHouse/pull/49112) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix key not found error for queries with multiple StorageJoin [#49137](https://github.com/ClickHouse/ClickHouse/pull/49137) ([vdimir](https://github.com/vdimir)).
-* Fix wrong query result when using nullable primary key [#49172](https://github.com/ClickHouse/ClickHouse/pull/49172) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix reinterpretAs*() on big endian machines [#49198](https://github.com/ClickHouse/ClickHouse/pull/49198) ([Suzy Wang](https://github.com/SuzyWangIBMer)).
-* (Experimental zero-copy replication) Lock zero copy parts more atomically [#49211](https://github.com/ClickHouse/ClickHouse/pull/49211) ([alesapin](https://github.com/alesapin)).
-* Fix race on Outdated parts loading [#49223](https://github.com/ClickHouse/ClickHouse/pull/49223) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix all key value is null and group use rollup return wrong answer [#49282](https://github.com/ClickHouse/ClickHouse/pull/49282) ([Shuai li](https://github.com/loneylee)).
-* Fix calculating load_factor for HASHED dictionaries with SHARDS [#49319](https://github.com/ClickHouse/ClickHouse/pull/49319) ([Azat Khuzhin](https://github.com/azat)).
-* Disallow configuring compression CODECs for alias columns [#49363](https://github.com/ClickHouse/ClickHouse/pull/49363) ([Timur Solodovnikov](https://github.com/tsolodov)).
-* Fix bug in removal of existing part directory [#49365](https://github.com/ClickHouse/ClickHouse/pull/49365) ([alesapin](https://github.com/alesapin)).
-* Properly fix GCS when HMAC is used [#49390](https://github.com/ClickHouse/ClickHouse/pull/49390) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix fuzz bug when subquery set is not built when reading from remote() [#49425](https://github.com/ClickHouse/ClickHouse/pull/49425) ([Alexander Gololobov](https://github.com/davenger)).
-* Invert `shutdown_wait_unfinished_queries` [#49427](https://github.com/ClickHouse/ClickHouse/pull/49427) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-* (Experimental zero-copy replication) Fix another zero copy bug [#49473](https://github.com/ClickHouse/ClickHouse/pull/49473) ([alesapin](https://github.com/alesapin)).
-* Fix postgres database setting [#49481](https://github.com/ClickHouse/ClickHouse/pull/49481) ([Mal Curtis](https://github.com/snikch)).
-* Correctly handle `s3Cluster` arguments [#49490](https://github.com/ClickHouse/ClickHouse/pull/49490) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix bug in TraceCollector destructor. [#49508](https://github.com/ClickHouse/ClickHouse/pull/49508) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix AsynchronousReadIndirectBufferFromRemoteFS breaking on short seeks [#49525](https://github.com/ClickHouse/ClickHouse/pull/49525) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix dictionaries loading order [#49560](https://github.com/ClickHouse/ClickHouse/pull/49560) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Forbid the change of data type of Object('json') column [#49563](https://github.com/ClickHouse/ClickHouse/pull/49563) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix stress test (Logical error: Expected 7134 >= 11030) [#49623](https://github.com/ClickHouse/ClickHouse/pull/49623) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix bug in DISTINCT [#49628](https://github.com/ClickHouse/ClickHouse/pull/49628) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix: DISTINCT in order with zero values in non-sorted columns [#49636](https://github.com/ClickHouse/ClickHouse/pull/49636) ([Igor Nikonov](https://github.com/devcrafter)).
-* Fix one-off error in big integers found by UBSan with fuzzer [#49645](https://github.com/ClickHouse/ClickHouse/pull/49645) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix reading from sparse columns after restart [#49660](https://github.com/ClickHouse/ClickHouse/pull/49660) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix assert in SpanHolder::finish() with fibers [#49673](https://github.com/ClickHouse/ClickHouse/pull/49673) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix short circuit functions and mutations with sparse arguments [#49716](https://github.com/ClickHouse/ClickHouse/pull/49716) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix writing appended files to incremental backups [#49725](https://github.com/ClickHouse/ClickHouse/pull/49725) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix "There is no physical column _row_exists in table" error occurring during lightweight delete mutation on a table with Object column. [#49737](https://github.com/ClickHouse/ClickHouse/pull/49737) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix msan issue in randomStringUTF8(uneven number) [#49750](https://github.com/ClickHouse/ClickHouse/pull/49750) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix aggregate function kolmogorovSmirnovTest [#49768](https://github.com/ClickHouse/ClickHouse/pull/49768) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Fix settings aliases in native protocol [#49776](https://github.com/ClickHouse/ClickHouse/pull/49776) ([Azat Khuzhin](https://github.com/azat)).
-* Fix `arrayMap` with array of tuples with single argument [#49789](https://github.com/ClickHouse/ClickHouse/pull/49789) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix per-query IO/BACKUPs throttling settings [#49797](https://github.com/ClickHouse/ClickHouse/pull/49797) ([Azat Khuzhin](https://github.com/azat)).
-* Fix setting NULL in profile definition [#49831](https://github.com/ClickHouse/ClickHouse/pull/49831) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix a bug with projections and the aggregate_functions_null_for_empty setting (for query_plan_optimize_projection) [#49873](https://github.com/ClickHouse/ClickHouse/pull/49873) ([Amos Bird](https://github.com/amosbird)).
-* Fix processing pending batch for Distributed async INSERT after restart [#49884](https://github.com/ClickHouse/ClickHouse/pull/49884) ([Azat Khuzhin](https://github.com/azat)).
-* Fix assertion in CacheMetadata::doCleanup [#49914](https://github.com/ClickHouse/ClickHouse/pull/49914) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* fix `is_prefix` in OptimizeRegularExpression [#49919](https://github.com/ClickHouse/ClickHouse/pull/49919) ([Han Fei](https://github.com/hanfei1991)).
-* Fix metrics `WriteBufferFromS3Bytes`, `WriteBufferFromS3Microseconds` and `WriteBufferFromS3RequestsErrors` [#49930](https://github.com/ClickHouse/ClickHouse/pull/49930) ([Aleksandr Musorin](https://github.com/AVMusorin)).
-* Fix IPv6 encoding in protobuf [#49933](https://github.com/ClickHouse/ClickHouse/pull/49933) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix possible Logical error on bad Nullable parsing for text formats [#49960](https://github.com/ClickHouse/ClickHouse/pull/49960) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add setting output_format_parquet_compliant_nested_types to produce more compatible Parquet files [#50001](https://github.com/ClickHouse/ClickHouse/pull/50001) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix logical error in stress test "Not enough space to add ..." [#50021](https://github.com/ClickHouse/ClickHouse/pull/50021) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Avoid deadlock when starting table in attach thread of `ReplicatedMergeTree` [#50026](https://github.com/ClickHouse/ClickHouse/pull/50026) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix assert in SpanHolder::finish() with fibers attempt 2 [#50034](https://github.com/ClickHouse/ClickHouse/pull/50034) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add proper escaping for DDL OpenTelemetry context serialization [#50045](https://github.com/ClickHouse/ClickHouse/pull/50045) ([Azat Khuzhin](https://github.com/azat)).
-* Fix reporting broken projection parts [#50052](https://github.com/ClickHouse/ClickHouse/pull/50052) ([Amos Bird](https://github.com/amosbird)).
-* JIT compilation not equals NaN fix [#50056](https://github.com/ClickHouse/ClickHouse/pull/50056) ([Maksim Kita](https://github.com/kitaisreal)).
-* Fix crashing in case of Replicated database without arguments [#50058](https://github.com/ClickHouse/ClickHouse/pull/50058) ([Azat Khuzhin](https://github.com/azat)).
-* Fix crash with `multiIf` and constant condition and nullable arguments [#50123](https://github.com/ClickHouse/ClickHouse/pull/50123) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix invalid index analysis for date related keys [#50153](https://github.com/ClickHouse/ClickHouse/pull/50153) ([Amos Bird](https://github.com/amosbird)).
-* do not allow modify order by when there are no order by cols [#50154](https://github.com/ClickHouse/ClickHouse/pull/50154) ([Han Fei](https://github.com/hanfei1991)).
-* Fix broken index analysis when binary operator contains a null constant argument [#50177](https://github.com/ClickHouse/ClickHouse/pull/50177) ([Amos Bird](https://github.com/amosbird)).
-* clickhouse-client: disallow usage of `--query` and `--queries-file` at the same time [#50210](https://github.com/ClickHouse/ClickHouse/pull/50210) ([Alexey Gerasimchuk](https://github.com/Demilivor)).
-* Fix UB for INTO OUTFILE extensions (APPEND / AND STDOUT) and WATCH EVENTS [#50216](https://github.com/ClickHouse/ClickHouse/pull/50216) ([Azat Khuzhin](https://github.com/azat)).
-* Fix skipping spaces at end of row in CustomSeparatedIgnoreSpaces format [#50224](https://github.com/ClickHouse/ClickHouse/pull/50224) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix iceberg metadata parsing [#50232](https://github.com/ClickHouse/ClickHouse/pull/50232) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix nested distributed SELECT in WITH clause [#50234](https://github.com/ClickHouse/ClickHouse/pull/50234) ([Azat Khuzhin](https://github.com/azat)).
-* Fix msan issue in keyed siphash [#50245](https://github.com/ClickHouse/ClickHouse/pull/50245) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix bugs in Poco sockets in non-blocking mode, use true non-blocking sockets [#50252](https://github.com/ClickHouse/ClickHouse/pull/50252) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix checksum calculation for backup entries [#50264](https://github.com/ClickHouse/ClickHouse/pull/50264) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Comparison functions NaN fix [#50287](https://github.com/ClickHouse/ClickHouse/pull/50287) ([Maksim Kita](https://github.com/kitaisreal)).
-* JIT aggregation nullable key fix [#50291](https://github.com/ClickHouse/ClickHouse/pull/50291) ([Maksim Kita](https://github.com/kitaisreal)).
-* Fix clickhouse-local crashing when writing empty Arrow or Parquet output [#50328](https://github.com/ClickHouse/ClickHouse/pull/50328) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix crash when Pool::Entry::disconnect() is called [#50334](https://github.com/ClickHouse/ClickHouse/pull/50334) ([Val Doroshchuk](https://github.com/valbok)).
-* Improved fetch part by holding directory lock longer [#50339](https://github.com/ClickHouse/ClickHouse/pull/50339) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix bitShift* functions with both constant arguments [#50343](https://github.com/ClickHouse/ClickHouse/pull/50343) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix Keeper deadlock on exception when preprocessing requests. [#50387](https://github.com/ClickHouse/ClickHouse/pull/50387) ([frinkr](https://github.com/frinkr)).
-* Fix hashing of const integer values [#50421](https://github.com/ClickHouse/ClickHouse/pull/50421) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix merge_tree_min_rows_for_seek/merge_tree_min_bytes_for_seek for data skipping indexes [#50432](https://github.com/ClickHouse/ClickHouse/pull/50432) ([Azat Khuzhin](https://github.com/azat)).
-* Limit the number of in-flight tasks for loading outdated parts [#50450](https://github.com/ClickHouse/ClickHouse/pull/50450) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Keeper fix: apply uncommitted state after snapshot install [#50483](https://github.com/ClickHouse/ClickHouse/pull/50483) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix incorrect constant folding [#50536](https://github.com/ClickHouse/ClickHouse/pull/50536) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix logical error in stress test (Not enough space to add ...) [#50583](https://github.com/ClickHouse/ClickHouse/pull/50583) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix converting Null to LowCardinality(Nullable) in values table function [#50637](https://github.com/ClickHouse/ClickHouse/pull/50637) ([Kruglov Pavel](https://github.com/Avogar)).
-* Revert invalid RegExpTreeDictionary optimization [#50642](https://github.com/ClickHouse/ClickHouse/pull/50642) ([Johann Gan](https://github.com/johanngan)).
-
-### <a id="234"></a> ClickHouse release 23.4, 2023-04-26
-
-#### Backward Incompatible Change
-* Formatter '%M' in function formatDateTime() now prints the month name instead of the minutes. This makes the behavior consistent with MySQL. The previous behavior can be restored using setting "formatdatetime_parsedatetime_m_is_month_name = 0". [#47246](https://github.com/ClickHouse/ClickHouse/pull/47246) ([Robert Schulze](https://github.com/rschu1ze)).
-* This change makes sense only if you are using the virtual filesystem cache. If `path` in the virtual filesystem cache configuration is not empty and is not an absolute path, then it will be put in `<clickhouse server data directory>/caches/<path_from_cache_config>`. [#48784](https://github.com/ClickHouse/ClickHouse/pull/48784) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Primary/secondary indices and sorting keys with identical expressions are now rejected. This behavior can be disabled using setting `allow_suspicious_indices`. [#48536](https://github.com/ClickHouse/ClickHouse/pull/48536) ([凌涛](https://github.com/lingtaolf)).
-
-#### New Feature
-* Support new aggregate function `quantileGK`/`quantilesGK`, like [approx_percentile](https://spark.apache.org/docs/latest/api/sql/index.html#approx_percentile) in spark. Greenwald-Khanna algorithm refer to http://infolab.stanford.edu/~datar/courses/cs361a/papers/quantiles.pdf. [#46428](https://github.com/ClickHouse/ClickHouse/pull/46428) ([李扬](https://github.com/taiyang-li)).
-* Add a statement `SHOW COLUMNS` which shows distilled information from system.columns. [#48017](https://github.com/ClickHouse/ClickHouse/pull/48017) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added `LIGHTWEIGHT` and `PULL` modifiers for `SYSTEM SYNC REPLICA` query. `LIGHTWEIGHT` version waits for fetches and drop-ranges only (merges and mutations are ignored). `PULL` version pulls new entries from ZooKeeper and does not wait for them. Fixes [#47794](https://github.com/ClickHouse/ClickHouse/issues/47794). [#48085](https://github.com/ClickHouse/ClickHouse/pull/48085) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Add `kafkaMurmurHash` function for compatibility with Kafka DefaultPartitioner. Closes [#47834](https://github.com/ClickHouse/ClickHouse/issues/47834). [#48185](https://github.com/ClickHouse/ClickHouse/pull/48185) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Allow to easily create a user with the same grants as the current user by using `GRANT CURRENT GRANTS`. [#48262](https://github.com/ClickHouse/ClickHouse/pull/48262) ([pufit](https://github.com/pufit)).
-* Add statistical aggregate function `kolmogorovSmirnovTest`. Close [#48228](https://github.com/ClickHouse/ClickHouse/issues/48228). [#48325](https://github.com/ClickHouse/ClickHouse/pull/48325) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Added a `lost_part_count` column to the `system.replicas` table. The column value shows the total number of lost parts in the corresponding table. Value is stored in zookeeper and can be used instead of not persistent `ReplicatedDataLoss` profile event for monitoring. [#48526](https://github.com/ClickHouse/ClickHouse/pull/48526) ([Sergei Trifonov](https://github.com/serxa)).
-* Add `soundex` function for compatibility. Closes [#39880](https://github.com/ClickHouse/ClickHouse/issues/39880). [#48567](https://github.com/ClickHouse/ClickHouse/pull/48567) ([FriendLey](https://github.com/FriendLey)).
-* Support `Map` type for JSONExtract. [#48629](https://github.com/ClickHouse/ClickHouse/pull/48629) ([李扬](https://github.com/taiyang-li)).
-* Add `PrettyJSONEachRow` format to output pretty JSON with new line delimiters and 4 space indents. [#48898](https://github.com/ClickHouse/ClickHouse/pull/48898) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add `ParquetMetadata` input format to read Parquet file metadata. [#48911](https://github.com/ClickHouse/ClickHouse/pull/48911) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add `extractKeyValuePairs` function to extract key value pairs from strings. Input strings might contain noise (i.e. log files / do not need to be 100% formatted in key-value-pair format), the algorithm will look for key value pairs matching the arguments passed to the function. As of now, function accepts the following arguments: `data_column` (mandatory), `key_value_pair_delimiter` (defaults to `:`), `pair_delimiters` (defaults to `\space \, \;`) and `quoting_character` (defaults to double quotes). [#43606](https://github.com/ClickHouse/ClickHouse/pull/43606) ([Arthur Passos](https://github.com/arthurpassos)).
-* Functions replaceOne(), replaceAll(), replaceRegexpOne() and replaceRegexpAll() can now be called with non-const pattern and replacement arguments. [#46589](https://github.com/ClickHouse/ClickHouse/pull/46589) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added functions to work with columns of type `Map`: `mapConcat`, `mapSort`, `mapExists`. [#48071](https://github.com/ClickHouse/ClickHouse/pull/48071) ([Anton Popov](https://github.com/CurtizJ)).
-
-#### Performance Improvement
-* Reading files in `Parquet` format is now much faster. IO and decoding are parallelized (controlled by `max_threads` setting), and only required data ranges are read. [#47964](https://github.com/ClickHouse/ClickHouse/pull/47964) ([Michael Kolupaev](https://github.com/al13n321)).
-* If we run a mutation with IN (subquery) like this: `ALTER TABLE t UPDATE col='new value' WHERE id IN (SELECT id FROM huge_table)` and the table `t` has multiple parts than for each part a set for subquery `SELECT id FROM huge_table` is built in memory. And if there are many parts then this might consume a lot of memory (and lead to an OOM) and CPU. The solution is to introduce a short-lived cache of sets that are currently being built by mutation tasks. If another task of the same mutation is executed concurrently it can look up the set in the cache, wait for it to be built and reuse it. [#46835](https://github.com/ClickHouse/ClickHouse/pull/46835) ([Alexander Gololobov](https://github.com/davenger)).
-* Only check dependencies if necessary when applying `ALTER TABLE` queries. [#48062](https://github.com/ClickHouse/ClickHouse/pull/48062) ([Raúl Marín](https://github.com/Algunenano)).
-* Optimize function `mapUpdate`. [#48118](https://github.com/ClickHouse/ClickHouse/pull/48118) ([Anton Popov](https://github.com/CurtizJ)).
-* Now an internal query to local replica is sent explicitly and data from it received through loopback interface. Setting `prefer_localhost_replica` is not respected for parallel replicas. This is needed for better scheduling and makes the code cleaner: the initiator is only responsible for coordinating of the reading process and merging results, continuously answering for requests while all the secondary queries read the data. Note: Using loopback interface is not so performant, otherwise some replicas could starve for tasks which could lead to even slower query execution and not utilizing all possible resources. The initialization of the coordinator is now even more lazy. All incoming requests contain the information about the reading algorithm we initialize the coordinator with it when first request comes. If any replica decides to read with a different algorithm–an exception will be thrown and a query will be aborted. [#48246](https://github.com/ClickHouse/ClickHouse/pull/48246) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Do not build set for the right side of `IN` clause with subquery when it is used only for analysis of skip indexes, and they are disabled by setting (`use_skip_indexes=0`). Previously it might affect the performance of queries. [#48299](https://github.com/ClickHouse/ClickHouse/pull/48299) ([Anton Popov](https://github.com/CurtizJ)).
-* Query processing is parallelized right after reading `FROM file(...)`. Related to [#38755](https://github.com/ClickHouse/ClickHouse/issues/38755). [#48525](https://github.com/ClickHouse/ClickHouse/pull/48525) ([Igor Nikonov](https://github.com/devcrafter)). Query processing is parallelized right after reading from any data source. Affected data sources are mostly simple or external storages like table functions `url`, `file`. [#48727](https://github.com/ClickHouse/ClickHouse/pull/48727) ([Igor Nikonov](https://github.com/devcrafter)). This is controlled by the setting `parallelize_output_from_storages` which is not enabled by default.
-* Lowered contention of ThreadPool mutex (may increase performance for a huge amount of small jobs). [#48750](https://github.com/ClickHouse/ClickHouse/pull/48750) ([Sergei Trifonov](https://github.com/serxa)).
-* Reduce memory usage for multiple `ALTER DELETE` mutations. [#48522](https://github.com/ClickHouse/ClickHouse/pull/48522) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Remove the excessive connection attempts if the `skip_unavailable_shards` setting is enabled. [#48771](https://github.com/ClickHouse/ClickHouse/pull/48771) ([Azat Khuzhin](https://github.com/azat)).
-
-#### Experimental Feature
-* Entries in the query cache are now squashed to max_block_size and compressed. [#45912](https://github.com/ClickHouse/ClickHouse/pull/45912) ([Robert Schulze](https://github.com/rschu1ze)).
-* It is now possible to define per-user quotas in the query cache. [#48284](https://github.com/ClickHouse/ClickHouse/pull/48284) ([Robert Schulze](https://github.com/rschu1ze)).
-* Some fixes for parallel replicas [#48433](https://github.com/ClickHouse/ClickHouse/pull/48433) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Implement zero-copy-replication (an experimental feature) on encrypted disks. [#48741](https://github.com/ClickHouse/ClickHouse/pull/48741) ([Vitaly Baranov](https://github.com/vitlibar)).
-
-#### Improvement
-* Increase default value for `connect_timeout_with_failover_ms` to 1000 ms (because of adding async connections in https://github.com/ClickHouse/ClickHouse/pull/47229) . Closes [#5188](https://github.com/ClickHouse/ClickHouse/issues/5188). [#49009](https://github.com/ClickHouse/ClickHouse/pull/49009) ([Kruglov Pavel](https://github.com/Avogar)).
-* Several improvements around data lakes: - Make `Iceberg` work with non-partitioned data. - Support `Iceberg` format version v2 (previously only v1 was supported) - Support reading partitioned data for `DeltaLake`/`Hudi` - Faster reading of `DeltaLake` metadata by using Delta's checkpoint files - Fixed incorrect `Hudi` reads: previously it incorrectly chose which data to read and therefore was able to read correctly only small size tables - Made these engines to pickup updates of changed data (previously the state was set on table creation) - Make proper testing for `Iceberg`/`DeltaLake`/`Hudi` using spark. [#47307](https://github.com/ClickHouse/ClickHouse/pull/47307) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Add async connection to socket and async writing to socket. Make creating connections and sending query/external tables async across shards. Refactor code with fibers. Closes [#46931](https://github.com/ClickHouse/ClickHouse/issues/46931). We will be able to increase `connect_timeout_with_failover_ms` by default after this PR (https://github.com/ClickHouse/ClickHouse/issues/5188). [#47229](https://github.com/ClickHouse/ClickHouse/pull/47229) ([Kruglov Pavel](https://github.com/Avogar)).
-* Support config sections `keeper`/`keeper_server` as an alternative to `zookeeper`. Close [#34766](https://github.com/ClickHouse/ClickHouse/issues/34766) , [#34767](https://github.com/ClickHouse/ClickHouse/issues/34767). [#35113](https://github.com/ClickHouse/ClickHouse/pull/35113) ([李扬](https://github.com/taiyang-li)).
-* It is possible to set _secure_ flag in named_collections for a dictionary with a ClickHouse table source. Addresses [#38450](https://github.com/ClickHouse/ClickHouse/issues/38450) . [#46323](https://github.com/ClickHouse/ClickHouse/pull/46323) ([Ilya Golshtein](https://github.com/ilejn)).
-* `bitCount` function support `FixedString` and `String` data type. [#49044](https://github.com/ClickHouse/ClickHouse/pull/49044) ([flynn](https://github.com/ucasfl)).
-* Added configurable retries for all operations with [Zoo]Keeper for Backup queries. [#47224](https://github.com/ClickHouse/ClickHouse/pull/47224) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Enable `use_environment_credentials` for S3 by default, so the entire provider chain is constructed by default. [#47397](https://github.com/ClickHouse/ClickHouse/pull/47397) ([Antonio Andelic](https://github.com/antonio2368)).
-* Currently, the JSON_VALUE function is similar as spark's get_json_object function, which support to get value from JSON string by a path like '$.key'. But still has something different - 1. in spark's get_json_object will return null while the path is not exist, but in JSON_VALUE will return empty string; - 2. in spark's get_json_object will return a complex type value, such as a JSON object/array value, but in JSON_VALUE will return empty string. [#47494](https://github.com/ClickHouse/ClickHouse/pull/47494) ([KevinyhZou](https://github.com/KevinyhZou)).
-* For `use_structure_from_insertion_table_in_table_functions` more flexible insert table structure propagation to table function. Fixed an issue with name mapping and using virtual columns. No more need for 'auto' setting. [#47962](https://github.com/ClickHouse/ClickHouse/pull/47962) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Do not continue retrying to connect to Keeper if the query is killed or over limits. [#47985](https://github.com/ClickHouse/ClickHouse/pull/47985) ([Raúl Marín](https://github.com/Algunenano)).
-* Support Enum output/input in `BSONEachRow`, allow all map key types and avoid extra calculations on output. [#48122](https://github.com/ClickHouse/ClickHouse/pull/48122) ([Kruglov Pavel](https://github.com/Avogar)).
-* Support more ClickHouse types in `ORC`/`Arrow`/`Parquet` formats: Enum(8|16), (U)Int(128|256), Decimal256 (for ORC), allow reading IPv4 from Int32 values (ORC outputs IPv4 as Int32, and we couldn't read it back), fix reading Nullable(IPv6) from binary data for `ORC`. [#48126](https://github.com/ClickHouse/ClickHouse/pull/48126) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add columns `perform_ttl_move_on_insert`, `load_balancing` for table `system.storage_policies`, modify column `volume_type` type to `Enum8`. [#48167](https://github.com/ClickHouse/ClickHouse/pull/48167) ([lizhuoyu5](https://github.com/lzydmxy)).
-* Added support for `BACKUP ALL` command which backups all tables and databases, including temporary and system ones. [#48189](https://github.com/ClickHouse/ClickHouse/pull/48189) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Function mapFromArrays supports `Map` type as an input. [#48207](https://github.com/ClickHouse/ClickHouse/pull/48207) ([李扬](https://github.com/taiyang-li)).
-* The output of some SHOW PROCESSLIST is now sorted. [#48241](https://github.com/ClickHouse/ClickHouse/pull/48241) ([Robert Schulze](https://github.com/rschu1ze)).
-* Per-query/per-server throttling for remote IO/local IO/BACKUPs (server settings: `max_remote_read_network_bandwidth_for_server`, `max_remote_write_network_bandwidth_for_server`, `max_local_read_bandwidth_for_server`, `max_local_write_bandwidth_for_server`, `max_backup_bandwidth_for_server`, settings: `max_remote_read_network_bandwidth`, `max_remote_write_network_bandwidth`, `max_local_read_bandwidth`, `max_local_write_bandwidth`, `max_backup_bandwidth`). [#48242](https://github.com/ClickHouse/ClickHouse/pull/48242) ([Azat Khuzhin](https://github.com/azat)).
-* Support more types in `CapnProto` format: Map, (U)Int(128|256), Decimal(128|256). Allow integer conversions during input/output. [#48257](https://github.com/ClickHouse/ClickHouse/pull/48257) ([Kruglov Pavel](https://github.com/Avogar)).
-* Don't throw CURRENT_WRITE_BUFFER_IS_EXHAUSTED for normal behaviour. [#48288](https://github.com/ClickHouse/ClickHouse/pull/48288) ([Raúl Marín](https://github.com/Algunenano)).
-* Add new setting `keeper_map_strict_mode` which enforces extra guarantees on operations made on top of `KeeperMap` tables. [#48293](https://github.com/ClickHouse/ClickHouse/pull/48293) ([Antonio Andelic](https://github.com/antonio2368)).
-* Check primary key type for simple dictionary is native unsigned integer type Add setting `check_dictionary_primary_key ` for compatibility(set `check_dictionary_primary_key =false` to disable checking). [#48335](https://github.com/ClickHouse/ClickHouse/pull/48335) ([lizhuoyu5](https://github.com/lzydmxy)).
-* Don't replicate mutations for `KeeperMap` because it's unnecessary. [#48354](https://github.com/ClickHouse/ClickHouse/pull/48354) ([Antonio Andelic](https://github.com/antonio2368)).
-* Allow to write/read unnamed tuple as nested Message in Protobuf format. Tuple elements and Message fields are matched by position. [#48390](https://github.com/ClickHouse/ClickHouse/pull/48390) ([Kruglov Pavel](https://github.com/Avogar)).
-* Support `additional_table_filters` and `additional_result_filter` settings in the new planner. Also, add a documentation entry for `additional_result_filter`. [#48405](https://github.com/ClickHouse/ClickHouse/pull/48405) ([Dmitry Novik](https://github.com/novikd)).
-* `parseDateTime` now understands format string '%f' (fractional seconds). [#48420](https://github.com/ClickHouse/ClickHouse/pull/48420) ([Robert Schulze](https://github.com/rschu1ze)).
-* Format string "%f" in formatDateTime() now prints "000000" if the formatted value has no fractional seconds, the previous behavior (single zero) can be restored using setting "formatdatetime_f_prints_single_zero = 1". [#48422](https://github.com/ClickHouse/ClickHouse/pull/48422) ([Robert Schulze](https://github.com/rschu1ze)).
-* Don't replicate DELETE and TRUNCATE for KeeperMap. [#48434](https://github.com/ClickHouse/ClickHouse/pull/48434) ([Antonio Andelic](https://github.com/antonio2368)).
-* Generate valid Decimals and Bools in generateRandom function. [#48436](https://github.com/ClickHouse/ClickHouse/pull/48436) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow trailing commas in expression list of SELECT query, for example `SELECT a, b, c, FROM table`. Closes [#37802](https://github.com/ClickHouse/ClickHouse/issues/37802). [#48438](https://github.com/ClickHouse/ClickHouse/pull/48438) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Override `CLICKHOUSE_USER` and `CLICKHOUSE_PASSWORD` environment variables with `--user` and `--password` client parameters. Closes [#38909](https://github.com/ClickHouse/ClickHouse/issues/38909). [#48440](https://github.com/ClickHouse/ClickHouse/pull/48440) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Added retries to loading of data parts in `MergeTree` tables in case of retryable errors. [#48442](https://github.com/ClickHouse/ClickHouse/pull/48442) ([Anton Popov](https://github.com/CurtizJ)).
-* Add support for `Date`, `Date32`, `DateTime`, `DateTime64` data types to `arrayMin`, `arrayMax`, `arrayDifference` functions. Closes [#21645](https://github.com/ClickHouse/ClickHouse/issues/21645). [#48445](https://github.com/ClickHouse/ClickHouse/pull/48445) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add support for `{server_uuid}` macro. It is useful for identifying replicas in autoscaled clusters when new replicas are constantly added and removed in runtime. This closes [#48554](https://github.com/ClickHouse/ClickHouse/issues/48554). [#48563](https://github.com/ClickHouse/ClickHouse/pull/48563) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The installation script will create a hard link instead of copying if it is possible. [#48578](https://github.com/ClickHouse/ClickHouse/pull/48578) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Support `SHOW TABLE` syntax meaning the same as `SHOW CREATE TABLE`. Closes [#48580](https://github.com/ClickHouse/ClickHouse/issues/48580). [#48591](https://github.com/ClickHouse/ClickHouse/pull/48591) ([flynn](https://github.com/ucasfl)).
-* HTTP temporary buffers now support working by evicting data from the virtual filesystem cache. [#48664](https://github.com/ClickHouse/ClickHouse/pull/48664) ([Vladimir C](https://github.com/vdimir)).
-* Make Schema inference works for `CREATE AS SELECT`. Closes [#47599](https://github.com/ClickHouse/ClickHouse/issues/47599). [#48679](https://github.com/ClickHouse/ClickHouse/pull/48679) ([flynn](https://github.com/ucasfl)).
-* Added a `replicated_max_mutations_in_one_entry` setting for `ReplicatedMergeTree` that allows limiting the number of mutation commands per one `MUTATE_PART` entry (default is 10000). [#48731](https://github.com/ClickHouse/ClickHouse/pull/48731) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* In AggregateFunction types, don't count unused arena bytes as `read_bytes`. [#48745](https://github.com/ClickHouse/ClickHouse/pull/48745) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix some MySQL-related settings not being handled with the MySQL dictionary source + named collection. Closes [#48402](https://github.com/ClickHouse/ClickHouse/issues/48402). [#48759](https://github.com/ClickHouse/ClickHouse/pull/48759) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* If a user set `max_single_part_upload_size` to a very large value, it can lead to a crash due to a bug in the AWS S3 SDK. This fixes [#47679](https://github.com/ClickHouse/ClickHouse/issues/47679). [#48816](https://github.com/ClickHouse/ClickHouse/pull/48816) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix data race in `RabbitMQ` ([report](https://pastila.nl/?004f7100/de1505289ab5bb355e67ebe6c7cc8707)), refactor the code. [#48845](https://github.com/ClickHouse/ClickHouse/pull/48845) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Add aliases `name` and `part_name` form `system.parts` and `system.part_log`. Closes [#48718](https://github.com/ClickHouse/ClickHouse/issues/48718). [#48850](https://github.com/ClickHouse/ClickHouse/pull/48850) ([sichenzhao](https://github.com/sichenzhao)).
-* Functions "arrayDifferenceSupport()", "arrayCumSum()" and "arrayCumSumNonNegative()" now support input arrays of wide integer types (U)Int128/256. [#48866](https://github.com/ClickHouse/ClickHouse/pull/48866) ([cluster](https://github.com/infdahai)).
-* Multi-line history in clickhouse-client is now no longer padded. This makes pasting more natural. [#48870](https://github.com/ClickHouse/ClickHouse/pull/48870) ([Joanna Hulboj](https://github.com/jh0x)).
-* Implement a slight improvement for the rare case when ClickHouse is run inside LXC and LXCFS is used. The LXCFS has an issue: sometimes it returns an error "Transport endpoint is not connected" on reading from the file inside `/proc`. This error was correctly logged into ClickHouse's server log. We have additionally workaround this issue by reopening a file. This is a minuscule change. [#48922](https://github.com/ClickHouse/ClickHouse/pull/48922) ([Real](https://github.com/RunningXie)).
-* Improve memory accounting for prefetches. Randomise prefetch settings In CI. [#48973](https://github.com/ClickHouse/ClickHouse/pull/48973) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Correctly set headers for native copy operations on GCS. [#48981](https://github.com/ClickHouse/ClickHouse/pull/48981) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add support for specifying setting names in the command line with dashes instead of underscores, for example, `--max-threads` instead of `--max_threads`. Additionally, support Unicode dash characters like `—` instead of `--` - this is useful when you communicate with a team in another company, and a manager from that team copy-pasted code from MS Word. [#48985](https://github.com/ClickHouse/ClickHouse/pull/48985) ([alekseygolub](https://github.com/alekseygolub)).
-* Add fallback to password authentication when authentication with SSL user certificate has failed. Closes [#48974](https://github.com/ClickHouse/ClickHouse/issues/48974). [#48989](https://github.com/ClickHouse/ClickHouse/pull/48989) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Improve the embedded dashboard. Close [#46671](https://github.com/ClickHouse/ClickHouse/issues/46671). [#49036](https://github.com/ClickHouse/ClickHouse/pull/49036) ([Kevin Zhang](https://github.com/Kinzeng)).
-* Add profile events for log messages, so you can easily see the count of log messages by severity. [#49042](https://github.com/ClickHouse/ClickHouse/pull/49042) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* In previous versions, the `LineAsString` format worked inconsistently when the parallel parsing was enabled or not, in presence of DOS or macOS Classic line breaks. This closes [#49039](https://github.com/ClickHouse/ClickHouse/issues/49039). [#49052](https://github.com/ClickHouse/ClickHouse/pull/49052) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The exception message about the unparsed query parameter will also tell about the name of the parameter. Reimplement [#48878](https://github.com/ClickHouse/ClickHouse/issues/48878). Close [#48772](https://github.com/ClickHouse/ClickHouse/issues/48772). [#49061](https://github.com/ClickHouse/ClickHouse/pull/49061) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-
-#### Build/Testing/Packaging Improvement
-* Update time zones. The following were updated: Africa/Cairo, Africa/Casablanca, Africa/El_Aaiun, America/Bogota, America/Cambridge_Bay, America/Ciudad_Juarez, America/Godthab, America/Inuvik, America/Iqaluit, America/Nuuk, America/Ojinaga, America/Pangnirtung, America/Rankin_Inlet, America/Resolute, America/Whitehorse, America/Yellowknife, Asia/Gaza, Asia/Hebron, Asia/Kuala_Lumpur, Asia/Singapore, Canada/Yukon, Egypt, Europe/Kirov, Europe/Volgograd, Singapore. [#48572](https://github.com/ClickHouse/ClickHouse/pull/48572) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Reduce the number of dependencies in the header files to speed up the build. [#47984](https://github.com/ClickHouse/ClickHouse/pull/47984) ([Dmitry Novik](https://github.com/novikd)).
-* Randomize compression of marks and indices in tests. [#48286](https://github.com/ClickHouse/ClickHouse/pull/48286) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Bump internal ZSTD from 1.5.4 to 1.5.5. [#46797](https://github.com/ClickHouse/ClickHouse/pull/46797) ([Robert Schulze](https://github.com/rschu1ze)).
-* Randomize vertical merges from compact to wide parts in tests. [#48287](https://github.com/ClickHouse/ClickHouse/pull/48287) ([Raúl Marín](https://github.com/Algunenano)).
-* Support for CRC32 checksum in HDFS. Fix performance issues. [#48614](https://github.com/ClickHouse/ClickHouse/pull/48614) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Remove remainders of GCC support. [#48671](https://github.com/ClickHouse/ClickHouse/pull/48671) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add CI run with new analyzer infrastructure enabled. [#48719](https://github.com/ClickHouse/ClickHouse/pull/48719) ([Dmitry Novik](https://github.com/novikd)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-
-* Fix system.query_views_log for MVs that are pushed from background threads [#46668](https://github.com/ClickHouse/ClickHouse/pull/46668) ([Azat Khuzhin](https://github.com/azat)).
-* Fix several `RENAME COLUMN` bugs [#46946](https://github.com/ClickHouse/ClickHouse/pull/46946) ([alesapin](https://github.com/alesapin)).
-* Fix minor hiliting issues in clickhouse-format [#47610](https://github.com/ClickHouse/ClickHouse/pull/47610) ([Natasha Murashkina](https://github.com/murfel)).
-* Fix a bug in LLVM's libc++ leading to a crash for uploading parts to S3 which size is greater than INT_MAX [#47693](https://github.com/ClickHouse/ClickHouse/pull/47693) ([Azat Khuzhin](https://github.com/azat)).
-* Fix overflow in the `sparkbar` function [#48121](https://github.com/ClickHouse/ClickHouse/pull/48121) ([Vladimir C](https://github.com/vdimir)).
-* Fix race in S3 [#48190](https://github.com/ClickHouse/ClickHouse/pull/48190) ([Anton Popov](https://github.com/CurtizJ)).
-* Disable JIT for aggregate functions due to inconsistent behavior [#48195](https://github.com/ClickHouse/ClickHouse/pull/48195) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix alter formatting (minor) [#48289](https://github.com/ClickHouse/ClickHouse/pull/48289) ([Natasha Murashkina](https://github.com/murfel)).
-* Fix CPU usage in RabbitMQ (was worsened in 23.2 after [#44404](https://github.com/ClickHouse/ClickHouse/issues/44404)) [#48311](https://github.com/ClickHouse/ClickHouse/pull/48311) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix crash in EXPLAIN PIPELINE for Merge over Distributed [#48320](https://github.com/ClickHouse/ClickHouse/pull/48320) ([Azat Khuzhin](https://github.com/azat)).
-* Fix serializing LowCardinality as Arrow dictionary [#48361](https://github.com/ClickHouse/ClickHouse/pull/48361) ([Kruglov Pavel](https://github.com/Avogar)).
-* Reset downloader for cache file segment in TemporaryFileStream [#48386](https://github.com/ClickHouse/ClickHouse/pull/48386) ([Vladimir C](https://github.com/vdimir)).
-* Fix possible SYSTEM SYNC REPLICA stuck in case of DROP/REPLACE PARTITION [#48391](https://github.com/ClickHouse/ClickHouse/pull/48391) ([Azat Khuzhin](https://github.com/azat)).
-* Fix a startup error when loading a distributed table that depends on a dictionary [#48419](https://github.com/ClickHouse/ClickHouse/pull/48419) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* Don't check dependencies when renaming system tables automatically [#48431](https://github.com/ClickHouse/ClickHouse/pull/48431) ([Raúl Marín](https://github.com/Algunenano)).
-* Update only affected rows in KeeperMap storage [#48435](https://github.com/ClickHouse/ClickHouse/pull/48435) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix possible segfault in the VFS cache [#48469](https://github.com/ClickHouse/ClickHouse/pull/48469) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* `toTimeZone` function throws an error when no constant string is provided [#48471](https://github.com/ClickHouse/ClickHouse/pull/48471) ([Jordi Villar](https://github.com/jrdi)).
-* Fix logical error with IPv4 in Protobuf, add support for Date32 [#48486](https://github.com/ClickHouse/ClickHouse/pull/48486) ([Kruglov Pavel](https://github.com/Avogar)).
-* "changed" flag in system.settings was calculated incorrectly for settings with multiple values [#48516](https://github.com/ClickHouse/ClickHouse/pull/48516) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* Fix storage `Memory` with enabled compression [#48517](https://github.com/ClickHouse/ClickHouse/pull/48517) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix bracketed-paste mode messing up password input in the event of client reconnection [#48528](https://github.com/ClickHouse/ClickHouse/pull/48528) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix nested map for keys of IP and UUID types [#48556](https://github.com/ClickHouse/ClickHouse/pull/48556) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix an uncaught exception in case of parallel loader for hashed dictionaries [#48571](https://github.com/ClickHouse/ClickHouse/pull/48571) ([Azat Khuzhin](https://github.com/azat)).
-* The `groupArray` aggregate function correctly works for empty result over nullable types [#48593](https://github.com/ClickHouse/ClickHouse/pull/48593) ([lgbo](https://github.com/lgbo-ustc)).
-* Fix bug in Keeper when a node is not created with scheme `auth` in ACL sometimes. [#48595](https://github.com/ClickHouse/ClickHouse/pull/48595) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* Allow IPv4 comparison operators with UInt [#48611](https://github.com/ClickHouse/ClickHouse/pull/48611) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix possible error from cache [#48636](https://github.com/ClickHouse/ClickHouse/pull/48636) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Async inserts with empty data will no longer throw exception. [#48663](https://github.com/ClickHouse/ClickHouse/pull/48663) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix table dependencies in case of failed RENAME TABLE [#48683](https://github.com/ClickHouse/ClickHouse/pull/48683) ([Azat Khuzhin](https://github.com/azat)).
-* If the primary key has duplicate columns (which is only possible for projections), in previous versions it might lead to a bug [#48838](https://github.com/ClickHouse/ClickHouse/pull/48838) ([Amos Bird](https://github.com/amosbird)).
-* Fix for a race condition in ZooKeeper when joining send_thread/receive_thread [#48849](https://github.com/ClickHouse/ClickHouse/pull/48849) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix unexpected part name error when trying to drop a ignored detached part with zero copy replication [#48862](https://github.com/ClickHouse/ClickHouse/pull/48862) ([Michael Lex](https://github.com/mlex)).
-* Fix reading `Date32` Parquet/Arrow column into not a `Date32` column [#48864](https://github.com/ClickHouse/ClickHouse/pull/48864) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix `UNKNOWN_IDENTIFIER` error while selecting from table with row policy and column with dots [#48976](https://github.com/ClickHouse/ClickHouse/pull/48976) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix aggregation by empty nullable strings [#48999](https://github.com/ClickHouse/ClickHouse/pull/48999) ([LiuNeng](https://github.com/liuneng1994)).
-
-### <a id="233"></a> ClickHouse release 23.3 LTS, 2023-03-30
-
-#### Upgrade Notes
-* Lightweight DELETEs are production ready and enabled by default. The `DELETE` query for MergeTree tables is now available by default.
-* The behavior of `*domain*RFC` and `netloc` functions is slightly changed: relaxed the set of symbols that are allowed in the URL authority for better conformance. [#46841](https://github.com/ClickHouse/ClickHouse/pull/46841) ([Azat Khuzhin](https://github.com/azat)).
-* Prohibited creating tables based on KafkaEngine with DEFAULT/EPHEMERAL/ALIAS/MATERIALIZED statements for columns. [#47138](https://github.com/ClickHouse/ClickHouse/pull/47138) ([Aleksandr Musorin](https://github.com/AVMusorin)).
-* An "asynchronous connection drain" feature is removed. Related settings and metrics are removed as well. It was an internal feature, so the removal should not affect users who had never heard about that feature. [#47486](https://github.com/ClickHouse/ClickHouse/pull/47486) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Support 256-bit Decimal data type (more than 38 digits) in `arraySum`/`Min`/`Max`/`Avg`/`Product`, `arrayCumSum`/`CumSumNonNegative`, `arrayDifference`, array construction, IN operator, query parameters, `groupArrayMovingSum`, statistical functions, `min`/`max`/`any`/`argMin`/`argMax`, PostgreSQL wire protocol, MySQL table engine and function, `sumMap`, `mapAdd`, `mapSubtract`, `arrayIntersect`. Add support for big integers in `arrayIntersect`. Statistical aggregate functions involving moments (such as `corr` or various `TTest`s) will use `Float64` as their internal representation (they were using `Decimal128` before this change, but it was pointless), and these functions can return `nan` instead of `inf` in case of infinite variance. Some functions were allowed on `Decimal256` data types but returned `Decimal128` in previous versions - now it is fixed. This closes [#47569](https://github.com/ClickHouse/ClickHouse/issues/47569). This closes [#44864](https://github.com/ClickHouse/ClickHouse/issues/44864). This closes [#28335](https://github.com/ClickHouse/ClickHouse/issues/28335). [#47594](https://github.com/ClickHouse/ClickHouse/pull/47594) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Make backup_threads/restore_threads server settings (instead of user settings). [#47881](https://github.com/ClickHouse/ClickHouse/pull/47881) ([Azat Khuzhin](https://github.com/azat)).
-* Do not allow const and non-deterministic secondary indices [#46839](https://github.com/ClickHouse/ClickHouse/pull/46839) ([Anton Popov](https://github.com/CurtizJ)).
-
-#### New Feature
-* Add a new mode for splitting the work on replicas using settings `parallel_replicas_custom_key` and `parallel_replicas_custom_key_filter_type`. If the cluster consists of a single shard with multiple replicas, up to `max_parallel_replicas` will be randomly picked and turned into shards. For each shard, a corresponding filter is added to the query on the initiator before being sent to the shard. If the cluster consists of multiple shards, it will behave the same as `sample_key` but with the possibility to define an arbitrary key. [#45108](https://github.com/ClickHouse/ClickHouse/pull/45108) ([Antonio Andelic](https://github.com/antonio2368)).
-* An option to display partial result on cancel: Added query setting `partial_result_on_first_cancel` allowing the canceled query (e.g. due to Ctrl-C) to return a partial result. [#45689](https://github.com/ClickHouse/ClickHouse/pull/45689) ([Alexey Perevyshin](https://github.com/alexX512)).
-* Added support of arbitrary tables engines for temporary tables (except for Replicated and KeeperMap engines). Close [#31497](https://github.com/ClickHouse/ClickHouse/issues/31497). [#46071](https://github.com/ClickHouse/ClickHouse/pull/46071) ([Roman Vasin](https://github.com/rvasin)).
-* Add support for replication of user-defined SQL functions using centralized storage in Keeper. [#46085](https://github.com/ClickHouse/ClickHouse/pull/46085) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* Implement `system.server_settings` (similar to `system.settings`), which will contain server configurations. [#46550](https://github.com/ClickHouse/ClickHouse/pull/46550) ([pufit](https://github.com/pufit)).
-* Support for `UNDROP TABLE` query. Closes [#46811](https://github.com/ClickHouse/ClickHouse/issues/46811). [#47241](https://github.com/ClickHouse/ClickHouse/pull/47241) ([chen](https://github.com/xiedeyantu)).
-* Allow separate grants for named collections (e.g. to be able to give `SHOW/CREATE/ALTER/DROP named collection` access only to certain collections, instead of all at once). Closes [#40894](https://github.com/ClickHouse/ClickHouse/issues/40894). Add new access type `NAMED_COLLECTION_CONTROL` which is not given to user default unless explicitly added to the user config (is required to be able to do `GRANT ALL`), also `show_named_collections` is no longer obligatory to be manually specified for user default to be able to have full access rights as was in 23.2. [#46241](https://github.com/ClickHouse/ClickHouse/pull/46241) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Allow nested custom disks. Previously custom disks supported only flat disk structure. [#47106](https://github.com/ClickHouse/ClickHouse/pull/47106) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Introduce a function `widthBucket` (with a `WIDTH_BUCKET` alias for compatibility). [#42974](https://github.com/ClickHouse/ClickHouse/issues/42974). [#46790](https://github.com/ClickHouse/ClickHouse/pull/46790) ([avoiderboi](https://github.com/avoiderboi)).
-* Add new function `parseDateTime`/`parseDateTimeInJodaSyntax` according to the specified format string. parseDateTime parses String to DateTime in MySQL syntax, parseDateTimeInJodaSyntax parses in Joda syntax. [#46815](https://github.com/ClickHouse/ClickHouse/pull/46815) ([李扬](https://github.com/taiyang-li)).
-* Use `dummy UInt8` for the default structure of table function `null`. Closes [#46930](https://github.com/ClickHouse/ClickHouse/issues/46930). [#47006](https://github.com/ClickHouse/ClickHouse/pull/47006) ([flynn](https://github.com/ucasfl)).
-* Support for date format with a comma, like `Dec 15, 2021` in the `parseDateTimeBestEffort` function. Closes [#46816](https://github.com/ClickHouse/ClickHouse/issues/46816). [#47071](https://github.com/ClickHouse/ClickHouse/pull/47071) ([chen](https://github.com/xiedeyantu)).
-* Add settings `http_wait_end_of_query` and `http_response_buffer_size` that corresponds to URL params `wait_end_of_query` and `buffer_size` for the HTTP interface. This allows changing these settings in the profiles. [#47108](https://github.com/ClickHouse/ClickHouse/pull/47108) ([Vladimir C](https://github.com/vdimir)).
-* Add `system.dropped_tables` table that shows tables that were dropped from `Atomic` databases but were not completely removed yet. [#47364](https://github.com/ClickHouse/ClickHouse/pull/47364) ([chen](https://github.com/xiedeyantu)).
-* Add `INSTR` as alias of `positionCaseInsensitive` for MySQL compatibility. Closes [#47529](https://github.com/ClickHouse/ClickHouse/issues/47529). [#47535](https://github.com/ClickHouse/ClickHouse/pull/47535) ([flynn](https://github.com/ucasfl)).
-* Added `toDecimalString` function allowing to convert numbers to string with fixed precision. [#47838](https://github.com/ClickHouse/ClickHouse/pull/47838) ([Andrey Zvonov](https://github.com/zvonand)).
-* Add a merge tree setting `max_number_of_mutations_for_replica`. It limits the number of part mutations per replica to the specified amount. Zero means no limit on the number of mutations per replica (the execution can still be constrained by other settings). [#48047](https://github.com/ClickHouse/ClickHouse/pull/48047) ([Vladimir C](https://github.com/vdimir)).
-* Add the Map-related function `mapFromArrays`, which allows the creation of a map from a pair of arrays. [#31125](https://github.com/ClickHouse/ClickHouse/pull/31125) ([李扬](https://github.com/taiyang-li)).
-* Allow control of compression in Parquet/ORC/Arrow output formats, adds support for more compression input formats. This closes [#13541](https://github.com/ClickHouse/ClickHouse/issues/13541). [#47114](https://github.com/ClickHouse/ClickHouse/pull/47114) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add SSL User Certificate authentication to the native protocol. Closes [#47077](https://github.com/ClickHouse/ClickHouse/issues/47077). [#47596](https://github.com/ClickHouse/ClickHouse/pull/47596) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add *OrNull() and *OrZero() variants for `parseDateTime`, add alias `str_to_date` for MySQL parity. [#48000](https://github.com/ClickHouse/ClickHouse/pull/48000) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added operator `REGEXP` (similar to operators "LIKE", "IN", "MOD" etc.) for better compatibility with MySQL [#47869](https://github.com/ClickHouse/ClickHouse/pull/47869) ([Robert Schulze](https://github.com/rschu1ze)).
-
-#### Performance Improvement
-* Marks in memory are now compressed, using 3-6x less memory. [#47290](https://github.com/ClickHouse/ClickHouse/pull/47290) ([Michael Kolupaev](https://github.com/al13n321)).
-* Backups for large numbers of files were unbelievably slow in previous versions. Not anymore. Now they are unbelievably fast. [#47251](https://github.com/ClickHouse/ClickHouse/pull/47251) ([Alexey Milovidov](https://github.com/alexey-milovidov)). Introduced a separate thread pool for backup's IO operations. This will allow scaling it independently of other pools and increase performance. [#47174](https://github.com/ClickHouse/ClickHouse/pull/47174) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)). Use MultiRead request and retries for collecting metadata at the final stage of backup processing. [#47243](https://github.com/ClickHouse/ClickHouse/pull/47243) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)). If a backup and restoring data are both in S3 then server-side copy should be used from now on. [#47546](https://github.com/ClickHouse/ClickHouse/pull/47546) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fixed excessive reading in queries with `FINAL`. [#47801](https://github.com/ClickHouse/ClickHouse/pull/47801) ([Nikita Taranov](https://github.com/nickitat)).
-* Setting `max_final_threads` would be set to the number of cores at server startup (by the same algorithm as used for `max_threads`). This improves the concurrency of `final` execution on servers with high number of CPUs. [#47915](https://github.com/ClickHouse/ClickHouse/pull/47915) ([Nikita Taranov](https://github.com/nickitat)).
-* Allow executing reading pipeline for DIRECT dictionary with CLICKHOUSE source in multiple threads. To enable set `dictionary_use_async_executor=1` in `SETTINGS` section for source in `CREATE DICTIONARY` statement. [#47986](https://github.com/ClickHouse/ClickHouse/pull/47986) ([Vladimir C](https://github.com/vdimir)).
-* Optimize one nullable key aggregate performance. [#45772](https://github.com/ClickHouse/ClickHouse/pull/45772) ([LiuNeng](https://github.com/liuneng1994)).
-* Implemented lowercase `tokenbf_v1` index utilization for `hasTokenOrNull`, `hasTokenCaseInsensitive` and `hasTokenCaseInsensitiveOrNull`. [#46252](https://github.com/ClickHouse/ClickHouse/pull/46252) ([ltrk2](https://github.com/ltrk2)).
-* Optimize functions `position` and `LIKE` by searching the first two chars using SIMD. [#46289](https://github.com/ClickHouse/ClickHouse/pull/46289) ([Jiebin Sun](https://github.com/jiebinn)).
-* Optimize queries from the `system.detached_parts`, which could be significantly large. Added several sources with respect to the block size limitation; in each block, an IO thread pool is used to calculate the part size, i.e. to make syscalls in parallel. [#46624](https://github.com/ClickHouse/ClickHouse/pull/46624) ([Sema Checherinda](https://github.com/CheSema)).
-* Increase the default value of `max_replicated_merges_in_queue` for ReplicatedMergeTree tables from 16 to 1000. It allows faster background merge operation on clusters with a very large number of replicas, such as clusters with shared storage in ClickHouse Cloud. [#47050](https://github.com/ClickHouse/ClickHouse/pull/47050) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Updated `clickhouse-copier` to use `GROUP BY` instead of `DISTINCT` to get the list of partitions. For large tables, this reduced the select time from over 500s to under 1s. [#47386](https://github.com/ClickHouse/ClickHouse/pull/47386) ([Clayton McClure](https://github.com/cmcclure-twilio)).
-* Fix performance degradation in `ASOF JOIN`. [#47544](https://github.com/ClickHouse/ClickHouse/pull/47544) ([Ongkong](https://github.com/ongkong)).
-* Even more batching in Keeper. Improve performance by avoiding breaking batches on read requests. [#47978](https://github.com/ClickHouse/ClickHouse/pull/47978) ([Antonio Andelic](https://github.com/antonio2368)).
-* Allow PREWHERE for Merge with different DEFAULT expressions for columns. [#46831](https://github.com/ClickHouse/ClickHouse/pull/46831) ([Azat Khuzhin](https://github.com/azat)).
-
-#### Experimental Feature
-* Parallel replicas: Improved the overall performance by better utilizing the local replica, and forbid the reading with parallel replicas from non-replicated MergeTree by default. [#47858](https://github.com/ClickHouse/ClickHouse/pull/47858) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Support filter push down to left table for JOIN with `Join`, `Dictionary` and `EmbeddedRocksDB` tables if the experimental Analyzer is enabled. [#47280](https://github.com/ClickHouse/ClickHouse/pull/47280) ([Maksim Kita](https://github.com/kitaisreal)).
-* Now ReplicatedMergeTree with zero copy replication has less load to Keeper. [#47676](https://github.com/ClickHouse/ClickHouse/pull/47676) ([alesapin](https://github.com/alesapin)).
-* Fix create materialized view with MaterializedPostgreSQL [#40807](https://github.com/ClickHouse/ClickHouse/pull/40807) ([Maksim Buren](https://github.com/maks-buren630501)).
-
-#### Improvement
-* Enable `input_format_json_ignore_unknown_keys_in_named_tuple` by default. [#46742](https://github.com/ClickHouse/ClickHouse/pull/46742) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow errors to be ignored while pushing to MATERIALIZED VIEW (add new setting `materialized_views_ignore_errors`, by default to `false`, but it is set to `true` for flushing logs to `system.*_log` tables unconditionally). [#46658](https://github.com/ClickHouse/ClickHouse/pull/46658) ([Azat Khuzhin](https://github.com/azat)).
-* Track the file queue of distributed sends in memory. [#45491](https://github.com/ClickHouse/ClickHouse/pull/45491) ([Azat Khuzhin](https://github.com/azat)).
-* Now `X-ClickHouse-Query-Id` and `X-ClickHouse-Timezone` headers are added to responses in all queries via HTTP protocol. Previously it was done only for `SELECT` queries. [#46364](https://github.com/ClickHouse/ClickHouse/pull/46364) ([Anton Popov](https://github.com/CurtizJ)).
-* External tables from `MongoDB`: support for connection to a replica set via a URI with a host:port enum and support for the readPreference option in MongoDB dictionaries. Example URI: mongodb://db0.example.com:27017,db1.example.com:27017,db2.example.com:27017/?replicaSet=myRepl&readPreference=primary. [#46524](https://github.com/ClickHouse/ClickHouse/pull/46524) ([artem-yadr](https://github.com/artem-yadr)).
-* This improvement should be invisible for users. Re-implement projection analysis on top of query plan. Added setting `query_plan_optimize_projection=1` to switch between old and new version. Fixes [#44963](https://github.com/ClickHouse/ClickHouse/issues/44963). [#46537](https://github.com/ClickHouse/ClickHouse/pull/46537) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Use Parquet format v2 instead of v1 in output format by default. Add setting `output_format_parquet_version` to control parquet version, possible values `1.0`, `2.4`, `2.6`, `2.latest` (default). [#46617](https://github.com/ClickHouse/ClickHouse/pull/46617) ([Kruglov Pavel](https://github.com/Avogar)).
-* It is now possible to use the new configuration syntax to configure Kafka topics with periods (`.`) in their name. [#46752](https://github.com/ClickHouse/ClickHouse/pull/46752) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix heuristics that check hyperscan patterns for problematic repeats. [#46819](https://github.com/ClickHouse/ClickHouse/pull/46819) ([Robert Schulze](https://github.com/rschu1ze)).
-* Don't report ZK node exists to system.errors when a block was created concurrently by a different replica. [#46820](https://github.com/ClickHouse/ClickHouse/pull/46820) ([Raúl Marín](https://github.com/Algunenano)).
-* Increase the limit for opened files in `clickhouse-local`. It will be able to read from `web` tables on servers with a huge number of CPU cores. Do not back off reading from the URL table engine in case of too many opened files. This closes [#46852](https://github.com/ClickHouse/ClickHouse/issues/46852). [#46853](https://github.com/ClickHouse/ClickHouse/pull/46853) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Exceptions thrown when numbers cannot be parsed now have an easier-to-read exception message. [#46917](https://github.com/ClickHouse/ClickHouse/pull/46917) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added update `system.backups` after every processed task to track the progress of backups. [#46989](https://github.com/ClickHouse/ClickHouse/pull/46989) ([Aleksandr Musorin](https://github.com/AVMusorin)).
-* Allow types conversion in Native input format. Add settings `input_format_native_allow_types_conversion` that controls it (enabled by default). [#46990](https://github.com/ClickHouse/ClickHouse/pull/46990) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow IPv4 in the `range` function to generate IP ranges. [#46995](https://github.com/ClickHouse/ClickHouse/pull/46995) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Improve exception message when it's impossible to move a part from one volume/disk to another. [#47032](https://github.com/ClickHouse/ClickHouse/pull/47032) ([alesapin](https://github.com/alesapin)).
-* Support `Bool` type in `JSONType` function. Previously `Null` type was mistakenly returned for bool values. [#47046](https://github.com/ClickHouse/ClickHouse/pull/47046) ([Anton Popov](https://github.com/CurtizJ)).
-* Use `_request_body` parameter to configure predefined HTTP queries. [#47086](https://github.com/ClickHouse/ClickHouse/pull/47086) ([Constantine Peresypkin](https://github.com/pkit)).
-* Automatic indentation in the built-in UI SQL editor when Enter is pressed. [#47113](https://github.com/ClickHouse/ClickHouse/pull/47113) ([Alexey Korepanov](https://github.com/alexkorep)).
-* Self-extraction with 'sudo' will attempt to set uid and gid of extracted files to running user. [#47116](https://github.com/ClickHouse/ClickHouse/pull/47116) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Previously, the `repeat` function's second argument only accepted an unsigned integer type, which meant it could not accept values such as -1. This behavior differed from that of the Spark function. In this update, the repeat function has been modified to match the behavior of the Spark function. It now accepts the same types of inputs, including negative integers. Extensive testing has been performed to verify the correctness of the updated implementation. [#47134](https://github.com/ClickHouse/ClickHouse/pull/47134) ([KevinyhZou](https://github.com/KevinyhZou)). Note: the changelog entry was rewritten by ChatGPT.
-* Remove `::__1` part from stacktraces. Display `std::basic_string<char, ...` as `String` in stacktraces. [#47171](https://github.com/ClickHouse/ClickHouse/pull/47171) ([Mike Kot](https://github.com/myrrc)).
-* Reimplement interserver mode to avoid replay attacks (note, that change is backward compatible with older servers). [#47213](https://github.com/ClickHouse/ClickHouse/pull/47213) ([Azat Khuzhin](https://github.com/azat)).
-* Improve recognition of regular expression groups and refine the regexp_tree dictionary. [#47218](https://github.com/ClickHouse/ClickHouse/pull/47218) ([Han Fei](https://github.com/hanfei1991)).
-* Keeper improvement: Add new 4LW `clrs` to clean resources used by Keeper (e.g. release unused memory). [#47256](https://github.com/ClickHouse/ClickHouse/pull/47256) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add optional arguments to codecs `DoubleDelta(bytes_size)`, `Gorilla(bytes_size)`, `FPC(level, float_size)`, this allows using these codecs without column type in `clickhouse-compressor`. Fix possible aborts and arithmetic errors in `clickhouse-compressor` with these codecs. Fixes: https://github.com/ClickHouse/ClickHouse/discussions/47262. [#47271](https://github.com/ClickHouse/ClickHouse/pull/47271) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add support for big int types to the `runningDifference` function. Closes [#47194](https://github.com/ClickHouse/ClickHouse/issues/47194). [#47322](https://github.com/ClickHouse/ClickHouse/pull/47322) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add an expiration window for S3 credentials that have an expiration time to avoid `ExpiredToken` errors in some edge cases. It can be controlled with `expiration_window_seconds` config, the default is 120 seconds. [#47423](https://github.com/ClickHouse/ClickHouse/pull/47423) ([Antonio Andelic](https://github.com/antonio2368)).
-* Support Decimals and Date32 in `Avro` format. [#47434](https://github.com/ClickHouse/ClickHouse/pull/47434) ([Kruglov Pavel](https://github.com/Avogar)).
-* Do not start the server if an interrupted conversion from `Ordinary` to `Atomic` was detected, print a better error message with troubleshooting instructions. [#47487](https://github.com/ClickHouse/ClickHouse/pull/47487) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Add a new column `kind` to the `system.opentelemetry_span_log`. This column holds the value of [SpanKind](https://opentelemetry.io/docs/reference/specification/trace/api/#spankind) defined in OpenTelemtry. [#47499](https://github.com/ClickHouse/ClickHouse/pull/47499) ([Frank Chen](https://github.com/FrankChen021)).
-* Allow reading/writing nested arrays in `Protobuf` format with only the root field name as column name. Previously column name should've contained all nested field names (like `a.b.c Array(Array(Array(UInt32)))`, now you can use just `a Array(Array(Array(UInt32)))`. [#47650](https://github.com/ClickHouse/ClickHouse/pull/47650) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added an optional `STRICT` modifier for `SYSTEM SYNC REPLICA` which makes the query wait for the replication queue to become empty (just like it worked before https://github.com/ClickHouse/ClickHouse/pull/45648). [#47659](https://github.com/ClickHouse/ClickHouse/pull/47659) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Improve the naming of some OpenTelemetry span logs. [#47667](https://github.com/ClickHouse/ClickHouse/pull/47667) ([Frank Chen](https://github.com/FrankChen021)).
-* Prevent using too long chains of aggregate function combinators (they can lead to slow queries in the analysis stage). This closes [#47715](https://github.com/ClickHouse/ClickHouse/issues/47715). [#47716](https://github.com/ClickHouse/ClickHouse/pull/47716) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Support for subquery in parameterized views; resolves [#46741](https://github.com/ClickHouse/ClickHouse/issues/46741) [#47725](https://github.com/ClickHouse/ClickHouse/pull/47725) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix memory leak in MySQL integration (reproduces with `connection_auto_close=1`). [#47732](https://github.com/ClickHouse/ClickHouse/pull/47732) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Improved error handling in the code related to Decimal parameters, resulting in more informative error messages. Previously, when incorrect Decimal parameters were supplied, the error message generated was unclear or unhelpful. With this update, the error message printed has been fixed to provide more detailed and useful information, making it easier to identify and correct issues related to Decimal parameters. [#47812](https://github.com/ClickHouse/ClickHouse/pull/47812) ([Yu Feng](https://github.com/Vigor-jpg)). Note: this changelog entry is rewritten by ChatGPT.
-* The parameter `exact_rows_before_limit` is used to make `rows_before_limit_at_least` is designed to accurately reflect the number of rows returned before the limit is reached. This pull request addresses issues encountered when the query involves distributed processing across multiple shards or sorting operations. Prior to this update, these scenarios were not functioning as intended. [#47874](https://github.com/ClickHouse/ClickHouse/pull/47874) ([Amos Bird](https://github.com/amosbird)).
-* ThreadPools metrics introspection. [#47880](https://github.com/ClickHouse/ClickHouse/pull/47880) ([Azat Khuzhin](https://github.com/azat)).
-* Add `WriteBufferFromS3Microseconds` and `WriteBufferFromS3RequestsErrors` profile events. [#47885](https://github.com/ClickHouse/ClickHouse/pull/47885) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add `--link` and `--noninteractive` (`-y`) options to ClickHouse install. Closes [#47750](https://github.com/ClickHouse/ClickHouse/issues/47750). [#47887](https://github.com/ClickHouse/ClickHouse/pull/47887) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fixed `UNKNOWN_TABLE` exception when attaching to a materialized view that has dependent tables that are not available. This might be useful when trying to restore state from a backup. [#47975](https://github.com/ClickHouse/ClickHouse/pull/47975) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* Fix case when the (optional) path is not added to an encrypted disk configuration. [#47981](https://github.com/ClickHouse/ClickHouse/pull/47981) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Support for CTE in parameterized views Implementation: Updated to allow query parameters while evaluating scalar subqueries. [#48065](https://github.com/ClickHouse/ClickHouse/pull/48065) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Support big integers `(U)Int128/(U)Int256`, `Map` with any key type and `DateTime64` with any precision (not only 3 and 6). [#48119](https://github.com/ClickHouse/ClickHouse/pull/48119) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow skipping errors related to unknown enum values in row input formats. [#48133](https://github.com/ClickHouse/ClickHouse/pull/48133) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-
-#### Build/Testing/Packaging Improvement
-* ClickHouse now builds with `C++23`. [#47424](https://github.com/ClickHouse/ClickHouse/pull/47424) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fuzz `EXPLAIN` queries in the AST Fuzzer. [#47803](https://github.com/ClickHouse/ClickHouse/pull/47803) [#47852](https://github.com/ClickHouse/ClickHouse/pull/47852) ([flynn](https://github.com/ucasfl)).
-* Split stress test and the automated backward compatibility check (now Upgrade check). [#44879](https://github.com/ClickHouse/ClickHouse/pull/44879) ([Kruglov Pavel](https://github.com/Avogar)).
-* Updated the Ubuntu Image for Docker to calm down some bogus security reports. [#46784](https://github.com/ClickHouse/ClickHouse/pull/46784) ([Julio Jimenez](https://github.com/juliojimenez)). Please note that ClickHouse has no dependencies and does not require Docker.
-* Adds a prompt to allow the removal of an existing `clickhouse` download when using "curl | sh" download of ClickHouse. Prompt is "ClickHouse binary clickhouse already exists. Overwrite? \[y/N\]". [#46859](https://github.com/ClickHouse/ClickHouse/pull/46859) ([Dan Roscigno](https://github.com/DanRoscigno)).
-* Fix error during server startup on old distros (e.g. Amazon Linux 2) and on ARM that glibc 2.28 symbols are not found. [#47008](https://github.com/ClickHouse/ClickHouse/pull/47008) ([Robert Schulze](https://github.com/rschu1ze)).
-* Prepare for clang 16. [#47027](https://github.com/ClickHouse/ClickHouse/pull/47027) ([Amos Bird](https://github.com/amosbird)).
-* Added a CI check which ensures ClickHouse can run with an old glibc on ARM. [#47063](https://github.com/ClickHouse/ClickHouse/pull/47063) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add a style check to prevent incorrect usage of the `NDEBUG` macro. [#47699](https://github.com/ClickHouse/ClickHouse/pull/47699) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Speed up the build a little. [#47714](https://github.com/ClickHouse/ClickHouse/pull/47714) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Bump `vectorscan` to 5.4.9. [#47955](https://github.com/ClickHouse/ClickHouse/pull/47955) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add a unit test to assert Apache Arrow's fatal logging does not abort. It covers the changes in [ClickHouse/arrow#16](https://github.com/ClickHouse/arrow/pull/16). [#47958](https://github.com/ClickHouse/ClickHouse/pull/47958) ([Arthur Passos](https://github.com/arthurpassos)).
-* Restore the ability of native macOS debug server build to start. [#48050](https://github.com/ClickHouse/ClickHouse/pull/48050) ([Robert Schulze](https://github.com/rschu1ze)). Note: this change is only relevant for development, as the ClickHouse official builds are done with cross-compilation.
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Fix formats parser resetting, test processing bad messages in `Kafka` [#45693](https://github.com/ClickHouse/ClickHouse/pull/45693) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix data size calculation in Keeper [#46086](https://github.com/ClickHouse/ClickHouse/pull/46086) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fixed a bug in automatic retries of `DROP TABLE` query with `ReplicatedMergeTree` tables and `Atomic` databases. In rare cases it could lead to `Can't get data for node /zk_path/log_pointer` and `The specified key does not exist` errors if the ZooKeeper session expired during DROP and a new replicated table with the same path in ZooKeeper was created in parallel. [#46384](https://github.com/ClickHouse/ClickHouse/pull/46384) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix incorrect alias recursion while normalizing queries that prevented some queries to run. [#46609](https://github.com/ClickHouse/ClickHouse/pull/46609) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix IPv4/IPv6 serialization/deserialization in binary formats [#46616](https://github.com/ClickHouse/ClickHouse/pull/46616) ([Kruglov Pavel](https://github.com/Avogar)).
-* ActionsDAG: do not change result of `and` during optimization [#46653](https://github.com/ClickHouse/ClickHouse/pull/46653) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Improve query cancellation when a client dies [#46681](https://github.com/ClickHouse/ClickHouse/pull/46681) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix arithmetic operations in aggregate optimization [#46705](https://github.com/ClickHouse/ClickHouse/pull/46705) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix possible `clickhouse-local`'s abort on JSONEachRow schema inference [#46731](https://github.com/ClickHouse/ClickHouse/pull/46731) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix changing an expired role [#46772](https://github.com/ClickHouse/ClickHouse/pull/46772) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix combined PREWHERE column accumulation from multiple steps [#46785](https://github.com/ClickHouse/ClickHouse/pull/46785) ([Alexander Gololobov](https://github.com/davenger)).
-* Use initial range for fetching file size in HTTP read buffer. Without this change, some remote files couldn't be processed. [#46824](https://github.com/ClickHouse/ClickHouse/pull/46824) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix the incorrect progress bar while using the URL tables [#46830](https://github.com/ClickHouse/ClickHouse/pull/46830) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix MSan report in `maxIntersections` function [#46847](https://github.com/ClickHouse/ClickHouse/pull/46847) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix a bug in `Map` data type [#46856](https://github.com/ClickHouse/ClickHouse/pull/46856) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix wrong results of some LIKE searches when the LIKE pattern contains quoted non-quotable characters [#46875](https://github.com/ClickHouse/ClickHouse/pull/46875) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix - WITH FILL would produce abort when the Filling Transform processing an empty block [#46897](https://github.com/ClickHouse/ClickHouse/pull/46897) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix date and int inference from string in JSON [#46972](https://github.com/ClickHouse/ClickHouse/pull/46972) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix bug in zero-copy replication disk choice during fetch [#47010](https://github.com/ClickHouse/ClickHouse/pull/47010) ([alesapin](https://github.com/alesapin)).
-* Fix a typo in systemd service definition [#47051](https://github.com/ClickHouse/ClickHouse/pull/47051) ([Palash Goel](https://github.com/palash-goel)).
-* Fix the NOT_IMPLEMENTED error with CROSS JOIN and algorithm = auto [#47068](https://github.com/ClickHouse/ClickHouse/pull/47068) ([Vladimir C](https://github.com/vdimir)).
-* Fix the problem that the 'ReplicatedMergeTree' table failed to insert two similar data when the 'part_type' is configured as 'InMemory' mode (experimental feature). [#47121](https://github.com/ClickHouse/ClickHouse/pull/47121) ([liding1992](https://github.com/liding1992)).
-* External dictionaries / library-bridge: Fix error "unknown library method 'extDict_libClone'" [#47136](https://github.com/ClickHouse/ClickHouse/pull/47136) ([alex filatov](https://github.com/phil-88)).
-* Fix race condition in a grace hash join with limit [#47153](https://github.com/ClickHouse/ClickHouse/pull/47153) ([Vladimir C](https://github.com/vdimir)).
-* Fix concrete columns PREWHERE support [#47154](https://github.com/ClickHouse/ClickHouse/pull/47154) ([Azat Khuzhin](https://github.com/azat)).
-* Fix possible deadlock in Query Status [#47161](https://github.com/ClickHouse/ClickHouse/pull/47161) ([Kruglov Pavel](https://github.com/Avogar)).
-* Forbid insert select for the same `Join` table, as it leads to a deadlock [#47260](https://github.com/ClickHouse/ClickHouse/pull/47260) ([Vladimir C](https://github.com/vdimir)).
-* Skip merged partitions for `min_age_to_force_merge_seconds` merges [#47303](https://github.com/ClickHouse/ClickHouse/pull/47303) ([Antonio Andelic](https://github.com/antonio2368)).
-* Modify find_first_symbols, so it works as expected for find_first_not_symbols [#47304](https://github.com/ClickHouse/ClickHouse/pull/47304) ([Arthur Passos](https://github.com/arthurpassos)).
-* Fix big numbers inference in CSV [#47410](https://github.com/ClickHouse/ClickHouse/pull/47410) ([Kruglov Pavel](https://github.com/Avogar)).
-* Disable logical expression optimizer for expression with aliases. [#47451](https://github.com/ClickHouse/ClickHouse/pull/47451) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix error in `decodeURLComponent` [#47457](https://github.com/ClickHouse/ClickHouse/pull/47457) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix explain graph with projection [#47473](https://github.com/ClickHouse/ClickHouse/pull/47473) ([flynn](https://github.com/ucasfl)).
-* Fix query parameters [#47488](https://github.com/ClickHouse/ClickHouse/pull/47488) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Parameterized view: a bug fix. [#47495](https://github.com/ClickHouse/ClickHouse/pull/47495) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fuzzer of data formats, and the corresponding fixes. [#47519](https://github.com/ClickHouse/ClickHouse/pull/47519) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix monotonicity check for `DateTime64` [#47526](https://github.com/ClickHouse/ClickHouse/pull/47526) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix "block structure mismatch" for a Nullable LowCardinality column [#47537](https://github.com/ClickHouse/ClickHouse/pull/47537) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Proper fix for a bug in Apache Parquet [#45878](https://github.com/ClickHouse/ClickHouse/issues/45878) [#47538](https://github.com/ClickHouse/ClickHouse/pull/47538) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix `BSONEachRow` parallel parsing when document size is invalid [#47540](https://github.com/ClickHouse/ClickHouse/pull/47540) ([Kruglov Pavel](https://github.com/Avogar)).
-* Preserve error in `system.distribution_queue` on `SYSTEM FLUSH DISTRIBUTED` [#47541](https://github.com/ClickHouse/ClickHouse/pull/47541) ([Azat Khuzhin](https://github.com/azat)).
-* Check for duplicate column in `BSONEachRow` format [#47609](https://github.com/ClickHouse/ClickHouse/pull/47609) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix wait for zero copy lock during move [#47631](https://github.com/ClickHouse/ClickHouse/pull/47631) ([alesapin](https://github.com/alesapin)).
-* Fix aggregation by partitions [#47634](https://github.com/ClickHouse/ClickHouse/pull/47634) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix bug in tuple as array serialization in `BSONEachRow` format [#47690](https://github.com/ClickHouse/ClickHouse/pull/47690) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix crash in `polygonsSymDifferenceCartesian` [#47702](https://github.com/ClickHouse/ClickHouse/pull/47702) ([pufit](https://github.com/pufit)).
-* Fix reading from storage `File` compressed files with `zlib` and `gzip` compression [#47796](https://github.com/ClickHouse/ClickHouse/pull/47796) ([Anton Popov](https://github.com/CurtizJ)).
-* Improve empty query detection for PostgreSQL (for pgx golang driver) [#47854](https://github.com/ClickHouse/ClickHouse/pull/47854) ([Azat Khuzhin](https://github.com/azat)).
-* Fix DateTime monotonicity check for LowCardinality types [#47860](https://github.com/ClickHouse/ClickHouse/pull/47860) ([Antonio Andelic](https://github.com/antonio2368)).
-* Use restore_threads (not backup_threads) for RESTORE ASYNC [#47861](https://github.com/ClickHouse/ClickHouse/pull/47861) ([Azat Khuzhin](https://github.com/azat)).
-* Fix DROP COLUMN with ReplicatedMergeTree containing projections [#47883](https://github.com/ClickHouse/ClickHouse/pull/47883) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix for Replicated database recovery [#47901](https://github.com/ClickHouse/ClickHouse/pull/47901) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Hotfix for too verbose warnings in HTTP [#47903](https://github.com/ClickHouse/ClickHouse/pull/47903) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix "Field value too long" in `catboostEvaluate` [#47970](https://github.com/ClickHouse/ClickHouse/pull/47970) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix [#36971](https://github.com/ClickHouse/ClickHouse/issues/36971): Watchdog: exit with non-zero code if child process exits [#47973](https://github.com/ClickHouse/ClickHouse/pull/47973) ([Коренберг Марк](https://github.com/socketpair)).
-* Fix for "index file `cidx` is unexpectedly long" [#48010](https://github.com/ClickHouse/ClickHouse/pull/48010) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix MaterializedPostgreSQL query to get attributes (replica-identity) [#48015](https://github.com/ClickHouse/ClickHouse/pull/48015) ([Solomatov Sergei](https://github.com/solomatovs)).
-* parseDateTime(): Fix UB (signed integer overflow) [#48019](https://github.com/ClickHouse/ClickHouse/pull/48019) ([Robert Schulze](https://github.com/rschu1ze)).
-* Use unique names for Records in Avro to avoid reusing its schema [#48057](https://github.com/ClickHouse/ClickHouse/pull/48057) ([Kruglov Pavel](https://github.com/Avogar)).
-* Correctly set TCP/HTTP socket timeouts in Keeper [#48108](https://github.com/ClickHouse/ClickHouse/pull/48108) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix possible member call on null pointer in `Avro` format [#48184](https://github.com/ClickHouse/ClickHouse/pull/48184) ([Kruglov Pavel](https://github.com/Avogar)).
-
-### <a id="232"></a> ClickHouse release 23.2, 2023-02-23
-
-#### Backward Incompatible Change
-* Extend function "toDayOfWeek()" (alias: "DAYOFWEEK") with a mode argument that encodes whether the week starts on Monday or Sunday and whether counting starts at 0 or 1. For consistency with other date time functions, the mode argument was inserted between the time and the time zone arguments. This breaks existing usage of the (previously undocumented) 2-argument syntax "toDayOfWeek(time, time_zone)". A fix is to rewrite the function into "toDayOfWeek(time, 0, time_zone)". [#45233](https://github.com/ClickHouse/ClickHouse/pull/45233) ([Robert Schulze](https://github.com/rschu1ze)).
-* Rename setting `max_query_cache_size` to `filesystem_cache_max_download_size`. [#45614](https://github.com/ClickHouse/ClickHouse/pull/45614) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* The `default` user will not have permissions for access type `SHOW NAMED COLLECTION` by default (e.g. `default` user will no longer be able to grant ALL to other users as it was before, therefore this PR is backward incompatible). [#46010](https://github.com/ClickHouse/ClickHouse/pull/46010) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* If the SETTINGS clause is specified before the FORMAT clause, the settings will be applied to formatting as well. [#46003](https://github.com/ClickHouse/ClickHouse/pull/46003) ([Azat Khuzhin](https://github.com/azat)).
-* Remove support for setting `materialized_postgresql_allow_automatic_update` (which was by default turned off). [#46106](https://github.com/ClickHouse/ClickHouse/pull/46106) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Slightly improve performance of `countDigits` on realistic datasets. This closed [#44518](https://github.com/ClickHouse/ClickHouse/issues/44518). In previous versions, `countDigits(0)` returned `0`; now it returns `1`, which is more correct, and follows the existing documentation. [#46187](https://github.com/ClickHouse/ClickHouse/pull/46187) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Disallow creation of new columns compressed by a combination of codecs "Delta" or "DoubleDelta" followed by codecs "Gorilla" or "FPC". This can be bypassed using setting "allow_suspicious_codecs = true". [#45652](https://github.com/ClickHouse/ClickHouse/pull/45652) ([Robert Schulze](https://github.com/rschu1ze)).
-
-#### New Feature
-* Add `StorageIceberg` and table function `iceberg` to access iceberg table store on S3. [#45384](https://github.com/ClickHouse/ClickHouse/pull/45384) ([flynn](https://github.com/ucasfl)).
-* Allow configuring storage as `SETTINGS disk = '<disk_name>'` (instead of `storage_policy`) and with explicit disk creation `SETTINGS disk = disk(type=s3, ...)`. [#41976](https://github.com/ClickHouse/ClickHouse/pull/41976) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Expose `ProfileEvents` counters in `system.part_log`. [#38614](https://github.com/ClickHouse/ClickHouse/pull/38614) ([Bharat Nallan](https://github.com/bharatnc)).
-* Enrichment of the existing `ReplacingMergeTree` engine to allow duplicate the insertion. It leverages the power of both `ReplacingMergeTree` and `CollapsingMergeTree` in one MergeTree engine. Deleted data are not returned when queried, but not removed from disk neither. [#41005](https://github.com/ClickHouse/ClickHouse/pull/41005) ([youennL-cs](https://github.com/youennL-cs)).
-* Add `generateULID` function. Closes [#36536](https://github.com/ClickHouse/ClickHouse/issues/36536). [#44662](https://github.com/ClickHouse/ClickHouse/pull/44662) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add `corrMatrix` aggregate function, calculating each two columns. In addition, since Aggregatefunctions `covarSamp` and `covarPop` are similar to `corr`, I add `covarSampMatrix`, `covarPopMatrix` by the way. @alexey-milovidov closes [#44587](https://github.com/ClickHouse/ClickHouse/issues/44587). [#44680](https://github.com/ClickHouse/ClickHouse/pull/44680) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Introduce arrayShuffle function for random array permutations. [#45271](https://github.com/ClickHouse/ClickHouse/pull/45271) ([Joanna Hulboj](https://github.com/jh0x)).
-* Support types `FIXED_SIZE_BINARY` type in Arrow, `FIXED_LENGTH_BYTE_ARRAY` in `Parquet` and match them to `FixedString`. Add settings `output_format_parquet_fixed_string_as_fixed_byte_array/output_format_arrow_fixed_string_as_fixed_byte_array` to control default output type for FixedString. Closes [#45326](https://github.com/ClickHouse/ClickHouse/issues/45326). [#45340](https://github.com/ClickHouse/ClickHouse/pull/45340) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add a new column `last_exception_time` to system.replication_queue. [#45457](https://github.com/ClickHouse/ClickHouse/pull/45457) ([Frank Chen](https://github.com/FrankChen021)).
-* Add two new functions which allow for user-defined keys/seeds with SipHash{64,128}. [#45513](https://github.com/ClickHouse/ClickHouse/pull/45513) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Allow a three-argument version for table function `format`. close [#45808](https://github.com/ClickHouse/ClickHouse/issues/45808). [#45873](https://github.com/ClickHouse/ClickHouse/pull/45873) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Add `JodaTime` format support for 'x','w','S'. Refer to https://joda-time.sourceforge.net/apidocs/org/joda/time/format/DateTimeFormat.html. [#46073](https://github.com/ClickHouse/ClickHouse/pull/46073) ([zk_kiger](https://github.com/zk-kiger)).
-* Support window function `ntile`. ([lgbo](https://github.com/lgbo-ustc)).
-* Add setting `final` to implicitly apply the `FINAL` modifier to every table. [#40945](https://github.com/ClickHouse/ClickHouse/pull/40945) ([Arthur Passos](https://github.com/arthurpassos)).
-* Added `arrayPartialSort` and `arrayPartialReverseSort` functions. [#46296](https://github.com/ClickHouse/ClickHouse/pull/46296) ([Joanna Hulboj](https://github.com/jh0x)).
-* The new http parameter `client_protocol_version` allows setting a client protocol version for HTTP responses using the Native format. [#40397](https://github.com/ClickHouse/ClickHouse/issues/40397). [#46360](https://github.com/ClickHouse/ClickHouse/pull/46360) ([Geoff Genz](https://github.com/genzgd)).
-* Add new function `regexpExtract`, like spark function `REGEXP_EXTRACT` for compatibility. It is similar to the existing function `extract`. [#46469](https://github.com/ClickHouse/ClickHouse/pull/46469) ([李扬](https://github.com/taiyang-li)).
-* Add new function `JSONArrayLength`, which returns the number of elements in the outermost JSON array. The function returns NULL if the input JSON string is invalid. [#46631](https://github.com/ClickHouse/ClickHouse/pull/46631) ([李扬](https://github.com/taiyang-li)).
-
-#### Performance Improvement
-* The introduced logic works if PREWHERE condition is a conjunction of multiple conditions (cond1 AND cond2 AND ... ). It groups those conditions that require reading the same columns into steps. After each step the corresponding part of the full condition is computed and the result rows might be filtered. This allows to read fewer rows in the next steps thus saving IO bandwidth and doing less computation. This logic is disabled by default for now. It will be enabled by default in one of the future releases once it is known to not have any regressions, so it is highly encouraged to be used for testing. It can be controlled by 2 settings: "enable_multiple_prewhere_read_steps" and "move_all_conditions_to_prewhere". [#46140](https://github.com/ClickHouse/ClickHouse/pull/46140) ([Alexander Gololobov](https://github.com/davenger)).
-* An option added to aggregate partitions independently if table partition key and group by key are compatible. Controlled by the setting `allow_aggregate_partitions_independently`. Disabled by default because of limited applicability (please refer to the docs). [#45364](https://github.com/ClickHouse/ClickHouse/pull/45364) ([Nikita Taranov](https://github.com/nickitat)).
-* Allow using Vertical merge algorithm with parts in Compact format. This will allow ClickHouse server to use much less memory for background operations. This closes [#46084](https://github.com/ClickHouse/ClickHouse/issues/46084). [#45681](https://github.com/ClickHouse/ClickHouse/pull/45681) [#46282](https://github.com/ClickHouse/ClickHouse/pull/46282) ([Anton Popov](https://github.com/CurtizJ)).
-* Optimize `Parquet` reader by using batch reader. [#45878](https://github.com/ClickHouse/ClickHouse/pull/45878) ([LiuNeng](https://github.com/liuneng1994)).
-* Add new `local_filesystem_read_method` method `io_uring` based on the asynchronous Linux [io_uring](https://kernel.dk/io_uring.pdf) subsystem, improving read performance almost universally compared to the default `pread` method. [#38456](https://github.com/ClickHouse/ClickHouse/pull/38456) ([Saulius Valatka](https://github.com/sauliusvl)).
-* Rewrite aggregate functions with `if` expression as argument when logically equivalent. For example, `avg(if(cond, col, null))` can be rewritten to avgIf(cond, col). It is helpful in performance. [#44730](https://github.com/ClickHouse/ClickHouse/pull/44730) ([李扬](https://github.com/taiyang-li)).
-* Improve lower/upper function performance with avx512 instructions. [#37894](https://github.com/ClickHouse/ClickHouse/pull/37894) ([yaqi-zhao](https://github.com/yaqi-zhao)).
-* Remove the limitation that on systems with >=32 cores and SMT disabled ClickHouse uses only half of the cores (the case when you disable Hyper Threading in BIOS). [#44973](https://github.com/ClickHouse/ClickHouse/pull/44973) ([Robert Schulze](https://github.com/rschu1ze)).
-* Improve performance of function `multiIf` by columnar executing, speed up by 2.3x. [#45296](https://github.com/ClickHouse/ClickHouse/pull/45296) ([李扬](https://github.com/taiyang-li)).
-* Add fast path for function `position` when the needle is empty. [#45382](https://github.com/ClickHouse/ClickHouse/pull/45382) ([李扬](https://github.com/taiyang-li)).
-* Enable `query_plan_remove_redundant_sorting` optimization by default. Optimization implemented in [#45420](https://github.com/ClickHouse/ClickHouse/issues/45420). [#45567](https://github.com/ClickHouse/ClickHouse/pull/45567) ([Igor Nikonov](https://github.com/devcrafter)).
-* Increased HTTP Transfer Encoding chunk size to improve performance of large queries using the HTTP interface. [#45593](https://github.com/ClickHouse/ClickHouse/pull/45593) ([Geoff Genz](https://github.com/genzgd)).
-* Fixed performance of short `SELECT` queries that read from tables with large number of `Array`/`Map`/`Nested` columns. [#45630](https://github.com/ClickHouse/ClickHouse/pull/45630) ([Anton Popov](https://github.com/CurtizJ)).
-* Improve performance of filtering for big integers and decimal types. [#45949](https://github.com/ClickHouse/ClickHouse/pull/45949) ([李扬](https://github.com/taiyang-li)).
-* This change could effectively reduce the overhead of obtaining the filter from ColumnNullable(UInt8) and improve the overall query performance. To evaluate the impact of this change, we adopted TPC-H benchmark but revised the column types from non-nullable to nullable, and we measured the QPS of its queries as the performance indicator. [#45962](https://github.com/ClickHouse/ClickHouse/pull/45962) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Make the `_part` and `_partition_id` virtual column be `LowCardinality(String)` type. Closes [#45964](https://github.com/ClickHouse/ClickHouse/issues/45964). [#45975](https://github.com/ClickHouse/ClickHouse/pull/45975) ([flynn](https://github.com/ucasfl)).
-* Improve the performance of Decimal conversion when the scale does not change. [#46095](https://github.com/ClickHouse/ClickHouse/pull/46095) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Allow to increase prefetching for read data. [#46168](https://github.com/ClickHouse/ClickHouse/pull/46168) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Rewrite `arrayExists(x -> x = 1, arr)` -> `has(arr, 1)`, which improve performance by 1.34x. [#46188](https://github.com/ClickHouse/ClickHouse/pull/46188) ([李扬](https://github.com/taiyang-li)).
-* Fix too big memory usage for vertical merges on non-remote disk. Respect `max_insert_delayed_streams_for_parallel_write` for the remote disk. [#46275](https://github.com/ClickHouse/ClickHouse/pull/46275) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Update zstd to v1.5.4. It has some minor improvements in performance and compression ratio. If you run replicas with different versions of ClickHouse you may see reasonable error messages `Data after merge/mutation is not byte-identical to data on another replicas.` with explanation. These messages are Ok and you should not worry. [#46280](https://github.com/ClickHouse/ClickHouse/pull/46280) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix performance degradation caused by [#39737](https://github.com/ClickHouse/ClickHouse/issues/39737). [#46309](https://github.com/ClickHouse/ClickHouse/pull/46309) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The `replicas_status` handle will answer quickly even in case of a large replication queue. [#46310](https://github.com/ClickHouse/ClickHouse/pull/46310) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add avx512 support for aggregate function `sum`, function unary arithmetic, function comparison. [#37870](https://github.com/ClickHouse/ClickHouse/pull/37870) ([zhao zhou](https://github.com/zzachimed)).
-* Rewrote the code around marks distribution and the overall coordination of the reading in order to achieve the maximum performance improvement. This closes [#34527](https://github.com/ClickHouse/ClickHouse/issues/34527). [#43772](https://github.com/ClickHouse/ClickHouse/pull/43772) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Remove redundant DISTINCT clauses in query (subqueries). Implemented on top of query plan. It does similar optimization as `optimize_duplicate_order_by_and_distinct` regarding DISTINCT clauses. Can be enabled via `query_plan_remove_redundant_distinct` setting. Related to [#42648](https://github.com/ClickHouse/ClickHouse/issues/42648). [#44176](https://github.com/ClickHouse/ClickHouse/pull/44176) ([Igor Nikonov](https://github.com/devcrafter)).
-* A few query rewrite optimizations: `sumIf(123, cond) -> 123 * countIf(1, cond)`, `sum(if(cond, 123, 0)) -> 123 * countIf(cond)`, `sum(if(cond, 0, 123)) -> 123 * countIf(not(cond))` [#44728](https://github.com/ClickHouse/ClickHouse/pull/44728) ([李扬](https://github.com/taiyang-li)).
-* Improved how memory bound merging and aggregation in order on top query plan interact. Previously we fell back to explicit sorting for AIO in some cases when it wasn't actually needed. [#45892](https://github.com/ClickHouse/ClickHouse/pull/45892) ([Nikita Taranov](https://github.com/nickitat)).
-* Concurrent merges are scheduled using round-robin by default to ensure fair and starvation-free operation. Previously in heavily overloaded shards, big merges could possibly be starved by smaller merges due to the use of strict priority scheduling. Added `background_merges_mutations_scheduling_policy` server config option to select scheduling algorithm (`round_robin` or `shortest_task_first`). [#46247](https://github.com/ClickHouse/ClickHouse/pull/46247) ([Sergei Trifonov](https://github.com/serxa)).
-
-#### Improvement
-* Enable retries for INSERT by default in case of ZooKeeper session loss. We already use it in production. [#46308](https://github.com/ClickHouse/ClickHouse/pull/46308) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add ability to ignore unknown keys in JSON object for named tuples (`input_format_json_ignore_unknown_keys_in_named_tuple`). [#45678](https://github.com/ClickHouse/ClickHouse/pull/45678) ([Azat Khuzhin](https://github.com/azat)).
-* Support optimizing the `where` clause with sorting key expression move to `prewhere`  for query with `final`. [#38893](https://github.com/ClickHouse/ClickHouse/issues/38893). [#38950](https://github.com/ClickHouse/ClickHouse/pull/38950) ([hexiaoting](https://github.com/hexiaoting)).
-* Add new metrics for backups: num_processed_files and processed_files_size described actual number of processed files. [#42244](https://github.com/ClickHouse/ClickHouse/pull/42244) ([Aleksandr](https://github.com/AVMusorin)).
-* Added retries on interserver DNS errors. [#43179](https://github.com/ClickHouse/ClickHouse/pull/43179) ([Anton Kozlov](https://github.com/tonickkozlov)).
-* Keeper improvement: try preallocating space on the disk to avoid undefined out-of-space issues. Introduce setting `max_log_file_size` for the maximum size of Keeper's Raft log files. [#44370](https://github.com/ClickHouse/ClickHouse/pull/44370) ([Antonio Andelic](https://github.com/antonio2368)).
-* Optimize behavior for a replica delay api logic in case the replica is read-only. [#45148](https://github.com/ClickHouse/ClickHouse/pull/45148) ([mateng915](https://github.com/mateng0915)).
-* Ask for the password in clickhouse-client interactively in a case when the empty password is wrong. Closes [#46702](https://github.com/ClickHouse/ClickHouse/issues/46702). [#46730](https://github.com/ClickHouse/ClickHouse/pull/46730) ([Nikolay Degterinsky](https://github.com/evillique)). 
-* Mark `Gorilla` compression on columns of non-Float* type as suspicious. [#45376](https://github.com/ClickHouse/ClickHouse/pull/45376) ([Robert Schulze](https://github.com/rschu1ze)).
-* Show replica name that is executing a merge in the `postpone_reason` column. [#45458](https://github.com/ClickHouse/ClickHouse/pull/45458) ([Frank Chen](https://github.com/FrankChen021)).
-* Save exception stack trace in part_log. [#45459](https://github.com/ClickHouse/ClickHouse/pull/45459) ([Frank Chen](https://github.com/FrankChen021)).
-* The `regexp_tree` dictionary is polished and now it is compatible with https://github.com/ua-parser/uap-core. [#45631](https://github.com/ClickHouse/ClickHouse/pull/45631) ([Han Fei](https://github.com/hanfei1991)).
-* Updated checking of `SYSTEM SYNC REPLICA`, resolves [#45508](https://github.com/ClickHouse/ClickHouse/issues/45508) [#45648](https://github.com/ClickHouse/ClickHouse/pull/45648) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Rename setting `replication_alter_partitions_sync` to `alter_sync`. [#45659](https://github.com/ClickHouse/ClickHouse/pull/45659) ([Antonio Andelic](https://github.com/antonio2368)).
-* The `generateRandom` table function and the engine now support `LowCardinality` data types. This is useful for testing, for example you can write `INSERT INTO table SELECT * FROM generateRandom() LIMIT 1000`. This is needed to debug [#45590](https://github.com/ClickHouse/ClickHouse/issues/45590). [#45661](https://github.com/ClickHouse/ClickHouse/pull/45661) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The experimental query result cache now provides more modular configuration settings. [#45679](https://github.com/ClickHouse/ClickHouse/pull/45679) ([Robert Schulze](https://github.com/rschu1ze)).
-* Renamed "query result cache" to "query cache". [#45682](https://github.com/ClickHouse/ClickHouse/pull/45682) ([Robert Schulze](https://github.com/rschu1ze)).
-* add `SYSTEM SYNC FILE CACHE` command. It will do the `sync` syscall. [#8921](https://github.com/ClickHouse/ClickHouse/issues/8921). [#45685](https://github.com/ClickHouse/ClickHouse/pull/45685) ([DR](https://github.com/freedomDR)).
-* Add a new S3 setting `allow_head_object_request`. This PR makes usage of `GetObjectAttributes` request instead of `HeadObject` introduced in https://github.com/ClickHouse/ClickHouse/pull/45288 optional (and disabled by default). [#45701](https://github.com/ClickHouse/ClickHouse/pull/45701) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Add ability to override connection settings based on connection names (that said that now you can forget about storing password for each connection, you can simply put everything into `~/.clickhouse-client/config.xml` and even use different history files for them, which can be also useful). [#45715](https://github.com/ClickHouse/ClickHouse/pull/45715) ([Azat Khuzhin](https://github.com/azat)).
-* Arrow format: support the duration type. Closes [#45669](https://github.com/ClickHouse/ClickHouse/issues/45669). [#45750](https://github.com/ClickHouse/ClickHouse/pull/45750) ([flynn](https://github.com/ucasfl)).
-* Extend the logging in the Query Cache to improve investigations of the caching behavior. [#45751](https://github.com/ClickHouse/ClickHouse/pull/45751) ([Robert Schulze](https://github.com/rschu1ze)).
-* The query cache's server-level settings are now reconfigurable at runtime. [#45758](https://github.com/ClickHouse/ClickHouse/pull/45758) ([Robert Schulze](https://github.com/rschu1ze)).
-* Hide password in logs when a table function's arguments are specified with a named collection. [#45774](https://github.com/ClickHouse/ClickHouse/pull/45774) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Improve internal S3 client to correctly deduce regions and redirections for different types of URLs. [#45783](https://github.com/ClickHouse/ClickHouse/pull/45783) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add support for Map, IPv4 and IPv6 types in generateRandom. Mostly useful for testing. [#45785](https://github.com/ClickHouse/ClickHouse/pull/45785) ([Raúl Marín](https://github.com/Algunenano)).
-* Support empty/notEmpty for IP types. [#45799](https://github.com/ClickHouse/ClickHouse/pull/45799) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* The column `num_processed_files` was split into two columns: `num_files` (for BACKUP) and `files_read` (for RESTORE). The column `processed_files_size` was split into two columns: `total_size` (for BACKUP) and `bytes_read` (for RESTORE). [#45800](https://github.com/ClickHouse/ClickHouse/pull/45800) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Add support for `SHOW ENGINES` query for MySQL compatibility. [#45859](https://github.com/ClickHouse/ClickHouse/pull/45859) ([Filatenkov Artur](https://github.com/FArthur-cmd)).
-* Improved how the obfuscator deals with queries. [#45867](https://github.com/ClickHouse/ClickHouse/pull/45867) ([Raúl Marín](https://github.com/Algunenano)).
-* Improve behaviour of conversion into Date for boundary value 65535 (2149-06-06). [#46042](https://github.com/ClickHouse/ClickHouse/pull/46042) [#45914](https://github.com/ClickHouse/ClickHouse/pull/45914) ([Joanna Hulboj](https://github.com/jh0x)).
-* Add setting `check_referential_table_dependencies` to check referential dependencies on `DROP TABLE`. This PR solves [#38326](https://github.com/ClickHouse/ClickHouse/issues/38326). [#45936](https://github.com/ClickHouse/ClickHouse/pull/45936) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix `tupleElement` to return `Null` when having `Null` argument. Closes [#45894](https://github.com/ClickHouse/ClickHouse/issues/45894). [#45952](https://github.com/ClickHouse/ClickHouse/pull/45952) ([flynn](https://github.com/ucasfl)).
-* Throw an error on no files satisfying the S3 wildcard. Closes [#45587](https://github.com/ClickHouse/ClickHouse/issues/45587). [#45957](https://github.com/ClickHouse/ClickHouse/pull/45957) ([chen](https://github.com/xiedeyantu)).
-* Use cluster state data to check concurrent backup/restore. [#45982](https://github.com/ClickHouse/ClickHouse/pull/45982) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* ClickHouse Client: Use "exact" matching for fuzzy search, which has correct case ignorance and more appropriate algorithm for matching SQL queries. [#46000](https://github.com/ClickHouse/ClickHouse/pull/46000) ([Azat Khuzhin](https://github.com/azat)).
-* Forbid wrong create View syntax `CREATE View X TO Y AS SELECT`. Closes [#4331](https://github.com/ClickHouse/ClickHouse/issues/4331). [#46043](https://github.com/ClickHouse/ClickHouse/pull/46043) ([flynn](https://github.com/ucasfl)).
-* Storage `Log` family support setting the `storage_policy`. Closes [#43421](https://github.com/ClickHouse/ClickHouse/issues/43421). [#46044](https://github.com/ClickHouse/ClickHouse/pull/46044) ([flynn](https://github.com/ucasfl)).
-* Improve `JSONColumns` format when the result is empty. Closes [#46024](https://github.com/ClickHouse/ClickHouse/issues/46024). [#46053](https://github.com/ClickHouse/ClickHouse/pull/46053) ([flynn](https://github.com/ucasfl)).
-* Add reference implementation for SipHash128. [#46065](https://github.com/ClickHouse/ClickHouse/pull/46065) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Add a new metric to record allocations times and bytes using mmap. [#46068](https://github.com/ClickHouse/ClickHouse/pull/46068) ([李扬](https://github.com/taiyang-li)).
-* Currently for functions like `leftPad`, `rightPad`, `leftPadUTF8`, `rightPadUTF8`, the second argument `length` must be UInt8|16|32|64|128|256. Which is too strict for clickhouse users, besides, it is not consistent with other similar functions like `arrayResize`, `substring` and so on. [#46103](https://github.com/ClickHouse/ClickHouse/pull/46103) ([李扬](https://github.com/taiyang-li)).
-* Fix assertion in the `welchTTest` function in debug build when the resulting statistics is NaN. Unified the behavior with other similar functions. Change the behavior of `studentTTest` to return NaN instead of throwing an exception because the previous behavior was inconvenient. This closes [#41176](https://github.com/ClickHouse/ClickHouse/issues/41176) This closes [#42162](https://github.com/ClickHouse/ClickHouse/issues/42162). [#46141](https://github.com/ClickHouse/ClickHouse/pull/46141) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* More convenient usage of big integers and ORDER BY WITH FILL. Allow using plain integers for start and end points in WITH FILL when ORDER BY big (128-bit and 256-bit) integers. Fix the wrong result for big integers with negative start or end points. This closes [#16733](https://github.com/ClickHouse/ClickHouse/issues/16733). [#46152](https://github.com/ClickHouse/ClickHouse/pull/46152) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add `parts`, `active_parts` and `total_marks` columns to `system.tables` on [issue](https://github.com/ClickHouse/ClickHouse/issues/44336). [#46161](https://github.com/ClickHouse/ClickHouse/pull/46161) ([attack204](https://github.com/attack204)).
-* Functions "multi[Fuzzy]Match(Any|AnyIndex|AllIndices}" now reject regexes which will likely evaluate very slowly in vectorscan. [#46167](https://github.com/ClickHouse/ClickHouse/pull/46167) ([Robert Schulze](https://github.com/rschu1ze)).
-* When `insert_null_as_default` is enabled and column doesn't have defined default value, the default of column type will be used. Also this PR fixes using default values on nulls in case of LowCardinality columns. [#46171](https://github.com/ClickHouse/ClickHouse/pull/46171) ([Kruglov Pavel](https://github.com/Avogar)).
-* Prefer explicitly defined access keys for S3 clients. If `use_environment_credentials` is set to `true`, and the user has provided the access key through query or config, they will be used instead of the ones from the environment variable. [#46191](https://github.com/ClickHouse/ClickHouse/pull/46191) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add an alias "DATE_FORMAT()" for function "formatDateTime()" to improve compatibility with MySQL's SQL dialect, extend function `formatDateTime` with substitutions "a", "b", "c", "h", "i", "k", "l" "r", "s", "W". ### Documentation entry for user-facing changes User-readable short description: `DATE_FORMAT` is an alias of `formatDateTime`. Formats a Time according to the given Format string. Format is a constant expression, so you cannot have multiple formats for a single result column. (Provide link to [formatDateTime](https://clickhouse.com/docs/en/sql-reference/functions/date-time-functions/#formatdatetime)). [#46302](https://github.com/ClickHouse/ClickHouse/pull/46302) ([Jake Bamrah](https://github.com/JakeBamrah)).
-* Add `ProfileEvents` and `CurrentMetrics` about the callback tasks for parallel replicas (`s3Cluster` and `MergeTree` tables). [#46313](https://github.com/ClickHouse/ClickHouse/pull/46313) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add support for `DELETE` and `UPDATE` for tables using `KeeperMap` storage engine. [#46330](https://github.com/ClickHouse/ClickHouse/pull/46330) ([Antonio Andelic](https://github.com/antonio2368)).
-* Allow writing RENAME queries with query parameters. Resolves [#45778](https://github.com/ClickHouse/ClickHouse/issues/45778). [#46407](https://github.com/ClickHouse/ClickHouse/pull/46407) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix parameterized SELECT queries with REPLACE transformer. Resolves [#33002](https://github.com/ClickHouse/ClickHouse/issues/33002). [#46420](https://github.com/ClickHouse/ClickHouse/pull/46420) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Exclude the internal database used for temporary/external tables from the calculation of asynchronous metric "NumberOfDatabases". This makes the behavior consistent with system table "system.databases". [#46435](https://github.com/ClickHouse/ClickHouse/pull/46435) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added `last_exception_time` column into distribution_queue table. [#46564](https://github.com/ClickHouse/ClickHouse/pull/46564) ([Aleksandr](https://github.com/AVMusorin)).
-* Support for IN clause with parameter in parameterized views. [#46583](https://github.com/ClickHouse/ClickHouse/pull/46583) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Do not load named collections on server startup (load them on first access instead). [#46607](https://github.com/ClickHouse/ClickHouse/pull/46607) ([Kseniia Sumarokova](https://github.com/kssenii)).
-
-
-#### Build/Testing/Packaging Improvement
-* Introduce GWP-ASan implemented by the LLVM runtime. This closes [#27039](https://github.com/ClickHouse/ClickHouse/issues/27039). [#45226](https://github.com/ClickHouse/ClickHouse/pull/45226) ([Han Fei](https://github.com/hanfei1991)).
-* We want to make our tests less stable and more flaky: add randomization for merge tree settings in tests. [#38983](https://github.com/ClickHouse/ClickHouse/pull/38983) ([Anton Popov](https://github.com/CurtizJ)).
-* Enable the HDFS support in PowerPC and which helps to fixes the following functional tests 02113_hdfs_assert.sh, 02244_hdfs_cluster.sql and 02368_cancel_write_into_hdfs.sh. [#44949](https://github.com/ClickHouse/ClickHouse/pull/44949) ([MeenaRenganathan22](https://github.com/MeenaRenganathan22)).
-* Add systemd.service file for clickhouse-keeper. Fixes [#44293](https://github.com/ClickHouse/ClickHouse/issues/44293). [#45568](https://github.com/ClickHouse/ClickHouse/pull/45568) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* ClickHouse's fork of poco was moved from "contrib/" to "base/poco/". [#46075](https://github.com/ClickHouse/ClickHouse/pull/46075) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add an option for `clickhouse-watchdog` to restart the child process. This does not make a lot of use. [#46312](https://github.com/ClickHouse/ClickHouse/pull/46312) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* If the environment variable `CLICKHOUSE_DOCKER_RESTART_ON_EXIT` is set to 1, the Docker container will run `clickhouse-server` as a child instead of the first process, and restart it when it exited. [#46391](https://github.com/ClickHouse/ClickHouse/pull/46391) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix Systemd service file. [#46461](https://github.com/ClickHouse/ClickHouse/pull/46461) ([SuperDJY](https://github.com/cmsxbc)).
-* Raised the minimum Clang version needed to build ClickHouse from 12 to 15. [#46710](https://github.com/ClickHouse/ClickHouse/pull/46710) ([Robert Schulze](https://github.com/rschu1ze)).
-* Upgrade Intel QPL from v0.3.0 to v1.0.0 2. Build libaccel-config and link it statically to QPL library instead of dynamically. [#45809](https://github.com/ClickHouse/ClickHouse/pull/45809) ([jasperzhu](https://github.com/jinjunzh)).
-
-
-#### Bug Fix (user-visible misbehavior in official stable release)
-
-* Flush data exactly by `rabbitmq_flush_interval_ms` or by `rabbitmq_max_block_size` in `StorageRabbitMQ`. Closes [#42389](https://github.com/ClickHouse/ClickHouse/issues/42389). Closes [#45160](https://github.com/ClickHouse/ClickHouse/issues/45160). [#44404](https://github.com/ClickHouse/ClickHouse/pull/44404) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Use PODArray to render in sparkBar function, so we can control the memory usage. Close [#44467](https://github.com/ClickHouse/ClickHouse/issues/44467). [#44489](https://github.com/ClickHouse/ClickHouse/pull/44489) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix functions (quantilesExactExclusive, quantilesExactInclusive) return unsorted array element. [#45379](https://github.com/ClickHouse/ClickHouse/pull/45379) ([wujunfu](https://github.com/wujunfu)).
-* Fix uncaught exception in HTTPHandler when open telemetry is enabled. [#45456](https://github.com/ClickHouse/ClickHouse/pull/45456) ([Frank Chen](https://github.com/FrankChen021)).
-* Don't infer Dates from 8 digit numbers. It could lead to wrong data to be read. [#45581](https://github.com/ClickHouse/ClickHouse/pull/45581) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fixes to correctly use `odbc_bridge_use_connection_pooling` setting. [#45591](https://github.com/ClickHouse/ClickHouse/pull/45591) ([Bharat Nallan](https://github.com/bharatnc)).
-* When the callback in the cache is called, it is possible that this cache is destructed. To keep it safe, we capture members by value. It's also safe for task schedule because it will be deactivated before storage is destroyed. Resolve [#45548](https://github.com/ClickHouse/ClickHouse/issues/45548). [#45601](https://github.com/ClickHouse/ClickHouse/pull/45601) ([Han Fei](https://github.com/hanfei1991)).
-* Fix data corruption when codecs Delta or DoubleDelta are combined with codec Gorilla. [#45615](https://github.com/ClickHouse/ClickHouse/pull/45615) ([Robert Schulze](https://github.com/rschu1ze)).
-* Correctly check types when using N-gram bloom filter index to avoid invalid reads. [#45617](https://github.com/ClickHouse/ClickHouse/pull/45617) ([Antonio Andelic](https://github.com/antonio2368)).
-* A couple of segfaults have been reported around `c-ares`. They were introduced in my previous pull requests. I have fixed them with the help of Alexander Tokmakov. [#45629](https://github.com/ClickHouse/ClickHouse/pull/45629) ([Arthur Passos](https://github.com/arthurpassos)).
-* Fix key description when encountering duplicate primary keys. This can happen in projections. See [#45590](https://github.com/ClickHouse/ClickHouse/issues/45590) for details. [#45686](https://github.com/ClickHouse/ClickHouse/pull/45686) ([Amos Bird](https://github.com/amosbird)).
-* Set compression method and level for backup Closes [#45690](https://github.com/ClickHouse/ClickHouse/issues/45690). [#45737](https://github.com/ClickHouse/ClickHouse/pull/45737) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
-* Should use `select_query_typed.limitByOffset` instead of `select_query_typed.limitOffset`. [#45817](https://github.com/ClickHouse/ClickHouse/pull/45817) ([刘陶峰](https://github.com/taofengliu)).
-* When use experimental analyzer, queries like `SELECT number FROM numbers(100) LIMIT 10 OFFSET 10;` get wrong results (empty result for this sql). That is caused by an unnecessary offset step added by planner. [#45822](https://github.com/ClickHouse/ClickHouse/pull/45822) ([刘陶峰](https://github.com/taofengliu)).
-* Backward compatibility - allow implicit narrowing conversion from UInt64 to IPv4 - required for "INSERT ... VALUES ..." expression. [#45865](https://github.com/ClickHouse/ClickHouse/pull/45865) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Bugfix IPv6 parser for mixed ip4 address with missed first octet (like `::.1.2.3`). [#45871](https://github.com/ClickHouse/ClickHouse/pull/45871) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Add the `query_kind` column to the `system.processes` table and the `SHOW PROCESSLIST` query. Remove duplicate code. It fixes a bug: the global configuration parameter `max_concurrent_select_queries` was not respected to queries with `INTERSECT` or `EXCEPT` chains. [#45872](https://github.com/ClickHouse/ClickHouse/pull/45872) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix crash in a function `stochasticLinearRegression`. Found by WingFuzz. [#45985](https://github.com/ClickHouse/ClickHouse/pull/45985) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix crash in `SELECT` queries with `INTERSECT` and `EXCEPT` modifiers that read data from tables with enabled sparse columns (controlled by setting `ratio_of_defaults_for_sparse_serialization`). [#45987](https://github.com/ClickHouse/ClickHouse/pull/45987) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix read in order optimization for DESC sorting with FINAL, close [#45815](https://github.com/ClickHouse/ClickHouse/issues/45815). [#46009](https://github.com/ClickHouse/ClickHouse/pull/46009) ([Vladimir C](https://github.com/vdimir)).
-* Fix reading of non existing nested columns with multiple level in compact parts. [#46045](https://github.com/ClickHouse/ClickHouse/pull/46045) ([Azat Khuzhin](https://github.com/azat)).
-* Fix elapsed column in system.processes (10x error). [#46047](https://github.com/ClickHouse/ClickHouse/pull/46047) ([Azat Khuzhin](https://github.com/azat)).
-* Follow-up fix for Replace domain IP types (IPv4, IPv6) with native https://github.com/ClickHouse/ClickHouse/pull/43221. [#46087](https://github.com/ClickHouse/ClickHouse/pull/46087) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix environment variable substitution in the configuration when a parameter already has a value. This closes [#46131](https://github.com/ClickHouse/ClickHouse/issues/46131). This closes [#9547](https://github.com/ClickHouse/ClickHouse/issues/9547). [#46144](https://github.com/ClickHouse/ClickHouse/pull/46144) ([pufit](https://github.com/pufit)).
-* Fix incorrect predicate push down with grouping sets. Closes [#45947](https://github.com/ClickHouse/ClickHouse/issues/45947). [#46151](https://github.com/ClickHouse/ClickHouse/pull/46151) ([flynn](https://github.com/ucasfl)).
-* Fix possible pipeline stuck error on `fulls_sorting_join` with constant keys. [#46175](https://github.com/ClickHouse/ClickHouse/pull/46175) ([Vladimir C](https://github.com/vdimir)).
-* Never rewrite tuple functions as literals during formatting to avoid incorrect results. [#46232](https://github.com/ClickHouse/ClickHouse/pull/46232) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Fix possible out of bounds error while reading LowCardinality(Nullable) in Arrow format. [#46270](https://github.com/ClickHouse/ClickHouse/pull/46270) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix `SYSTEM UNFREEZE` queries failing with the exception `CANNOT_PARSE_INPUT_ASSERTION_FAILED`. [#46325](https://github.com/ClickHouse/ClickHouse/pull/46325) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* Fix possible crash which can be caused by an integer overflow while deserializing aggregating state of a function that stores HashTable. [#46349](https://github.com/ClickHouse/ClickHouse/pull/46349) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix possible `LOGICAL_ERROR` in asynchronous inserts with invalid data sent in format `VALUES`. [#46350](https://github.com/ClickHouse/ClickHouse/pull/46350) ([Anton Popov](https://github.com/CurtizJ)).
-* Fixed a LOGICAL_ERROR on an attempt to execute `ALTER ... MOVE PART ... TO TABLE`. This type of query was never actually supported. [#46359](https://github.com/ClickHouse/ClickHouse/pull/46359) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix s3Cluster schema inference in parallel distributed insert select when `parallel_distributed_insert_select` is enabled. [#46381](https://github.com/ClickHouse/ClickHouse/pull/46381) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix queries like `ALTER TABLE ... UPDATE nested.arr1 = nested.arr2 ...`, where `arr1` and `arr2` are fields of the same `Nested` column. [#46387](https://github.com/ClickHouse/ClickHouse/pull/46387) ([Anton Popov](https://github.com/CurtizJ)).
-* Scheduler may fail to schedule a task. If it happens, the whole MulityPartUpload should be aborted and `UploadHelper` must wait for already scheduled tasks. [#46451](https://github.com/ClickHouse/ClickHouse/pull/46451) ([Dmitry Novik](https://github.com/novikd)).
-* Fix PREWHERE for Merge with different default types (fixes some `NOT_FOUND_COLUMN_IN_BLOCK` when the default type for the column differs, also allow `PREWHERE` when the type of column is the same across tables, and prohibit it, only if it differs). [#46454](https://github.com/ClickHouse/ClickHouse/pull/46454) ([Azat Khuzhin](https://github.com/azat)).
-* Fix a crash that could happen when constant values are used in `ORDER BY`. Fixes [#46466](https://github.com/ClickHouse/ClickHouse/issues/46466). [#46493](https://github.com/ClickHouse/ClickHouse/pull/46493) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Do not throw exception if `disk` setting was specified on query level, but `storage_policy` was specified in config merge tree settings section. `disk` will override setting from config. [#46533](https://github.com/ClickHouse/ClickHouse/pull/46533) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix an invalid processing of constant `LowCardinality` argument in function `arrayMap`. This bug could lead to a segfault in release, and logical error `Bad cast` in debug build. [#46569](https://github.com/ClickHouse/ClickHouse/pull/46569) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* fixes [#46557](https://github.com/ClickHouse/ClickHouse/issues/46557). [#46611](https://github.com/ClickHouse/ClickHouse/pull/46611) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix endless restarts of clickhouse-server systemd unit if server cannot start within 1m30sec (Disable timeout logic for starting clickhouse-server from systemd service). [#46613](https://github.com/ClickHouse/ClickHouse/pull/46613) ([Azat Khuzhin](https://github.com/azat)).
-* Allocated during asynchronous inserts memory buffers were deallocated in the global context and MemoryTracker counters for corresponding user and query were not updated correctly. That led to false positive OOM exceptions. [#46622](https://github.com/ClickHouse/ClickHouse/pull/46622) ([Dmitry Novik](https://github.com/novikd)).
-* Updated to not clear on_expression from table_join as its used by future analyze runs resolves [#45185](https://github.com/ClickHouse/ClickHouse/issues/45185). [#46487](https://github.com/ClickHouse/ClickHouse/pull/46487) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-
-
-### <a id="231"></a> ClickHouse release 23.1, 2023-01-26
-
-### ClickHouse release 23.1
-
-#### Upgrade Notes
-* The `SYSTEM RESTART DISK` query becomes a no-op. [#44647](https://github.com/ClickHouse/ClickHouse/pull/44647) ([alesapin](https://github.com/alesapin)).
-* The `PREALLOCATE` option for `HASHED`/`SPARSE_HASHED` dictionaries becomes a no-op. [#45388](https://github.com/ClickHouse/ClickHouse/pull/45388) ([Azat Khuzhin](https://github.com/azat)). It does not give significant advantages anymore.
-* Disallow `Gorilla` codec on columns of non-Float32 or non-Float64 type. [#45252](https://github.com/ClickHouse/ClickHouse/pull/45252) ([Robert Schulze](https://github.com/rschu1ze)). It was pointless and led to inconsistencies. 
-* Parallel quorum inserts might work incorrectly with `*MergeTree` tables created with the deprecated syntax. Therefore, parallel quorum inserts support is completely disabled for such tables. It does not affect tables created with a new syntax. [#45430](https://github.com/ClickHouse/ClickHouse/pull/45430) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Use the `GetObjectAttributes` request instead of the `HeadObject` request to get the size of an object in AWS S3. This change fixes handling endpoints without explicit regions after updating the AWS SDK, for example. [#45288](https://github.com/ClickHouse/ClickHouse/pull/45288) ([Vitaly Baranov](https://github.com/vitlibar)). AWS S3 and Minio are tested, but keep in mind that various S3-compatible services (GCS, R2, B2) may have subtle incompatibilities. This change also may require you to adjust the ACL to allow the `GetObjectAttributes` request.
-* Forbid paths in timezone names. For example, a timezone name like `/usr/share/zoneinfo/Asia/Aden` is not allowed; the IANA timezone database name like `Asia/Aden` should be used. [#44225](https://github.com/ClickHouse/ClickHouse/pull/44225) ([Kruglov Pavel](https://github.com/Avogar)).
-* Queries combining equijoin and constant expressions (e.g., `JOIN ON t1.x = t2.x AND 1 = 1`) are forbidden due to incorrect results. [#44016](https://github.com/ClickHouse/ClickHouse/pull/44016) ([Vladimir C](https://github.com/vdimir)).
-
-
-#### New Feature
-* Dictionary source for extracting keys by traversing regular expressions tree. It can be used for User-Agent parsing. [#40878](https://github.com/ClickHouse/ClickHouse/pull/40878) ([Vage Ogannisian](https://github.com/nooblose)). [#43858](https://github.com/ClickHouse/ClickHouse/pull/43858) ([Han Fei](https://github.com/hanfei1991)).
-* Added parametrized view functionality, now it's possible to specify query parameters for the View table engine. resolves [#40907](https://github.com/ClickHouse/ClickHouse/issues/40907). [#41687](https://github.com/ClickHouse/ClickHouse/pull/41687) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Add `quantileInterpolatedWeighted`/`quantilesInterpolatedWeighted` functions. [#38252](https://github.com/ClickHouse/ClickHouse/pull/38252) ([Bharat Nallan](https://github.com/bharatnc)).
-* Array join support for the `Map` type, like the function "explode" in Spark. [#43239](https://github.com/ClickHouse/ClickHouse/pull/43239) ([李扬](https://github.com/taiyang-li)).
-* Support SQL standard binary and hex string literals. [#43785](https://github.com/ClickHouse/ClickHouse/pull/43785) ([Mo Xuan](https://github.com/mo-avatar)).
-* Allow formatting `DateTime` in Joda-Time style. Refer to [the Joda-Time docs](https://joda-time.sourceforge.net/apidocs/org/joda/time/format/DateTimeFormat.html). [#43818](https://github.com/ClickHouse/ClickHouse/pull/43818) ([李扬](https://github.com/taiyang-li)).
-* Implemented a fractional second formatter (`%f`) for `formatDateTime`. [#44060](https://github.com/ClickHouse/ClickHouse/pull/44060) ([ltrk2](https://github.com/ltrk2)). [#44497](https://github.com/ClickHouse/ClickHouse/pull/44497) ([Alexander Gololobov](https://github.com/davenger)).
-* Added `age` function to calculate the difference between two dates or dates with time values expressed as the number of full units. Closes [#41115](https://github.com/ClickHouse/ClickHouse/issues/41115). [#44421](https://github.com/ClickHouse/ClickHouse/pull/44421) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add `Null` source for dictionaries. Closes [#44240](https://github.com/ClickHouse/ClickHouse/issues/44240). [#44502](https://github.com/ClickHouse/ClickHouse/pull/44502) ([mayamika](https://github.com/mayamika)).
-* Allow configuring the S3 storage class with the `s3_storage_class` configuration option. Such as `<s3_storage_class>STANDARD/INTELLIGENT_TIERING</s3_storage_class>` Closes [#44443](https://github.com/ClickHouse/ClickHouse/issues/44443). [#44707](https://github.com/ClickHouse/ClickHouse/pull/44707) ([chen](https://github.com/xiedeyantu)).
-* Insert default values in case of missing elements in JSON object while parsing named tuple. Add setting `input_format_json_defaults_for_missing_elements_in_named_tuple` that controls this behaviour. Closes [#45142](https://github.com/ClickHouse/ClickHouse/issues/45142)#issuecomment-1380153217. [#45231](https://github.com/ClickHouse/ClickHouse/pull/45231) ([Kruglov Pavel](https://github.com/Avogar)).
-* Record server startup time in ProfileEvents (`ServerStartupMilliseconds`). Resolves [#43188](https://github.com/ClickHouse/ClickHouse/issues/43188). [#45250](https://github.com/ClickHouse/ClickHouse/pull/45250) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Refactor and Improve streaming engines Kafka/RabbitMQ/NATS and add support for all formats, also refactor formats a bit: - Fix producing messages in row-based formats with suffixes/prefixes. Now every message is formatted completely with all delimiters and can be parsed back using input format. - Support block-based formats like Native, Parquet, ORC, etc. Every block is formatted as a separate message. The number of rows in one message depends on the block size, so you can control it via the setting `max_block_size`. - Add new engine settings `kafka_max_rows_per_message/rabbitmq_max_rows_per_message/nats_max_rows_per_message`. They control the number of rows formatted in one message in row-based formats. Default value: 1. - Fix high memory consumption in the NATS table engine. - Support arbitrary binary data in NATS producer (previously it worked only with strings contained \0 at the end) - Add missing Kafka/RabbitMQ/NATS engine settings in the documentation. - Refactor producing and consuming in Kafka/RabbitMQ/NATS, separate it from WriteBuffers/ReadBuffers semantic. - Refactor output formats: remove callbacks on each row used in Kafka/RabbitMQ/NATS (now we don't use callbacks there), allow to use IRowOutputFormat directly, clarify row end and row between delimiters, make it possible to reset output format to start formatting again - Add proper implementation in formatRow function (bonus after formats refactoring). [#42777](https://github.com/ClickHouse/ClickHouse/pull/42777) ([Kruglov Pavel](https://github.com/Avogar)).
-* Support reading/writing `Nested` tables as `List` of `Struct` in `CapnProto` format. Read/write `Decimal32/64` as `Int32/64`. Closes [#43319](https://github.com/ClickHouse/ClickHouse/issues/43319). [#43379](https://github.com/ClickHouse/ClickHouse/pull/43379) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added a `message_format_string` column to `system.text_log`. The column contains a pattern that was used to format the message. [#44543](https://github.com/ClickHouse/ClickHouse/pull/44543) ([Alexander Tokmakov](https://github.com/tavplubix)). This allows various analytics over the ClickHouse logs.
-* Try to autodetect headers with column names (and maybe types) for CSV/TSV/CustomSeparated input formats.
-Add settings input_format_tsv/csv/custom_detect_header that enable this behaviour (enabled by default). Closes [#44640](https://github.com/ClickHouse/ClickHouse/issues/44640). [#44953](https://github.com/ClickHouse/ClickHouse/pull/44953) ([Kruglov Pavel](https://github.com/Avogar)).
-
-#### Experimental Feature
-* Add an experimental inverted index as a new secondary index type for efficient text search. [#38667](https://github.com/ClickHouse/ClickHouse/pull/38667) ([larryluogit](https://github.com/larryluogit)).
-* Add experimental query result cache. [#43797](https://github.com/ClickHouse/ClickHouse/pull/43797) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added extendable and configurable scheduling subsystem for IO requests (not yet integrated with IO code itself). [#41840](https://github.com/ClickHouse/ClickHouse/pull/41840) ([Sergei Trifonov](https://github.com/serxa)). This feature does nothing at all, enjoy.
-* Added `SYSTEM DROP DATABASE REPLICA` that removes metadata of a dead replica of a `Replicated` database. Resolves [#41794](https://github.com/ClickHouse/ClickHouse/issues/41794). [#42807](https://github.com/ClickHouse/ClickHouse/pull/42807) ([Alexander Tokmakov](https://github.com/tavplubix)).
-
-#### Performance Improvement
-* Do not load inactive parts at startup of `MergeTree` tables. [#42181](https://github.com/ClickHouse/ClickHouse/pull/42181) ([Anton Popov](https://github.com/CurtizJ)).
-* Improved latency of reading from storage `S3` and table function `s3` with large numbers of small files. Now settings `remote_filesystem_read_method` and `remote_filesystem_read_prefetch` take effect while reading from storage `S3`. [#43726](https://github.com/ClickHouse/ClickHouse/pull/43726) ([Anton Popov](https://github.com/CurtizJ)).
-* Optimization for reading struct fields in Parquet/ORC files. Only the required fields are loaded. [#44484](https://github.com/ClickHouse/ClickHouse/pull/44484) ([lgbo](https://github.com/lgbo-ustc)).
-* Two-level aggregation algorithm was mistakenly disabled for queries over the HTTP interface. It was enabled back, and it leads to a major performance improvement. [#45450](https://github.com/ClickHouse/ClickHouse/pull/45450) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Added mmap support for StorageFile, which should improve the performance of clickhouse-local. [#43927](https://github.com/ClickHouse/ClickHouse/pull/43927) ([pufit](https://github.com/pufit)).
-* Added sharding support in HashedDictionary to allow parallel load (almost linear scaling based on number of shards). [#40003](https://github.com/ClickHouse/ClickHouse/pull/40003) ([Azat Khuzhin](https://github.com/azat)).
-* Speed up query parsing. [#42284](https://github.com/ClickHouse/ClickHouse/pull/42284) ([Raúl Marín](https://github.com/Algunenano)).
-* Always replace OR chain `expr = x1 OR ... OR expr = xN` to `expr IN (x1, ..., xN)` in the case where `expr` is a `LowCardinality` column. Setting `optimize_min_equality_disjunction_chain_length` is ignored in this case. [#42889](https://github.com/ClickHouse/ClickHouse/pull/42889) ([Guo Wangyang](https://github.com/guowangy)).
-* Slightly improve performance by optimizing the code around ThreadStatus. [#43586](https://github.com/ClickHouse/ClickHouse/pull/43586) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Optimize the column-wise ternary logic evaluation by achieving auto-vectorization. In the performance test of this [microbenchmark](https://github.com/ZhiguoZh/ClickHouse/blob/20221123-ternary-logic-opt-example/src/Functions/examples/associative_applier_perf.cpp), we've observed a peak **performance gain** of **21x** on the ICX device (Intel Xeon Platinum 8380 CPU). [#43669](https://github.com/ClickHouse/ClickHouse/pull/43669) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Avoid acquiring read locks in the `system.tables` table if possible. [#43840](https://github.com/ClickHouse/ClickHouse/pull/43840) ([Raúl Marín](https://github.com/Algunenano)).
-* Optimize ThreadPool. The performance experiments of SSB (Star Schema Benchmark) on the ICX device (Intel Xeon Platinum 8380 CPU, 80 cores, 160 threads) shows that this change could effectively decrease the lock contention for ThreadPoolImpl::mutex by **75%**, increasing the CPU utilization and improving the overall performance by **2.4%**. [#44308](https://github.com/ClickHouse/ClickHouse/pull/44308) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Now the optimisation for predicting the hash table size is applied only if the cached hash table size is sufficiently large (thresholds were determined empirically and hardcoded). [#44455](https://github.com/ClickHouse/ClickHouse/pull/44455) ([Nikita Taranov](https://github.com/nickitat)).
-* Small performance improvement for asynchronous reading from remote filesystems. [#44868](https://github.com/ClickHouse/ClickHouse/pull/44868) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Add fast path for: - `col like '%%'`; - `col like '%'`; - `col not like '%'`; - `col not like '%'`; - `match(col, '.*')`. [#45244](https://github.com/ClickHouse/ClickHouse/pull/45244) ([李扬](https://github.com/taiyang-li)).
-* Slightly improve happy path optimisation in filtering (WHERE clause). [#45289](https://github.com/ClickHouse/ClickHouse/pull/45289) ([Nikita Taranov](https://github.com/nickitat)).
-* Provide monotonicity info for `toUnixTimestamp64*` to enable more algebraic optimizations for index analysis. [#44116](https://github.com/ClickHouse/ClickHouse/pull/44116) ([Nikita Taranov](https://github.com/nickitat)).
-* Allow the configuration of temporary data for query processing (spilling to disk) to cooperate with the filesystem cache (taking up the space from the cache disk) [#43972](https://github.com/ClickHouse/ClickHouse/pull/43972) ([Vladimir C](https://github.com/vdimir)). This mainly improves [ClickHouse Cloud](https://clickhouse.cloud/), but can be used for self-managed setups as well, if you know what to do.
-* Make `system.replicas` table do parallel fetches of replicas statuses. Closes [#43918](https://github.com/ClickHouse/ClickHouse/issues/43918). [#43998](https://github.com/ClickHouse/ClickHouse/pull/43998) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Optimize memory consumption during backup to S3: files to S3 now will be copied directly without using `WriteBufferFromS3` (which could use a lot of memory). [#45188](https://github.com/ClickHouse/ClickHouse/pull/45188) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Add a cache for async block ids. This will reduce the number of requests of ZooKeeper when we enable async inserts deduplication. [#45106](https://github.com/ClickHouse/ClickHouse/pull/45106) ([Han Fei](https://github.com/hanfei1991)).
-
-#### Improvement
-
-* Use structure from insertion table in generateRandom without arguments. [#45239](https://github.com/ClickHouse/ClickHouse/pull/45239) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow to implicitly convert floats stored in string fields of JSON to integers in `JSONExtract` functions. E.g. `JSONExtract('{"a": "1000.111"}', 'a', 'UInt64')` -> `1000`, previously it returned 0. [#45432](https://github.com/ClickHouse/ClickHouse/pull/45432) ([Anton Popov](https://github.com/CurtizJ)).
-* Added fields `supports_parallel_parsing` and `supports_parallel_formatting` to table `system.formats` for better introspection. [#45499](https://github.com/ClickHouse/ClickHouse/pull/45499) ([Anton Popov](https://github.com/CurtizJ)).
-* Improve reading CSV field in CustomSeparated/Template format. Closes [#42352](https://github.com/ClickHouse/ClickHouse/issues/42352) Closes [#39620](https://github.com/ClickHouse/ClickHouse/issues/39620). [#43332](https://github.com/ClickHouse/ClickHouse/pull/43332) ([Kruglov Pavel](https://github.com/Avogar)).
-* Unify query elapsed time measurements. [#43455](https://github.com/ClickHouse/ClickHouse/pull/43455) ([Raúl Marín](https://github.com/Algunenano)).
-* Improve automatic usage of structure from insertion table in table functions file/hdfs/s3 when virtual columns are present in a select query, it fixes the possible error `Block structure mismatch` or `number of columns mismatch`. [#43695](https://github.com/ClickHouse/ClickHouse/pull/43695) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add support for signed arguments in the function `range`. Fixes [#43333](https://github.com/ClickHouse/ClickHouse/issues/43333). [#43733](https://github.com/ClickHouse/ClickHouse/pull/43733) ([sanyu](https://github.com/wineternity)).
-* Remove redundant sorting, for example, sorting related ORDER BY clauses in subqueries. Implemented on top of query plan. It does similar optimization as `optimize_duplicate_order_by_and_distinct` regarding `ORDER BY` clauses, but more generic, since it's applied to any redundant sorting steps (not only caused by ORDER BY clause) and applied to subqueries of any depth. Related to [#42648](https://github.com/ClickHouse/ClickHouse/issues/42648). [#43905](https://github.com/ClickHouse/ClickHouse/pull/43905) ([Igor Nikonov](https://github.com/devcrafter)).
-* Add the ability to disable deduplication of files for BACKUP (for backups without deduplication ATTACH can be used instead of full RESTORE). For example `BACKUP foo TO S3(...) SETTINGS deduplicate_files=0` (default `deduplicate_files=1`). [#43947](https://github.com/ClickHouse/ClickHouse/pull/43947) ([Azat Khuzhin](https://github.com/azat)).
-* Refactor and improve schema inference for text formats. Add new setting `schema_inference_make_columns_nullable` that controls making result types `Nullable` (enabled by default);. [#44019](https://github.com/ClickHouse/ClickHouse/pull/44019) ([Kruglov Pavel](https://github.com/Avogar)).
-* Better support for `PROXYv1` protocol. [#44135](https://github.com/ClickHouse/ClickHouse/pull/44135) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Add information about the latest part check by cleanup threads into `system.parts` table. [#44244](https://github.com/ClickHouse/ClickHouse/pull/44244) ([Dmitry Novik](https://github.com/novikd)).
-* Disable table functions in readonly mode for inserts. [#44290](https://github.com/ClickHouse/ClickHouse/pull/44290) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Add a setting `simultaneous_parts_removal_limit` to allow limiting the number of parts being processed by one iteration of CleanupThread. [#44461](https://github.com/ClickHouse/ClickHouse/pull/44461) ([Dmitry Novik](https://github.com/novikd)).
-* Do not initialize ReadBufferFromS3 when only virtual columns are needed in a query. This may be helpful to [#44246](https://github.com/ClickHouse/ClickHouse/issues/44246). [#44493](https://github.com/ClickHouse/ClickHouse/pull/44493) ([chen](https://github.com/xiedeyantu)).
-* Prevent duplicate column names hints. Closes [#44130](https://github.com/ClickHouse/ClickHouse/issues/44130). [#44519](https://github.com/ClickHouse/ClickHouse/pull/44519) ([Joanna Hulboj](https://github.com/jh0x)).
-* Allow macro substitution in endpoint of disks. Resolve [#40951](https://github.com/ClickHouse/ClickHouse/issues/40951). [#44533](https://github.com/ClickHouse/ClickHouse/pull/44533) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Improve schema inference when `input_format_json_read_object_as_string` is enabled. [#44546](https://github.com/ClickHouse/ClickHouse/pull/44546) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add a user-level setting `database_replicated_allow_replicated_engine_arguments` which allows banning the creation of `ReplicatedMergeTree` tables with arguments in `DatabaseReplicated`. [#44566](https://github.com/ClickHouse/ClickHouse/pull/44566) ([alesapin](https://github.com/alesapin)).
-* Prevent users from mistakenly specifying zero (invalid) value for `index_granularity`. This closes [#44536](https://github.com/ClickHouse/ClickHouse/issues/44536). [#44578](https://github.com/ClickHouse/ClickHouse/pull/44578) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added possibility to set path to service keytab file in `keytab` parameter in `kerberos` section of config.xml. [#44594](https://github.com/ClickHouse/ClickHouse/pull/44594) ([Roman Vasin](https://github.com/rvasin)).
-* Use already written part of the query for fuzzy search (pass to the `skim` library, which is written in Rust and linked statically to ClickHouse). [#44600](https://github.com/ClickHouse/ClickHouse/pull/44600) ([Azat Khuzhin](https://github.com/azat)).
-* Enable `input_format_json_read_objects_as_strings` by default to be able to read nested JSON objects while JSON Object type is experimental. [#44657](https://github.com/ClickHouse/ClickHouse/pull/44657) ([Kruglov Pavel](https://github.com/Avogar)).
-* Improvement for deduplication of async inserts: when users do duplicate async inserts, we should deduplicate inside the memory before we query Keeper. [#44682](https://github.com/ClickHouse/ClickHouse/pull/44682) ([Han Fei](https://github.com/hanfei1991)).
-* Input/output `Avro` format will parse bool type as ClickHouse bool type. [#44684](https://github.com/ClickHouse/ClickHouse/pull/44684) ([Kruglov Pavel](https://github.com/Avogar)).
-* Support Bool type in Arrow/Parquet/ORC. Closes [#43970](https://github.com/ClickHouse/ClickHouse/issues/43970). [#44698](https://github.com/ClickHouse/ClickHouse/pull/44698) ([Kruglov Pavel](https://github.com/Avogar)).
-* Don't greedily parse beyond the quotes when reading UUIDs - it may lead to mistakenly successful parsing of incorrect data. [#44686](https://github.com/ClickHouse/ClickHouse/pull/44686) ([Raúl Marín](https://github.com/Algunenano)).
-* Infer UInt64 in case of Int64 overflow and fix some transforms in schema inference. [#44696](https://github.com/ClickHouse/ClickHouse/pull/44696) ([Kruglov Pavel](https://github.com/Avogar)).
-* Previously dependency resolving inside `Replicated` database was done in a hacky way, and now it's done right using an explicit graph. [#44697](https://github.com/ClickHouse/ClickHouse/pull/44697) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Fix `output_format_pretty_row_numbers` does not preserve the counter across the blocks. Closes [#44815](https://github.com/ClickHouse/ClickHouse/issues/44815). [#44832](https://github.com/ClickHouse/ClickHouse/pull/44832) ([flynn](https://github.com/ucasfl)).
-* Don't report errors in `system.errors` due to parts being merged concurrently with the background cleanup process. [#44874](https://github.com/ClickHouse/ClickHouse/pull/44874) ([Raúl Marín](https://github.com/Algunenano)).
-* Optimize and fix metrics for Distributed async INSERT. [#44922](https://github.com/ClickHouse/ClickHouse/pull/44922) ([Azat Khuzhin](https://github.com/azat)).
-* Added settings to disallow concurrent backups and restores resolves [#43891](https://github.com/ClickHouse/ClickHouse/issues/43891) Implementation: * Added server-level settings to disallow concurrent backups and restores, which are read and set when BackupWorker is created in Context. * Settings are set to true by default. * Before starting backup or restores, added a check to see if any other backups/restores are running. For internal requests, it checks if it is from the self node using backup_uuid. [#45072](https://github.com/ClickHouse/ClickHouse/pull/45072) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Add `<storage_policy>` config parameter for system logs. [#45320](https://github.com/ClickHouse/ClickHouse/pull/45320) ([Stig Bakken](https://github.com/stigsb)).
-
-#### Build/Testing/Packaging Improvement
-* Statically link with the `skim` library (it is written in Rust) for fuzzy search in clickhouse client/local history. [#44239](https://github.com/ClickHouse/ClickHouse/pull/44239) ([Azat Khuzhin](https://github.com/azat)).
-* We removed support for shared linking because of Rust. Actually, Rust is only an excuse for this removal, and we wanted to remove it nevertheless. [#44828](https://github.com/ClickHouse/ClickHouse/pull/44828) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Remove the dependency on the `adduser` tool from the packages, because we don't use it. This fixes [#44934](https://github.com/ClickHouse/ClickHouse/issues/44934). [#45011](https://github.com/ClickHouse/ClickHouse/pull/45011) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The `SQLite` library is updated to the latest. It is used for the SQLite database and table integration engines. Also, fixed a false-positive TSan report. This closes [#45027](https://github.com/ClickHouse/ClickHouse/issues/45027). [#45031](https://github.com/ClickHouse/ClickHouse/pull/45031) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* CRC-32 changes to address the WeakHash collision issue in PowerPC. [#45144](https://github.com/ClickHouse/ClickHouse/pull/45144) ([MeenaRenganathan22](https://github.com/MeenaRenganathan22)).
-* Update aws-c* submodules [#43020](https://github.com/ClickHouse/ClickHouse/pull/43020) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Automatically merge green backport PRs and green approved PRs [#41110](https://github.com/ClickHouse/ClickHouse/pull/41110) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* Introduce a [website](https://aretestsgreenyet.com/) for the status of ClickHouse CI. [Source](https://github.com/ClickHouse/aretestsgreenyet).
-
-#### Bug Fix
-
-* Replace domain IP types (IPv4, IPv6) with native. [#43221](https://github.com/ClickHouse/ClickHouse/pull/43221) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)). It automatically fixes some missing implementations in the code.
-* Fix the backup process if mutations get killed during the backup process. [#45351](https://github.com/ClickHouse/ClickHouse/pull/45351) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix the `Invalid number of rows in Chunk` exception message. [#41404](https://github.com/ClickHouse/ClickHouse/issues/41404). [#42126](https://github.com/ClickHouse/ClickHouse/pull/42126) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix possible use of an uninitialized value after executing expressions after sorting. Closes [#43386](https://github.com/ClickHouse/ClickHouse/issues/43386) [#43635](https://github.com/ClickHouse/ClickHouse/pull/43635) ([Kruglov Pavel](https://github.com/Avogar)).
-* Better handling of NULL in aggregate combinators, fix possible segfault/logical error while using an obscure optimization `optimize_rewrite_sum_if_to_count_if`. Closes [#43758](https://github.com/ClickHouse/ClickHouse/issues/43758). [#43813](https://github.com/ClickHouse/ClickHouse/pull/43813) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix CREATE USER/ROLE query settings constraints. [#43993](https://github.com/ClickHouse/ClickHouse/pull/43993) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fixed bug with non-parsable default value for `EPHEMERAL` column in table metadata. [#44026](https://github.com/ClickHouse/ClickHouse/pull/44026) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix parsing of bad version from compatibility setting. [#44224](https://github.com/ClickHouse/ClickHouse/pull/44224) ([Kruglov Pavel](https://github.com/Avogar)).
-* Bring interval subtraction from datetime in line with addition. [#44241](https://github.com/ClickHouse/ClickHouse/pull/44241) ([ltrk2](https://github.com/ltrk2)).
-* Remove limits on the maximum size of the result for view. [#44261](https://github.com/ClickHouse/ClickHouse/pull/44261) ([lizhuoyu5](https://github.com/lzydmxy)).
-* Fix possible logical error in cache if `do_not_evict_index_and_mrk_files=1`. Closes [#42142](https://github.com/ClickHouse/ClickHouse/issues/42142). [#44268](https://github.com/ClickHouse/ClickHouse/pull/44268) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix possible too early cache write interruption in write-through cache (caching could be stopped due to false assumption when it shouldn't have). [#44289](https://github.com/ClickHouse/ClickHouse/pull/44289) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix possible crash in the case function `IN` with constant arguments was used as a constant argument together with `LowCardinality`. Fixes [#44221](https://github.com/ClickHouse/ClickHouse/issues/44221). [#44346](https://github.com/ClickHouse/ClickHouse/pull/44346) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix support for complex parameters (like arrays) of parametric aggregate functions. This closes [#30975](https://github.com/ClickHouse/ClickHouse/issues/30975). The aggregate function `sumMapFiltered` was unusable in distributed queries before this change. [#44358](https://github.com/ClickHouse/ClickHouse/pull/44358) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix reading ObjectId in BSON schema inference. [#44382](https://github.com/ClickHouse/ClickHouse/pull/44382) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix race which can lead to premature temp parts removal before merge finishes in ReplicatedMergeTree. This issue could lead to errors like `No such file or directory: xxx`. Fixes [#43983](https://github.com/ClickHouse/ClickHouse/issues/43983). [#44383](https://github.com/ClickHouse/ClickHouse/pull/44383) ([alesapin](https://github.com/alesapin)).
-* Some invalid `SYSTEM ... ON CLUSTER` queries worked in an unexpected way if a cluster name was not specified. It's fixed, now invalid queries throw `SYNTAX_ERROR` as they should. Fixes [#44264](https://github.com/ClickHouse/ClickHouse/issues/44264). [#44387](https://github.com/ClickHouse/ClickHouse/pull/44387) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix reading Map type in ORC format. [#44400](https://github.com/ClickHouse/ClickHouse/pull/44400) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix reading columns that are not presented in input data in Parquet/ORC formats. Previously it could lead to error `INCORRECT_NUMBER_OF_COLUMNS`. Closes [#44333](https://github.com/ClickHouse/ClickHouse/issues/44333). [#44405](https://github.com/ClickHouse/ClickHouse/pull/44405) ([Kruglov Pavel](https://github.com/Avogar)).
-* Previously the `bar` function used the same '▋' (U+258B "Left five eighths block") character to display both 5/8 and 6/8 bars. This change corrects this behavior by using '▊' (U+258A "Left three quarters block") for displaying 6/8 bar. [#44410](https://github.com/ClickHouse/ClickHouse/pull/44410) ([Alexander Gololobov](https://github.com/davenger)).
-* Placing profile settings after profile settings constraints in the configuration file made constraints ineffective. [#44411](https://github.com/ClickHouse/ClickHouse/pull/44411) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-* Fix `SYNTAX_ERROR` while running `EXPLAIN AST INSERT` queries with data. Closes [#44207](https://github.com/ClickHouse/ClickHouse/issues/44207). [#44413](https://github.com/ClickHouse/ClickHouse/pull/44413) ([save-my-heart](https://github.com/save-my-heart)).
-* Fix reading bool value with CRLF in CSV format. Closes [#44401](https://github.com/ClickHouse/ClickHouse/issues/44401). [#44442](https://github.com/ClickHouse/ClickHouse/pull/44442) ([Kruglov Pavel](https://github.com/Avogar)).
-* Don't execute and/or/if/multiIf on a LowCardinality dictionary, so the result type cannot be LowCardinality. It could lead to the error `Illegal column ColumnLowCardinality` in some cases. Fixes [#43603](https://github.com/ClickHouse/ClickHouse/issues/43603). [#44469](https://github.com/ClickHouse/ClickHouse/pull/44469) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix mutations with the setting `max_streams_for_merge_tree_reading`. [#44472](https://github.com/ClickHouse/ClickHouse/pull/44472) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix potential null pointer dereference with GROUPING SETS in ASTSelectQuery::formatImpl ([#43049](https://github.com/ClickHouse/ClickHouse/issues/43049)). [#44479](https://github.com/ClickHouse/ClickHouse/pull/44479) ([Robert Schulze](https://github.com/rschu1ze)).
-* Validate types in table function arguments, CAST function arguments, JSONAsObject schema inference according to settings. [#44501](https://github.com/ClickHouse/ClickHouse/pull/44501) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix IN function with LowCardinality and const column, close [#44503](https://github.com/ClickHouse/ClickHouse/issues/44503). [#44506](https://github.com/ClickHouse/ClickHouse/pull/44506) ([Duc Canh Le](https://github.com/canhld94)).
-* Fixed a bug in the normalization of a `DEFAULT` expression in `CREATE TABLE` statement. The second argument of the function `in` (or the right argument of operator `IN`) might be replaced with the result of its evaluation during CREATE query execution. Fixes [#44496](https://github.com/ClickHouse/ClickHouse/issues/44496). [#44547](https://github.com/ClickHouse/ClickHouse/pull/44547) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Projections do not work in presence of WITH ROLLUP, WITH CUBE and WITH TOTALS. In previous versions, a query produced an exception instead of skipping the usage of projections. This closes [#44614](https://github.com/ClickHouse/ClickHouse/issues/44614). This closes [#42772](https://github.com/ClickHouse/ClickHouse/issues/42772). [#44615](https://github.com/ClickHouse/ClickHouse/pull/44615) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Async blocks were not cleaned because the function `get all blocks sorted by time` didn't get async blocks. [#44651](https://github.com/ClickHouse/ClickHouse/pull/44651) ([Han Fei](https://github.com/hanfei1991)).
-* Fix `LOGICAL_ERROR` `The top step of the right pipeline should be ExpressionStep` for JOIN with subquery, UNION, and TOTALS. Fixes [#43687](https://github.com/ClickHouse/ClickHouse/issues/43687). [#44673](https://github.com/ClickHouse/ClickHouse/pull/44673) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Avoid `std::out_of_range` exception in the Executable table engine. [#44681](https://github.com/ClickHouse/ClickHouse/pull/44681) ([Kruglov Pavel](https://github.com/Avogar)).
-* Do not apply `optimize_syntax_fuse_functions` to quantiles on AST, close [#44712](https://github.com/ClickHouse/ClickHouse/issues/44712). [#44713](https://github.com/ClickHouse/ClickHouse/pull/44713) ([Vladimir C](https://github.com/vdimir)).
-* Fix bug with wrong type in Merge table and PREWHERE, close [#43324](https://github.com/ClickHouse/ClickHouse/issues/43324). [#44716](https://github.com/ClickHouse/ClickHouse/pull/44716) ([Vladimir C](https://github.com/vdimir)).
-* Fix a possible crash during shutdown (while destroying TraceCollector). Fixes [#44757](https://github.com/ClickHouse/ClickHouse/issues/44757). [#44758](https://github.com/ClickHouse/ClickHouse/pull/44758) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix a possible crash in distributed query processing. The crash could happen if a query with totals or extremes returned an empty result and there are mismatched types in the Distributed and the local tables. Fixes [#44738](https://github.com/ClickHouse/ClickHouse/issues/44738). [#44760](https://github.com/ClickHouse/ClickHouse/pull/44760) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix fsync for fetches (`min_compressed_bytes_to_fsync_after_fetch`)/small files (ttl.txt, columns.txt) in mutations (`min_rows_to_fsync_after_merge`/`min_compressed_bytes_to_fsync_after_merge`). [#44781](https://github.com/ClickHouse/ClickHouse/pull/44781) ([Azat Khuzhin](https://github.com/azat)).
-* A rare race condition was possible when querying the `system.parts` or `system.parts_columns` tables in the presence of parts being moved between disks. Introduced in [#41145](https://github.com/ClickHouse/ClickHouse/issues/41145). [#44809](https://github.com/ClickHouse/ClickHouse/pull/44809) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix the error `Context has expired` which could appear with enabled projections optimization. Can be reproduced for queries with specific functions, like `dictHas/dictGet` which use context in runtime. Fixes [#44844](https://github.com/ClickHouse/ClickHouse/issues/44844). [#44850](https://github.com/ClickHouse/ClickHouse/pull/44850) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* A fix for `Cannot read all data` error which could happen while reading `LowCardinality` dictionary from remote fs. Fixes [#44709](https://github.com/ClickHouse/ClickHouse/issues/44709). [#44875](https://github.com/ClickHouse/ClickHouse/pull/44875) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Ignore cases when hardware monitor sensors cannot be read instead of showing a full exception message in logs. [#44895](https://github.com/ClickHouse/ClickHouse/pull/44895) ([Raúl Marín](https://github.com/Algunenano)).
-* Use `max_delay_to_insert` value in case the calculated time to delay INSERT exceeds the setting value. Related to [#44902](https://github.com/ClickHouse/ClickHouse/issues/44902). [#44916](https://github.com/ClickHouse/ClickHouse/pull/44916) ([Igor Nikonov](https://github.com/devcrafter)).
-* Fix error `Different order of columns in UNION subquery` for queries with `UNION`. Fixes [#44866](https://github.com/ClickHouse/ClickHouse/issues/44866). [#44920](https://github.com/ClickHouse/ClickHouse/pull/44920) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Delay for INSERT can be calculated incorrectly, which can lead to always using `max_delay_to_insert` setting as delay instead of a correct value. Using simple formula `max_delay_to_insert * (parts_over_threshold/max_allowed_parts_over_threshold)` i.e. delay grows proportionally to parts over threshold. Closes [#44902](https://github.com/ClickHouse/ClickHouse/issues/44902). [#44954](https://github.com/ClickHouse/ClickHouse/pull/44954) ([Igor Nikonov](https://github.com/devcrafter)).
-* Fix alter table TTL error when a wide part has the lightweight delete mask. [#44959](https://github.com/ClickHouse/ClickHouse/pull/44959) ([Mingliang Pan](https://github.com/liangliangpan)).
-* Follow-up fix for Replace domain IP types (IPv4, IPv6) with native [#43221](https://github.com/ClickHouse/ClickHouse/issues/43221). [#45024](https://github.com/ClickHouse/ClickHouse/pull/45024) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Follow-up fix for Replace domain IP types (IPv4, IPv6) with native https://github.com/ClickHouse/ClickHouse/pull/43221. [#45043](https://github.com/ClickHouse/ClickHouse/pull/45043) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* A buffer overflow was possible in the parser. Found by fuzzer. [#45047](https://github.com/ClickHouse/ClickHouse/pull/45047) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix possible cannot-read-all-data error in storage FileLog. Closes [#45051](https://github.com/ClickHouse/ClickHouse/issues/45051), [#38257](https://github.com/ClickHouse/ClickHouse/issues/38257). [#45057](https://github.com/ClickHouse/ClickHouse/pull/45057) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Memory efficient aggregation (setting `distributed_aggregation_memory_efficient`) is disabled when grouping sets are present in the query. [#45058](https://github.com/ClickHouse/ClickHouse/pull/45058) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix `RANGE_HASHED` dictionary to count range columns as part of the primary key during updates when `update_field` is specified. Closes [#44588](https://github.com/ClickHouse/ClickHouse/issues/44588). [#45061](https://github.com/ClickHouse/ClickHouse/pull/45061) ([Maksim Kita](https://github.com/kitaisreal)).
-* Fix error `Cannot capture column` for `LowCardinality` captured argument of nested lambda. Fixes [#45028](https://github.com/ClickHouse/ClickHouse/issues/45028). [#45065](https://github.com/ClickHouse/ClickHouse/pull/45065) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix the wrong query result of `additional_table_filters` (additional filter was not applied) in case the minmax/count projection is used. [#45133](https://github.com/ClickHouse/ClickHouse/pull/45133) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fixed bug in `histogram` function accepting negative values. [#45147](https://github.com/ClickHouse/ClickHouse/pull/45147) ([simpleton](https://github.com/rgzntrade)).
-* Fix wrong column nullability in StoreageJoin, close [#44940](https://github.com/ClickHouse/ClickHouse/issues/44940). [#45184](https://github.com/ClickHouse/ClickHouse/pull/45184) ([Vladimir C](https://github.com/vdimir)).
-* Fix `background_fetches_pool_size` settings reload (increase at runtime). [#45189](https://github.com/ClickHouse/ClickHouse/pull/45189) ([Raúl Marín](https://github.com/Algunenano)).
-* Correctly process `SELECT` queries on KV engines (e.g. KeeperMap, EmbeddedRocksDB) using `IN` on the key with subquery producing different type. [#45215](https://github.com/ClickHouse/ClickHouse/pull/45215) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix logical error in SEMI JOIN & join_use_nulls in some cases, close [#45163](https://github.com/ClickHouse/ClickHouse/issues/45163), close [#45209](https://github.com/ClickHouse/ClickHouse/issues/45209). [#45230](https://github.com/ClickHouse/ClickHouse/pull/45230) ([Vladimir C](https://github.com/vdimir)).
-* Fix heap-use-after-free in reading from s3. [#45253](https://github.com/ClickHouse/ClickHouse/pull/45253) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix bug when the Avro Union type is ['null', Nested type], closes [#45275](https://github.com/ClickHouse/ClickHouse/issues/45275). Fix bug that incorrectly infers `bytes` type to `Float`. [#45276](https://github.com/ClickHouse/ClickHouse/pull/45276) ([flynn](https://github.com/ucasfl)).
-* Throw a correct exception when explicit PREWHERE cannot be used with a table using the storage engine `Merge`. [#45319](https://github.com/ClickHouse/ClickHouse/pull/45319) ([Antonio Andelic](https://github.com/antonio2368)).
-* Under WSL1 Ubuntu self-extracting ClickHouse fails to decompress due to inconsistency - /proc/self/maps reporting 32bit file's inode, while stat reporting 64bit inode. [#45339](https://github.com/ClickHouse/ClickHouse/pull/45339) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix race in Distributed table startup (that could lead to processing file of async INSERT multiple times). [#45360](https://github.com/ClickHouse/ClickHouse/pull/45360) ([Azat Khuzhin](https://github.com/azat)).
-* Fix a possible crash while reading from storage `S3` and table function `s3` in the case when `ListObject` request has failed. [#45371](https://github.com/ClickHouse/ClickHouse/pull/45371) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix `SELECT ... FROM system.dictionaries` exception when there is a dictionary with a bad structure (e.g. incorrect type in XML config). [#45399](https://github.com/ClickHouse/ClickHouse/pull/45399) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* Fix s3Cluster schema inference when structure from insertion table is used in `INSERT INTO ... SELECT * FROM s3Cluster` queries. [#45422](https://github.com/ClickHouse/ClickHouse/pull/45422) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix bug in JSON/BSONEachRow parsing with HTTP that could lead to using default values for some columns instead of values from data. [#45424](https://github.com/ClickHouse/ClickHouse/pull/45424) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fixed bug (Code: 632. DB::Exception: Unexpected data ... after parsed IPv6 value ...) with typed parsing of IP types from text source. [#45425](https://github.com/ClickHouse/ClickHouse/pull/45425) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* close [#45297](https://github.com/ClickHouse/ClickHouse/issues/45297) Add check for empty regular expressions. [#45428](https://github.com/ClickHouse/ClickHouse/pull/45428) ([Han Fei](https://github.com/hanfei1991)).
-* Fix possible (likely distributed) query hung. [#45448](https://github.com/ClickHouse/ClickHouse/pull/45448) ([Azat Khuzhin](https://github.com/azat)).
-* Fix possible deadlock with `allow_asynchronous_read_from_io_pool_for_merge_tree` enabled in case of exception from `ThreadPool::schedule`. [#45481](https://github.com/ClickHouse/ClickHouse/pull/45481) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix possible in-use table after DETACH. [#45493](https://github.com/ClickHouse/ClickHouse/pull/45493) ([Azat Khuzhin](https://github.com/azat)).
-* Fix rare abort in the case when a query is canceled and parallel parsing was used during its execution. [#45498](https://github.com/ClickHouse/ClickHouse/pull/45498) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix a race between Distributed table creation and INSERT into it (could lead to CANNOT_LINK during INSERT into the table). [#45502](https://github.com/ClickHouse/ClickHouse/pull/45502) ([Azat Khuzhin](https://github.com/azat)).
-* Add proper default (SLRU) to cache policy getter. Closes [#45514](https://github.com/ClickHouse/ClickHouse/issues/45514). [#45524](https://github.com/ClickHouse/ClickHouse/pull/45524) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Disallow array join in mutations closes [#42637](https://github.com/ClickHouse/ClickHouse/issues/42637) [#44447](https://github.com/ClickHouse/ClickHouse/pull/44447) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix for qualified asterisks with alias table name and column transformer. Resolves [#44736](https://github.com/ClickHouse/ClickHouse/issues/44736). [#44755](https://github.com/ClickHouse/ClickHouse/pull/44755) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-
-## [Changelog for 2022](https://clickhouse.com/docs/en/whats-new/changelog/2022)
+## [Changelog for 2023](https://clickhouse.com/docs/en/whats-new/changelog/2023)

From bcc99a216d1f697b0a28ed98bd35688b3e078c47 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 09:10:11 +0300
Subject: [PATCH 211/245] Update json.md

---
 docs/en/sql-reference/data-types/json.md | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/docs/en/sql-reference/data-types/json.md b/docs/en/sql-reference/data-types/json.md
index f727f0d75f7..fd548a0d5a2 100644
--- a/docs/en/sql-reference/data-types/json.md
+++ b/docs/en/sql-reference/data-types/json.md
@@ -7,7 +7,7 @@ sidebar_label: JSON
 # JSON
 
 :::note
-This feature is experimental and is not production ready. If you need to work with JSON documents, consider using [this guide](/docs/en/integrations/data-ingestion/data-formats/json.md) instead.
+This feature is experimental and is not production-ready. If you need to work with JSON documents, consider using [this guide](/docs/en/integrations/data-ingestion/data-formats/json.md) instead.
 :::
 
 Stores JavaScript Object Notation (JSON) documents in a single column.
@@ -15,7 +15,8 @@ Stores JavaScript Object Notation (JSON) documents in a single column.
 `JSON` is an alias for `Object('json')`.
 
 :::note
-The JSON data type is an experimental feature. To use it, set `allow_experimental_object_type = 1`.
+The JSON data type is an obsolete feature. Do not use it.
+If you want to use it, set `allow_experimental_object_type = 1`.
 :::
 
 ## Example

From bfb6d284d99817c791409f42ec4c269ee2327e22 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Tue, 30 Jan 2024 07:16:21 +0000
Subject: [PATCH 212/245] Make test non-parallel

---
 tests/queries/0_stateless/02971_analyzer_remote_id.sh | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/02971_analyzer_remote_id.sh b/tests/queries/0_stateless/02971_analyzer_remote_id.sh
index 88bbe38729b..21141fa47ff 100755
--- a/tests/queries/0_stateless/02971_analyzer_remote_id.sh
+++ b/tests/queries/0_stateless/02971_analyzer_remote_id.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: no-parallel
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh

From 37bcd59508f5f9095afe5bdaf8f2eca9b1cd410e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 08:48:42 +0100
Subject: [PATCH 213/245] Remove wrong (Kernigan & Ritchie) notation for
 functions. Use pure mathematical notation instead.

---
 CHANGELOG.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index ea3c954776a..b097757a7ee 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -25,14 +25,14 @@
 * Allow to configure any kind of object storage with any kind of metadata type. [#58357](https://github.com/ClickHouse/ClickHouse/pull/58357) ([Kseniia Sumarokova](https://github.com/kssenii)).
 * Added `null_status_on_timeout_only_active` and `throw_only_active` modes for `distributed_ddl_output_mode` that allow to avoid waiting for inactive replicas. [#58350](https://github.com/ClickHouse/ClickHouse/pull/58350) ([Alexander Tokmakov](https://github.com/tavplubix)).
 * Allow partitions from tables with different partition expressions to be attached when the destination table partition expression doesn't re-partition/split the part. [#39507](https://github.com/ClickHouse/ClickHouse/pull/39507) ([Arthur Passos](https://github.com/arthurpassos)).
-* Add function `arrayShingles()` to compute subarrays, e.g. `arrayShingles([1, 2, 3, 4, 5], 3)` returns `[[1,2,3],[2,3,4],[3,4,5]]`. [#58396](https://github.com/ClickHouse/ClickHouse/pull/58396) ([Zheng Miao](https://github.com/zenmiao7)).
-* Added functions `punycodeEncode()`, `punycodeDecode()`, `idnaEncode()` and `idnaDecode()` which are useful for translating international domain names to an ASCII representation according to the IDNA standard. [#58454](https://github.com/ClickHouse/ClickHouse/pull/58454) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added string similarity functions `dramerauLevenshteinDistance()`, `jaroSimilarity()` and `jaroWinklerSimilarity()`. [#58531](https://github.com/ClickHouse/ClickHouse/pull/58531) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add function `arrayShingles` to compute subarrays, e.g. `arrayShingles([1, 2, 3, 4, 5], 3)` returns `[[1,2,3],[2,3,4],[3,4,5]]`. [#58396](https://github.com/ClickHouse/ClickHouse/pull/58396) ([Zheng Miao](https://github.com/zenmiao7)).
+* Added functions `punycodeEncode`, `punycodeDecode`, `idnaEncode` and `idnaDecode` which are useful for translating international domain names to an ASCII representation according to the IDNA standard. [#58454](https://github.com/ClickHouse/ClickHouse/pull/58454) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added string similarity functions `dramerauLevenshteinDistance`, `jaroSimilarity` and `jaroWinklerSimilarity`. [#58531](https://github.com/ClickHouse/ClickHouse/pull/58531) ([Robert Schulze](https://github.com/rschu1ze)).
 * Add two settings `output_format_compression_level` to change output compression level and `output_format_compression_zstd_window_log` to explicitly set compression window size and enable long-range mode for zstd compression if output compression method is `zstd`. Applied for `INTO OUTFILE` and when writing to table functions `file`, `url`, `hdfs`, `s3`, and `azureBlobStorage`. [#58539](https://github.com/ClickHouse/ClickHouse/pull/58539) ([Duc Canh Le](https://github.com/canhld94)).
 * Automatically disable ANSI escape sequences in Pretty formats if the output is not a terminal. Add new `auto` mode to setting `output_format_pretty_color`. [#58614](https://github.com/ClickHouse/ClickHouse/pull/58614) ([Shaun Struwig](https://github.com/Blargian)).
-* Added function `sqidDecode()` which decodes [Sqids](https://sqids.org/). [#58544](https://github.com/ClickHouse/ClickHouse/pull/58544) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added function `sqidDecode` which decodes [Sqids](https://sqids.org/). [#58544](https://github.com/ClickHouse/ClickHouse/pull/58544) ([Robert Schulze](https://github.com/rschu1ze)).
 * Allow to read Bool values into String in JSON input formats. It's done under a setting `input_format_json_read_bools_as_strings` that is enabled by default. [#58561](https://github.com/ClickHouse/ClickHouse/pull/58561) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added function `seriesDecomposeSTL()` which decomposes a time series into a season, a trend and a residual component. [#57078](https://github.com/ClickHouse/ClickHouse/pull/57078) ([Bhavna Jindal](https://github.com/bhavnajindal)).
+* Added function `seriesDecomposeSTL` which decomposes a time series into a season, a trend and a residual component. [#57078](https://github.com/ClickHouse/ClickHouse/pull/57078) ([Bhavna Jindal](https://github.com/bhavnajindal)).
 * Introduced MySQL Binlog Client for MaterializedMySQL: One binlog connection for many databases. [#57323](https://github.com/ClickHouse/ClickHouse/pull/57323) ([Val Doroshchuk](https://github.com/valbok)).
 * Intel QuickAssist Technology (QAT) provides hardware-accelerated compression and cryptograpy. ClickHouse got a new compression codec `ZSTD_QAT` which utilizes QAT for zstd compression. The codec uses [Intel's QATlib](https://github.com/intel/qatlib) and [Inte's QAT ZSTD Plugin](https://github.com/intel/QAT-ZSTD-Plugin). Right now, only compression can be accelerated in hardware (a software fallback kicks in in case QAT could not be initialized), decompression always runs in software. [#57509](https://github.com/ClickHouse/ClickHouse/pull/57509) ([jasperzhu](https://github.com/jinjunzh)).
 * Implementing the new way how object storage keys are generated for s3 disks. Now the format could be defined in terms of `re2` regex syntax with `key_template` option in disc description. [#57663](https://github.com/ClickHouse/ClickHouse/pull/57663) ([Sema Checherinda](https://github.com/CheSema)).

From 1b748fc7b24649c0018abe3175bfcad546f5bf1f Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 30 Jan 2024 10:18:39 +0100
Subject: [PATCH 214/245] Fixes

---
 contrib/llvm-project-cmake/CMakeLists.txt              | 4 +++-
 tests/queries/0_stateless/02252_jit_profile_events.sql | 2 +-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/contrib/llvm-project-cmake/CMakeLists.txt b/contrib/llvm-project-cmake/CMakeLists.txt
index ed73af1277c..76e620314a2 100644
--- a/contrib/llvm-project-cmake/CMakeLists.txt
+++ b/contrib/llvm-project-cmake/CMakeLists.txt
@@ -1,5 +1,7 @@
 if (APPLE OR SANITIZE STREQUAL "memory")
-    # llvm-tblgen, that is used during LLVM build, doesn't work with MSAN.
+    # llvm-tblgen, that is used during LLVM build, will throw MSAN errors when running (breaking the build)
+    # TODO: Retest when upgrading LLVM or build only llvm-tblgen without sanitizers
+    set (ENABLE_EMBEDDED_COMPILER_DEFAULT OFF)
     set (ENABLE_DWARF_PARSER_DEFAULT OFF)
 else()
     set (ENABLE_EMBEDDED_COMPILER_DEFAULT ${ENABLE_LIBRARIES})
diff --git a/tests/queries/0_stateless/02252_jit_profile_events.sql b/tests/queries/0_stateless/02252_jit_profile_events.sql
index 4b69dde2a45..fb7f806c46b 100644
--- a/tests/queries/0_stateless/02252_jit_profile_events.sql
+++ b/tests/queries/0_stateless/02252_jit_profile_events.sql
@@ -1,4 +1,4 @@
--- Tags: no-fasttest, no-cpu-aarch64, no-msan
+-- Tags: no-fasttest, no-parallel, no-cpu-aarch64, no-msan
 
 SET compile_expressions = 1;
 SET min_count_to_compile_expression = 0;

From f984770223c96bb33f851358e98ccc3144fa334b Mon Sep 17 00:00:00 2001
From: Jordi Villar <jrdi.villar@gmail.com>
Date: Tue, 30 Jan 2024 11:23:07 +0100
Subject: [PATCH 215/245] Minor typos in Settings.h

---
 src/Core/Settings.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 747c755f3ea..2e453bfe480 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -230,7 +230,7 @@ class IColumn;
     \
     M(Bool, force_index_by_date, false, "Throw an exception if there is a partition key in a table, and it is not used.", 0) \
     M(Bool, force_primary_key, false, "Throw an exception if there is primary key in a table, and it is not used.", 0) \
-    M(Bool, use_skip_indexes, true, "Use data skinipping indexes during query execution.", 0) \
+    M(Bool, use_skip_indexes, true, "Use data skipping indexes during query execution.", 0) \
     M(Bool, use_skip_indexes_if_final, false, "If query has FINAL, then skipping data based on indexes may produce incorrect result, hence disabled by default.", 0) \
     M(String, ignore_data_skipping_indices, "", "Comma separated list of strings or literals with the name of the data skipping indices that should be excluded during query execution.", 0) \
     \
@@ -591,7 +591,7 @@ class IColumn;
     M(Bool, deduplicate_blocks_in_dependent_materialized_views, false, "Should deduplicate blocks for materialized views if the block is not a duplicate for the table. Use true to always deduplicate in dependent tables.", 0) \
     M(Bool, update_insert_deduplication_token_in_dependent_materialized_views, false, "Should update insert deduplication token with table identifier during insert in dependent materialized views.", 0) \
     M(Bool, materialized_views_ignore_errors, false, "Allows to ignore errors for MATERIALIZED VIEW, and deliver original block to the table regardless of MVs", 0) \
-    M(Bool, ignore_materialized_views_with_dropped_target_table, false, "Ignore MVs with dropped taraget table during pushing to views", 0) \
+    M(Bool, ignore_materialized_views_with_dropped_target_table, false, "Ignore MVs with dropped target table during pushing to views", 0) \
     M(Bool, allow_experimental_refreshable_materialized_view, false, "Allow refreshable materialized views (CREATE MATERIALIZED VIEW <name> REFRESH ...).", 0) \
     M(Bool, stop_refreshable_materialized_views_on_startup, false, "On server startup, prevent scheduling of refreshable materialized views, as if with SYSTEM STOP VIEWS. You can manually start them with SYSTEM START VIEWS or SYSTEM START VIEW <name> afterwards. Also applies to newly created views. Has no effect on non-refreshable materialized views.", 0) \
     M(Bool, use_compact_format_in_distributed_parts_names, true, "Changes format of directories names for distributed table insert parts.", 0) \

From ccc4295542bec3e93935682186ba3b0821fc30e1 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 30 Jan 2024 11:35:14 +0100
Subject: [PATCH 216/245] More typos in settings

---
 src/Core/Settings.h | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 2e453bfe480..4bb48cb3a29 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -154,7 +154,7 @@ class IColumn;
     M(Float, totals_auto_threshold, 0.5, "The threshold for totals_mode = 'auto'.", 0) \
     \
     M(Bool, allow_suspicious_low_cardinality_types, false, "In CREATE TABLE statement allows specifying LowCardinality modifier for types of small fixed size (8 or less). Enabling this may increase merge times and memory consumption.", 0) \
-    M(Bool, allow_suspicious_fixed_string_types, false, "In CREATE TABLE statement allows creating columns of type FixedString(n) with n > 256. FixedString with length >= 256 is suspicious and most likely indicates misusage", 0) \
+    M(Bool, allow_suspicious_fixed_string_types, false, "In CREATE TABLE statement allows creating columns of type FixedString(n) with n > 256. FixedString with length >= 256 is suspicious and most likely indicates misuse", 0) \
     M(Bool, allow_suspicious_indices, false, "Reject primary/secondary indexes and sorting keys with identical expressions", 0) \
     M(Bool, allow_suspicious_ttl_expressions, false, "Reject TTL expressions that don't depend on any of table's columns. It indicates a user error most of the time.", 0) \
     M(Bool, compile_expressions, false, "Compile some scalar functions and operators to native code.", 0) \
@@ -253,7 +253,7 @@ class IColumn;
     M(LogQueriesType, log_queries_min_type, QueryLogElementType::QUERY_START, "Minimal type in query_log to log, possible values (from low to high): QUERY_START, QUERY_FINISH, EXCEPTION_BEFORE_START, EXCEPTION_WHILE_PROCESSING.", 0) \
     M(Milliseconds, log_queries_min_query_duration_ms, 0, "Minimal time for the query to run, to get to the query_log/query_thread_log/query_views_log.", 0) \
     M(UInt64, log_queries_cut_to_length, 100000, "If query length is greater than specified threshold (in bytes), then cut query when writing to query log. Also limit length of printed query in ordinary text log.", 0) \
-    M(Float, log_queries_probability, 1., "Log queries with the specified probabality.", 0) \
+    M(Float, log_queries_probability, 1., "Log queries with the specified probability.", 0) \
     \
     M(Bool, log_processors_profiles, false, "Log Processors profile events.", 0) \
     M(DistributedProductMode, distributed_product_mode, DistributedProductMode::DENY, "How are distributed subqueries performed inside IN or JOIN sections?", IMPORTANT) \
@@ -261,8 +261,8 @@ class IColumn;
     M(UInt64, max_concurrent_queries_for_all_users, 0, "The maximum number of concurrent requests for all users.", 0) \
     M(UInt64, max_concurrent_queries_for_user, 0, "The maximum number of concurrent requests per user.", 0) \
     \
-    M(Bool, insert_deduplicate, true, "For INSERT queries in the replicated table, specifies that deduplication of insertings blocks should be performed", 0) \
-    M(Bool, async_insert_deduplicate, false, "For async INSERT queries in the replicated table, specifies that deduplication of insertings blocks should be performed", 0) \
+    M(Bool, insert_deduplicate, true, "For INSERT queries in the replicated table, specifies that deduplication of inserting blocks should be performed", 0) \
+    M(Bool, async_insert_deduplicate, false, "For async INSERT queries in the replicated table, specifies that deduplication of inserting blocks should be performed", 0) \
     \
     M(UInt64Auto, insert_quorum, 0, "For INSERT queries in the replicated table, wait writing for the specified number of replicas and linearize the addition of the data. 0 - disabled, 'auto' - use majority", 0) \
     M(Milliseconds, insert_quorum_timeout, 600000, "If the quorum of replicas did not meet in specified time (in milliseconds), exception will be thrown and insertion is aborted.", 0) \
@@ -587,7 +587,7 @@ class IColumn;
     M(Bool, optimize_substitute_columns, false, "Use constraints for column substitution", 0)                                                                                                                                         \
     M(Bool, optimize_append_index, false, "Use constraints in order to append index condition (indexHint)", 0) \
     M(Bool, normalize_function_names, true, "Normalize function names to their canonical names", 0) \
-    M(Bool, enable_early_constant_folding, true, "Enable query optimization where we analyze function and subqueries results and rewrite query if there're constants there", 0) \
+    M(Bool, enable_early_constant_folding, true, "Enable query optimization where we analyze function and subqueries results and rewrite query if there are constants there", 0) \
     M(Bool, deduplicate_blocks_in_dependent_materialized_views, false, "Should deduplicate blocks for materialized views if the block is not a duplicate for the table. Use true to always deduplicate in dependent tables.", 0) \
     M(Bool, update_insert_deduplication_token_in_dependent_materialized_views, false, "Should update insert deduplication token with table identifier during insert in dependent materialized views.", 0) \
     M(Bool, materialized_views_ignore_errors, false, "Allows to ignore errors for MATERIALIZED VIEW, and deliver original block to the table regardless of MVs", 0) \
@@ -765,8 +765,8 @@ class IColumn;
     \
     M(Bool, load_marks_asynchronously, false, "Load MergeTree marks asynchronously", 0) \
     M(Bool, enable_filesystem_read_prefetches_log, false, "Log to system.filesystem prefetch_log during query. Should be used only for testing or debugging, not recommended to be turned on by default", 0) \
-    M(Bool, allow_prefetched_read_pool_for_remote_filesystem, true, "Prefer prefethed threadpool if all parts are on remote filesystem", 0) \
-    M(Bool, allow_prefetched_read_pool_for_local_filesystem, false, "Prefer prefethed threadpool if all parts are on remote filesystem", 0) \
+    M(Bool, allow_prefetched_read_pool_for_remote_filesystem, true, "Prefer prefetched threadpool if all parts are on remote filesystem", 0) \
+    M(Bool, allow_prefetched_read_pool_for_local_filesystem, false, "Prefer prefetched threadpool if all parts are on remote filesystem", 0) \
     \
     M(UInt64, prefetch_buffer_size, DBMS_DEFAULT_BUFFER_SIZE, "The maximum size of the prefetch buffer to read from the filesystem.", 0) \
     M(UInt64, filesystem_prefetch_step_bytes, 0, "Prefetch step in bytes. Zero means `auto` - approximately the best prefetch step will be auto deduced, but might not be 100% the best. The actual value might be different because of setting filesystem_prefetch_min_bytes_for_single_read_task", 0) \
@@ -811,7 +811,7 @@ class IColumn;
     \
     M(String, rename_files_after_processing, "", "Rename successfully processed files according to the specified pattern; Pattern can include the following placeholders: `%a` (full original file name), `%f` (original filename without extension), `%e` (file extension with dot), `%t` (current timestamp in µs), and `%%` (% sign)", 0) \
     \
-    M(Bool, parallelize_output_from_storages, true, "Parallelize output for reading step from storage. It allows parallelizing query processing right after reading from storage if possible", 0) \
+    M(Bool, parallelize_output_from_storages, true, "Parallelize output for reading step from storage. It allows parallelization of  query processing right after reading from storage if possible", 0) \
     M(String, insert_deduplication_token, "", "If not empty, used for duplicate detection instead of data digest", 0) \
     M(Bool, count_distinct_optimization, false, "Rewrite count distinct to subquery of group by", 0) \
     M(Bool, throw_if_no_data_to_insert, true, "Allows or forbids empty INSERTs, enabled by default (throws an error on an empty insert)", 0) \
@@ -1105,7 +1105,7 @@ class IColumn;
     M(Bool, insert_distributed_one_random_shard, false, "If setting is enabled, inserting into distributed table will choose a random shard to write when there is no sharding key", 0) \
     \
     M(Bool, exact_rows_before_limit, false, "When enabled, ClickHouse will provide exact value for rows_before_limit_at_least statistic, but with the cost that the data before limit will have to be read completely", 0) \
-    M(UInt64, cross_to_inner_join_rewrite, 1, "Use inner join instead of comma/cross join if there're joining expressions in the WHERE section. Values: 0 - no rewrite, 1 - apply if possible for comma/cross, 2 - force rewrite all comma joins, cross - if possible", 0) \
+    M(UInt64, cross_to_inner_join_rewrite, 1, "Use inner join instead of comma/cross join if there are joining expressions in the WHERE section. Values: 0 - no rewrite, 1 - apply if possible for comma/cross, 2 - force rewrite all comma joins, cross - if possible", 0) \
     \
     M(Bool, output_format_arrow_low_cardinality_as_dictionary, false, "Enable output LowCardinality type as Dictionary Arrow type", 0) \
     M(Bool, output_format_arrow_use_signed_indexes_for_dictionary, true, "Use signed integers for dictionary indexes in Arrow format", 0) \

From 13770645542c2c6b51fec3b1c634874b79937105 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 11:45:57 +0100
Subject: [PATCH 217/245] Update changelog

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index b097757a7ee..50db3292ca8 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -21,7 +21,7 @@
 #### New Feature
 * Implement Variant data type that represents a union of other data types. Type `Variant(T1, T2, ..., TN)` means that each row of this type has a value of either type `T1` or `T2` or ... or `TN` or none of them (`NULL` value). Variant type is available under a setting `allow_experimental_variant_type`. Reference: [#54864](https://github.com/ClickHouse/ClickHouse/issues/54864). [#58047](https://github.com/ClickHouse/ClickHouse/pull/58047) ([Kruglov Pavel](https://github.com/Avogar)).
 * Certain settings (currently `min_compress_block_size` and `max_compress_block_size`) can now be specified at column-level where they take precedence over the corresponding table-level setting. Example: `CREATE TABLE tab (col String SETTINGS (min_compress_block_size = 81920, max_compress_block_size = 163840)) ENGINE = MergeTree ORDER BY tuple();`. [#55201](https://github.com/ClickHouse/ClickHouse/pull/55201) ([Duc Canh Le](https://github.com/canhld94)).
-* Add `quantileDDSketch` aggregate function as well as the corresponding `quantilesDDSketch` and `medianDDSketch`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
+* Add `quantileDD` aggregate function as well as the corresponding `quantilesDD` and `medianDD`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
 * Allow to configure any kind of object storage with any kind of metadata type. [#58357](https://github.com/ClickHouse/ClickHouse/pull/58357) ([Kseniia Sumarokova](https://github.com/kssenii)).
 * Added `null_status_on_timeout_only_active` and `throw_only_active` modes for `distributed_ddl_output_mode` that allow to avoid waiting for inactive replicas. [#58350](https://github.com/ClickHouse/ClickHouse/pull/58350) ([Alexander Tokmakov](https://github.com/tavplubix)).
 * Allow partitions from tables with different partition expressions to be attached when the destination table partition expression doesn't re-partition/split the part. [#39507](https://github.com/ClickHouse/ClickHouse/pull/39507) ([Arthur Passos](https://github.com/arthurpassos)).

From 798f655276afe25fde8616ad8d4ba78123f61728 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 11:49:56 +0100
Subject: [PATCH 218/245] Rename quantileDDSketch to quantileDD

---
 .../aggregate-functions/reference/index.md    |  3 +-
 .../aggregate-functions/reference/median.md   |  2 +-
 .../reference/quantileddsketch.md             |  8 ++---
 .../reference/quantiles.md                    |  2 +-
 .../AggregateFunctionQuantile.h               |  8 ++---
 ...ch.cpp => AggregateFunctionQuantileDD.cpp} | 14 ++++-----
 .../{QuantileDDSketch.h => QuantileDD.h}      |  8 ++---
 .../registerAggregateFunctions.cpp            |  4 +--
 tests/queries/0_stateless/00273_quantiles.sql |  4 +--
 .../0_stateless/02919_ddsketch_quantile.sql   | 30 +++++++++----------
 .../1_stateful/00178_quantile_ddsketch.sql    |  8 ++---
 .../aspell-ignore/en/aspell-dict.txt          |  4 +--
 12 files changed, 47 insertions(+), 48 deletions(-)
 rename src/AggregateFunctions/{AggregateFunctionQuantileDDSketch.cpp => AggregateFunctionQuantileDD.cpp} (70%)
 rename src/AggregateFunctions/{QuantileDDSketch.h => QuantileDD.h} (93%)

diff --git a/docs/en/sql-reference/aggregate-functions/reference/index.md b/docs/en/sql-reference/aggregate-functions/reference/index.md
index 10bd3e11064..1922672bee9 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/index.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/index.md
@@ -88,7 +88,7 @@ ClickHouse-specific aggregate functions:
 - [quantileTDigestWeighted](/docs/en/sql-reference/aggregate-functions/reference/quantiletdigestweighted.md)
 - [quantileBFloat16](/docs/en/sql-reference/aggregate-functions/reference/quantilebfloat16.md#quantilebfloat16)
 - [quantileBFloat16Weighted](/docs/en/sql-reference/aggregate-functions/reference/quantilebfloat16.md#quantilebfloat16weighted)
-- [quantileDDSketch](/docs/en/sql-reference/aggregate-functions/reference/quantileddsketch.md#quantileddsketch)
+- [quantileDD](/docs/en/sql-reference/aggregate-functions/reference/quantileddsketch.md#quantileddsketch)
 - [simpleLinearRegression](/docs/en/sql-reference/aggregate-functions/reference/simplelinearregression.md)
 - [stochasticLinearRegression](/docs/en/sql-reference/aggregate-functions/reference/stochasticlinearregression.md)
 - [stochasticLogisticRegression](/docs/en/sql-reference/aggregate-functions/reference/stochasticlogisticregression.md)
@@ -105,4 +105,3 @@ ClickHouse-specific aggregate functions:
 - [sparkBar](./sparkbar.md)
 - [sumCount](./sumcount.md)
 - [largestTriangleThreeBuckets](./largestTriangleThreeBuckets.md)
-
diff --git a/docs/en/sql-reference/aggregate-functions/reference/median.md b/docs/en/sql-reference/aggregate-functions/reference/median.md
index 7467a47cf5f..2a166c83dad 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/median.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/median.md
@@ -18,7 +18,7 @@ Functions:
 - `medianTDigest` — Alias for [quantileTDigest](../../../sql-reference/aggregate-functions/reference/quantiletdigest.md#quantiletdigest).
 - `medianTDigestWeighted` — Alias for [quantileTDigestWeighted](../../../sql-reference/aggregate-functions/reference/quantiletdigestweighted.md#quantiletdigestweighted).
 - `medianBFloat16` — Alias for [quantileBFloat16](../../../sql-reference/aggregate-functions/reference/quantilebfloat16.md#quantilebfloat16).
-- `medianDDSketch` — Alias for [quantileDDSketch](../../../sql-reference/aggregate-functions/reference/quantileddsketch.md#quantileddsketch).
+- `medianDD` — Alias for [quantileDD](../../../sql-reference/aggregate-functions/reference/quantileddsketch.md#quantileddsketch).
 
 **Example**
 
diff --git a/docs/en/sql-reference/aggregate-functions/reference/quantileddsketch.md b/docs/en/sql-reference/aggregate-functions/reference/quantileddsketch.md
index 9cb73dfc9d8..f9acd2e20cb 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/quantileddsketch.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/quantileddsketch.md
@@ -1,10 +1,10 @@
 ---
 slug: /en/sql-reference/aggregate-functions/reference/quantileddsketch
 sidebar_position: 211
-title: quantileDDSketch
+title: quantileDD
 ---
 
-Computes an approximate [quantile](https://en.wikipedia.org/wiki/Quantile) of a sample with relative-error guarantees. It works by building a [DDSketch](https://www.vldb.org/pvldb/vol12/p2195-masson.pdf).
+Computes an approximate [quantile](https://en.wikipedia.org/wiki/Quantile) of a sample with relative-error guarantees. It works by building a [DD](https://www.vldb.org/pvldb/vol12/p2195-masson.pdf).
 
 **Syntax**
 
@@ -44,13 +44,13 @@ Input table has an integer and a float columns:
 Query to calculate 0.75-quantile (third quartile):
 
 ``` sql
-SELECT quantileDDSketch(0.01, 0.75)(a), quantileDDSketch(0.01, 0.75)(b) FROM example_table;
+SELECT quantileDD(0.01, 0.75)(a), quantileDD(0.01, 0.75)(b) FROM example_table;
 ```
 
 Result:
 
 ``` text
-┌─quantileDDSketch(0.01, 0.75)(a)─┬─quantileDDSketch(0.01, 0.75)(b)─┐
+┌─quantileDD(0.01, 0.75)(a)─┬─quantileDD(0.01, 0.75)(b)─┐
 │               2.974233423476717 │                            1.01 │
 └─────────────────────────────────┴─────────────────────────────────┘
 ```
diff --git a/docs/en/sql-reference/aggregate-functions/reference/quantiles.md b/docs/en/sql-reference/aggregate-functions/reference/quantiles.md
index e5da6a9c1de..e2a5bc53e32 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/quantiles.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/quantiles.md
@@ -9,7 +9,7 @@ sidebar_position: 201
 
 Syntax: `quantiles(level1, level2, …)(x)`
 
-All the quantile functions also have corresponding quantiles functions: `quantiles`, `quantilesDeterministic`, `quantilesTiming`, `quantilesTimingWeighted`, `quantilesExact`, `quantilesExactWeighted`, `quantileInterpolatedWeighted`, `quantilesTDigest`, `quantilesBFloat16`, `quantilesDDSketch`. These functions calculate all the quantiles of the listed levels in one pass, and return an array of the resulting values.
+All the quantile functions also have corresponding quantiles functions: `quantiles`, `quantilesDeterministic`, `quantilesTiming`, `quantilesTimingWeighted`, `quantilesExact`, `quantilesExactWeighted`, `quantileInterpolatedWeighted`, `quantilesTDigest`, `quantilesBFloat16`, `quantilesDD`. These functions calculate all the quantiles of the listed levels in one pass, and return an array of the resulting values.
 
 ## quantilesExactExclusive
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantile.h b/src/AggregateFunctions/AggregateFunctionQuantile.h
index 5a0509a5b8d..315be2123a7 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantile.h
+++ b/src/AggregateFunctions/AggregateFunctionQuantile.h
@@ -31,7 +31,7 @@ namespace ErrorCodes
 
 template <typename> class QuantileTiming;
 template <typename> class QuantileGK;
-template <typename> class QuantileDDSketch;
+template <typename> class QuantileDD;
 
 /** Generic aggregate function for calculation of quantiles.
   * It depends on quantile calculation data structure. Look at Quantile*.h for various implementations.
@@ -64,7 +64,7 @@ private:
     using ColVecType = ColumnVectorOrDecimal<Value>;
 
     static constexpr bool returns_float = !(std::is_same_v<FloatReturnType, void>);
-    static constexpr bool is_quantile_ddsketch = std::is_same_v<Data, QuantileDDSketch<Value>>;
+    static constexpr bool is_quantile_ddsketch = std::is_same_v<Data, QuantileDD<Value>>;
     static_assert(!is_decimal<Value> || !returns_float);
 
     QuantileLevels<Float64> levels;
@@ -334,7 +334,7 @@ struct NameQuantilesBFloat16Weighted { static constexpr auto name = "quantilesBF
 struct NameQuantileGK { static constexpr auto name = "quantileGK"; };
 struct NameQuantilesGK { static constexpr auto name = "quantilesGK"; };
 
-struct NameQuantileDDSketch { static constexpr auto name = "quantileDDSketch"; };
-struct NameQuantilesDDSketch { static constexpr auto name = "quantilesDDSketch"; };
+struct NameQuantileDD { static constexpr auto name = "quantileDD"; };
+struct NameQuantilesDD { static constexpr auto name = "quantilesDD"; };
 
 }
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileDDSketch.cpp b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
similarity index 70%
rename from src/AggregateFunctions/AggregateFunctionQuantileDDSketch.cpp
rename to src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
index 0c5c992920c..4d1b2069dcc 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileDDSketch.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
@@ -1,5 +1,5 @@
 #include <AggregateFunctions/AggregateFunctionQuantile.h>
-#include <AggregateFunctions/QuantileDDSketch.h>
+#include <AggregateFunctions/QuantileDD.h>
 #include <AggregateFunctions/AggregateFunctionFactory.h>
 #include <AggregateFunctions/Helpers.h>
 #include <DataTypes/DataTypeDate.h>
@@ -19,8 +19,8 @@ namespace ErrorCodes
 namespace
 {
 
-template <typename Value, bool float_return> using FuncQuantileDDSketch = AggregateFunctionQuantile<Value, QuantileDDSketch<Value>, NameQuantileDDSketch, false, std::conditional_t<float_return, Float64, void>, false, true>;
-template <typename Value, bool float_return> using FuncQuantilesDDSketch = AggregateFunctionQuantile<Value, QuantileDDSketch<Value>, NameQuantilesDDSketch, false, std::conditional_t<float_return, Float64, void>, true, true>;
+template <typename Value, bool float_return> using FuncQuantileDD = AggregateFunctionQuantile<Value, QuantileDD<Value>, NameQuantileDD, false, std::conditional_t<float_return, Float64, void>, false, true>;
+template <typename Value, bool float_return> using FuncQuantilesDD = AggregateFunctionQuantile<Value, QuantileDD<Value>, NameQuantilesDD, false, std::conditional_t<float_return, Float64, void>, true, true>;
 
 
 template <template <typename, bool> class Function>
@@ -46,16 +46,16 @@ AggregateFunctionPtr createAggregateFunctionQuantile(
 
 }
 
-void registerAggregateFunctionsQuantileDDSketch(AggregateFunctionFactory & factory)
+void registerAggregateFunctionsQuantileDD(AggregateFunctionFactory & factory)
 {
     /// For aggregate functions returning array we cannot return NULL on empty set.
     AggregateFunctionProperties properties = { .returns_default_when_only_null = true };
 
-    factory.registerFunction(NameQuantileDDSketch::name, createAggregateFunctionQuantile<FuncQuantileDDSketch>);
-    factory.registerFunction(NameQuantilesDDSketch::name, { createAggregateFunctionQuantile<FuncQuantilesDDSketch>, properties });
+    factory.registerFunction(NameQuantileDD::name, createAggregateFunctionQuantile<FuncQuantileDD>);
+    factory.registerFunction(NameQuantilesDD::name, { createAggregateFunctionQuantile<FuncQuantilesDD>, properties });
 
     /// 'median' is an alias for 'quantile'
-    factory.registerAlias("medianDDSketch", NameQuantileDDSketch::name);
+    factory.registerAlias("medianDD", NameQuantileDD::name);
 }
 
 }
diff --git a/src/AggregateFunctions/QuantileDDSketch.h b/src/AggregateFunctions/QuantileDD.h
similarity index 93%
rename from src/AggregateFunctions/QuantileDDSketch.h
rename to src/AggregateFunctions/QuantileDD.h
index 05e92f3b869..1d063c7a014 100644
--- a/src/AggregateFunctions/QuantileDDSketch.h
+++ b/src/AggregateFunctions/QuantileDD.h
@@ -33,14 +33,14 @@ namespace DB
 */
 
 template <typename Value>
-class QuantileDDSketch
+class QuantileDD
 {
 public:
     using Weight = UInt64;
 
-    QuantileDDSketch() = default;
+    QuantileDD() = default;
 
-    explicit QuantileDDSketch(Float64 relative_accuracy) : data(relative_accuracy) { }
+    explicit QuantileDD(Float64 relative_accuracy) : data(relative_accuracy) { }
 
     void add(const Value & x)
     {
@@ -53,7 +53,7 @@ public:
             data.add(x, w);
     }
 
-    void merge(const QuantileDDSketch &other)
+    void merge(const QuantileDD &other)
     {
         data.merge(other.data);
     }
diff --git a/src/AggregateFunctions/registerAggregateFunctions.cpp b/src/AggregateFunctions/registerAggregateFunctions.cpp
index 6d3a144fa49..10c5cc36f9a 100644
--- a/src/AggregateFunctions/registerAggregateFunctions.cpp
+++ b/src/AggregateFunctions/registerAggregateFunctions.cpp
@@ -31,7 +31,7 @@ void registerAggregateFunctionsQuantileTimingWeighted(AggregateFunctionFactory &
 void registerAggregateFunctionsQuantileTDigest(AggregateFunctionFactory &);
 void registerAggregateFunctionsQuantileTDigestWeighted(AggregateFunctionFactory &);
 void registerAggregateFunctionsQuantileBFloat16(AggregateFunctionFactory &);
-void registerAggregateFunctionsQuantileDDSketch(AggregateFunctionFactory &);
+void registerAggregateFunctionsQuantileDD(AggregateFunctionFactory &);
 void registerAggregateFunctionsQuantileBFloat16Weighted(AggregateFunctionFactory &);
 void registerAggregateFunctionsQuantileApprox(AggregateFunctionFactory &);
 void registerAggregateFunctionsSequenceMatch(AggregateFunctionFactory &);
@@ -128,7 +128,7 @@ void registerAggregateFunctions()
         registerAggregateFunctionsQuantileTDigest(factory);
         registerAggregateFunctionsQuantileTDigestWeighted(factory);
         registerAggregateFunctionsQuantileBFloat16(factory);
-        registerAggregateFunctionsQuantileDDSketch(factory);
+        registerAggregateFunctionsQuantileDD(factory);
         registerAggregateFunctionsQuantileBFloat16Weighted(factory);
         registerAggregateFunctionsQuantileApprox(factory);
         registerAggregateFunctionsSequenceMatch(factory);
diff --git a/tests/queries/0_stateless/00273_quantiles.sql b/tests/queries/0_stateless/00273_quantiles.sql
index eba5e772997..791ced6bc5d 100644
--- a/tests/queries/0_stateless/00273_quantiles.sql
+++ b/tests/queries/0_stateless/00273_quantiles.sql
@@ -2,13 +2,13 @@ SELECT quantiles(0.5)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001
 SELECT quantilesExact(0.5)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 SELECT quantilesTDigest(0.5)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 SELECT quantilesDeterministic(0.5)(x, x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
-SELECT arrayMap(a -> round(a, 2), quantilesDDSketch(0.01, 0.5)(x)) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
+SELECT arrayMap(a -> round(a, 2), quantilesDD(0.01, 0.5)(x)) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 
 SELECT quantiles(0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 SELECT quantilesExact(0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 SELECT quantilesTDigest(0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 SELECT quantilesDeterministic(0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x, x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
-SELECT arrayMap(a -> round(a, 2), quantilesDDSketch(0.01, 0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x)) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
+SELECT arrayMap(a -> round(a, 2), quantilesDD(0.01, 0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x)) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 
 -- The result slightly differs but it's ok since `quantilesDeterministic` is an approximate function.
 SET max_bytes_before_external_group_by = 0;
diff --git a/tests/queries/0_stateless/02919_ddsketch_quantile.sql b/tests/queries/0_stateless/02919_ddsketch_quantile.sql
index 99eace15d2d..d98978c117e 100644
--- a/tests/queries/0_stateless/02919_ddsketch_quantile.sql
+++ b/tests/queries/0_stateless/02919_ddsketch_quantile.sql
@@ -1,23 +1,23 @@
 SELECT '1'; -- simple test
-SELECT round(quantileDDSketch(0.01, 0.5)(number), 2) FROM numbers(200);
-SELECT round(quantileDDSketch(0.0001, 0.69)(number), 2) FROM numbers(500);
-SELECT round(quantileDDSketch(0.003, 0.42)(number), 2) FROM numbers(200);
-SELECT round(quantileDDSketch(0.02, 0.99)(number), 2) FROM numbers(500);
+SELECT round(quantileDD(0.01, 0.5)(number), 2) FROM numbers(200);
+SELECT round(quantileDD(0.0001, 0.69)(number), 2) FROM numbers(500);
+SELECT round(quantileDD(0.003, 0.42)(number), 2) FROM numbers(200);
+SELECT round(quantileDD(0.02, 0.99)(number), 2) FROM numbers(500);
 
 SELECT '2'; -- median is close to 0
-SELECT round(quantileDDSketch(0.01, 0.5)(number), 2)
+SELECT round(quantileDD(0.01, 0.5)(number), 2)
 FROM
 (
     SELECT arrayJoin([toInt64(number), number - 10]) AS number
     FROM numbers(0, 10)
 );
-SELECT round(quantileDDSketch(0.01, 0.5)(number - 10), 2) FROM numbers(21);
+SELECT round(quantileDD(0.01, 0.5)(number - 10), 2) FROM numbers(21);
 
 SELECT '3'; -- all values are negative
-SELECT round(quantileDDSketch(0.01, 0.99)(-number), 2) FROM numbers(1, 500);
+SELECT round(quantileDD(0.01, 0.99)(-number), 2) FROM numbers(1, 500);
 
 SELECT '4'; -- min and max values of integer types (-2^63, 2^63-1)
-SELECT round(quantileDDSketch(0.01, 0.5)(number), 2)
+SELECT round(quantileDD(0.01, 0.5)(number), 2)
 FROM
 (
     SELECT arrayJoin([toInt64(number), number - 9223372036854775808, toInt64(number + 9223372036854775798)]) AS number
@@ -25,7 +25,7 @@ FROM
 );
 
 SELECT '5'; -- min and max values of floating point types
-SELECT round(quantileDDSketch(0.01, 0.42)(number), 2)
+SELECT round(quantileDD(0.01, 0.42)(number), 2)
 FROM
 (
     SELECT arrayJoin([toFloat32(number), number - 3.4028235e+38, toFloat32(number + 3.4028235e+38)]) AS number
@@ -33,7 +33,7 @@ FROM
 );
 
 SELECT '6'; -- denormalized floats
-SELECT round(quantileDDSketch(0.01, 0.69)(number), 2)
+SELECT round(quantileDD(0.01, 0.69)(number), 2)
 FROM
 (
     SELECT arrayJoin([toFloat32(number), number - 1.1754944e-38, toFloat32(number + 1.1754944e-38)]) AS number
@@ -41,7 +41,7 @@ FROM
 );
 
 SELECT '7'; -- NaNs
-SELECT round(quantileDDSketch(0.01, 0.5)(number), 2)
+SELECT round(quantileDD(0.01, 0.5)(number), 2)
 FROM
 (
     SELECT arrayJoin([toFloat32(number), NaN * number]) AS number
@@ -50,7 +50,7 @@ FROM
 
 SELECT '8'; -- sparse sketch
 
-SELECT round(quantileDDSketch(0.01, 0.75)(number), 2)
+SELECT round(quantileDD(0.01, 0.75)(number), 2)
 FROM
 (
     SELECT number * 1e7 AS number
@@ -63,11 +63,11 @@ DROP TABLE IF EXISTS `02919_ddsketch_quantile`;
 
 CREATE TABLE `02919_ddsketch_quantile`
 ENGINE = Log AS
-SELECT quantilesDDSketchState(0.001, 0.9)(number) AS sketch
+SELECT quantilesDDState(0.001, 0.9)(number) AS sketch
 FROM numbers(1000);
 
-INSERT INTO `02919_ddsketch_quantile` SELECT quantilesDDSketchState(0.001, 0.9)(number + 1000)
+INSERT INTO `02919_ddsketch_quantile` SELECT quantilesDDState(0.001, 0.9)(number + 1000)
 FROM numbers(1000);
 
-SELECT arrayMap(a -> round(a, 2), (quantilesDDSketchMerge(0.001, 0.9)(sketch)))
+SELECT arrayMap(a -> round(a, 2), (quantilesDDMerge(0.001, 0.9)(sketch)))
 FROM `02919_ddsketch_quantile`;
diff --git a/tests/queries/1_stateful/00178_quantile_ddsketch.sql b/tests/queries/1_stateful/00178_quantile_ddsketch.sql
index 6844dc05cf9..c1ef4b9f4f2 100644
--- a/tests/queries/1_stateful/00178_quantile_ddsketch.sql
+++ b/tests/queries/1_stateful/00178_quantile_ddsketch.sql
@@ -1,5 +1,5 @@
-SELECT CounterID AS k, round(quantileDDSketch(0.01, 0.5)(ResolutionWidth), 2) FROM test.hits GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
-SELECT CounterID AS k, arrayMap(a -> round(a, 2), quantilesDDSketch(0.01, 0.1, 0.5, 0.9, 0.99, 0.999)(ResolutionWidth)) FROM test.hits GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
+SELECT CounterID AS k, round(quantileDD(0.01, 0.5)(ResolutionWidth), 2) FROM test.hits GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
+SELECT CounterID AS k, arrayMap(a -> round(a, 2), quantilesDD(0.01, 0.1, 0.5, 0.9, 0.99, 0.999)(ResolutionWidth)) FROM test.hits GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
 
-SELECT CounterID AS k, round(quantileDDSketch(0.01, 0.5)(ResolutionWidth), 2) FROM remote('127.0.0.{1,2}', test.hits) GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
-SELECT CounterID AS k, arrayMap(a -> round(a, 2), quantilesDDSketch(0.01, 0.1, 0.5, 0.9, 0.99, 0.999)(ResolutionWidth)) FROM remote('127.0.0.{1,2}', test.hits) GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
+SELECT CounterID AS k, round(quantileDD(0.01, 0.5)(ResolutionWidth), 2) FROM remote('127.0.0.{1,2}', test.hits) GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
+SELECT CounterID AS k, arrayMap(a -> round(a, 2), quantilesDD(0.01, 0.1, 0.5, 0.9, 0.99, 0.999)(ResolutionWidth)) FROM remote('127.0.0.{1,2}', test.hits) GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 93e2a12d69c..a71c7cd88c5 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -214,7 +214,7 @@ DatabaseOrdinaryThreadsActive
 DateTime
 DateTimes
 DbCL
-DDSketch
+DD
 Decrypted
 Deduplicate
 Deduplication
@@ -2136,7 +2136,7 @@ quantiletdigestweighted
 quantiletiming
 quantiletimingweighted
 quantileddsketch
-quantileDDSketch
+quantileDD
 quartile
 queryID
 queryString

From 2087de548674d158fab63d18fb1b590aea5eaab2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 11:45:57 +0100
Subject: [PATCH 219/245] Update changelog

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index ea3c954776a..a7e44b00f85 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -21,7 +21,7 @@
 #### New Feature
 * Implement Variant data type that represents a union of other data types. Type `Variant(T1, T2, ..., TN)` means that each row of this type has a value of either type `T1` or `T2` or ... or `TN` or none of them (`NULL` value). Variant type is available under a setting `allow_experimental_variant_type`. Reference: [#54864](https://github.com/ClickHouse/ClickHouse/issues/54864). [#58047](https://github.com/ClickHouse/ClickHouse/pull/58047) ([Kruglov Pavel](https://github.com/Avogar)).
 * Certain settings (currently `min_compress_block_size` and `max_compress_block_size`) can now be specified at column-level where they take precedence over the corresponding table-level setting. Example: `CREATE TABLE tab (col String SETTINGS (min_compress_block_size = 81920, max_compress_block_size = 163840)) ENGINE = MergeTree ORDER BY tuple();`. [#55201](https://github.com/ClickHouse/ClickHouse/pull/55201) ([Duc Canh Le](https://github.com/canhld94)).
-* Add `quantileDDSketch` aggregate function as well as the corresponding `quantilesDDSketch` and `medianDDSketch`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
+* Add `quantileDD` aggregate function as well as the corresponding `quantilesDD` and `medianDD`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
 * Allow to configure any kind of object storage with any kind of metadata type. [#58357](https://github.com/ClickHouse/ClickHouse/pull/58357) ([Kseniia Sumarokova](https://github.com/kssenii)).
 * Added `null_status_on_timeout_only_active` and `throw_only_active` modes for `distributed_ddl_output_mode` that allow to avoid waiting for inactive replicas. [#58350](https://github.com/ClickHouse/ClickHouse/pull/58350) ([Alexander Tokmakov](https://github.com/tavplubix)).
 * Allow partitions from tables with different partition expressions to be attached when the destination table partition expression doesn't re-partition/split the part. [#39507](https://github.com/ClickHouse/ClickHouse/pull/39507) ([Arthur Passos](https://github.com/arthurpassos)).

From 5ea2afa981f9efe5d2a9e736e27a614256129fa4 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 13:16:22 +0100
Subject: [PATCH 220/245] Fix

---
 .../0_stateless/02973_s3_compressed_file_in_error_message.sh   | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
index 764c6a2af54..946f0c09007 100755
--- a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
+++ b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
@@ -5,5 +5,4 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_CLIENT -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c -F "a.tsv"
-
+$CLICKHOUSE_CLIENT --allow_repeated_settings --send_logs_level=none -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c -F "(in file/uri a.tsv)"

From b3483eede3b39bac256ec69069e1978ecb7fbc3e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 22:31:29 +0100
Subject: [PATCH 221/245] Fix translate() return type

---
 src/Functions/translate.cpp                   | 20 ++++++++++++++-----
 .../02981_translate_fixedstring.reference     |  5 +++++
 .../02981_translate_fixedstring.sql           |  2 ++
 3 files changed, 22 insertions(+), 5 deletions(-)
 create mode 100644 tests/queries/0_stateless/02981_translate_fixedstring.reference
 create mode 100644 tests/queries/0_stateless/02981_translate_fixedstring.sql

diff --git a/src/Functions/translate.cpp b/src/Functions/translate.cpp
index ad5be7d9dfd..c7173909029 100644
--- a/src/Functions/translate.cpp
+++ b/src/Functions/translate.cpp
@@ -1,12 +1,15 @@
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnConst.h>
+#include <Columns/ColumnFixedString.h>
+#include <Columns/ColumnString.h>
+#include <DataTypes/DataTypeFixedString.h>
 #include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
-#include <Common/iota.h>
+#include <Functions/FunctionHelpers.h>
+#include <Common/HashTable/HashMap.h>
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/UTF8Helpers.h>
-#include <Common/HashTable/HashMap.h>
+#include <Common/iota.h>
+
 #include <numeric>
 
 
@@ -298,7 +301,14 @@ public:
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of third argument of function {}",
                 arguments[2]->getName(), getName());
 
-        return std::make_shared<DataTypeString>();
+        if (isString(arguments[0]))
+            return std::make_shared<DataTypeString>();
+        else
+        {
+            const auto * ptr = checkAndGetDataType<DataTypeFixedString>(arguments[0].get());
+            chassert(ptr);
+            return std::make_shared<DataTypeFixedString>(ptr->getN());
+        }
     }
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/) const override
diff --git a/tests/queries/0_stateless/02981_translate_fixedstring.reference b/tests/queries/0_stateless/02981_translate_fixedstring.reference
new file mode 100644
index 00000000000..e506d4a22f7
--- /dev/null
+++ b/tests/queries/0_stateless/02981_translate_fixedstring.reference
@@ -0,0 +1,5 @@
+AAA\0\0\0\0\0\0\0
+A
+1
+2
+3
diff --git a/tests/queries/0_stateless/02981_translate_fixedstring.sql b/tests/queries/0_stateless/02981_translate_fixedstring.sql
new file mode 100644
index 00000000000..209efa4ba4a
--- /dev/null
+++ b/tests/queries/0_stateless/02981_translate_fixedstring.sql
@@ -0,0 +1,2 @@
+SELECT translate('aaa'::FixedString(10), 'a','A');
+SELECT translate(number::String::FixedString(1), '0','A') from numbers(4);

From f79a402e6d92fc0e14bf9684d731c76a51fcdca0 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 30 Jan 2024 14:10:07 +0100
Subject: [PATCH 222/245] Add sanity checks for function return types

---
 src/Columns/ColumnFunction.cpp         | 7 +++++++
 src/DataTypes/DataTypeDate.h           | 1 +
 src/DataTypes/DataTypeDate32.h         | 1 +
 src/DataTypes/DataTypeDateTime.h       | 1 +
 src/DataTypes/DataTypeEnum.h           | 1 +
 src/DataTypes/DataTypeInterval.h       | 1 +
 src/DataTypes/IDataType.h              | 2 ++
 src/Interpreters/ActionsDAG.cpp        | 7 +++++++
 src/Interpreters/ExpressionActions.cpp | 7 +++++++
 9 files changed, 28 insertions(+)

diff --git a/src/Columns/ColumnFunction.cpp b/src/Columns/ColumnFunction.cpp
index d8eea26b7d5..0ab9d15ad50 100644
--- a/src/Columns/ColumnFunction.cpp
+++ b/src/Columns/ColumnFunction.cpp
@@ -308,6 +308,13 @@ ColumnWithTypeAndName ColumnFunction::reduce() const
         ProfileEvents::increment(ProfileEvents::CompiledFunctionExecute);
 
     res.column = function->execute(columns, res.type, elements_size);
+    if (res.column->getDataType() != res.type->getColumnType())
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR,
+            "Unexpected return type from {}. Expected {}. Got {}",
+            function->getName(),
+            res.type->getColumnType(),
+            res.column->getDataType());
     if (recursively_convert_result_to_full_column_if_low_cardinality)
     {
         res.column = recursiveRemoveLowCardinality(res.column);
diff --git a/src/DataTypes/DataTypeDate.h b/src/DataTypes/DataTypeDate.h
index 2f17207cc07..0e08b9ba2ca 100644
--- a/src/DataTypes/DataTypeDate.h
+++ b/src/DataTypes/DataTypeDate.h
@@ -12,6 +12,7 @@ public:
     static constexpr auto family_name = "Date";
 
     TypeIndex getTypeId() const override { return TypeIndex::Date; }
+    TypeIndex getColumnType() const override { return TypeIndex::UInt16; }
     const char * getFamilyName() const override { return family_name; }
 
     bool canBeUsedAsVersion() const override { return true; }
diff --git a/src/DataTypes/DataTypeDate32.h b/src/DataTypes/DataTypeDate32.h
index 9160b62dc15..02e818f10df 100644
--- a/src/DataTypes/DataTypeDate32.h
+++ b/src/DataTypes/DataTypeDate32.h
@@ -12,6 +12,7 @@ public:
     static constexpr auto family_name = "Date32";
 
     TypeIndex getTypeId() const override { return TypeIndex::Date32; }
+    TypeIndex getColumnType() const override { return TypeIndex::Int32; }
     const char * getFamilyName() const override { return family_name; }
 
     Field getDefault() const override
diff --git a/src/DataTypes/DataTypeDateTime.h b/src/DataTypes/DataTypeDateTime.h
index a4a05917ba5..5519240dee1 100644
--- a/src/DataTypes/DataTypeDateTime.h
+++ b/src/DataTypes/DataTypeDateTime.h
@@ -40,6 +40,7 @@ public:
     const char * getFamilyName() const override { return family_name; }
     String doGetName() const override;
     TypeIndex getTypeId() const override { return TypeIndex::DateTime; }
+    TypeIndex getColumnType() const override { return TypeIndex::UInt32; }
 
     bool canBeUsedAsVersion() const override { return true; }
     bool canBeInsideNullable() const override { return true; }
diff --git a/src/DataTypes/DataTypeEnum.h b/src/DataTypes/DataTypeEnum.h
index 2f607fc2aa6..075d2d274ae 100644
--- a/src/DataTypes/DataTypeEnum.h
+++ b/src/DataTypes/DataTypeEnum.h
@@ -54,6 +54,7 @@ public:
     const char * getFamilyName() const override;
 
     TypeIndex getTypeId() const override { return type_id; }
+    TypeIndex getColumnType() const override { return sizeof(FieldType) == 1 ? TypeIndex::Int8 : TypeIndex::Int16; }
 
     FieldType readValue(ReadBuffer & istr) const
     {
diff --git a/src/DataTypes/DataTypeInterval.h b/src/DataTypes/DataTypeInterval.h
index b0e747555e3..8bb9ae8d7b6 100644
--- a/src/DataTypes/DataTypeInterval.h
+++ b/src/DataTypes/DataTypeInterval.h
@@ -28,6 +28,7 @@ public:
     std::string doGetName() const override { return fmt::format("Interval{}", kind.toString()); }
     const char * getFamilyName() const override { return "Interval"; }
     TypeIndex getTypeId() const override { return TypeIndex::Interval; }
+    TypeIndex getColumnType() const override { return TypeIndex::Int64; }
 
     bool equals(const IDataType & rhs) const override;
 
diff --git a/src/DataTypes/IDataType.h b/src/DataTypes/IDataType.h
index 4533c23a89f..48cc127746f 100644
--- a/src/DataTypes/IDataType.h
+++ b/src/DataTypes/IDataType.h
@@ -86,6 +86,8 @@ public:
 
     /// Data type id. It's used for runtime type checks.
     virtual TypeIndex getTypeId() const = 0;
+    /// Storage type (e.g. Int64 for Interval)
+    virtual TypeIndex getColumnType() const { return getTypeId(); }
 
     bool hasSubcolumn(std::string_view subcolumn_name) const;
 
diff --git a/src/Interpreters/ActionsDAG.cpp b/src/Interpreters/ActionsDAG.cpp
index 1124ba94bc1..6512def9202 100644
--- a/src/Interpreters/ActionsDAG.cpp
+++ b/src/Interpreters/ActionsDAG.cpp
@@ -282,6 +282,13 @@ const ActionsDAG::Node & ActionsDAG::addFunctionImpl(
         {
             size_t num_rows = arguments.empty() ? 0 : arguments.front().column->size();
             column = node.function->execute(arguments, node.result_type, num_rows, true);
+            if (column->getDataType() != node.result_type->getColumnType())
+                throw Exception(
+                    ErrorCodes::LOGICAL_ERROR,
+                    "Unexpected return type from {}. Expected {}. Got {}",
+                    node.function->getName(),
+                    node.result_type->getColumnType(),
+                    column->getDataType());
         }
         else
         {
diff --git a/src/Interpreters/ExpressionActions.cpp b/src/Interpreters/ExpressionActions.cpp
index f1c577948eb..1bd1e2c318f 100644
--- a/src/Interpreters/ExpressionActions.cpp
+++ b/src/Interpreters/ExpressionActions.cpp
@@ -611,6 +611,13 @@ static void executeAction(const ExpressionActions::Action & action, ExecutionCon
                     ProfileEvents::increment(ProfileEvents::CompiledFunctionExecute);
 
                 res_column.column = action.node->function->execute(arguments, res_column.type, num_rows, dry_run);
+                if (res_column.column->getDataType() != res_column.type->getColumnType())
+                    throw Exception(
+                        ErrorCodes::LOGICAL_ERROR,
+                        "Unexpected return type from {}. Expected {}. Got {}",
+                        action.node->function->getName(),
+                        res_column.type->getColumnType(),
+                        res_column.column->getDataType());
             }
             break;
         }

From df439dcfdd1c23c3e029f070a314511bc88d24e1 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Tue, 30 Jan 2024 14:36:08 +0100
Subject: [PATCH 223/245] updated development documentation to warn about
 parallel tests failing if .tmp file names aren't unique (for new
 contributors)

---
 docs/en/development/tests.md | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/docs/en/development/tests.md b/docs/en/development/tests.md
index 1d3e7d4964e..efbce54d44b 100644
--- a/docs/en/development/tests.md
+++ b/docs/en/development/tests.md
@@ -109,6 +109,9 @@ Do not check for a particular wording of error message, it may change in the fut
 
 If you want to use distributed queries in functional tests, you can leverage `remote` table function with `127.0.0.{1..2}` addresses for the server to query itself; or you can use predefined test clusters in server configuration file like `test_shard_localhost`. Remember to add the words `shard` or `distributed` to the test name, so that it is run in CI in correct configurations, where the server is configured to support distributed queries.
 
+### Working with Temporary Files
+
+Sometimes in a shell test you may need to create a file on the fly to work with. Keep in mind that some CI checks run tests in parallel, so if you are creating or removing a temporary file in your script without a unique name this can cause some of the CI checks, such as Flaky, to fail. To get around this you should use environment variable `$CLICKHOUSE_TEST_UNIQUE_NAME` to give temporary files a name unique to the test that is running. That way you can be sure that the file you are creating during setup or removing during cleanup is the file only in use by that test and not some other test which is running in parallel. 
 
 ## Known Bugs {#known-bugs}
 

From 20c1f0c18f65b3ab149b84abc18dfe1a4d3b3383 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Fri, 19 Jan 2024 18:37:02 +0300
Subject: [PATCH 224/245] Revert "Revert "Add new aggregation function
 groupArraySorted()""

---
 .../reference/grouparraysorted.md             |  48 +++
 .../aggregate-functions/reference/index.md    |   1 +
 .../AggregateFunctionGroupArraySorted.cpp     |  82 ++++
 .../AggregateFunctionGroupArraySorted.h       | 355 ++++++++++++++++++
 .../registerAggregateFunctions.cpp            |   2 +
 tests/performance/group_array_sorted.xml      |  31 ++
 .../02841_group_array_sorted.reference        |  12 +
 .../0_stateless/02841_group_array_sorted.sql  |  41 ++
 .../aspell-ignore/en/aspell-dict.txt          |   2 +
 9 files changed, 574 insertions(+)
 create mode 100644 docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md
 create mode 100644 src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
 create mode 100644 src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
 create mode 100644 tests/performance/group_array_sorted.xml
 create mode 100644 tests/queries/0_stateless/02841_group_array_sorted.reference
 create mode 100644 tests/queries/0_stateless/02841_group_array_sorted.sql

diff --git a/docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md b/docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md
new file mode 100644
index 00000000000..cc601c097fe
--- /dev/null
+++ b/docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md
@@ -0,0 +1,48 @@
+ ---
+ toc_priority: 112
+ ---
+
+ # groupArraySorted {#groupArraySorted}
+
+ Returns an array with the first N items in ascending order.
+
+ ``` sql
+ groupArraySorted(N)(column)
+ ```
+
+ **Arguments**
+
+ -   `N` – The number of elements to return.
+
+ If the parameter is omitted, default value is the size of input.
+
+ -   `column` – The value (Integer, String, Float and other Generic types).
+
+ **Example**
+
+ Gets the first 10 numbers:
+
+ ``` sql
+ SELECT groupArraySorted(10)(number) FROM numbers(100)
+ ```
+
+ ``` text
+ ┌─groupArraySorted(10)(number)─┐
+ │ [0,1,2,3,4,5,6,7,8,9]        │
+ └──────────────────────────────┘
+ ```
+
+
+ Gets all the String implementations of all numbers in column:
+
+ ``` sql
+SELECT groupArraySorted(str) FROM (SELECT toString(number) as str FROM numbers(5));
+
+ ```
+
+ ``` text
+ ┌─groupArraySorted(str)────────┐
+ │ ['0','1','2','3','4']        │
+ └──────────────────────────────┘
+ ```
+ 
\ No newline at end of file
diff --git a/docs/en/sql-reference/aggregate-functions/reference/index.md b/docs/en/sql-reference/aggregate-functions/reference/index.md
index 10bd3e11064..0834fef60f6 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/index.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/index.md
@@ -54,6 +54,7 @@ ClickHouse-specific aggregate functions:
 - [groupArrayMovingAvg](/docs/en/sql-reference/aggregate-functions/reference/grouparraymovingavg.md)
 - [groupArrayMovingSum](/docs/en/sql-reference/aggregate-functions/reference/grouparraymovingsum.md)
 - [groupArraySample](./grouparraysample.md)
+- [groupArraySorted](/docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md)
 - [groupBitAnd](/docs/en/sql-reference/aggregate-functions/reference/groupbitand.md)
 - [groupBitOr](/docs/en/sql-reference/aggregate-functions/reference/groupbitor.md)
 - [groupBitXor](/docs/en/sql-reference/aggregate-functions/reference/groupbitxor.md)
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
new file mode 100644
index 00000000000..debc9b6d565
--- /dev/null
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -0,0 +1,82 @@
+#include <AggregateFunctions/AggregateFunctionFactory.h>
+#include <AggregateFunctions/AggregateFunctionGroupArraySorted.h>
+#include <AggregateFunctions/Helpers.h>
+#include <AggregateFunctions/FactoryHelpers.h>
+#include <DataTypes/DataTypeDate.h>
+#include <DataTypes/DataTypeDateTime.h>
+#include <Common/Exception.h>
+
+namespace DB
+{
+struct Settings;
+
+namespace ErrorCodes
+{
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int BAD_ARGUMENTS;
+}
+
+namespace
+{
+
+template <template <typename> class AggregateFunctionTemplate, typename ... TArgs>
+AggregateFunctionPtr createWithNumericOrTimeType(const IDataType & argument_type, TArgs && ... args)
+{
+    WhichDataType which(argument_type);
+    if (which.idx == TypeIndex::Date) return std::make_shared<AggregateFunctionTemplate<UInt16>>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::DateTime) return std::make_shared<AggregateFunctionTemplate<UInt32>>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::IPv4) return std::make_shared<AggregateFunctionTemplate<IPv4>>(std::forward<TArgs>(args)...);
+    return AggregateFunctionPtr(createWithNumericType<AggregateFunctionTemplate, TArgs...>(argument_type, std::forward<TArgs>(args)...));
+}
+
+template <typename ... TArgs>
+inline AggregateFunctionPtr createAggregateFunctionGroupArraySortedImpl(const DataTypePtr & argument_type, const Array & parameters, TArgs ... args)
+{
+    if (auto res = createWithNumericOrTimeType<GroupArraySortedNumericImpl>(*argument_type, argument_type, parameters, std::forward<TArgs>(args)...))
+        return AggregateFunctionPtr(res);
+
+    WhichDataType which(argument_type);
+    return std::make_shared<GroupArraySortedGeneralImpl<GroupArraySortedNodeGeneral>>(argument_type, parameters, std::forward<TArgs>(args)...);
+}
+
+AggregateFunctionPtr createAggregateFunctionGroupArraySorted(
+    const std::string & name, const DataTypes & argument_types, const Array & parameters, const Settings *)
+{
+    assertUnary(name, argument_types);
+
+    UInt64 max_elems = std::numeric_limits<UInt64>::max();
+
+    if (parameters.empty())
+    {
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Parameter for aggregate function {} should have limit argument", name);
+    }
+    else if (parameters.size() == 1)
+    {
+        auto type = parameters[0].getType();
+        if (type != Field::Types::Int64 && type != Field::Types::UInt64)
+               throw Exception(ErrorCodes::BAD_ARGUMENTS, "Parameter for aggregate function {} should be positive number", name);
+
+        if ((type == Field::Types::Int64 && parameters[0].get<Int64>() < 0) ||
+            (type == Field::Types::UInt64 && parameters[0].get<UInt64>() == 0))
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Parameter for aggregate function {} should be positive number", name);
+
+        max_elems = parameters[0].get<UInt64>();
+    }
+    else
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            "Function {} does not support this number of arguments", name);
+
+    return createAggregateFunctionGroupArraySortedImpl(argument_types[0], parameters, max_elems);
+}
+
+}
+
+
+void registerAggregateFunctionGroupArraySorted(AggregateFunctionFactory & factory)
+{
+    AggregateFunctionProperties properties = { .returns_default_when_only_null = false, .is_order_dependent = false };
+
+    factory.registerFunction("groupArraySorted", { createAggregateFunctionGroupArraySorted, properties });
+}
+
+}
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
new file mode 100644
index 00000000000..5079eaad756
--- /dev/null
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
@@ -0,0 +1,355 @@
+#pragma once
+
+#include <IO/ReadHelpers.h>
+#include <IO/WriteHelpers.h>
+#include <IO/ReadBufferFromString.h>
+#include <IO/WriteBufferFromString.h>
+#include <IO/Operators.h>
+
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnVector.h>
+#include <Functions/array/arraySort.h>
+
+#include <Common/Exception.h>
+#include <Common/ArenaAllocator.h>
+#include <Common/assert_cast.h>
+#include <Columns/ColumnConst.h>
+#include <DataTypes/IDataType.h>
+#include <base/sort.h>
+#include <Columns/IColumn.h>
+
+#include <AggregateFunctions/IAggregateFunction.h>
+
+#include <Common/RadixSort.h>
+#include <algorithm>
+#include <type_traits>
+#include <utility>
+
+#define AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE 0xFFFFFF
+
+namespace DB
+{
+struct Settings;
+
+namespace ErrorCodes
+{
+    extern const int TOO_LARGE_ARRAY_SIZE;
+}
+
+template <typename T>
+struct GroupArraySortedData;
+
+template <typename T>
+struct GroupArraySortedData
+{
+    /// For easy serialization.
+    static_assert(std::has_unique_object_representations_v<T> || std::is_floating_point_v<T>);
+
+    // Switch to ordinary Allocator after 4096 bytes to avoid fragmentation and trash in Arena
+    using Allocator = MixedAlignedArenaAllocator<alignof(T), 4096>;
+    using Array = PODArray<T, 32, Allocator>;
+
+    Array value;
+};
+
+template <typename T>
+class GroupArraySortedNumericImpl final
+    : public IAggregateFunctionDataHelper<GroupArraySortedData<T>, GroupArraySortedNumericImpl<T>>
+{
+    using Data = GroupArraySortedData<T>;
+    UInt64 max_elems;
+    SerializationPtr serialization;
+
+public:
+    explicit GroupArraySortedNumericImpl(
+        const DataTypePtr & data_type_, const Array & parameters_, UInt64 max_elems_ = std::numeric_limits<UInt64>::max())
+        : IAggregateFunctionDataHelper<GroupArraySortedData<T>, GroupArraySortedNumericImpl<T>>(
+            {data_type_}, parameters_, std::make_shared<DataTypeArray>(data_type_))
+        , max_elems(max_elems_)
+        , serialization(data_type_->getDefaultSerialization())
+    {
+    }
+
+    String getName() const override { return "groupArraySorted"; }
+
+    void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena * arena) const override
+    {
+        const auto & row_value = assert_cast<const ColumnVector<T> &>(*columns[0]).getData()[row_num];
+        auto & cur_elems = this->data(place);
+
+        cur_elems.value.push_back(row_value, arena);
+
+        /// To optimize, we sort (2 * max_size) elements of input array over and over again
+        /// and after each loop we delete the last half of sorted array
+        if (cur_elems.value.size() >= max_elems * 2)
+        {
+            RadixSort<RadixSortNumTraits<T>>::executeLSD(cur_elems.value.data(), cur_elems.value.size());
+            cur_elems.value.resize(max_elems, arena);
+        }
+    }
+
+    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena * arena) const override
+    {
+        auto & cur_elems = this->data(place);
+        auto & rhs_elems = this->data(rhs);
+
+        if (rhs_elems.value.empty())
+            return;
+
+        if (rhs_elems.value.size())
+            cur_elems.value.insertByOffsets(rhs_elems.value, 0, rhs_elems.value.size(), arena);
+
+        RadixSort<RadixSortNumTraits<T>>::executeLSD(cur_elems.value.data(), cur_elems.value.size());
+
+        size_t elems_size = cur_elems.value.size() < max_elems ? cur_elems.value.size() : max_elems;
+        cur_elems.value.resize(elems_size, arena);
+    }
+
+    void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> /* version */) const override
+    {
+        auto & value = this->data(place).value;
+        size_t size = value.size();
+        writeVarUInt(size, buf);
+
+        for (const auto & elem : value)
+            writeBinaryLittleEndian(elem, buf);
+    }
+
+    void deserialize(AggregateDataPtr __restrict place, ReadBuffer & buf, std::optional<size_t> /* version */, Arena * arena) const override
+    {
+        size_t size = 0;
+        readVarUInt(size, buf);
+
+        if (unlikely(size > max_elems))
+            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elems);
+
+        auto & value = this->data(place).value;
+
+        value.resize(size, arena);
+        for (auto & element : value)
+            readBinaryLittleEndian(element, buf);
+    }
+
+    static void checkArraySize(size_t elems, size_t max_elems)
+    {
+        if (unlikely(elems > max_elems))
+            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE,
+                            "Too large array size {} (maximum: {})", elems, max_elems);
+    }
+
+    void insertResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const override
+    {
+        auto& value = this->data(place).value;
+
+        RadixSort<RadixSortNumTraits<T>>::executeLSD(value.data(), value.size());
+        size_t elems_size = value.size() < max_elems ? value.size() : max_elems;
+        value.resize(elems_size, arena);
+        size_t size = value.size();
+
+        ColumnArray & arr_to = assert_cast<ColumnArray &>(to);
+        ColumnArray::Offsets & offsets_to = arr_to.getOffsets();
+
+        offsets_to.push_back(offsets_to.back() + size);
+
+        if (size)
+        {
+            typename ColumnVector<T>::Container & data_to = assert_cast<ColumnVector<T> &>(arr_to.getData()).getData();
+            data_to.insert(this->data(place).value.begin(), this->data(place).value.end());
+            RadixSort<RadixSortNumTraits<T>>::executeLSD(value.data(), value.size());
+            value.resize(elems_size, arena);
+        }
+    }
+
+    bool allocatesMemoryInArena() const override { return true; }
+};
+
+
+template <typename Node, bool has_sampler>
+struct GroupArraySortedGeneralData;
+
+template <typename Node>
+struct GroupArraySortedGeneralData<Node, false>
+{
+    // Switch to ordinary Allocator after 4096 bytes to avoid fragmentation and trash in Arena
+    using Allocator = MixedAlignedArenaAllocator<alignof(Node *), 4096>;
+    using Array = PODArray<Field, 32, Allocator>;
+
+    Array value;
+};
+
+template <typename Node>
+struct GroupArraySortedNodeBase
+{
+    UInt64 size; // size of payload
+
+    /// Returns pointer to actual payload
+    char * data() { return reinterpret_cast<char *>(this) + sizeof(Node); }
+
+    const char * data() const { return reinterpret_cast<const char *>(this) + sizeof(Node); }
+};
+
+struct GroupArraySortedNodeString : public GroupArraySortedNodeBase<GroupArraySortedNodeString>
+{
+    using Node = GroupArraySortedNodeString;
+
+};
+
+struct GroupArraySortedNodeGeneral : public GroupArraySortedNodeBase<GroupArraySortedNodeGeneral>
+{
+    using Node = GroupArraySortedNodeGeneral;
+
+};
+
+/// Implementation of groupArraySorted for Generic data via Array
+template <typename Node>
+class GroupArraySortedGeneralImpl final
+    : public IAggregateFunctionDataHelper<GroupArraySortedGeneralData<Node, false>, GroupArraySortedGeneralImpl<Node>>
+{
+    using Data = GroupArraySortedGeneralData<Node, false>;
+    static Data & data(AggregateDataPtr __restrict place) { return *reinterpret_cast<Data *>(place); }
+    static const Data & data(ConstAggregateDataPtr __restrict place) { return *reinterpret_cast<const Data *>(place); }
+
+    DataTypePtr & data_type;
+    UInt64 max_elems;
+    SerializationPtr serialization;
+
+
+public:
+    GroupArraySortedGeneralImpl(const DataTypePtr & data_type_, const Array & parameters_, UInt64 max_elems_ = std::numeric_limits<UInt64>::max())
+        : IAggregateFunctionDataHelper<GroupArraySortedGeneralData<Node, false>, GroupArraySortedGeneralImpl<Node>>(
+            {data_type_}, parameters_, std::make_shared<DataTypeArray>(data_type_))
+        , data_type(this->argument_types[0])
+        , max_elems(max_elems_)
+        , serialization(data_type->getDefaultSerialization())
+    {
+    }
+
+    String getName() const override { return "groupArraySorted"; }
+
+    void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena * arena) const override
+    {
+        auto & cur_elems = data(place);
+
+        cur_elems.value.push_back(columns[0][0][row_num], arena);
+
+        /// To optimize, we sort (2 * max_size) elements of input array over and over again and
+        /// after each loop we delete the last half of sorted array
+
+        if (cur_elems.value.size() >= max_elems * 2)
+        {
+            std::sort(cur_elems.value.begin(), cur_elems.value.begin() + (max_elems * 2));
+            cur_elems.value.erase(cur_elems.value.begin() + max_elems, cur_elems.value.begin() + (max_elems * 2));
+        }
+    }
+
+    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena * arena) const override
+    {
+        auto & cur_elems = data(place);
+        auto & rhs_elems = data(rhs);
+
+        if (rhs_elems.value.empty())
+            return;
+
+        UInt64 new_elems = rhs_elems.value.size();
+
+        for (UInt64 i = 0; i < new_elems; ++i)
+            cur_elems.value.push_back(rhs_elems.value[i], arena);
+
+        checkArraySize(cur_elems.value.size(), AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
+
+        if (!cur_elems.value.empty())
+        {
+            std::sort(cur_elems.value.begin(), cur_elems.value.end());
+
+            if (cur_elems.value.size() > max_elems)
+                cur_elems.value.resize(max_elems, arena);
+        }
+    }
+
+    static void checkArraySize(size_t elems, size_t max_elems)
+    {
+        if (unlikely(elems > max_elems))
+            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE,
+                            "Too large array size {} (maximum: {})", elems, max_elems);
+    }
+
+    void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> /* version */) const override
+    {
+        auto & value = data(place).value;
+        size_t size = value.size();
+        checkArraySize(size, AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
+        writeVarUInt(size, buf);
+
+        for (const Field & elem : value)
+        {
+            if (elem.isNull())
+            {
+                writeBinary(false, buf);
+            }
+            else
+            {
+                writeBinary(true, buf);
+                serialization->serializeBinary(elem, buf, {});
+            }
+        }
+    }
+
+    void deserialize(AggregateDataPtr __restrict place, ReadBuffer & buf, std::optional<size_t> /* version */, Arena * arena) const override
+    {
+        size_t size = 0;
+        readVarUInt(size, buf);
+
+        if (unlikely(size > max_elems))
+            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elems);
+
+        checkArraySize(size, AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
+        auto & value = data(place).value;
+
+        value.resize(size, arena);
+        for (Field & elem : value)
+        {
+            UInt8 is_null = 0;
+            readBinary(is_null, buf);
+            if (!is_null)
+                serialization->deserializeBinary(elem, buf, {});
+        }
+    }
+
+    void insertResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const override
+    {
+        auto & column_array = assert_cast<ColumnArray &>(to);
+        auto & value = data(place).value;
+
+        if (!value.empty())
+        {
+            std::sort(value.begin(), value.end());
+
+            if (value.size() > max_elems)
+                value.resize_exact(max_elems, arena);
+        }
+        auto & offsets = column_array.getOffsets();
+        offsets.push_back(offsets.back() + value.size());
+
+        auto & column_data = column_array.getData();
+
+        if (std::is_same_v<Node, GroupArraySortedNodeString>)
+        {
+            auto & string_offsets = assert_cast<ColumnString &>(column_data).getOffsets();
+            string_offsets.reserve(string_offsets.size() + value.size());
+        }
+
+        for (const Field& field : value)
+            column_data.insert(field);
+    }
+
+    bool allocatesMemoryInArena() const override { return true; }
+};
+
+#undef AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ARRAY_SIZE
+
+}
diff --git a/src/AggregateFunctions/registerAggregateFunctions.cpp b/src/AggregateFunctions/registerAggregateFunctions.cpp
index 6d3a144fa49..f44bc9e126c 100644
--- a/src/AggregateFunctions/registerAggregateFunctions.cpp
+++ b/src/AggregateFunctions/registerAggregateFunctions.cpp
@@ -15,6 +15,7 @@ void registerAggregateFunctionCount(AggregateFunctionFactory &);
 void registerAggregateFunctionDeltaSum(AggregateFunctionFactory &);
 void registerAggregateFunctionDeltaSumTimestamp(AggregateFunctionFactory &);
 void registerAggregateFunctionGroupArray(AggregateFunctionFactory &);
+void registerAggregateFunctionGroupArraySorted(AggregateFunctionFactory & factory);
 void registerAggregateFunctionGroupUniqArray(AggregateFunctionFactory &);
 void registerAggregateFunctionGroupArrayInsertAt(AggregateFunctionFactory &);
 void registerAggregateFunctionsQuantile(AggregateFunctionFactory &);
@@ -112,6 +113,7 @@ void registerAggregateFunctions()
         registerAggregateFunctionDeltaSum(factory);
         registerAggregateFunctionDeltaSumTimestamp(factory);
         registerAggregateFunctionGroupArray(factory);
+        registerAggregateFunctionGroupArraySorted(factory);
         registerAggregateFunctionGroupUniqArray(factory);
         registerAggregateFunctionGroupArrayInsertAt(factory);
         registerAggregateFunctionsQuantile(factory);
diff --git a/tests/performance/group_array_sorted.xml b/tests/performance/group_array_sorted.xml
new file mode 100644
index 00000000000..d5887998341
--- /dev/null
+++ b/tests/performance/group_array_sorted.xml
@@ -0,0 +1,31 @@
+<test>
+    <settings>
+        <max_memory_usage>30000000000</max_memory_usage>
+    </settings>
+
+    <substitutions>
+        <substitution>
+            <name>millions</name>
+            <values>
+                <value>50</value>
+                <value>100</value>
+            </values>
+        </substitution>
+        <substitution>
+            <name>window</name>
+            <values>
+                <value>10</value>
+                <value>1000</value>
+                <value>10000</value>
+            </values>
+        </substitution>
+    </substitutions>
+
+    <create_query>create table sorted_{millions}m engine MergeTree order by k as select number % 100 k, rand() v from numbers_mt(1000000 * {millions})</create_query>
+    <create_query>optimize table sorted_{millions}m final</create_query>
+
+    <query>select k, groupArraySorted({window})(v) from sorted_{millions}m group by k format Null</query>
+    <query>select k % 10 kk, groupArraySorted({window})(v) from sorted_{millions}m group by kk format Null</query>
+
+    <drop_query>drop table if exists sorted_{millions}m</drop_query>
+</test>
diff --git a/tests/queries/0_stateless/02841_group_array_sorted.reference b/tests/queries/0_stateless/02841_group_array_sorted.reference
new file mode 100644
index 00000000000..1043f949590
--- /dev/null
+++ b/tests/queries/0_stateless/02841_group_array_sorted.reference
@@ -0,0 +1,12 @@
+[0,1,2,3,4]
+[0,1,2,3,4]
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99]
+['0','1','10','11','12','13','14','15','16','17','18','19','2','20','21','22','23','24','25','26','27','28','29','3','4','5','6','7','8','9']
+[0,0,1,1,2,2,3,3,4,4]
+[[1,2,3,4],[2,3,4,5],[3,4,5,6]]
+[(2,1),(15,25),(30,60),(100,200)]
+[0.2,2.2,6.6,12.5]
+['AAA','Aaa','aaa','abc','bbc']
+1000000
+1000000
+[0,1]
diff --git a/tests/queries/0_stateless/02841_group_array_sorted.sql b/tests/queries/0_stateless/02841_group_array_sorted.sql
new file mode 100644
index 00000000000..a8cd6791ff3
--- /dev/null
+++ b/tests/queries/0_stateless/02841_group_array_sorted.sql
@@ -0,0 +1,41 @@
+SELECT groupArraySorted(5)(number) FROM numbers(100);
+
+SELECT groupArraySorted(10)(number) FROM numbers(5);
+
+SELECT groupArraySorted(100)(number) FROM numbers(1000);
+
+SELECT groupArraySorted(30)(str) FROM (SELECT toString(number) as str FROM numbers(30));
+
+SELECT groupArraySorted(10)(toInt64(number/2)) FROM numbers(100);
+
+DROP TABLE IF EXISTS test;
+CREATE TABLE test (a Array(UInt64)) engine=MergeTree ORDER BY a;
+INSERT INTO test VALUES ([3,4,5,6]), ([1,2,3,4]), ([2,3,4,5]);
+SELECT groupArraySorted(3)(a) FROM test;
+DROP TABLE test;
+
+CREATE TABLE IF NOT EXISTS test (id Int32, data Tuple(Int32, Int32)) ENGINE = MergeTree() ORDER BY id;
+INSERT INTO test (id, data) VALUES (1, (100, 200)), (2, (15, 25)), (3, (2, 1)), (4, (30, 60));
+SELECT groupArraySorted(4)(data) FROM test;
+DROP TABLE test;
+
+CREATE TABLE IF NOT EXISTS test (id Int32, data Decimal32(2)) ENGINE = MergeTree() ORDER BY id;
+INSERT INTO test (id, data) VALUES (1, 12.5), (2, 0.2), (3, 6.6), (4, 2.2);
+SELECT groupArraySorted(4)(data) FROM test;
+DROP TABLE test;
+
+CREATE TABLE IF NOT EXISTS test (id Int32, data FixedString(3)) ENGINE = MergeTree() ORDER BY id;
+INSERT INTO test (id, data) VALUES (1, 'AAA'), (2, 'bbc'), (3, 'abc'), (4, 'aaa'), (5, 'Aaa');
+SELECT groupArraySorted(5)(data) FROM test;
+DROP TABLE test;
+
+CREATE TABLE test (id Decimal(76, 53), str String) ENGINE = MergeTree ORDER BY id;
+INSERT INTO test SELECT number, 'test' FROM numbers(1000000);
+SELECT count(id) FROM test;
+SELECT count(concat(toString(id), 'a')) FROM test;
+DROP TABLE test;
+
+CREATE TABLE test (id UInt64, agg AggregateFunction(groupArraySorted(2), UInt64)) engine=MergeTree ORDER BY id;
+INSERT INTO test SELECT 1, groupArraySortedState(2)(number) FROM numbers(10);
+SELECT groupArraySortedMerge(2)(agg) FROM test;
+DROP TABLE test;
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 93e2a12d69c..cacba174237 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1593,6 +1593,7 @@ groupArrayLast
 groupArrayMovingAvg
 groupArrayMovingSum
 groupArraySample
+groupArraySorted
 groupBitAnd
 groupBitOr
 groupBitXor
@@ -1607,6 +1608,7 @@ grouparraylast
 grouparraymovingavg
 grouparraymovingsum
 grouparraysample
+grouparraysorted
 groupbitand
 groupbitmap
 groupbitmapand

From 86a542b5c4bb9978830b82e07c7dc80f3c6a5df3 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 24 Jan 2024 15:06:21 +0300
Subject: [PATCH 225/245] Updated implementation

---
 base/base/sort.h                              |  20 +-
 .../AggregateFunctionGroupArraySorted.cpp     | 333 +++++++++++++++-
 .../AggregateFunctionGroupArraySorted.h       | 355 ------------------
 .../examples/CMakeLists.txt                   |   3 +
 .../examples/group_array_sorted.cpp           | 205 ++++++++++
 5 files changed, 543 insertions(+), 373 deletions(-)
 delete mode 100644 src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
 create mode 100644 src/AggregateFunctions/examples/group_array_sorted.cpp

diff --git a/base/base/sort.h b/base/base/sort.h
index 1a814587763..99bf8a0830e 100644
--- a/base/base/sort.h
+++ b/base/base/sort.h
@@ -64,19 +64,14 @@ using ComparatorWrapper = Comparator;
 
 #include <miniselect/floyd_rivest_select.h>
 
-template <typename RandomIt>
-void nth_element(RandomIt first, RandomIt nth, RandomIt last)
+template <typename RandomIt, typename Compare>
+void nth_element(RandomIt first, RandomIt nth, RandomIt last, Compare compare)
 {
-    using value_type = typename std::iterator_traits<RandomIt>::value_type;
-    using comparator = std::less<value_type>;
-
-    comparator compare;
-    ComparatorWrapper<comparator> compare_wrapper = compare;
-
 #ifndef NDEBUG
     ::shuffle(first, last);
 #endif
 
+    ComparatorWrapper<Compare> compare_wrapper = compare;
     ::miniselect::floyd_rivest_select(first, nth, last, compare_wrapper);
 
 #ifndef NDEBUG
@@ -87,6 +82,15 @@ void nth_element(RandomIt first, RandomIt nth, RandomIt last)
 #endif
 }
 
+template <typename RandomIt>
+void nth_element(RandomIt first, RandomIt nth, RandomIt last)
+{
+    using value_type = typename std::iterator_traits<RandomIt>::value_type;
+    using comparator = std::less<value_type>;
+
+    ::nth_element(first, nth, last, comparator());
+}
+
 template <typename RandomIt, typename Compare>
 void partial_sort(RandomIt first, RandomIt middle, RandomIt last, Compare compare)
 {
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
index debc9b6d565..5eb20f9d14d 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -1,45 +1,356 @@
+#include <AggregateFunctions/IAggregateFunction.h>
 #include <AggregateFunctions/AggregateFunctionFactory.h>
-#include <AggregateFunctions/AggregateFunctionGroupArraySorted.h>
 #include <AggregateFunctions/Helpers.h>
 #include <AggregateFunctions/FactoryHelpers.h>
+
+#include <base/sort.h>
+#include <algorithm>
+#include <type_traits>
+#include <utility>
+
+#include <Common/RadixSort.h>
+#include <Common/Exception.h>
+#include <Common/ArenaAllocator.h>
+#include <Common/assert_cast.h>
+
+#include <IO/ReadHelpers.h>
+#include <IO/WriteHelpers.h>
+#include <IO/ReadBufferFromString.h>
+#include <IO/WriteBufferFromString.h>
+#include <IO/Operators.h>
+
+#include <DataTypes/IDataType.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
-#include <Common/Exception.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnVector.h>
+
+#include <Columns/IColumn.h>
+#include <Columns/ColumnConst.h>
 
 namespace DB
 {
+
 struct Settings;
 
 namespace ErrorCodes
 {
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int BAD_ARGUMENTS;
+    extern const int UNSUPPORTED_METHOD;
+    extern const int TOO_LARGE_ARRAY_SIZE;
 }
 
 namespace
 {
 
+enum class GroupArraySortedStrategy
+{
+    heap,
+    sort
+};
+
+constexpr size_t group_array_sorted_sort_strategy_max_elements_threshold = 1000000;
+
+template <typename T, GroupArraySortedStrategy strategy>
+struct GroupArraySortedData
+{
+    using Allocator = MixedAlignedArenaAllocator<alignof(T), 4096>;
+    using Array = PODArray<T, 32, Allocator>;
+
+    static constexpr size_t partial_sort_max_elements_factor = 2;
+
+    static constexpr bool is_value_generic_field = std::is_same_v<T, Field>;
+
+    Array values;
+
+    static bool compare(const T & lhs, const T & rhs)
+    {
+        if constexpr (is_value_generic_field)
+        {
+            return lhs < rhs;
+        }
+        else
+        {
+            return CompareHelper<T>::less(lhs, rhs, -1);
+        }
+    }
+
+    struct Comparator
+    {
+        bool operator()(const T & lhs, const T & rhs)
+        {
+            return compare(lhs, rhs);
+        }
+    };
+
+    ALWAYS_INLINE void heapReplaceTop()
+    {
+        size_t size = values.size();
+        if (size < 2)
+            return;
+
+        size_t child_index = 1;
+
+        if (values.size() > 2 && compare(values[1], values[2]))
+            ++child_index;
+
+        /// Check if we are in order
+        if (compare(values[child_index], values[0]))
+            return;
+
+        size_t current_index = 0;
+        auto current = values[current_index];
+
+        do
+        {
+            /// We are not in heap-order, swap the parent with it's largest child.
+            values[current_index] = values[child_index];
+            current_index = child_index;
+
+            // Recompute the child based off of the updated parent
+            child_index = 2 * child_index + 1;
+
+            if (child_index >= size)
+                break;
+
+            if ((child_index + 1) < size && compare(values[child_index], values[child_index + 1]))
+            {
+                /// Right child exists and is greater than left child.
+                ++child_index;
+            }
+
+            /// Check if we are in order.
+        } while (!compare(values[child_index], current));
+
+        values[current_index] = current;
+    }
+
+    ALWAYS_INLINE void sortAndLimit(size_t max_elements, Arena * arena)
+    {
+        if constexpr (is_value_generic_field)
+            ::sort(values.begin(), values.end(), Comparator());
+        else
+            RadixSort<RadixSortNumTraits<T>>::executeLSD(values.data(), values.size());
+
+        if (values.size() > max_elements)
+            values.resize(max_elements, arena);
+    }
+
+    ALWAYS_INLINE void partialSortAndLimitIfNeeded(size_t max_elements, Arena * arena)
+    {
+        if (values.size() < max_elements * partial_sort_max_elements_factor)
+            return;
+
+        ::nth_element(values.begin(), values.begin() + max_elements, values.end(), Comparator());
+        values.resize(max_elements, arena);
+    }
+
+    ALWAYS_INLINE void addElement(T && element, size_t max_elements, Arena * arena)
+    {
+        if constexpr (strategy == GroupArraySortedStrategy::heap)
+        {
+            if (values.size() >= max_elements)
+            {
+                /// Element is greater or equal than current max element, it cannot be in k min elements
+                if (!compare(element, values[0]))
+                    return;
+
+                values[0] = std::move(element);
+                heapReplaceTop();
+                return;
+            }
+
+            values.push_back(std::move(element), arena);
+            std::push_heap(values.begin(), values.end(), Comparator());
+        }
+        else
+        {
+            values.push_back(std::move(element), arena);
+            partialSortAndLimitIfNeeded(max_elements, arena);
+        }
+    }
+
+    ALWAYS_INLINE void insertResultInto(IColumn & to, size_t max_elements, Arena * arena)
+    {
+        auto & result_array = assert_cast<ColumnArray &>(to);
+        auto & result_array_offsets = result_array.getOffsets();
+
+        sortAndLimit(max_elements, arena);
+
+        result_array_offsets.push_back(result_array_offsets.back() + values.size());
+
+        if (values.empty())
+            return;
+
+        if constexpr (is_value_generic_field)
+        {
+            auto & result_array_data = result_array.getData();
+            for (auto & value : values)
+                result_array_data.insert(value);
+        }
+        else
+        {
+            auto & result_array_data = assert_cast<ColumnVector<T> &>(result_array.getData()).getData();
+
+            size_t result_array_data_insert_begin = result_array_data.size();
+            result_array_data.resize(result_array_data_insert_begin + values.size());
+
+            for (size_t i = 0; i < values.size(); ++i)
+                result_array_data[result_array_data_insert_begin + i] = values[i];
+        }
+    }
+};
+
+template <typename T>
+using GroupArraySortedDataHeap = GroupArraySortedData<T, GroupArraySortedStrategy::heap>;
+
+template <typename T>
+using GroupArraySortedDataSort = GroupArraySortedData<T, GroupArraySortedStrategy::sort>;
+
+constexpr UInt64 aggregate_function_group_array_sorted_max_element_size = 0xFFFFFF;
+
+template <typename Data, typename T>
+class GroupArraySorted final
+    : public IAggregateFunctionDataHelper<Data, GroupArraySorted<Data, T>>
+{
+public:
+    explicit GroupArraySorted(
+        const DataTypePtr & data_type_, const Array & parameters_, UInt64 max_elements_)
+        : IAggregateFunctionDataHelper<Data, GroupArraySorted<Data, T>>(
+            {data_type_}, parameters_, std::make_shared<DataTypeArray>(data_type_))
+        , max_elements(max_elements_)
+        , serialization(data_type_->getDefaultSerialization())
+    {
+        if (max_elements > aggregate_function_group_array_sorted_max_element_size)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                "Too large limit parameter for groupArraySorted aggregate function, it should not exceed {}",
+                aggregate_function_group_array_sorted_max_element_size);
+    }
+
+    String getName() const override { return "groupArraySorted"; }
+
+    void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena * arena) const override
+    {
+        if constexpr (std::is_same_v<T, Field>)
+        {
+            auto row_value = (*columns[0])[row_num];
+            this->data(place).addElement(std::move(row_value), max_elements, arena);
+        }
+        else
+        {
+            auto row_value = assert_cast<const ColumnVector<T> &>(*columns[0]).getData()[row_num];
+            this->data(place).addElement(std::move(row_value), max_elements, arena);
+        }
+    }
+
+    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena * arena) const override
+    {
+        auto & rhs_values = this->data(rhs).values;
+        for (auto rhs_element : rhs_values)
+            this->data(place).addElement(std::move(rhs_element), max_elements, arena);
+    }
+
+    void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> /* version */) const override
+    {
+        auto & values = this->data(place).values;
+        size_t size = values.size();
+        writeVarUInt(size, buf);
+
+        if constexpr (std::is_same_v<T, Field>)
+        {
+            for (const Field & element : values)
+            {
+                if (element.isNull())
+                {
+                    writeBinary(false, buf);
+                }
+                else
+                {
+                    writeBinary(true, buf);
+                    serialization->serializeBinary(element, buf, {});
+                }
+            }
+        }
+        else
+        {
+            for (const auto & element : values)
+                writeBinaryLittleEndian(element, buf);
+        }
+    }
+
+    void deserialize(AggregateDataPtr __restrict place, ReadBuffer & buf, std::optional<size_t> /* version */, Arena * arena) const override
+    {
+        size_t size = 0;
+        readVarUInt(size, buf);
+
+        if (unlikely(size > max_elements))
+            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elements);
+
+        auto & values = this->data(place).values;
+        values.resize(size, arena);
+
+        if constexpr (std::is_same_v<T, Field>)
+        {
+            for (Field & element : values)
+            {
+                UInt8 is_null = 0;
+                readBinary(is_null, buf);
+                if (!is_null)
+                    serialization->deserializeBinary(element, buf, {});
+            }
+        }
+        else
+        {
+            for (auto & element : values)
+                readBinaryLittleEndian(element, buf);
+        }
+    }
+
+    void insertResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const override
+    {
+        this->data(place).insertResultInto(to, max_elements, arena);
+    }
+
+    bool allocatesMemoryInArena() const override { return true; }
+
+private:
+    UInt64 max_elements;
+    SerializationPtr serialization;
+};
+
+template <typename T>
+using GroupArraySortedHeap = GroupArraySorted<GroupArraySortedDataHeap<T>, T>;
+
+template <typename T>
+using GroupArraySortedSort = GroupArraySorted<GroupArraySortedDataSort<T>, T>;
+
 template <template <typename> class AggregateFunctionTemplate, typename ... TArgs>
 AggregateFunctionPtr createWithNumericOrTimeType(const IDataType & argument_type, TArgs && ... args)
 {
     WhichDataType which(argument_type);
+
     if (which.idx == TypeIndex::Date) return std::make_shared<AggregateFunctionTemplate<UInt16>>(std::forward<TArgs>(args)...);
     if (which.idx == TypeIndex::DateTime) return std::make_shared<AggregateFunctionTemplate<UInt32>>(std::forward<TArgs>(args)...);
     if (which.idx == TypeIndex::IPv4) return std::make_shared<AggregateFunctionTemplate<IPv4>>(std::forward<TArgs>(args)...);
+
     return AggregateFunctionPtr(createWithNumericType<AggregateFunctionTemplate, TArgs...>(argument_type, std::forward<TArgs>(args)...));
 }
 
-template <typename ... TArgs>
+template <template <typename> class AggregateFunctionTemplate, typename ... TArgs>
 inline AggregateFunctionPtr createAggregateFunctionGroupArraySortedImpl(const DataTypePtr & argument_type, const Array & parameters, TArgs ... args)
 {
-    if (auto res = createWithNumericOrTimeType<GroupArraySortedNumericImpl>(*argument_type, argument_type, parameters, std::forward<TArgs>(args)...))
+    if (auto res = createWithNumericOrTimeType<AggregateFunctionTemplate>(*argument_type, argument_type, parameters, std::forward<TArgs>(args)...))
         return AggregateFunctionPtr(res);
 
-    WhichDataType which(argument_type);
-    return std::make_shared<GroupArraySortedGeneralImpl<GroupArraySortedNodeGeneral>>(argument_type, parameters, std::forward<TArgs>(args)...);
+    return std::make_shared<AggregateFunctionTemplate<Field>>(argument_type, parameters, std::forward<TArgs>(args)...);
 }
 
-AggregateFunctionPtr createAggregateFunctionGroupArraySorted(
+AggregateFunctionPtr createAggregateFunctionGroupArray(
     const std::string & name, const DataTypes & argument_types, const Array & parameters, const Settings *)
 {
     assertUnary(name, argument_types);
@@ -66,17 +377,19 @@ AggregateFunctionPtr createAggregateFunctionGroupArraySorted(
         throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
             "Function {} does not support this number of arguments", name);
 
-    return createAggregateFunctionGroupArraySortedImpl(argument_types[0], parameters, max_elems);
+    if (max_elems > group_array_sorted_sort_strategy_max_elements_threshold)
+        return createAggregateFunctionGroupArraySortedImpl<GroupArraySortedSort>(argument_types[0], parameters, max_elems);
+
+    return createAggregateFunctionGroupArraySortedImpl<GroupArraySortedHeap>(argument_types[0], parameters, max_elems);
 }
 
 }
 
-
 void registerAggregateFunctionGroupArraySorted(AggregateFunctionFactory & factory)
 {
     AggregateFunctionProperties properties = { .returns_default_when_only_null = false, .is_order_dependent = false };
 
-    factory.registerFunction("groupArraySorted", { createAggregateFunctionGroupArraySorted, properties });
+    factory.registerFunction("groupArraySorted", { createAggregateFunctionGroupArray, properties });
 }
 
 }
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
deleted file mode 100644
index 5079eaad756..00000000000
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
+++ /dev/null
@@ -1,355 +0,0 @@
-#pragma once
-
-#include <IO/ReadHelpers.h>
-#include <IO/WriteHelpers.h>
-#include <IO/ReadBufferFromString.h>
-#include <IO/WriteBufferFromString.h>
-#include <IO/Operators.h>
-
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypesNumber.h>
-
-#include <Columns/ColumnArray.h>
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnVector.h>
-#include <Functions/array/arraySort.h>
-
-#include <Common/Exception.h>
-#include <Common/ArenaAllocator.h>
-#include <Common/assert_cast.h>
-#include <Columns/ColumnConst.h>
-#include <DataTypes/IDataType.h>
-#include <base/sort.h>
-#include <Columns/IColumn.h>
-
-#include <AggregateFunctions/IAggregateFunction.h>
-
-#include <Common/RadixSort.h>
-#include <algorithm>
-#include <type_traits>
-#include <utility>
-
-#define AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE 0xFFFFFF
-
-namespace DB
-{
-struct Settings;
-
-namespace ErrorCodes
-{
-    extern const int TOO_LARGE_ARRAY_SIZE;
-}
-
-template <typename T>
-struct GroupArraySortedData;
-
-template <typename T>
-struct GroupArraySortedData
-{
-    /// For easy serialization.
-    static_assert(std::has_unique_object_representations_v<T> || std::is_floating_point_v<T>);
-
-    // Switch to ordinary Allocator after 4096 bytes to avoid fragmentation and trash in Arena
-    using Allocator = MixedAlignedArenaAllocator<alignof(T), 4096>;
-    using Array = PODArray<T, 32, Allocator>;
-
-    Array value;
-};
-
-template <typename T>
-class GroupArraySortedNumericImpl final
-    : public IAggregateFunctionDataHelper<GroupArraySortedData<T>, GroupArraySortedNumericImpl<T>>
-{
-    using Data = GroupArraySortedData<T>;
-    UInt64 max_elems;
-    SerializationPtr serialization;
-
-public:
-    explicit GroupArraySortedNumericImpl(
-        const DataTypePtr & data_type_, const Array & parameters_, UInt64 max_elems_ = std::numeric_limits<UInt64>::max())
-        : IAggregateFunctionDataHelper<GroupArraySortedData<T>, GroupArraySortedNumericImpl<T>>(
-            {data_type_}, parameters_, std::make_shared<DataTypeArray>(data_type_))
-        , max_elems(max_elems_)
-        , serialization(data_type_->getDefaultSerialization())
-    {
-    }
-
-    String getName() const override { return "groupArraySorted"; }
-
-    void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena * arena) const override
-    {
-        const auto & row_value = assert_cast<const ColumnVector<T> &>(*columns[0]).getData()[row_num];
-        auto & cur_elems = this->data(place);
-
-        cur_elems.value.push_back(row_value, arena);
-
-        /// To optimize, we sort (2 * max_size) elements of input array over and over again
-        /// and after each loop we delete the last half of sorted array
-        if (cur_elems.value.size() >= max_elems * 2)
-        {
-            RadixSort<RadixSortNumTraits<T>>::executeLSD(cur_elems.value.data(), cur_elems.value.size());
-            cur_elems.value.resize(max_elems, arena);
-        }
-    }
-
-    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena * arena) const override
-    {
-        auto & cur_elems = this->data(place);
-        auto & rhs_elems = this->data(rhs);
-
-        if (rhs_elems.value.empty())
-            return;
-
-        if (rhs_elems.value.size())
-            cur_elems.value.insertByOffsets(rhs_elems.value, 0, rhs_elems.value.size(), arena);
-
-        RadixSort<RadixSortNumTraits<T>>::executeLSD(cur_elems.value.data(), cur_elems.value.size());
-
-        size_t elems_size = cur_elems.value.size() < max_elems ? cur_elems.value.size() : max_elems;
-        cur_elems.value.resize(elems_size, arena);
-    }
-
-    void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> /* version */) const override
-    {
-        auto & value = this->data(place).value;
-        size_t size = value.size();
-        writeVarUInt(size, buf);
-
-        for (const auto & elem : value)
-            writeBinaryLittleEndian(elem, buf);
-    }
-
-    void deserialize(AggregateDataPtr __restrict place, ReadBuffer & buf, std::optional<size_t> /* version */, Arena * arena) const override
-    {
-        size_t size = 0;
-        readVarUInt(size, buf);
-
-        if (unlikely(size > max_elems))
-            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elems);
-
-        auto & value = this->data(place).value;
-
-        value.resize(size, arena);
-        for (auto & element : value)
-            readBinaryLittleEndian(element, buf);
-    }
-
-    static void checkArraySize(size_t elems, size_t max_elems)
-    {
-        if (unlikely(elems > max_elems))
-            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE,
-                            "Too large array size {} (maximum: {})", elems, max_elems);
-    }
-
-    void insertResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const override
-    {
-        auto& value = this->data(place).value;
-
-        RadixSort<RadixSortNumTraits<T>>::executeLSD(value.data(), value.size());
-        size_t elems_size = value.size() < max_elems ? value.size() : max_elems;
-        value.resize(elems_size, arena);
-        size_t size = value.size();
-
-        ColumnArray & arr_to = assert_cast<ColumnArray &>(to);
-        ColumnArray::Offsets & offsets_to = arr_to.getOffsets();
-
-        offsets_to.push_back(offsets_to.back() + size);
-
-        if (size)
-        {
-            typename ColumnVector<T>::Container & data_to = assert_cast<ColumnVector<T> &>(arr_to.getData()).getData();
-            data_to.insert(this->data(place).value.begin(), this->data(place).value.end());
-            RadixSort<RadixSortNumTraits<T>>::executeLSD(value.data(), value.size());
-            value.resize(elems_size, arena);
-        }
-    }
-
-    bool allocatesMemoryInArena() const override { return true; }
-};
-
-
-template <typename Node, bool has_sampler>
-struct GroupArraySortedGeneralData;
-
-template <typename Node>
-struct GroupArraySortedGeneralData<Node, false>
-{
-    // Switch to ordinary Allocator after 4096 bytes to avoid fragmentation and trash in Arena
-    using Allocator = MixedAlignedArenaAllocator<alignof(Node *), 4096>;
-    using Array = PODArray<Field, 32, Allocator>;
-
-    Array value;
-};
-
-template <typename Node>
-struct GroupArraySortedNodeBase
-{
-    UInt64 size; // size of payload
-
-    /// Returns pointer to actual payload
-    char * data() { return reinterpret_cast<char *>(this) + sizeof(Node); }
-
-    const char * data() const { return reinterpret_cast<const char *>(this) + sizeof(Node); }
-};
-
-struct GroupArraySortedNodeString : public GroupArraySortedNodeBase<GroupArraySortedNodeString>
-{
-    using Node = GroupArraySortedNodeString;
-
-};
-
-struct GroupArraySortedNodeGeneral : public GroupArraySortedNodeBase<GroupArraySortedNodeGeneral>
-{
-    using Node = GroupArraySortedNodeGeneral;
-
-};
-
-/// Implementation of groupArraySorted for Generic data via Array
-template <typename Node>
-class GroupArraySortedGeneralImpl final
-    : public IAggregateFunctionDataHelper<GroupArraySortedGeneralData<Node, false>, GroupArraySortedGeneralImpl<Node>>
-{
-    using Data = GroupArraySortedGeneralData<Node, false>;
-    static Data & data(AggregateDataPtr __restrict place) { return *reinterpret_cast<Data *>(place); }
-    static const Data & data(ConstAggregateDataPtr __restrict place) { return *reinterpret_cast<const Data *>(place); }
-
-    DataTypePtr & data_type;
-    UInt64 max_elems;
-    SerializationPtr serialization;
-
-
-public:
-    GroupArraySortedGeneralImpl(const DataTypePtr & data_type_, const Array & parameters_, UInt64 max_elems_ = std::numeric_limits<UInt64>::max())
-        : IAggregateFunctionDataHelper<GroupArraySortedGeneralData<Node, false>, GroupArraySortedGeneralImpl<Node>>(
-            {data_type_}, parameters_, std::make_shared<DataTypeArray>(data_type_))
-        , data_type(this->argument_types[0])
-        , max_elems(max_elems_)
-        , serialization(data_type->getDefaultSerialization())
-    {
-    }
-
-    String getName() const override { return "groupArraySorted"; }
-
-    void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena * arena) const override
-    {
-        auto & cur_elems = data(place);
-
-        cur_elems.value.push_back(columns[0][0][row_num], arena);
-
-        /// To optimize, we sort (2 * max_size) elements of input array over and over again and
-        /// after each loop we delete the last half of sorted array
-
-        if (cur_elems.value.size() >= max_elems * 2)
-        {
-            std::sort(cur_elems.value.begin(), cur_elems.value.begin() + (max_elems * 2));
-            cur_elems.value.erase(cur_elems.value.begin() + max_elems, cur_elems.value.begin() + (max_elems * 2));
-        }
-    }
-
-    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena * arena) const override
-    {
-        auto & cur_elems = data(place);
-        auto & rhs_elems = data(rhs);
-
-        if (rhs_elems.value.empty())
-            return;
-
-        UInt64 new_elems = rhs_elems.value.size();
-
-        for (UInt64 i = 0; i < new_elems; ++i)
-            cur_elems.value.push_back(rhs_elems.value[i], arena);
-
-        checkArraySize(cur_elems.value.size(), AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
-
-        if (!cur_elems.value.empty())
-        {
-            std::sort(cur_elems.value.begin(), cur_elems.value.end());
-
-            if (cur_elems.value.size() > max_elems)
-                cur_elems.value.resize(max_elems, arena);
-        }
-    }
-
-    static void checkArraySize(size_t elems, size_t max_elems)
-    {
-        if (unlikely(elems > max_elems))
-            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE,
-                            "Too large array size {} (maximum: {})", elems, max_elems);
-    }
-
-    void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> /* version */) const override
-    {
-        auto & value = data(place).value;
-        size_t size = value.size();
-        checkArraySize(size, AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
-        writeVarUInt(size, buf);
-
-        for (const Field & elem : value)
-        {
-            if (elem.isNull())
-            {
-                writeBinary(false, buf);
-            }
-            else
-            {
-                writeBinary(true, buf);
-                serialization->serializeBinary(elem, buf, {});
-            }
-        }
-    }
-
-    void deserialize(AggregateDataPtr __restrict place, ReadBuffer & buf, std::optional<size_t> /* version */, Arena * arena) const override
-    {
-        size_t size = 0;
-        readVarUInt(size, buf);
-
-        if (unlikely(size > max_elems))
-            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elems);
-
-        checkArraySize(size, AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
-        auto & value = data(place).value;
-
-        value.resize(size, arena);
-        for (Field & elem : value)
-        {
-            UInt8 is_null = 0;
-            readBinary(is_null, buf);
-            if (!is_null)
-                serialization->deserializeBinary(elem, buf, {});
-        }
-    }
-
-    void insertResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const override
-    {
-        auto & column_array = assert_cast<ColumnArray &>(to);
-        auto & value = data(place).value;
-
-        if (!value.empty())
-        {
-            std::sort(value.begin(), value.end());
-
-            if (value.size() > max_elems)
-                value.resize_exact(max_elems, arena);
-        }
-        auto & offsets = column_array.getOffsets();
-        offsets.push_back(offsets.back() + value.size());
-
-        auto & column_data = column_array.getData();
-
-        if (std::is_same_v<Node, GroupArraySortedNodeString>)
-        {
-            auto & string_offsets = assert_cast<ColumnString &>(column_data).getOffsets();
-            string_offsets.reserve(string_offsets.size() + value.size());
-        }
-
-        for (const Field& field : value)
-            column_data.insert(field);
-    }
-
-    bool allocatesMemoryInArena() const override { return true; }
-};
-
-#undef AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ARRAY_SIZE
-
-}
diff --git a/src/AggregateFunctions/examples/CMakeLists.txt b/src/AggregateFunctions/examples/CMakeLists.txt
index b11f8d37d69..a9033fd8508 100644
--- a/src/AggregateFunctions/examples/CMakeLists.txt
+++ b/src/AggregateFunctions/examples/CMakeLists.txt
@@ -1,2 +1,5 @@
 clickhouse_add_executable (quantile-t-digest quantile-t-digest.cpp)
 target_link_libraries (quantile-t-digest PRIVATE dbms clickhouse_aggregate_functions)
+
+clickhouse_add_executable (group_array_sorted group_array_sorted.cpp)
+target_link_libraries (group_array_sorted PRIVATE dbms clickhouse_aggregate_functions)
diff --git a/src/AggregateFunctions/examples/group_array_sorted.cpp b/src/AggregateFunctions/examples/group_array_sorted.cpp
new file mode 100644
index 00000000000..22f7b8d2446
--- /dev/null
+++ b/src/AggregateFunctions/examples/group_array_sorted.cpp
@@ -0,0 +1,205 @@
+#include <algorithm>
+#include <type_traits>
+#include <utility>
+#include <iostream>
+
+#include "pcg_random.hpp"
+
+#include <Columns/ColumnVector.h>
+#include <Common/ArenaAllocator.h>
+#include <Common/RadixSort.h>
+#include <Columns/ColumnArray.h>
+
+
+using namespace DB;
+
+template <typename T>
+struct GroupArraySortedDataHeap
+{
+    using Allocator = MixedAlignedArenaAllocator<alignof(T), 4096>;
+    using Array = PODArray<T, 32, Allocator>;
+
+    Array values;
+
+    static bool compare(const T & lhs, const T & rhs)
+    {
+        return lhs < rhs;
+    }
+
+    struct Comparator
+    {
+        bool operator()(const T & lhs, const T & rhs)
+        {
+            return compare(lhs, rhs);
+        }
+    };
+
+    ALWAYS_INLINE void replaceTop()
+    {
+        size_t size = values.size();
+        if (size < 2)
+            return;
+
+        size_t child_index = 1;
+
+        if (values.size() > 2 && compare(values[1], values[2]))
+            ++child_index;
+
+        /// Check if we are in order
+        if (compare(values[child_index], values[0]))
+            return;
+
+        size_t current_index = 0;
+        auto current = values[current_index];
+
+        do
+        {
+            /// We are not in heap-order, swap the parent with it's largest child.
+            values[current_index] = values[child_index];
+            current_index = child_index;
+
+            // Recompute the child based off of the updated parent
+            child_index = 2 * child_index + 1;
+
+            if (child_index >= size)
+                break;
+
+            if ((child_index + 1) < size && compare(values[child_index], values[child_index + 1]))
+            {
+                /// Right child exists and is greater than left child.
+                ++child_index;
+            }
+
+            /// Check if we are in order.
+        } while (!compare(values[child_index], current));
+
+        values[current_index] = current;
+    }
+
+    ALWAYS_INLINE void addElement(const T & element, size_t max_elements, Arena * arena)
+    {
+        if (values.size() >= max_elements)
+        {
+            /// Element is greater or equal than current max element, it cannot be in k min elements
+            if (!compare(element, values[0]))
+                return;
+
+            values[0] = element;
+            replaceTop();
+            return;
+        }
+
+        values.push_back(element, arena);
+        std::push_heap(values.begin(), values.end(), Comparator());
+    }
+
+    ALWAYS_INLINE void dump()
+    {
+        while (!values.empty())
+        {
+            std::pop_heap(values.begin(), values.end(), Comparator());
+            std::cerr << values.back() << ' ';
+            values.pop_back();
+        }
+
+        std::cerr << '\n';
+    }
+};
+
+template <typename T>
+struct GroupArraySortedDataSort
+{
+    using Allocator = MixedAlignedArenaAllocator<alignof(T), 4096>;
+    using Array = PODArray<T, 32, Allocator>;
+
+    Array values;
+
+    static bool compare(const T & lhs, const T & rhs)
+    {
+        return lhs < rhs;
+    }
+
+    struct Comparator
+    {
+        bool operator()(const T & lhs, const T & rhs)
+        {
+            return compare(lhs, rhs);
+        }
+    };
+
+    ALWAYS_INLINE void sortAndLimit(size_t max_elements, Arena * arena)
+    {
+        RadixSort<RadixSortNumTraits<T>>::executeLSD(values.data(), values.size());
+        values.resize(max_elements, arena);
+    }
+
+    ALWAYS_INLINE void partialSortAndLimitIfNeeded(size_t max_elements, Arena * arena)
+    {
+        if (values.size() < max_elements * 4)
+            return;
+
+        std::nth_element(values.begin(), values.begin() + max_elements, values.end(), Comparator());
+        values.resize(max_elements, arena);
+    }
+
+    ALWAYS_INLINE void addElement(const T & element, size_t max_elements, Arena * arena)
+    {
+        values.push_back(element, arena);
+        partialSortAndLimitIfNeeded(max_elements, arena);
+    }
+};
+
+template <typename SortedData>
+NO_INLINE void benchmark(size_t elements, size_t max_elements)
+{
+    Stopwatch watch;
+    watch.start();
+
+    SortedData data;
+    pcg64_fast rng;
+
+    Arena arena;
+
+    for (size_t i = 0; i < elements; ++i)
+    {
+        uint64_t value = rng();
+        data.addElement(value, max_elements, &arena);
+    }
+
+    watch.stop();
+    std::cerr << "Elapsed " << watch.elapsedMilliseconds() << " milliseconds" << '\n';
+}
+
+int main(int argc, char ** argv)
+{
+    (void)(argc);
+    (void)(argv);
+
+    if (argc != 4)
+    {
+        std::cerr << "./group_array_sorted method elements max_elements" << '\n';
+        return 1;
+    }
+
+    std::string method = std::string(argv[1]);
+    uint64_t elements = std::atol(argv[2]);
+    uint64_t max_elements = std::atol(argv[3]);
+
+    std::cerr << "Method " << method << " elements " << elements << " max elements " << max_elements << '\n';
+
+    if (method == "heap")
+    {
+        benchmark<GroupArraySortedDataHeap<UInt64>>(elements, max_elements);
+    }
+    else if (method == "sort")
+    {
+        benchmark<GroupArraySortedDataSort<UInt64>>(elements, max_elements);
+    }
+    else
+    {
+        std::cerr << "Invalid method " << method << '\n';
+        return 1;
+    }
+
+    return 0;
+}

From 948f3f1f623df5ea51c885fc8088080b66ae4660 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 24 Jan 2024 16:23:35 +0300
Subject: [PATCH 226/245] Fixed style check

---
 src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
index 5eb20f9d14d..751bc4630e7 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -41,7 +41,6 @@ namespace ErrorCodes
 {
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int BAD_ARGUMENTS;
-    extern const int UNSUPPORTED_METHOD;
     extern const int TOO_LARGE_ARRAY_SIZE;
 }
 

From 0ba3f92248574bbd95a78850200aab25a6aef574 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Tue, 30 Jan 2024 16:11:43 +0100
Subject: [PATCH 227/245] Add a workaround for ASAN

---
 tests/queries/0_stateless/02971_analyzer_remote_id.sh | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02971_analyzer_remote_id.sh b/tests/queries/0_stateless/02971_analyzer_remote_id.sh
index 21141fa47ff..463e4cc1f0c 100755
--- a/tests/queries/0_stateless/02971_analyzer_remote_id.sh
+++ b/tests/queries/0_stateless/02971_analyzer_remote_id.sh
@@ -9,6 +9,7 @@ ${CLICKHOUSE_CLIENT} --query="DROP DATABASE IF EXISTS test_02971"
 ${CLICKHOUSE_CLIENT} --query="CREATE DATABASE test_02971"
 
 ${CLICKHOUSE_CLIENT} --query="CREATE TABLE test_02971.x ENGINE = MergeTree() ORDER BY number AS SELECT * FROM numbers(2)"
-${CLICKHOUSE_LOCAL} --query="SELECT count() FROM remote('127.0.0.{2,3}', 'test_02971.x') SETTINGS allow_experimental_analyzer = 1"
+${CLICKHOUSE_LOCAL} --query="SELECT count() FROM remote('127.0.0.{2,3}', 'test_02971.x') SETTINGS allow_experimental_analyzer = 1" 2>&1 \
+        | grep -av "ASan doesn't fully support makecontext/swapcontext functions"
 
 ${CLICKHOUSE_CLIENT} --query="DROP DATABASE IF EXISTS test_02971"

From 145f6a31cbb4a1063de5b98704ab9357ec48dd0b Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 30 Jan 2024 15:58:35 +0100
Subject: [PATCH 228/245] Fix

---
 src/Storages/S3Queue/S3QueueFilesMetadata.cpp   |  8 ++------
 src/Storages/S3Queue/S3QueueFilesMetadata.h     |  1 -
 src/Storages/S3Queue/S3QueueSource.cpp          |  2 +-
 tests/integration/test_storage_s3_queue/test.py | 10 ++++++++--
 4 files changed, 11 insertions(+), 10 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
index 30bb561204f..61f6b7fe052 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
@@ -160,11 +160,7 @@ void S3QueueFilesMetadata::deactivateCleanupTask()
 
 zkutil::ZooKeeperPtr S3QueueFilesMetadata::getZooKeeper() const
 {
-    if (!zookeeper || zookeeper->expired())
-    {
-        zookeeper = Context::getGlobalContextInstance()->getZooKeeper();
-    }
-    return zookeeper;
+    return Context::getGlobalContextInstance()->getZooKeeper();
 }
 
 S3QueueFilesMetadata::FileStatusPtr S3QueueFilesMetadata::getFileStatus(const std::string & path)
@@ -318,7 +314,7 @@ size_t S3QueueFilesMetadata::getIdForProcessingThread(size_t thread_id, size_t s
 
 size_t S3QueueFilesMetadata::getProcessingIdForPath(const std::string & path) const
 {
-    return sipHash64(path.data(), path.size()) % getProcessingIdsNum();
+    return sipHash64(path) % getProcessingIdsNum();
 }
 
 S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAsProcessing(const std::string & path)
diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index 66e36b4122e..c83c6f20b92 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -129,7 +129,6 @@ private:
     const fs::path zookeeper_cleanup_lock_path;
 
     LoggerPtr log;
-    mutable zkutil::ZooKeeperPtr zookeeper;
 
     std::atomic_bool shutdown = false;
     BackgroundSchedulePool::TaskHolder task;
diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index e277a81a923..b4f5f957f76 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -100,7 +100,7 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
                     {
                         if (metadata->isProcessingIdBelongsToShard(processing_id_for_key, current_shard))
                         {
-                            LOG_TEST(log, "Putting key {} into queue of shard {} (total: {})",
+                            LOG_TEST(log, "Putting key {} into queue of processor {} (total: {})",
                                      val->key, processing_id_for_key, sharded_keys.size());
 
                             if (auto it = sharded_keys.find(idx); it != sharded_keys.end())
diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 1495e4954b1..5e86b798bf7 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -1209,6 +1209,12 @@ def test_shards_distributed(started_cluster, mode, processing_threads):
         shard_nodes = zk.get_children(f"{keeper_path}/shards/")
         assert len(shard_nodes) == shards_num
 
+    node.restart_clickhouse()
+    time.sleep(10)
+    assert (
+        get_count(node, dst_table_name) + get_count(node_2, dst_table_name)
+    ) == total_rows
+
 
 def test_settings_check(started_cluster):
     node = started_cluster.instances["instance"]
@@ -1219,8 +1225,6 @@ def test_settings_check(started_cluster):
     files_path = f"{table_name}_data"
     mode = "ordered"
 
-    node.restart_clickhouse()
-
     create_table(
         started_cluster,
         node,
@@ -1271,7 +1275,9 @@ def test_settings_check(started_cluster):
     assert "s3queue_current_shard_num = 0" in node.query(
         f"SHOW CREATE TABLE {table_name}"
     )
+
     node.restart_clickhouse()
+
     assert "s3queue_current_shard_num = 0" in node.query(
         f"SHOW CREATE TABLE {table_name}"
     )

From 1c5b377b3a2e516ec79ad1b230e29d9b6821cdde Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 30 Jan 2024 19:36:40 +0300
Subject: [PATCH 229/245] Fixed code review issues

---
 .../AggregateFunctionGroupArraySorted.cpp                 | 8 +++++++-
 src/AggregateFunctions/examples/group_array_sorted.cpp    | 4 ++--
 2 files changed, 9 insertions(+), 3 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
index 751bc4630e7..c8ab947e8e8 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -132,9 +132,15 @@ struct GroupArraySortedData
     ALWAYS_INLINE void sortAndLimit(size_t max_elements, Arena * arena)
     {
         if constexpr (is_value_generic_field)
+        {
             ::sort(values.begin(), values.end(), Comparator());
+        }
         else
-            RadixSort<RadixSortNumTraits<T>>::executeLSD(values.data(), values.size());
+        {
+            bool is_sorted = trySort(values.begin(), values.end(), Comparator());
+            if (!is_sorted)
+                RadixSort<RadixSortNumTraits<T>>::executeLSD(values.data(), values.size());
+        }
 
         if (values.size() > max_elements)
             values.resize(max_elements, arena);
diff --git a/src/AggregateFunctions/examples/group_array_sorted.cpp b/src/AggregateFunctions/examples/group_array_sorted.cpp
index 22f7b8d2446..06592892c35 100644
--- a/src/AggregateFunctions/examples/group_array_sorted.cpp
+++ b/src/AggregateFunctions/examples/group_array_sorted.cpp
@@ -182,8 +182,8 @@ int main(int argc, char ** argv)
     }
 
     std::string method = std::string(argv[1]);
-    uint64_t elements = std::atol(argv[2]);
-    uint64_t max_elements = std::atol(argv[3]);
+    uint64_t elements = std::atol(argv[2]); /// NOLINT
+    uint64_t max_elements = std::atol(argv[3]); /// NOLINT
 
     std::cerr << "Method " << method << " elements " << elements << " max elements " << max_elements << '\n';
 

From 600eae00ccb0f5328ea66cad2045049bf7b67a91 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 30 Jan 2024 19:50:18 +0300
Subject: [PATCH 230/245] Fixed code review issues

---
 .../AggregateFunctionGroupArray.cpp           | 25 ++++++++++++++---
 .../AggregateFunctionGroupArraySorted.cpp     | 28 ++++++++++++++-----
 2 files changed, 42 insertions(+), 11 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
index f27c3c21a73..d72ddb42d9e 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
@@ -291,8 +291,17 @@ public:
         const UInt64 size = value.size();
         checkArraySize(size, max_elems);
         writeVarUInt(size, buf);
-        for (const auto & element : value)
-            writeBinaryLittleEndian(element, buf);
+
+
+        if constexpr (std::endian::native == std::endian::little)
+        {
+            buf.write(reinterpret_cast<const char *>(value.data()), size * sizeof(value[0]));
+        }
+        else
+        {
+            for (const auto & element : value)
+                writeBinaryLittleEndian(element, buf);
+        }
 
         if constexpr (Trait::last)
             writeBinaryLittleEndian(this->data(place).total_values, buf);
@@ -315,8 +324,16 @@ public:
         auto & value = this->data(place).value;
 
         value.resize_exact(size, arena);
-        for (auto & element : value)
-            readBinaryLittleEndian(element, buf);
+
+        if constexpr (std::endian::native == std::endian::little)
+        {
+            buf.readStrict(reinterpret_cast<char *>(value.data()), size * sizeof(value[0]));
+        }
+        else
+        {
+            for (auto & element : value)
+                readBinaryLittleEndian(element, buf);
+        }
 
         if constexpr (Trait::last)
             readBinaryLittleEndian(this->data(place).total_values, buf);
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
index c8ab947e8e8..0e9856cfab9 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -137,8 +137,8 @@ struct GroupArraySortedData
         }
         else
         {
-            bool is_sorted = trySort(values.begin(), values.end(), Comparator());
-            if (!is_sorted)
+            bool try_sort = trySort(values.begin(), values.end(), Comparator());
+            if (!try_sort)
                 RadixSort<RadixSortNumTraits<T>>::executeLSD(values.data(), values.size());
         }
 
@@ -283,8 +283,15 @@ public:
         }
         else
         {
-            for (const auto & element : values)
-                writeBinaryLittleEndian(element, buf);
+            if constexpr (std::endian::native == std::endian::little)
+            {
+                buf.write(reinterpret_cast<const char *>(values.data()), size * sizeof(values[0]));
+            }
+            else
+            {
+                for (const auto & element : values)
+                    writeBinaryLittleEndian(element, buf);
+            }
         }
     }
 
@@ -297,7 +304,7 @@ public:
             throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elements);
 
         auto & values = this->data(place).values;
-        values.resize(size, arena);
+        values.resize_exact(size, arena);
 
         if constexpr (std::is_same_v<T, Field>)
         {
@@ -311,8 +318,15 @@ public:
         }
         else
         {
-            for (auto & element : values)
-                readBinaryLittleEndian(element, buf);
+            if constexpr (std::endian::native == std::endian::little)
+            {
+                buf.readStrict(reinterpret_cast<char *>(values.data()), size * sizeof(values[0]));
+            }
+            else
+            {
+                for (auto & element : values)
+                    readBinaryLittleEndian(element, buf);
+            }
         }
     }
 

From 4ddba907c8cf4796d549a607daf8a29a06dd70b1 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 18:49:28 +0100
Subject: [PATCH 231/245] Update autogenerated version to 24.2.1.1 and
 contributors

---
 cmake/autogenerated_versions.txt              | 10 ++++-----
 .../StorageSystemContributors.generated.cpp   | 22 +++++++++++++++++++
 2 files changed, 27 insertions(+), 5 deletions(-)

diff --git a/cmake/autogenerated_versions.txt b/cmake/autogenerated_versions.txt
index e5a8c064808..885080a3e38 100644
--- a/cmake/autogenerated_versions.txt
+++ b/cmake/autogenerated_versions.txt
@@ -2,11 +2,11 @@
 
 # NOTE: has nothing common with DBMS_TCP_PROTOCOL_VERSION,
 # only DBMS_TCP_PROTOCOL_VERSION should be incremented on protocol changes.
-SET(VERSION_REVISION 54482)
+SET(VERSION_REVISION 54483)
 SET(VERSION_MAJOR 24)
-SET(VERSION_MINOR 1)
+SET(VERSION_MINOR 2)
 SET(VERSION_PATCH 1)
-SET(VERSION_GITHASH a2faa65b080a587026c86844f3a20c74d23a86f8)
-SET(VERSION_DESCRIBE v24.1.1.1-testing)
-SET(VERSION_STRING 24.1.1.1)
+SET(VERSION_GITHASH 5a024dfc0936e062770d0cfaad0805b57c1fba17)
+SET(VERSION_DESCRIBE v24.2.1.1-testing)
+SET(VERSION_STRING 24.2.1.1)
 # end of autochange
diff --git a/src/Storages/System/StorageSystemContributors.generated.cpp b/src/Storages/System/StorageSystemContributors.generated.cpp
index fbd5afd3274..b5a985fec9b 100644
--- a/src/Storages/System/StorageSystemContributors.generated.cpp
+++ b/src/Storages/System/StorageSystemContributors.generated.cpp
@@ -109,6 +109,7 @@ const char * auto_contributors[] {
     "Ali Demirci",
     "Aliaksandr Pliutau",
     "Aliaksandr Shylau",
+    "Aliaksei Khatskevich",
     "Alina Terekhova",
     "Amesaru",
     "Amila Welihinda",
@@ -179,6 +180,7 @@ const char * auto_contributors[] {
     "Arsen Hakobyan",
     "Arslan G",
     "ArtCorp",
+    "Artem Alperin",
     "Artem Andreenko",
     "Artem Gavrilov",
     "Artem Hnilov",
@@ -223,7 +225,9 @@ const char * auto_contributors[] {
     "Bill",
     "Bin Xie",
     "BiteTheDDDDt",
+    "Blacksmith",
     "BlahGeek",
+    "Blargian",
     "Bo Lu",
     "Bogdan",
     "Bogdan Voronin",
@@ -373,6 +377,7 @@ const char * auto_contributors[] {
     "Evgeny Kruglov",
     "Evgeny Markov",
     "Ewout",
+    "Eyal Halpern Shalev",
     "FArthur-cmd",
     "FFFFFFFHHHHHHH",
     "FFish",
@@ -513,6 +518,7 @@ const char * auto_contributors[] {
     "Javi santana bot",
     "JaySon",
     "JaySon-Huang",
+    "Jayme Bird",
     "Jean Baptiste Favre",
     "Jeffrey Dang",
     "Jens Hoevenaars",
@@ -613,6 +619,7 @@ const char * auto_contributors[] {
     "Lewinma",
     "Li Shuai",
     "Li Yin",
+    "Lino Uruñuela",
     "Lirikl",
     "Liu Cong",
     "LiuCong",
@@ -636,6 +643,7 @@ const char * auto_contributors[] {
     "MagiaGroz",
     "Maks Skorokhod",
     "Maksim",
+    "Maksim Alekseev",
     "Maksim Buren",
     "Maksim Fedotov",
     "Maksim Kita",
@@ -653,6 +661,7 @@ const char * auto_contributors[] {
     "Mariano Benítez Mulet",
     "Mark Andreev",
     "Mark Frost",
+    "Mark Needham",
     "Mark Papadakis",
     "Mark Polokhov",
     "Maroun Maroun",
@@ -662,6 +671,7 @@ const char * auto_contributors[] {
     "Martijn Bakker",
     "Marvin Taschenberger",
     "Masha",
+    "Mathieu Rey",
     "Matthew Peveler",
     "Matwey V. Kornilov",
     "Max",
@@ -733,6 +743,7 @@ const char * auto_contributors[] {
     "Mingliang Pan",
     "Misko Lee",
     "Misz606",
+    "MochiXu",
     "Mohamad Fadhil",
     "Mohammad Arab Anvari",
     "Mohammad Hossein Sekhavat",
@@ -780,6 +791,7 @@ const char * auto_contributors[] {
     "Nikolai Sorokin",
     "Nikolay",
     "Nikolay Degterinsky",
+    "Nikolay Edigaryev",
     "Nikolay Kirsh",
     "Nikolay Semyachkin",
     "Nikolay Shcheglov",
@@ -876,6 +888,7 @@ const char * auto_contributors[] {
     "Roman Bug",
     "Roman Chyrva",
     "Roman G",
+    "Roman Glinskikh",
     "Roman Heinrich",
     "Roman Lipovsky",
     "Roman Nikolaev",
@@ -948,6 +961,7 @@ const char * auto_contributors[] {
     "Seyed Mehrshad Hosseini",
     "Shane Andrade",
     "Shani Elharrar",
+    "Shaun Struwig",
     "Sherry Wang",
     "Shoh Jahon",
     "Shri Bodas",
@@ -1015,6 +1029,7 @@ const char * auto_contributors[] {
     "Tian Xinhui",
     "Tiaonmmn",
     "Tigran Khudaverdyan",
+    "Tim Liou",
     "Tim Windelschmidt",
     "Timur Magomedov",
     "Timur Solodovnikov",
@@ -1109,6 +1124,7 @@ const char * auto_contributors[] {
     "Wang Fenjin",
     "WangZengrui",
     "Wangyang Guo",
+    "Waterkin",
     "Weiqing Xu",
     "William Shallum",
     "Winter Zhang",
@@ -1152,6 +1168,7 @@ const char * auto_contributors[] {
     "Yury Stankevich",
     "Yusuke Tanaka",
     "Zach Naimon",
+    "Zheng Miao",
     "ZhiYong Wang",
     "Zhichang Yu",
     "Zhichun Wu",
@@ -1213,6 +1230,7 @@ const char * auto_contributors[] {
     "attack204",
     "auxten",
     "avasiliev",
+    "avinzhang",
     "avogar",
     "avoiderboi",
     "avsharapov",
@@ -1253,6 +1271,7 @@ const char * auto_contributors[] {
     "chengy8934",
     "chenjian",
     "chenqi",
+    "chenwei",
     "chenxing-xc",
     "chenxing.xc",
     "chertus",
@@ -1301,6 +1320,7 @@ const char * auto_contributors[] {
     "ducle.canh",
     "eaxdev",
     "edef",
+    "edpyt",
     "eejoin",
     "egatov",
     "ekrasikov",
@@ -1540,6 +1560,7 @@ const char * auto_contributors[] {
     "mlkui",
     "mnkonkova",
     "mo-avatar",
+    "mochi",
     "monchickey",
     "morty",
     "moscas",
@@ -1671,6 +1692,7 @@ const char * auto_contributors[] {
     "sundy-li",
     "sundyli",
     "sunlisheng",
+    "sunny19930321",
     "svladykin",
     "tai",
     "taichong",

From 584694ed51a0e24b811054d19863915577e2e7aa Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 30 Jan 2024 18:01:12 +0000
Subject: [PATCH 232/245] Add function variantType

---
 docs/en/sql-reference/data-types/variant.md   |  29 +++++
 .../functions/other-functions.md              |  45 +++++++
 src/Functions/array/variantType.cpp           |   3 +
 src/Functions/variantElement.cpp              |   2 +-
 src/Functions/variantType.cpp                 | 112 ++++++++++++++++++
 .../02981_variant_type_function.reference     |  10 ++
 .../02981_variant_type_function.sql           |  13 ++
 7 files changed, 213 insertions(+), 1 deletion(-)
 create mode 100644 src/Functions/array/variantType.cpp
 create mode 100644 src/Functions/variantType.cpp
 create mode 100644 tests/queries/0_stateless/02981_variant_type_function.reference
 create mode 100644 tests/queries/0_stateless/02981_variant_type_function.sql

diff --git a/docs/en/sql-reference/data-types/variant.md b/docs/en/sql-reference/data-types/variant.md
index 0058e13b4ca..17d51878420 100644
--- a/docs/en/sql-reference/data-types/variant.md
+++ b/docs/en/sql-reference/data-types/variant.md
@@ -156,6 +156,35 @@ SELECT v, variantElement(v, 'String'), variantElement(v, 'UInt64'), variantEleme
 └───────────────┴─────────────────────────────┴─────────────────────────────┴────────────────────────────────────┘
 ```
 
+To know what variant is stored in each row function `variantType(variant_column)` can be used. It returns `Enum` with variant type name for each row (or `'None'` if row is `NULL`).
+
+Example:
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT variantType(v) from test;
+```
+
+```text
+┌─variantType(v)─┐
+│ None           │
+│ UInt64         │
+│ String         │
+│ Array(UInt64)  │
+└────────────────┘
+```
+
+```sql
+SELECT toTypeName(variantType(v)) FROM test LIMIT 1;
+```
+
+```text
+┌─toTypeName(variantType(v))──────────────────────────────────────────┐
+│ Enum8('None' = -1, 'Array(UInt64)' = 0, 'String' = 1, 'UInt64' = 2) │
+└─────────────────────────────────────────────────────────────────────┘
+```
+
 ## Conversion between Variant column and other columns
 
 There are 3 possible conversions that can be performed with Variant column.
diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index ebc80e4d308..d05e7bbfe51 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -2869,6 +2869,51 @@ SELECT v, variantElement(v, 'String'), variantElement(v, 'UInt64'), variantEleme
 └───────────────┴─────────────────────────────┴─────────────────────────────┴────────────────────────────────────┘
 ```
 
+## variantType
+
+Returns the variant type name for each row of `Variant` column. If row contains NULL, it returns `'None'` for it.
+
+**Syntax**
+
+```sql
+variantType(variant)
+```
+
+**Arguments**
+
+- `variant` — Variant column. [Variant](../../sql-reference/data-types/variant.md).
+
+**Returned value**
+
+- Enum8 column with variant type name for each row.
+
+**Example**
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT variantType(v) FROM test;
+```
+
+```text
+┌─variantType(v)─┐
+│ None           │
+│ UInt64         │
+│ String         │
+│ Array(UInt64)  │
+└────────────────┘
+```
+
+```sql
+SELECT toTypeName(variantType(v)) FROM test LIMIT 1;
+```
+
+```text
+┌─toTypeName(variantType(v))──────────────────────────────────────────┐
+│ Enum8('None' = -1, 'Array(UInt64)' = 0, 'String' = 1, 'UInt64' = 2) │
+└─────────────────────────────────────────────────────────────────────┘
+```
+
 ## minSampleSizeConversion
 
 Calculates minimum required sample size for an A/B test comparing conversions (proportions) in two samples.
diff --git a/src/Functions/array/variantType.cpp b/src/Functions/array/variantType.cpp
new file mode 100644
index 00000000000..a120cc213ec
--- /dev/null
+++ b/src/Functions/array/variantType.cpp
@@ -0,0 +1,3 @@
+//
+// Created by Павел Круглов on 30/01/2024.
+//
diff --git a/src/Functions/variantElement.cpp b/src/Functions/variantElement.cpp
index 7c63e1266e6..2744a0dabb8 100644
--- a/src/Functions/variantElement.cpp
+++ b/src/Functions/variantElement.cpp
@@ -212,7 +212,7 @@ REGISTER_FUNCTION(VariantElement)
         .description = R"(
 Extracts a column with specified type from a `Variant` column.
 )",
-        .syntax{"tupleElement(variant, type_name, [, default_value])"},
+        .syntax{"variantElement(variant, type_name, [, default_value])"},
         .arguments{{
             {"variant", "Variant column"},
             {"type_name", "The name of the variant type to extract"},
diff --git a/src/Functions/variantType.cpp b/src/Functions/variantType.cpp
new file mode 100644
index 00000000000..9549f4c5210
--- /dev/null
+++ b/src/Functions/variantType.cpp
@@ -0,0 +1,112 @@
+#include <Functions/IFunction.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionHelpers.h>
+#include <DataTypes/IDataType.h>
+#include <DataTypes/DataTypeVariant.h>
+#include <DataTypes/DataTypeEnum.h>
+#include <Columns/ColumnVariant.h>
+#include <Columns/ColumnVector.h>
+#include <Columns/ColumnsNumber.h>
+#include <Common/assert_cast.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+}
+
+namespace
+{
+
+/// Return enum with type name for each row in Variant column.
+class FunctionVariantType : public IFunction
+{
+public:
+    static constexpr auto name = "variantType";
+    static constexpr auto enum_name_for_null = "None";
+
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionVariantType>(); }
+    String getName() const override { return name; }
+    size_t getNumberOfArguments() const override { return 1; }
+    bool useDefaultImplementationForConstants() const override { return true; }
+    bool useDefaultImplementationForNulls() const override { return false; }
+    bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
+
+    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
+    {
+        if (arguments.empty() || arguments.size() > 1)
+            throw Exception(
+                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                "Number of arguments for function {} doesn't match: passed {}, should be 1",
+                getName(), arguments.empty());
+
+        const DataTypeVariant * variant_type = checkAndGetDataType<DataTypeVariant>(arguments[0].type.get());
+
+        if (!variant_type)
+            throw Exception(
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                "First argument for function {} must be Variant, got {} instead",
+                getName(), arguments[0].type->getName());
+
+        const auto & variants = variant_type->getVariants();
+        std::vector<std::pair<String, Int8>> enum_values;
+        enum_values.reserve(variants.size() + 1);
+        for (ColumnVariant::Discriminator i = 0; i != variants.size(); ++i)
+            enum_values.emplace_back(variants[i]->getName(), i);
+        enum_values.emplace_back(enum_name_for_null, ColumnVariant::NULL_DISCRIMINATOR);
+        return std::make_shared<DataTypeEnum<Int8>>(enum_values);
+    }
+
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
+    {
+        const ColumnVariant * variant_column = checkAndGetColumn<ColumnVariant>(arguments[0].column.get());
+        if (!variant_column)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                "First argument for function {} must be Variant, got {} instead",
+                getName(), arguments[0].type->getName());
+
+        auto res = result_type->createColumn();
+        auto & res_data = typeid_cast<ColumnInt8 *>(res.get())->getData();
+        res_data.reserve(input_rows_count);
+        for (size_t i = 0; i != input_rows_count; ++i)
+            res_data.push_back(variant_column->globalDiscriminatorAt(i));
+
+        return res;
+    }
+};
+
+}
+
+REGISTER_FUNCTION(VariantType)
+{
+    factory.registerFunction<FunctionVariantType>(FunctionDocumentation{
+        .description = R"(
+Returns the variant type name for each row of `Variant` column. If row contains NULL, it returns 'None' for it.
+)",
+        .syntax{"variantType(variant)"},
+        .arguments{{
+            {"variant", "Variant column"}}},
+        .examples{{{
+            "Example",
+            R"(
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT variantType(v) FROM test;)",
+            R"(
+┌─variantType(v)─┐
+│ None           │
+│ UInt64         │
+│ String         │
+│ Array(UInt64)  │
+└────────────────┘
+)"}}},
+        .categories{"Variant"},
+    });
+}
+
+}
diff --git a/tests/queries/0_stateless/02981_variant_type_function.reference b/tests/queries/0_stateless/02981_variant_type_function.reference
new file mode 100644
index 00000000000..4fae89810ef
--- /dev/null
+++ b/tests/queries/0_stateless/02981_variant_type_function.reference
@@ -0,0 +1,10 @@
+None
+UInt64
+String
+Array(UInt64)
+Enum8(\'None\' = -1, \'Array(UInt64)\' = 0, \'String\' = 1, \'UInt64\' = 2)
+None
+UInt64
+String
+Array(UInt64)
+Enum8(\'None\' = -1, \'Array(UInt64)\' = 0, \'Date\' = 1, \'String\' = 2, \'UInt64\' = 3)
diff --git a/tests/queries/0_stateless/02981_variant_type_function.sql b/tests/queries/0_stateless/02981_variant_type_function.sql
new file mode 100644
index 00000000000..cba653d7374
--- /dev/null
+++ b/tests/queries/0_stateless/02981_variant_type_function.sql
@@ -0,0 +1,13 @@
+SET allow_experimental_variant_type = 1;
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT variantType(v) as type FROM test;
+SELECT toTypeName(variantType(v)) from test limit 1;
+
+SELECT variantType() FROM test; -- {serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
+SELECT variantType(v, v) FROM test; -- {serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
+SELECT variantType(v.String) FROM test; -- {serverError ILLEGAL_TYPE_OF_ARGUMENT}
+
+SELECT variantType(v::Variant(UInt64, String, Array(UInt64), Date)) as type FROM test;
+SELECT toTypeName(variantType(v::Variant(UInt64, String, Array(UInt64), Date))) from test limit 1;
+

From ef6c90c71bad65552ac1bb38769487fe5c106ed9 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Tue, 30 Jan 2024 18:01:46 +0000
Subject: [PATCH 233/245] Update version_date.tsv and changelogs after
 v24.1.1.2048-stable

---
 SECURITY.md                            |   3 +-
 docker/keeper/Dockerfile               |   2 +-
 docker/server/Dockerfile.alpine        |   2 +-
 docker/server/Dockerfile.ubuntu        |   2 +-
 docs/changelogs/v24.1.1.2048-stable.md | 438 +++++++++++++++++++++++++
 utils/list-versions/version_date.tsv   |   1 +
 6 files changed, 444 insertions(+), 4 deletions(-)
 create mode 100644 docs/changelogs/v24.1.1.2048-stable.md

diff --git a/SECURITY.md b/SECURITY.md
index a200e172a3b..79ca0269838 100644
--- a/SECURITY.md
+++ b/SECURITY.md
@@ -13,9 +13,10 @@ The following versions of ClickHouse server are currently being supported with s
 
 | Version | Supported |
 |:-|:-|
+| 24.1 | ✔️ |
 | 23.12 | ✔️ |
 | 23.11 | ✔️ |
-| 23.10 | ✔️ |
+| 23.10 | ❌ |
 | 23.9 | ❌ |
 | 23.8 | ✔️ |
 | 23.7 | ❌ |
diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index 4b5e8cd3970..82405d63df9 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,7 +34,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="23.12.2.59"
+ARG VERSION="24.1.1.2048"
 ARG PACKAGES="clickhouse-keeper"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index 452d8539a48..f48e14aba50 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="23.12.2.59"
+ARG VERSION="24.1.1.2048"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index 0cefa3c14cb..60ef7a67563 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -30,7 +30,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="23.12.2.59"
+ARG VERSION="24.1.1.2048"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
diff --git a/docs/changelogs/v24.1.1.2048-stable.md b/docs/changelogs/v24.1.1.2048-stable.md
new file mode 100644
index 00000000000..8e4647da86e
--- /dev/null
+++ b/docs/changelogs/v24.1.1.2048-stable.md
@@ -0,0 +1,438 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v24.1.1.2048-stable (5a024dfc093) FIXME as compared to v23.12.1.1368-stable (a2faa65b080)
+
+#### Backward Incompatible Change
+* The setting `print_pretty_type_names` is turned on by default. You can turn it off to keep the old behavior or `SET compatibility = '23.12'`. [#57726](https://github.com/ClickHouse/ClickHouse/pull/57726) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The MergeTree setting `clean_deleted_rows` is deprecated, it has no effect anymore. The `CLEANUP` keyword for `OPTIMIZE` is not allowed by default (unless `allow_experimental_replacing_merge_with_cleanup` is enabled). [#58316](https://github.com/ClickHouse/ClickHouse/pull/58316) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* The function `reverseDNSQuery` is no longer available. This closes [#58368](https://github.com/ClickHouse/ClickHouse/issues/58368). [#58369](https://github.com/ClickHouse/ClickHouse/pull/58369) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Enable various changes to improve the access control in the configuration file. These changes affect the behavior, and you check the `config.xml` in the `access_control_improvements` section. In case you are not confident, keep the values in the configuration file as they were in the previous version. [#58584](https://github.com/ClickHouse/ClickHouse/pull/58584) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Allow queries without aliases for subqueries for `PASTE JOIN`. [#58654](https://github.com/ClickHouse/ClickHouse/pull/58654) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Fix sumMapFiltered with NaN values. NaN values are now placed at the end (instead of randomly) and considered different from any values. `-0` is now also treated as equal to `0`; since 0 values are discarded, `-0` values are discarded too. [#58959](https://github.com/ClickHouse/ClickHouse/pull/58959) ([Raúl Marín](https://github.com/Algunenano)).
+* The function `visibleWidth` will behave according to the docs. In previous versions, it simply counted code points after string serialization, like the `lengthUTF8` function, but didn't consider zero-width and combining characters, full-width characters, tabs, and deletes. Now the behavior is changed accordingly. If you want to keep the old behavior, set `function_visible_width_behavior` to `0`, or set `compatibility` to `23.12` or lower. [#59022](https://github.com/ClickHouse/ClickHouse/pull/59022) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Kusto dialect is disabled until these two bugs will be fixed: [#59037](https://github.com/ClickHouse/ClickHouse/issues/59037) and [#59036](https://github.com/ClickHouse/ClickHouse/issues/59036). [#59305](https://github.com/ClickHouse/ClickHouse/pull/59305) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### New Feature
+* Allow partitions from tables with different partition expressions to be attached when the destination table partition expression doesn't re-partition/ split the part. [#39507](https://github.com/ClickHouse/ClickHouse/pull/39507) ([Arthur Passos](https://github.com/arthurpassos)).
+* Added statement `SYSTEM RELOAD ASYNCHRONOUS METRICS` which updates the asynchronous metrics. Mostly useful for testing and development. [#53710](https://github.com/ClickHouse/ClickHouse/pull/53710) ([Robert Schulze](https://github.com/rschu1ze)).
+* Certain settings (currently `min_compress_block_size` and `max_compress_block_size`) can now be specified at column-level where they take precedence over the corresponding table-level setting. Example: `CREATE TABLE tab (col String SETTINGS (min_compress_block_size = 81920, max_compress_block_size = 163840)) ENGINE = MergeTree ORDER BY tuple();`. [#55201](https://github.com/ClickHouse/ClickHouse/pull/55201) ([Duc Canh Le](https://github.com/canhld94)).
+* Add `quantileDDSketch` aggregate function as well as the corresponding `quantilesDDSketch` and `medianDDSketch`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
+* Added function `seriesDecomposeSTL()` which decomposes a time series into a season, a trend and a residual component. [#57078](https://github.com/ClickHouse/ClickHouse/pull/57078) ([Bhavna Jindal](https://github.com/bhavnajindal)).
+* Introduced MySQL Binlog Client for MaterializedMySQL: One binlog connection for many databases. [#57323](https://github.com/ClickHouse/ClickHouse/pull/57323) ([Val Doroshchuk](https://github.com/valbok)).
+* Intel QuickAssist Technology (QAT) provides hardware-accelerated compression and cryptograpy. ClickHouse got a new compression codec `ZSTD_QAT` which utilizes QAT for zstd compression. The codec uses [Intel's QATlib](https://github.com/intel/qatlib) and [Inte's QAT ZSTD Plugin](https://github.com/intel/QAT-ZSTD-Plugin). Right now, only compression can be accelerated in hardware (a software fallback kicks in in case QAT could not be initialized), decompression always runs in software. [#57509](https://github.com/ClickHouse/ClickHouse/pull/57509) ([jasperzhu](https://github.com/jinjunzh)).
+* Implementing the new way how object storage keys are generated for s3 disks. Now the format could be defined in terms of `re2` regex syntax with `key_template` option in disc description. [#57663](https://github.com/ClickHouse/ClickHouse/pull/57663) ([Sema Checherinda](https://github.com/CheSema)).
+* Table system.dropped_tables_parts contains parts of system.dropped_tables tables (dropped but not yet removed tables). [#58038](https://github.com/ClickHouse/ClickHouse/pull/58038) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Implement Variant data type that represents a union of other data types. Type `Variant(T1, T2, ..., TN)` means that each row of this type has a value of either type `T1` or `T2` or ... or `TN` or none of them (`NULL` value). Variant type is available under a setting `allow_experimental_variant_type`. Reference: [#54864](https://github.com/ClickHouse/ClickHouse/issues/54864). [#58047](https://github.com/ClickHouse/ClickHouse/pull/58047) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add settings `max_materialized_views_size_for_table` to limit the number of materialized views attached to a table. [#58068](https://github.com/ClickHouse/ClickHouse/pull/58068) ([zhongyuankai](https://github.com/zhongyuankai)).
+* `clickhouse-format` improvements: * support INSERT queries with `VALUES` * support comments (use `--comments` to output them) * support `--max_line_length` option to format only long queries in multiline. [#58246](https://github.com/ClickHouse/ClickHouse/pull/58246) ([vdimir](https://github.com/vdimir)).
+* Added `null_status_on_timeout_only_active` and `throw_only_active` modes for `distributed_ddl_output_mode` that allow to avoid waiting for inactive replicas. [#58350](https://github.com/ClickHouse/ClickHouse/pull/58350) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Add table `system.database_engines`. [#58390](https://github.com/ClickHouse/ClickHouse/pull/58390) ([Bharat Nallan](https://github.com/bharatnc)).
+* Added FROM <Replicas> modifier for SYSTEM SYNC REPLICA LIGHTWEIGHT query. The FROM modifier ensures we wait for for fetches and drop-ranges only for the specified source replicas, as well as any replica not in zookeeper or with an empty source_replica. [#58393](https://github.com/ClickHouse/ClickHouse/pull/58393) ([Jayme Bird](https://github.com/jaymebrd)).
+* Add function `arrayShingles()` to compute subarrays, e.g. `arrayShingles([1, 2, 3, 4, 5], 3)` returns `[[1,2,3],[2,3,4],[3,4,5]]`. [#58396](https://github.com/ClickHouse/ClickHouse/pull/58396) ([Zheng Miao](https://github.com/zenmiao7)).
+* Added functions `punycodeEncode()`, `punycodeDecode()`, `idnaEncode()` and `idnaDecode()` which are useful for translating international domain names to an ASCII representation according to the IDNA standard. [#58454](https://github.com/ClickHouse/ClickHouse/pull/58454) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added string similarity functions `dramerauLevenshteinDistance()`, `jaroSimilarity()` and `jaroWinklerSimilarity()`. [#58531](https://github.com/ClickHouse/ClickHouse/pull/58531) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add two settings `output_format_compression_level` to change output compression level and `output_format_compression_zstd_window_log` to explicitly set compression window size and enable long-range mode for zstd compression if output compression method is `zstd`. Applied for `INTO OUTFILE` and when writing to table functions `file`, `url`, `hdfs`, `s3`, and `azureBlobStorage`. [#58539](https://github.com/ClickHouse/ClickHouse/pull/58539) ([Duc Canh Le](https://github.com/canhld94)).
+* Automatically disable ANSI escape sequences in Pretty formats if the output is not a terminal. Add new `auto` mode to setting `output_format_pretty_color`. [#58614](https://github.com/ClickHouse/ClickHouse/pull/58614) ([Shaun Struwig](https://github.com/Blargian)).
+* Added setting `update_insert_deduplication_token_in_dependent_materialized_views`. This setting allows to update insert deduplication token with table identifier during insert in dependent materialized views. Closes [#59165](https://github.com/ClickHouse/ClickHouse/issues/59165). [#59238](https://github.com/ClickHouse/ClickHouse/pull/59238) ([Maksim Kita](https://github.com/kitaisreal)).
+
+#### Performance Improvement
+* More cache-friendly final implementation. Note on the behaviour change: previously queries with `FINAL` modifier that read with a single stream (e.g. `max_threads=1`) produced sorted output without explicitly provided `ORDER BY` clause. This behaviour no longer exists when `enable_vertical_final = true` (and it is so by default). [#54366](https://github.com/ClickHouse/ClickHouse/pull/54366) ([Duc Canh Le](https://github.com/canhld94)).
+* Optimize array element function when input is array(map)/array(array(num)/array(array(string))/array(bigint)/array(decimal). Current implementation causes too many reallocs. The optimization speed up by ~6x especially when input type is array(map). [#56403](https://github.com/ClickHouse/ClickHouse/pull/56403) ([李扬](https://github.com/taiyang-li)).
+* Bypass `Poco::BasicBufferedStreamBuf` abstraction when reading from S3 (namely `ReadBufferFromIStream`) to avoid extra copying of data. [#56961](https://github.com/ClickHouse/ClickHouse/pull/56961) ([Nikita Taranov](https://github.com/nickitat)).
+* Read column once while reading more that one subcolumn from it in Compact parts. [#57631](https://github.com/ClickHouse/ClickHouse/pull/57631) ([Kruglov Pavel](https://github.com/Avogar)).
+* Rewrite the AST of sum(column + literal) function. [#57853](https://github.com/ClickHouse/ClickHouse/pull/57853) ([Jiebin Sun](https://github.com/jiebinn)).
+* The evaluation of function `match()` now utilizes skipping indices `ngrambf_v1` and `tokenbf_v1`. [#57882](https://github.com/ClickHouse/ClickHouse/pull/57882) ([凌涛](https://github.com/lingtaolf)).
+* Default coordinator for parallel replicas is rewritten for better cache locality (same mark ranges are almost always assigned to the same replicas). Consistent hashing is used also during work stealing, so better tail latency is expected. It has been tested for linear scalability on a hundred of replicas. [#57968](https://github.com/ClickHouse/ClickHouse/pull/57968) ([Nikita Taranov](https://github.com/nickitat)).
+* MergeTree FINAL to not compare rows from same non-L0 part. [#58142](https://github.com/ClickHouse/ClickHouse/pull/58142) ([Duc Canh Le](https://github.com/canhld94)).
+* Speed up iota calls (filling array with consecutive numbers). [#58271](https://github.com/ClickHouse/ClickHouse/pull/58271) ([Raúl Marín](https://github.com/Algunenano)).
+* The evaluation of function `match()` now utilizes inverted indices. [#58284](https://github.com/ClickHouse/ClickHouse/pull/58284) ([凌涛](https://github.com/lingtaolf)).
+* Speedup MIN/MAX for non numeric types. [#58334](https://github.com/ClickHouse/ClickHouse/pull/58334) ([Raúl Marín](https://github.com/Algunenano)).
+* Enable JIT compilation for aggregation without a key. Closes [#41461](https://github.com/ClickHouse/ClickHouse/issues/41461). Originally [#53757](https://github.com/ClickHouse/ClickHouse/issues/53757). [#58440](https://github.com/ClickHouse/ClickHouse/pull/58440) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The performance experiments of **OnTime** on the Intel server with up to AVX2 (and BMI2) support show that this change could effectively improve the QPS of **Q2** and **Q3** by **5.0%** and **3.7%** through reducing the cycle ratio of the hotspot, **_DB::MergeTreeRangeReader::ReadResult::optimize_**, **from 11.48% to 1.09%** and **from 8.09% to 0.67%** respectively while having no impact on others. [#58800](https://github.com/ClickHouse/ClickHouse/pull/58800) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
+* Use one thread less in `clickhouse-local`. [#58968](https://github.com/ClickHouse/ClickHouse/pull/58968) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Large aggregation states of `uniqExact` will be merged in parallel in distrubuted queries. [#59009](https://github.com/ClickHouse/ClickHouse/pull/59009) ([Nikita Taranov](https://github.com/nickitat)).
+* Lower memory usage after reading from `MergeTree` tables. [#59290](https://github.com/ClickHouse/ClickHouse/pull/59290) ([Anton Popov](https://github.com/CurtizJ)).
+* Lower memory usage in vertical merges. [#59340](https://github.com/ClickHouse/ClickHouse/pull/59340) ([Anton Popov](https://github.com/CurtizJ)).
+
+#### Improvement
+* Enable MySQL/MariaDB on macOS. This closes [#21191](https://github.com/ClickHouse/ClickHouse/issues/21191). [#46316](https://github.com/ClickHouse/ClickHouse/pull/46316) ([Robert Schulze](https://github.com/rschu1ze)).
+* Do not interpret numbers with leading zeroes as octals. [#55575](https://github.com/ClickHouse/ClickHouse/pull/55575) ([Joanna Hulboj](https://github.com/jh0x)).
+* Replace HTTP outgoing buffering based on std ostream with CH Buffer. Add bytes counting metrics for interfaces. [#56064](https://github.com/ClickHouse/ClickHouse/pull/56064) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Disable `max_rows_in_set_to_optimize_join` by default. [#56396](https://github.com/ClickHouse/ClickHouse/pull/56396) ([vdimir](https://github.com/vdimir)).
+* Add `<host_name>` config parameter that allows avoiding resolving hostnames in DDLWorker. This mitigates the possibility of the queue being stuck in case of a change in cluster definition. Closes [#57573](https://github.com/ClickHouse/ClickHouse/issues/57573). [#57603](https://github.com/ClickHouse/ClickHouse/pull/57603) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Increase `load_metadata_threads` to 16 for the filesystem cache. It will make the server start up faster. [#57732](https://github.com/ClickHouse/ClickHouse/pull/57732) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Improve the `multiIf` function performance when the type is Nullable. [#57745](https://github.com/ClickHouse/ClickHouse/pull/57745) ([KevinyhZou](https://github.com/KevinyhZou)).
+* Add ability to throttle merges/mutations (`max_mutations_bandwidth_for_server`/`max_merges_bandwidth_for_server`). [#57877](https://github.com/ClickHouse/ClickHouse/pull/57877) ([Azat Khuzhin](https://github.com/azat)).
+* Replaced undocumented (boolean) column `is_hot_reloadable` in system table `system.server_settings` by (Enum8) column `changeable_without_restart` with possible values `No`, `Yes`, `IncreaseOnly` and `DecreaseOnly`. Also documented the column. [#58029](https://github.com/ClickHouse/ClickHouse/pull/58029) ([skyoct](https://github.com/skyoct)).
+* ClusterDiscovery supports setting username and password, close [#58063](https://github.com/ClickHouse/ClickHouse/issues/58063). [#58123](https://github.com/ClickHouse/ClickHouse/pull/58123) ([vdimir](https://github.com/vdimir)).
+* Support query parameters in ALTER TABLE ... PART. [#58297](https://github.com/ClickHouse/ClickHouse/pull/58297) ([Azat Khuzhin](https://github.com/azat)).
+* Create consumers for Kafka tables on fly (but keep them for some period - `kafka_consumers_pool_ttl_ms`, since last used), this should fix problem with statistics for `system.kafka_consumers` (that does not consumed when nobody reads from Kafka table, which leads to live memory leak and slow table detach) and also this PR enables stats for `system.kafka_consumers` by default again. [#58310](https://github.com/ClickHouse/ClickHouse/pull/58310) ([Azat Khuzhin](https://github.com/azat)).
+* Sparkbar as an alias to sparkbar. [#58335](https://github.com/ClickHouse/ClickHouse/pull/58335) ([凌涛](https://github.com/lingtaolf)).
+* Avoid sending ComposeObject requests after upload to GCS. [#58343](https://github.com/ClickHouse/ClickHouse/pull/58343) ([Azat Khuzhin](https://github.com/azat)).
+* Correctly handle keys with dot in the name in configurations XMLs. [#58354](https://github.com/ClickHouse/ClickHouse/pull/58354) ([Azat Khuzhin](https://github.com/azat)).
+* Added comments (brief descriptions) to all columns of system tables. The are several reasons fro this: - We use system tables a lot and sometimes is could be very difficult for developer to understand the purpose and the meaning of a particular column. - We change (add new ones or modify existing) system tables a lot and the documentation for them is always outdated. For example take a look at the documentation page for [`system.parts`](https://clickhouse.com/docs/en/operations/system-tables/parts). It misses a lot of columns - We would like to eventually generate documentation directly from ClickHouse. [#58356](https://github.com/ClickHouse/ClickHouse/pull/58356) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Allow to configure any kind of object storage with any kind of metadata type. [#58357](https://github.com/ClickHouse/ClickHouse/pull/58357) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Make function `format` return constant on constant arguments. This closes [#58355](https://github.com/ClickHouse/ClickHouse/issues/58355). [#58358](https://github.com/ClickHouse/ClickHouse/pull/58358) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Attach all system tables in `clickhouse-local`, including `system.parts`. This closes [#58312](https://github.com/ClickHouse/ClickHouse/issues/58312). [#58359](https://github.com/ClickHouse/ClickHouse/pull/58359) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Support for `Enum` data types in function `transform`. This closes [#58241](https://github.com/ClickHouse/ClickHouse/issues/58241). [#58360](https://github.com/ClickHouse/ClickHouse/pull/58360) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Allow registering database engines independently. [#58365](https://github.com/ClickHouse/ClickHouse/pull/58365) ([Bharat Nallan](https://github.com/bharatnc)).
+* Adding a setting `max_estimated_execution_time` to separate `max_execution_time` and `max_estimated_execution_time`. [#58402](https://github.com/ClickHouse/ClickHouse/pull/58402) ([Zhang Yifan](https://github.com/zhangyifan27)).
+* Allow registering interpreters independently. [#58443](https://github.com/ClickHouse/ClickHouse/pull/58443) ([Bharat Nallan](https://github.com/bharatnc)).
+* Provide hint when an invalid database engine name is used. [#58444](https://github.com/ClickHouse/ClickHouse/pull/58444) ([Bharat Nallan](https://github.com/bharatnc)).
+* Avoid huge memory consumption during Keeper startup for more cases. [#58455](https://github.com/ClickHouse/ClickHouse/pull/58455) ([Antonio Andelic](https://github.com/antonio2368)).
+* Add settings for better control of indexes type in Arrow dictionary. Use signed integer type for indexes by default as Arrow recommends. Closes [#57401](https://github.com/ClickHouse/ClickHouse/issues/57401). [#58519](https://github.com/ClickHouse/ClickHouse/pull/58519) ([Kruglov Pavel](https://github.com/Avogar)).
+* Added function `sqidDecode()` which decodes [Sqids](https://sqids.org/). [#58544](https://github.com/ClickHouse/ClickHouse/pull/58544) ([Robert Schulze](https://github.com/rschu1ze)).
+* Allow to read Bool values into String in JSON input formats. It's done under a setting `input_format_json_read_bools_as_strings` that is enabled by default. [#58561](https://github.com/ClickHouse/ClickHouse/pull/58561) ([Kruglov Pavel](https://github.com/Avogar)).
+* Implement [#58575](https://github.com/ClickHouse/ClickHouse/issues/58575) Support `CLICKHOUSE_PASSWORD_FILE ` environment variable when running the docker image. [#58583](https://github.com/ClickHouse/ClickHouse/pull/58583) ([Eyal Halpern Shalev](https://github.com/Eyal-Shalev)).
+* When executing some queries, which require a lot of streams for reading data, the error `"Paste JOIN requires sorted tables only"` was previously thrown. Now the numbers of streams resize to 1 in that case. [#58608](https://github.com/ClickHouse/ClickHouse/pull/58608) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Add `SYSTEM JEMALLOC PURGE` for purging unused jemalloc pages, `SYSTEM JEMALLOC [ ENABLE | DISABLE | FLUSH ] PROFILE` for controlling jemalloc profile if the profiler is enabled. Add jemalloc-related 4LW command in Keeper: `jmst` for dumping jemalloc stats, `jmfp`, `jmep`, `jmdp` for controlling jemalloc profile if the profiler is enabled. [#58665](https://github.com/ClickHouse/ClickHouse/pull/58665) ([Antonio Andelic](https://github.com/antonio2368)).
+* Better message for INVALID_IDENTIFIER error. [#58703](https://github.com/ClickHouse/ClickHouse/pull/58703) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Improved handling of signed numeric literals in normalizeQuery. [#58710](https://github.com/ClickHouse/ClickHouse/pull/58710) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Support Point data type for MySQL. [#58721](https://github.com/ClickHouse/ClickHouse/pull/58721) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* When comparing a Float32 column and a const string, read the string as Float32 (instead of Float64). [#58724](https://github.com/ClickHouse/ClickHouse/pull/58724) ([Raúl Marín](https://github.com/Algunenano)).
+* Improve S3 compatible, add Ecloud EOS storage support. [#58786](https://github.com/ClickHouse/ClickHouse/pull/58786) ([xleoken](https://github.com/xleoken)).
+* Allow `KILL QUERY` to cancel backups / restores. This PR also makes running backups and restores visible in `system.processes`. Also there is a new setting in the server configuration now - `shutdown_wait_backups_and_restores` (default=true) which makes the server either wait on shutdown for all running backups and restores to finish or just cancel them. [#58804](https://github.com/ClickHouse/ClickHouse/pull/58804) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Avro format support Zstd codec. Closes [#58735](https://github.com/ClickHouse/ClickHouse/issues/58735). [#58805](https://github.com/ClickHouse/ClickHouse/pull/58805) ([flynn](https://github.com/ucasfl)).
+* MySQL interface gained support for `net_write_timeout` and `net_read_timeout` settings. `net_write_timeout` is translated into the native `send_timeout` ClickHouse setting and, similarly, `net_read_timeout` into `receive_timeout`. Fixed an issue where it was possible to set MySQL `sql_select_limit` setting only if the entire statement was in upper case. [#58835](https://github.com/ClickHouse/ClickHouse/pull/58835) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Fixing a problem described in [#58719](https://github.com/ClickHouse/ClickHouse/issues/58719). [#58841](https://github.com/ClickHouse/ClickHouse/pull/58841) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Make sure that for custom (created from SQL) disks ether `filesystem_caches_path` (a common directory prefix for all filesystem caches) or `custom_cached_disks_base_directory` (a common directory prefix for only filesystem caches created from custom disks) is specified in server config. `custom_cached_disks_base_directory` has higher priority for custom disks over `filesystem_caches_path`, which is used if the former one is absent. Filesystem cache setting `path` must lie inside that directory, otherwise exception will be thrown preventing disk to be created. This will not affect disks created on an older version and server was upgraded - then the exception will not be thrown to allow the server to successfully start). `custom_cached_disks_base_directory` is added to default server config as `/var/lib/clickhouse/caches/`. Closes [#57825](https://github.com/ClickHouse/ClickHouse/issues/57825). [#58869](https://github.com/ClickHouse/ClickHouse/pull/58869) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* MySQL interface gained compatibility with `SHOW WARNINGS`/`SHOW COUNT(*) WARNINGS` queries, though the returned result is always an empty set. [#58929](https://github.com/ClickHouse/ClickHouse/pull/58929) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Skip unavailable replicas when executing parallel distributed `INSERT SELECT`. [#58931](https://github.com/ClickHouse/ClickHouse/pull/58931) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Display word-descriptive log level while enabling structured log formatting in json. [#58936](https://github.com/ClickHouse/ClickHouse/pull/58936) ([Tim Liou](https://github.com/wheatdog)).
+* MySQL interface gained support for `CAST(x AS SIGNED)` and `CAST(x AS UNSIGNED)` statements via data type aliases: `SIGNED` for Int64, and `UNSIGNED` for UInt64. This improves compatibility with BI tools such as Looker Studio. [#58954](https://github.com/ClickHouse/ClickHouse/pull/58954) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Function `seriesDecomposeSTL()` now returns a baseline component as season + trend components. [#58961](https://github.com/ClickHouse/ClickHouse/pull/58961) ([Bhavna Jindal](https://github.com/bhavnajindal)).
+* Fix memory management in copyDataToS3File. [#58962](https://github.com/ClickHouse/ClickHouse/pull/58962) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Change working directory to data path in docker container. [#58975](https://github.com/ClickHouse/ClickHouse/pull/58975) ([cangyin](https://github.com/cangyin)).
+* Added setting for Azure Blob Storage `azure_max_unexpected_write_error_retries` , can also be set from config under azure section. [#59001](https://github.com/ClickHouse/ClickHouse/pull/59001) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Keeper improvement: reduce Keeper's memory usage for stored nodes. [#59002](https://github.com/ClickHouse/ClickHouse/pull/59002) ([Antonio Andelic](https://github.com/antonio2368)).
+* Allow server to start with broken data lake table. Closes [#58625](https://github.com/ClickHouse/ClickHouse/issues/58625). [#59080](https://github.com/ClickHouse/ClickHouse/pull/59080) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fixes https://github.com/ClickHouse/ClickHouse/pull/59120#issuecomment-1906177350. [#59122](https://github.com/ClickHouse/ClickHouse/pull/59122) ([Arthur Passos](https://github.com/arthurpassos)).
+* The state of URL's #hash in the dashboard is now compressed using [lz-string](https://github.com/pieroxy/lz-string). The default size of the state string is compressed from 6856B to 2823B. [#59124](https://github.com/ClickHouse/ClickHouse/pull/59124) ([Amos Bird](https://github.com/amosbird)).
+* Allow to ignore schema evolution in Iceberg table engine and read all data using schema specified by the user on table creation or latest schema parsed from metadata on table creation. This is done under a setting `iceberg_engine_ignore_schema_evolution` that is disabled by default. Note that enabling this setting can lead to incorrect result as in case of evolved schema all data files will be read using the same schema. [#59133](https://github.com/ClickHouse/ClickHouse/pull/59133) ([Kruglov Pavel](https://github.com/Avogar)).
+* Prohibit mutable operations (`INSERT`/`ALTER`/`OPTIMIZE`/...) on read-only/write-once storages with a proper `TABLE_IS_READ_ONLY` error (to avoid leftovers). Avoid leaving left-overs on write-once disks (`format_version.txt`) on `CREATE`/`ATTACH`. Ignore `DROP` for `ReplicatedMergeTree` (so as for `MergeTree`). Fix iterating over `s3_plain` (`MetadataStorageFromPlainObjectStorage::iterateDirectory`). Note read-only is `web` disk, and write-once is `s3_plain`. [#59170](https://github.com/ClickHouse/ClickHouse/pull/59170) ([Azat Khuzhin](https://github.com/azat)).
+* MySQL interface gained support for `net_write_timeout` and `net_read_timeout` settings. `net_write_timeout` is translated into the native `send_timeout` ClickHouse setting and, similarly, `net_read_timeout` into `receive_timeout`. Fixed an issue where it was possible to set MySQL `sql_select_limit` setting only if the entire statement was in upper case. [#59293](https://github.com/ClickHouse/ClickHouse/pull/59293) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Fix bug in experimental `_block_number` column which could lead to logical error during complex combination of `ALTER`s and `merge`s. Fixes [#56202](https://github.com/ClickHouse/ClickHouse/issues/56202). Replaces [#58601](https://github.com/ClickHouse/ClickHouse/issues/58601). CC @SmitaRKulkarni. [#59295](https://github.com/ClickHouse/ClickHouse/pull/59295) ([alesapin](https://github.com/alesapin)).
+* Play UI understands when an exception is returned inside JSON. Adjustment for [#52853](https://github.com/ClickHouse/ClickHouse/issues/52853). [#59303](https://github.com/ClickHouse/ClickHouse/pull/59303) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* `/binary` HTTP handler allows to specify user, host, and optionally, password in the query string. [#59311](https://github.com/ClickHouse/ClickHouse/pull/59311) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Support backups for compressed in-memory tables. This closes [#57893](https://github.com/ClickHouse/ClickHouse/issues/57893). [#59315](https://github.com/ClickHouse/ClickHouse/pull/59315) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Improve exception message of function regexp_extract, close [#56393](https://github.com/ClickHouse/ClickHouse/issues/56393). [#59319](https://github.com/ClickHouse/ClickHouse/pull/59319) ([李扬](https://github.com/taiyang-li)).
+* Support the FORMAT clause in BACKUP and RESTORE queries. [#59338](https://github.com/ClickHouse/ClickHouse/pull/59338) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Function `concatWithSeparator()` now supports arbitrary argument types (instead of only `String` and `FixedString` arguments). For example, `SELECT concatWithSeparator('.', 'number', 1)` now returns `number.1`. [#59341](https://github.com/ClickHouse/ClickHouse/pull/59341) ([Robert Schulze](https://github.com/rschu1ze)).
+
+#### Build/Testing/Packaging Improvement
+* Improve aliases for clickhouse binary (now `ch`/`clickhouse` is `clickhouse-local` or `clickhouse` depends on the arguments) and add bash completion for new aliases. [#58344](https://github.com/ClickHouse/ClickHouse/pull/58344) ([Azat Khuzhin](https://github.com/azat)).
+* Add settings changes check to CI to check that all settings changes are reflected in settings changes history. [#58555](https://github.com/ClickHouse/ClickHouse/pull/58555) ([Kruglov Pavel](https://github.com/Avogar)).
+* Use tables directly attached from S3 in stateful tests. [#58791](https://github.com/ClickHouse/ClickHouse/pull/58791) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Save the whole `fuzzer.log` as an archive instead of the last 100k lines. `tail -n 100000` often removes lines with table definitions. Example:. [#58821](https://github.com/ClickHouse/ClickHouse/pull/58821) ([Dmitry Novik](https://github.com/novikd)).
+* Enable Rust on OSX ARM64 (this will add fuzzy search in client with skim and prql language, though I don't think that are people who hosts ClickHouse on darwin, so it is mostly for fuzzy search in client I would say). [#59272](https://github.com/ClickHouse/ClickHouse/pull/59272) ([Azat Khuzhin](https://github.com/azat)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Add join keys conversion for nested lowcardinality [#51550](https://github.com/ClickHouse/ClickHouse/pull/51550) ([vdimir](https://github.com/vdimir)).
+* Flatten only true Nested type if flatten_nested=1, not all Array(Tuple) [#56132](https://github.com/ClickHouse/ClickHouse/pull/56132) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix a bug with projections and the aggregate_functions_null_for_empty setting during insertion. [#56944](https://github.com/ClickHouse/ClickHouse/pull/56944) ([Amos Bird](https://github.com/amosbird)).
+* Fixed potential exception due to stale profile UUID [#57263](https://github.com/ClickHouse/ClickHouse/pull/57263) ([Vasily Nemkov](https://github.com/Enmk)).
+* Fix working with read buffers in StreamingFormatExecutor [#57438](https://github.com/ClickHouse/ClickHouse/pull/57438) ([Kruglov Pavel](https://github.com/Avogar)).
+* Ignore MVs with dropped target table during pushing to views [#57520](https://github.com/ClickHouse/ClickHouse/pull/57520) ([Kruglov Pavel](https://github.com/Avogar)).
+* [RFC] Eliminate possible race between ALTER_METADATA and MERGE_PARTS [#57755](https://github.com/ClickHouse/ClickHouse/pull/57755) ([Azat Khuzhin](https://github.com/azat)).
+* Fix the exprs order bug in group by with rollup [#57786](https://github.com/ClickHouse/ClickHouse/pull/57786) ([Chen768959](https://github.com/Chen768959)).
+* Fix lost blobs after dropping a replica with broken detached parts [#58333](https://github.com/ClickHouse/ClickHouse/pull/58333) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Allow users to work with symlinks in user_files_path (again) [#58447](https://github.com/ClickHouse/ClickHouse/pull/58447) ([Duc Canh Le](https://github.com/canhld94)).
+* Fix segfault when graphite table does not have agg function [#58453](https://github.com/ClickHouse/ClickHouse/pull/58453) ([Duc Canh Le](https://github.com/canhld94)).
+* Delay reading from StorageKafka to allow multiple reads in materialized views [#58477](https://github.com/ClickHouse/ClickHouse/pull/58477) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Fix a stupid case of intersecting parts [#58482](https://github.com/ClickHouse/ClickHouse/pull/58482) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* MergeTreePrefetchedReadPool disable for LIMIT only queries [#58505](https://github.com/ClickHouse/ClickHouse/pull/58505) ([Maksim Kita](https://github.com/kitaisreal)).
+* Enable ordinary databases while restoration [#58520](https://github.com/ClickHouse/ClickHouse/pull/58520) ([Jihyuk Bok](https://github.com/tomahawk28)).
+* Fix hive threadpool read ORC/Parquet/... Failed [#58537](https://github.com/ClickHouse/ClickHouse/pull/58537) ([sunny](https://github.com/sunny19930321)).
+* Hide credentials in system.backup_log base_backup_name column [#58550](https://github.com/ClickHouse/ClickHouse/pull/58550) ([Daniel Pozo Escalona](https://github.com/danipozo)).
+* toStartOfInterval for milli- microsencods values rounding [#58557](https://github.com/ClickHouse/ClickHouse/pull/58557) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Disable max_joined_block_rows in ConcurrentHashJoin [#58595](https://github.com/ClickHouse/ClickHouse/pull/58595) ([vdimir](https://github.com/vdimir)).
+* Fix join using nullable in old analyzer [#58596](https://github.com/ClickHouse/ClickHouse/pull/58596) ([vdimir](https://github.com/vdimir)).
+* `makeDateTime64()`: Allow non-const fraction argument [#58597](https://github.com/ClickHouse/ClickHouse/pull/58597) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix possible NULL dereference during symbolizing inline frames [#58607](https://github.com/ClickHouse/ClickHouse/pull/58607) ([Azat Khuzhin](https://github.com/azat)).
+* Improve isolation of query cache entries under re-created users or role switches [#58611](https://github.com/ClickHouse/ClickHouse/pull/58611) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix broken partition key analysis when doing projection optimization [#58638](https://github.com/ClickHouse/ClickHouse/pull/58638) ([Amos Bird](https://github.com/amosbird)).
+* Query cache: Fix per-user quota [#58731](https://github.com/ClickHouse/ClickHouse/pull/58731) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix stream partitioning in parallel window functions [#58739](https://github.com/ClickHouse/ClickHouse/pull/58739) ([Dmitry Novik](https://github.com/novikd)).
+* Fix double destroy call on exception throw in addBatchLookupTable8 [#58745](https://github.com/ClickHouse/ClickHouse/pull/58745) ([Raúl Marín](https://github.com/Algunenano)).
+* Don't process requests in Keeper during shutdown [#58765](https://github.com/ClickHouse/ClickHouse/pull/58765) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix Segfault in `SlabsPolygonIndex::find` [#58771](https://github.com/ClickHouse/ClickHouse/pull/58771) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Fix JSONExtract function for LowCardinality(Nullable) columns [#58808](https://github.com/ClickHouse/ClickHouse/pull/58808) ([vdimir](https://github.com/vdimir)).
+* Table CREATE DROP Poco::Logger memory leak fix [#58831](https://github.com/ClickHouse/ClickHouse/pull/58831) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix HTTP compressors finalization [#58846](https://github.com/ClickHouse/ClickHouse/pull/58846) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Multiple read file log storage in mv [#58877](https://github.com/ClickHouse/ClickHouse/pull/58877) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Restriction for the access key id for s3. [#58900](https://github.com/ClickHouse/ClickHouse/pull/58900) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* Fix possible crash in clickhouse-local during loading suggestions [#58907](https://github.com/ClickHouse/ClickHouse/pull/58907) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix crash when indexHint() is used [#58911](https://github.com/ClickHouse/ClickHouse/pull/58911) ([Dmitry Novik](https://github.com/novikd)).
+* Fix StorageURL forgetting headers on server restart [#58933](https://github.com/ClickHouse/ClickHouse/pull/58933) ([Michael Kolupaev](https://github.com/al13n321)).
+* Analyzer: fix storage replacement with insertion block [#58958](https://github.com/ClickHouse/ClickHouse/pull/58958) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Fix seek in ReadBufferFromZipArchive [#58966](https://github.com/ClickHouse/ClickHouse/pull/58966) ([Michael Kolupaev](https://github.com/al13n321)).
+* `DROP INDEX` of inverted index now removes all relevant files from persistence [#59040](https://github.com/ClickHouse/ClickHouse/pull/59040) ([mochi](https://github.com/MochiXu)).
+* Fix data race on query_factories_info [#59049](https://github.com/ClickHouse/ClickHouse/pull/59049) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Disable "Too many redirects" error  retry [#59099](https://github.com/ClickHouse/ClickHouse/pull/59099) ([skyoct](https://github.com/skyoct)).
+* Fix aggregation issue in mixed x86_64 and ARM clusters [#59132](https://github.com/ClickHouse/ClickHouse/pull/59132) ([Harry Lee](https://github.com/HarryLeeIBM)).
+* Fix not started database shutdown deadlock [#59137](https://github.com/ClickHouse/ClickHouse/pull/59137) ([Sergei Trifonov](https://github.com/serxa)).
+* Fix: LIMIT BY and LIMIT in distributed query [#59153](https://github.com/ClickHouse/ClickHouse/pull/59153) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix crash with nullable timezone for `toString` [#59190](https://github.com/ClickHouse/ClickHouse/pull/59190) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Fix abort in iceberg metadata on bad file paths [#59275](https://github.com/ClickHouse/ClickHouse/pull/59275) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix architecture name in select of Rust target [#59307](https://github.com/ClickHouse/ClickHouse/pull/59307) ([p1rattttt](https://github.com/p1rattttt)).
+* Fix not-ready set for system.tables [#59351](https://github.com/ClickHouse/ClickHouse/pull/59351) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix lazy initialization in RabbitMQ [#59352](https://github.com/ClickHouse/ClickHouse/pull/59352) ([Kruglov Pavel](https://github.com/Avogar)).
+
+#### NO CL ENTRY
+
+* NO CL ENTRY:  'Revert "Refreshable materialized views (takeover)"'. [#58296](https://github.com/ClickHouse/ClickHouse/pull/58296) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* NO CL ENTRY:  'Revert "Fix an error in the release script - it didn't allow to make 23.12."'. [#58381](https://github.com/ClickHouse/ClickHouse/pull/58381) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* NO CL ENTRY:  'Revert "Use CH Buffer for HTTP out stream, add metrics for interfaces"'. [#58450](https://github.com/ClickHouse/ClickHouse/pull/58450) ([Raúl Marín](https://github.com/Algunenano)).
+* NO CL ENTRY:  'Second attempt: Use CH Buffer for HTTP out stream, add metrics for interfaces'. [#58475](https://github.com/ClickHouse/ClickHouse/pull/58475) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* NO CL ENTRY:  'Revert "Merging [#53757](https://github.com/ClickHouse/ClickHouse/issues/53757)"'. [#58542](https://github.com/ClickHouse/ClickHouse/pull/58542) ([Raúl Marín](https://github.com/Algunenano)).
+* NO CL ENTRY:  'Revert "Add support for MySQL `net_write_timeout` and `net_read_timeout` settings"'. [#58872](https://github.com/ClickHouse/ClickHouse/pull/58872) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* NO CL ENTRY:  'Revert "Extend performance test norm_dist.xml"'. [#58989](https://github.com/ClickHouse/ClickHouse/pull/58989) ([Raúl Marín](https://github.com/Algunenano)).
+* NO CL ENTRY:  'Revert "Add a test for [#47892](https://github.com/ClickHouse/ClickHouse/issues/47892)"'. [#58990](https://github.com/ClickHouse/ClickHouse/pull/58990) ([Raúl Marín](https://github.com/Algunenano)).
+* NO CL ENTRY:  'Revert "Allow parallel replicas for JOIN with analyzer [part 1]."'. [#59059](https://github.com/ClickHouse/ClickHouse/pull/59059) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* NO CL ENTRY:  'Revert "Consume leading zeroes when parsing a number in ConstantExpressionTemplate"'. [#59070](https://github.com/ClickHouse/ClickHouse/pull/59070) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* NO CL ENTRY:  'Revert "Revert "Allow parallel replicas for JOIN with analyzer [part 1].""'. [#59076](https://github.com/ClickHouse/ClickHouse/pull/59076) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* NO CL ENTRY:  'Revert "Allow to attach partition from table with different partition expression when destination partition expression doesn't re-partition"'. [#59120](https://github.com/ClickHouse/ClickHouse/pull/59120) ([Robert Schulze](https://github.com/rschu1ze)).
+* NO CL ENTRY:  'DisksApp.cpp: fix typo (specifiged → specified)'. [#59140](https://github.com/ClickHouse/ClickHouse/pull/59140) ([Nikolay Edigaryev](https://github.com/edigaryev)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Analyzer: Fix resolving subcolumns in JOIN [#49703](https://github.com/ClickHouse/ClickHouse/pull/49703) ([vdimir](https://github.com/vdimir)).
+* Analyzer: always qualify execution names [#53705](https://github.com/ClickHouse/ClickHouse/pull/53705) ([Dmitry Novik](https://github.com/novikd)).
+* Insert quorum: check host node version in addition [#55528](https://github.com/ClickHouse/ClickHouse/pull/55528) ([Igor Nikonov](https://github.com/devcrafter)).
+* Remove more old code of projection analysis [#55579](https://github.com/ClickHouse/ClickHouse/pull/55579) ([Anton Popov](https://github.com/CurtizJ)).
+* Better exception messages in input formats [#57053](https://github.com/ClickHouse/ClickHouse/pull/57053) ([Kruglov Pavel](https://github.com/Avogar)).
+* Parallel replicas custom key: skip unavailable replicas [#57235](https://github.com/ClickHouse/ClickHouse/pull/57235) ([Igor Nikonov](https://github.com/devcrafter)).
+* Small change in log message in MergeTreeDataMergerMutator [#57550](https://github.com/ClickHouse/ClickHouse/pull/57550) ([Nikita Taranov](https://github.com/nickitat)).
+* fs cache: small optimization [#57615](https://github.com/ClickHouse/ClickHouse/pull/57615) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Customizable dependency failure handling for AsyncLoader [#57697](https://github.com/ClickHouse/ClickHouse/pull/57697) ([Sergei Trifonov](https://github.com/serxa)).
+* Bring test back [#57700](https://github.com/ClickHouse/ClickHouse/pull/57700) ([Nikita Taranov](https://github.com/nickitat)).
+* Change default database name in clickhouse-local to 'default' [#57774](https://github.com/ClickHouse/ClickHouse/pull/57774) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add option `--show-whitespaces-in-diff` to clickhouse-test [#57870](https://github.com/ClickHouse/ClickHouse/pull/57870) ([vdimir](https://github.com/vdimir)).
+* Update `query_masking_rules` when reloading the config, attempt 2 [#57993](https://github.com/ClickHouse/ClickHouse/pull/57993) ([Mikhail Koviazin](https://github.com/mkmkme)).
+* Remove unneeded parameter `use_external_buffer` from `AsynchronousReadBuffer*` [#58077](https://github.com/ClickHouse/ClickHouse/pull/58077) ([Nikita Taranov](https://github.com/nickitat)).
+* Print another message in Bugfix check if internal check had been failed [#58091](https://github.com/ClickHouse/ClickHouse/pull/58091) ([vdimir](https://github.com/vdimir)).
+* Refactor StorageMerge virtual columns filtering. [#58255](https://github.com/ClickHouse/ClickHouse/pull/58255) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Analyzer: fix tuple comparison when result is always null [#58266](https://github.com/ClickHouse/ClickHouse/pull/58266) ([vdimir](https://github.com/vdimir)).
+* Fix an error in the release script - it didn't allow to make 23.12. [#58288](https://github.com/ClickHouse/ClickHouse/pull/58288) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Update version_date.tsv and changelogs after v23.12.1.1368-stable [#58290](https://github.com/ClickHouse/ClickHouse/pull/58290) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Fix test_storage_s3_queue/test.py::test_drop_table [#58293](https://github.com/ClickHouse/ClickHouse/pull/58293) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix timeout in 01732_race_condition_storage_join_long [#58298](https://github.com/ClickHouse/ClickHouse/pull/58298) ([vdimir](https://github.com/vdimir)).
+* Handle another case for preprocessing in Keeper [#58308](https://github.com/ClickHouse/ClickHouse/pull/58308) ([Antonio Andelic](https://github.com/antonio2368)).
+* Disable max_bytes_before_external* in 00172_hits_joins [#58309](https://github.com/ClickHouse/ClickHouse/pull/58309) ([vdimir](https://github.com/vdimir)).
+* Analyzer: support functional arguments in USING clause [#58317](https://github.com/ClickHouse/ClickHouse/pull/58317) ([Dmitry Novik](https://github.com/novikd)).
+* Fixed logical error in CheckSortedTransform [#58318](https://github.com/ClickHouse/ClickHouse/pull/58318) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Refreshable materialized views again [#58320](https://github.com/ClickHouse/ClickHouse/pull/58320) ([Michael Kolupaev](https://github.com/al13n321)).
+* Organize symbols from src/* into DB namespace [#58336](https://github.com/ClickHouse/ClickHouse/pull/58336) ([Amos Bird](https://github.com/amosbird)).
+* Add a style check against DOS and Windows [#58345](https://github.com/ClickHouse/ClickHouse/pull/58345) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Check what happen if remove array joined columns from KeyCondition [#58346](https://github.com/ClickHouse/ClickHouse/pull/58346) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Upload time of the perf tests into artifacts as test_duration_ms [#58348](https://github.com/ClickHouse/ClickHouse/pull/58348) ([Azat Khuzhin](https://github.com/azat)).
+* Keep exception format string in retries ctl [#58351](https://github.com/ClickHouse/ClickHouse/pull/58351) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix replication.lib helper (system.mutations has database not current_database) [#58352](https://github.com/ClickHouse/ClickHouse/pull/58352) ([Azat Khuzhin](https://github.com/azat)).
+* Refactor StorageHDFS and StorageFile virtual columns filtering [#58353](https://github.com/ClickHouse/ClickHouse/pull/58353) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix suspended workers for AsyncLoader [#58362](https://github.com/ClickHouse/ClickHouse/pull/58362) ([Sergei Trifonov](https://github.com/serxa)).
+* Remove stale events from README [#58364](https://github.com/ClickHouse/ClickHouse/pull/58364) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Do not fail the CI on an expired token [#58384](https://github.com/ClickHouse/ClickHouse/pull/58384) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Add a test for [#38534](https://github.com/ClickHouse/ClickHouse/issues/38534) [#58391](https://github.com/ClickHouse/ClickHouse/pull/58391) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* fix database engine validation inside database factory [#58395](https://github.com/ClickHouse/ClickHouse/pull/58395) ([Bharat Nallan](https://github.com/bharatnc)).
+* Fix bad formatting of the `timeDiff` compatibility alias [#58398](https://github.com/ClickHouse/ClickHouse/pull/58398) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix a comment; remove unused method; stop using pointers [#58399](https://github.com/ClickHouse/ClickHouse/pull/58399) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix test_user_valid_until [#58409](https://github.com/ClickHouse/ClickHouse/pull/58409) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Make a test not depend on the lack of floating point associativity [#58439](https://github.com/ClickHouse/ClickHouse/pull/58439) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix `02944_dynamically_change_filesystem_cache_size` [#58445](https://github.com/ClickHouse/ClickHouse/pull/58445) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Analyzer: Fix LOGICAL_ERROR with LowCardinality [#58457](https://github.com/ClickHouse/ClickHouse/pull/58457) ([Dmitry Novik](https://github.com/novikd)).
+* Replace `std::regex` by re2 [#58458](https://github.com/ClickHouse/ClickHouse/pull/58458) ([Robert Schulze](https://github.com/rschu1ze)).
+* Improve perf tests [#58478](https://github.com/ClickHouse/ClickHouse/pull/58478) ([Raúl Marín](https://github.com/Algunenano)).
+* Check if I can remove KeyCondition analysis on AST. [#58480](https://github.com/ClickHouse/ClickHouse/pull/58480) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix some thread pool settings not updating at runtime [#58485](https://github.com/ClickHouse/ClickHouse/pull/58485) ([Michael Kolupaev](https://github.com/al13n321)).
+* Lower log levels for some Raft logs to new test level [#58487](https://github.com/ClickHouse/ClickHouse/pull/58487) ([Antonio Andelic](https://github.com/antonio2368)).
+* PartsSplitter small refactoring [#58506](https://github.com/ClickHouse/ClickHouse/pull/58506) ([Maksim Kita](https://github.com/kitaisreal)).
+* Sync content of the docker test images [#58507](https://github.com/ClickHouse/ClickHouse/pull/58507) ([Max K.](https://github.com/maxknv)).
+* CI: move ci-specifics from job scripts to ci.py [#58516](https://github.com/ClickHouse/ClickHouse/pull/58516) ([Max K.](https://github.com/maxknv)).
+* Minor fixups for `sqid()` [#58517](https://github.com/ClickHouse/ClickHouse/pull/58517) ([Robert Schulze](https://github.com/rschu1ze)).
+* Update version_date.tsv and changelogs after v23.12.2.59-stable [#58545](https://github.com/ClickHouse/ClickHouse/pull/58545) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.11.4.24-stable [#58546](https://github.com/ClickHouse/ClickHouse/pull/58546) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.8.9.54-lts [#58547](https://github.com/ClickHouse/ClickHouse/pull/58547) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.10.6.60-stable [#58548](https://github.com/ClickHouse/ClickHouse/pull/58548) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.3.19.32-lts [#58549](https://github.com/ClickHouse/ClickHouse/pull/58549) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update CHANGELOG.md [#58559](https://github.com/ClickHouse/ClickHouse/pull/58559) ([Konstantin Bogdanov](https://github.com/thevar1able)).
+* Fix test 02932_kill_query_sleep [#58560](https://github.com/ClickHouse/ClickHouse/pull/58560) ([Vitaly Baranov](https://github.com/vitlibar)).
+* CI fix. Add packager script to build digest [#58571](https://github.com/ClickHouse/ClickHouse/pull/58571) ([Max K.](https://github.com/maxknv)).
+* fix and test that S3Clients are reused [#58573](https://github.com/ClickHouse/ClickHouse/pull/58573) ([Sema Checherinda](https://github.com/CheSema)).
+* Follow-up to [#58482](https://github.com/ClickHouse/ClickHouse/issues/58482) [#58574](https://github.com/ClickHouse/ClickHouse/pull/58574) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Do not load database engines in suggest [#58586](https://github.com/ClickHouse/ClickHouse/pull/58586) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix wrong message in Keeper [#58588](https://github.com/ClickHouse/ClickHouse/pull/58588) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add some missing LLVM includes [#58594](https://github.com/ClickHouse/ClickHouse/pull/58594) ([Raúl Marín](https://github.com/Algunenano)).
+* Small fix in Keeper [#58598](https://github.com/ClickHouse/ClickHouse/pull/58598) ([Antonio Andelic](https://github.com/antonio2368)).
+* Update analyzer_tech_debt.txt [#58599](https://github.com/ClickHouse/ClickHouse/pull/58599) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Simplify release.py script [#58600](https://github.com/ClickHouse/ClickHouse/pull/58600) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Update analyzer_tech_debt.txt [#58602](https://github.com/ClickHouse/ClickHouse/pull/58602) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Refactor stacktrace symbolizer to avoid copy-paste [#58610](https://github.com/ClickHouse/ClickHouse/pull/58610) ([Azat Khuzhin](https://github.com/azat)).
+* Add intel AMX checking [#58617](https://github.com/ClickHouse/ClickHouse/pull/58617) ([Roman Glinskikh](https://github.com/omgronny)).
+* Optional `client` argument for `S3Helper` [#58619](https://github.com/ClickHouse/ClickHouse/pull/58619) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Add sorting to 02366_kql_summarize.sql [#58621](https://github.com/ClickHouse/ClickHouse/pull/58621) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix possible race in ManyAggregatedData dtor. [#58624](https://github.com/ClickHouse/ClickHouse/pull/58624) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Remove more projections code [#58628](https://github.com/ClickHouse/ClickHouse/pull/58628) ([Anton Popov](https://github.com/CurtizJ)).
+* Remove finalize() from ~WriteBufferFromEncryptedFile [#58629](https://github.com/ClickHouse/ClickHouse/pull/58629) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Update test_replicated_database/test.py [#58647](https://github.com/ClickHouse/ClickHouse/pull/58647) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Try disabling `muzzy_decay_ms` in jemalloc [#58648](https://github.com/ClickHouse/ClickHouse/pull/58648) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix test_replicated_database::test_startup_without_zk flakiness [#58649](https://github.com/ClickHouse/ClickHouse/pull/58649) ([Azat Khuzhin](https://github.com/azat)).
+* Fix 01600_remerge_sort_lowered_memory_bytes_ratio flakiness (due to settings randomization) [#58650](https://github.com/ClickHouse/ClickHouse/pull/58650) ([Azat Khuzhin](https://github.com/azat)).
+* Analyzer: Fix assertion in HashJoin with duplicate columns [#58652](https://github.com/ClickHouse/ClickHouse/pull/58652) ([vdimir](https://github.com/vdimir)).
+* Document that `match()` can use `ngrambf_v1` and `tokenbf_v1` indexes [#58655](https://github.com/ClickHouse/ClickHouse/pull/58655) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix perf tests duration (checks.test_duration_ms) [#58656](https://github.com/ClickHouse/ClickHouse/pull/58656) ([Azat Khuzhin](https://github.com/azat)).
+* Analyzer: Correctly handle constant set in index [#58657](https://github.com/ClickHouse/ClickHouse/pull/58657) ([Dmitry Novik](https://github.com/novikd)).
+* fix a typo in stress randomization setting [#58658](https://github.com/ClickHouse/ClickHouse/pull/58658) ([Sema Checherinda](https://github.com/CheSema)).
+* Small follow-up to `std::regex` --> `re2` conversion ([#58458](https://github.com/ClickHouse/ClickHouse/issues/58458)) [#58678](https://github.com/ClickHouse/ClickHouse/pull/58678) ([Robert Schulze](https://github.com/rschu1ze)).
+* Remove `<regex>` from libcxx [#58681](https://github.com/ClickHouse/ClickHouse/pull/58681) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix bad log message [#58698](https://github.com/ClickHouse/ClickHouse/pull/58698) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Some small improvements to version_helper from [#57203](https://github.com/ClickHouse/ClickHouse/issues/57203) [#58712](https://github.com/ClickHouse/ClickHouse/pull/58712) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Small fixes in different helpers [#58717](https://github.com/ClickHouse/ClickHouse/pull/58717) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix bug in new (not released yet) parallel replicas coordinator [#58722](https://github.com/ClickHouse/ClickHouse/pull/58722) ([Nikita Taranov](https://github.com/nickitat)).
+* Analyzer: Fix LOGICAL_ERROR in CountDistinctPass [#58723](https://github.com/ClickHouse/ClickHouse/pull/58723) ([Dmitry Novik](https://github.com/novikd)).
+* Fix reading of offsets subcolumn (`size0`) from `Nested` [#58729](https://github.com/ClickHouse/ClickHouse/pull/58729) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix Mac OS X [#58733](https://github.com/ClickHouse/ClickHouse/pull/58733) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* fix stress with generate-template-key [#58740](https://github.com/ClickHouse/ClickHouse/pull/58740) ([Sema Checherinda](https://github.com/CheSema)).
+* more relaxed check [#58751](https://github.com/ClickHouse/ClickHouse/pull/58751) ([Sema Checherinda](https://github.com/CheSema)).
+* Fix usage of small buffers for remote reading [#58768](https://github.com/ClickHouse/ClickHouse/pull/58768) ([Nikita Taranov](https://github.com/nickitat)).
+* Add missing includes when _LIBCPP_REMOVE_TRANSITIVE_INCLUDES enabled [#58770](https://github.com/ClickHouse/ClickHouse/pull/58770) ([Artem Alperin](https://github.com/hdnpth)).
+* Remove some code [#58772](https://github.com/ClickHouse/ClickHouse/pull/58772) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove some code [#58790](https://github.com/ClickHouse/ClickHouse/pull/58790) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix trash in performance tests [#58794](https://github.com/ClickHouse/ClickHouse/pull/58794) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix data race in Keeper [#58806](https://github.com/ClickHouse/ClickHouse/pull/58806) ([Antonio Andelic](https://github.com/antonio2368)).
+* Increase log level to trace to help debug `00993_system_parts_race_condition_drop_zookeeper` [#58809](https://github.com/ClickHouse/ClickHouse/pull/58809) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* DatabaseCatalog background tasks add log names [#58832](https://github.com/ClickHouse/ClickHouse/pull/58832) ([Maksim Kita](https://github.com/kitaisreal)).
+* Analyzer: Resolve GROUPING function on shards [#58833](https://github.com/ClickHouse/ClickHouse/pull/58833) ([Dmitry Novik](https://github.com/novikd)).
+* Allow parallel replicas for JOIN with analyzer [part 1]. [#58838](https://github.com/ClickHouse/ClickHouse/pull/58838) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix `isRetry` method [#58839](https://github.com/ClickHouse/ClickHouse/pull/58839) ([alesapin](https://github.com/alesapin)).
+* fs cache: fix data race in slru [#58842](https://github.com/ClickHouse/ClickHouse/pull/58842) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix reading from an invisible part in new (not released yet) parallel replicas coordinator [#58844](https://github.com/ClickHouse/ClickHouse/pull/58844) ([Nikita Taranov](https://github.com/nickitat)).
+* Fix bad log message [#58849](https://github.com/ClickHouse/ClickHouse/pull/58849) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Set max_bytes_before_external_group_by in 01961_roaring_memory_tracking [#58863](https://github.com/ClickHouse/ClickHouse/pull/58863) ([vdimir](https://github.com/vdimir)).
+* Fix `00089_group_by_arrays_of_fixed` with external aggregation [#58873](https://github.com/ClickHouse/ClickHouse/pull/58873) ([Antonio Andelic](https://github.com/antonio2368)).
+* DiskWeb minor improvement in loading [#58874](https://github.com/ClickHouse/ClickHouse/pull/58874) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix RPN construction for indexHint [#58875](https://github.com/ClickHouse/ClickHouse/pull/58875) ([Dmitry Novik](https://github.com/novikd)).
+* Analyzer: add test with GROUP BY on shards [#58876](https://github.com/ClickHouse/ClickHouse/pull/58876) ([Dmitry Novik](https://github.com/novikd)).
+* Jepsen job to reuse builds [#58881](https://github.com/ClickHouse/ClickHouse/pull/58881) ([Max K.](https://github.com/maxknv)).
+* Fix ambiguity in the setting description [#58883](https://github.com/ClickHouse/ClickHouse/pull/58883) ([Denny Crane](https://github.com/den-crane)).
+* Less error prone interface of read buffers [#58886](https://github.com/ClickHouse/ClickHouse/pull/58886) ([Anton Popov](https://github.com/CurtizJ)).
+* Add metric for keeper memory soft limit [#58890](https://github.com/ClickHouse/ClickHouse/pull/58890) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+* Add a test for [#47988](https://github.com/ClickHouse/ClickHouse/issues/47988) [#58893](https://github.com/ClickHouse/ClickHouse/pull/58893) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Whitespaces [#58894](https://github.com/ClickHouse/ClickHouse/pull/58894) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix data race in `AggregatingTransform` [#58896](https://github.com/ClickHouse/ClickHouse/pull/58896) ([Antonio Andelic](https://github.com/antonio2368)).
+* Update SLRUFileCachePriority.cpp [#58898](https://github.com/ClickHouse/ClickHouse/pull/58898) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add tests for [#57193](https://github.com/ClickHouse/ClickHouse/issues/57193) [#58899](https://github.com/ClickHouse/ClickHouse/pull/58899) ([Raúl Marín](https://github.com/Algunenano)).
+* Add log for already download binary in Jepsen [#58901](https://github.com/ClickHouse/ClickHouse/pull/58901) ([Antonio Andelic](https://github.com/antonio2368)).
+* fs cache: minor refactoring [#58902](https://github.com/ClickHouse/ClickHouse/pull/58902) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Checking on flaky test_parallel_replicas_custom_key_failover [#58909](https://github.com/ClickHouse/ClickHouse/pull/58909) ([Igor Nikonov](https://github.com/devcrafter)).
+* Style fix [#58913](https://github.com/ClickHouse/ClickHouse/pull/58913) ([Dmitry Novik](https://github.com/novikd)).
+* Opentelemetry spans to analyze CPU and S3 bottlenecks on inserts [#58914](https://github.com/ClickHouse/ClickHouse/pull/58914) ([Alexander Gololobov](https://github.com/davenger)).
+* Fix fault handler in case of thread (for fault handler) cannot be spawned [#58917](https://github.com/ClickHouse/ClickHouse/pull/58917) ([Azat Khuzhin](https://github.com/azat)).
+* Analyzer: Support GROUP BY injective function elimination [#58919](https://github.com/ClickHouse/ClickHouse/pull/58919) ([Dmitry Novik](https://github.com/novikd)).
+* Cancel MasterCI in PRs [#58920](https://github.com/ClickHouse/ClickHouse/pull/58920) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix and test for azure [#58697](https://github.com/ClickHouse/ClickHouse/issues/58697) [#58921](https://github.com/ClickHouse/ClickHouse/pull/58921) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Extend performance test norm_dist.xml [#58922](https://github.com/ClickHouse/ClickHouse/pull/58922) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add regression test for parallel replicas (follow up [#58722](https://github.com/ClickHouse/ClickHouse/issues/58722), [#58844](https://github.com/ClickHouse/ClickHouse/issues/58844)) [#58923](https://github.com/ClickHouse/ClickHouse/pull/58923) ([Nikita Taranov](https://github.com/nickitat)).
+* Add a test for [#47892](https://github.com/ClickHouse/ClickHouse/issues/47892) [#58927](https://github.com/ClickHouse/ClickHouse/pull/58927) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix `FunctionToSubcolumnsPass` in debug build [#58930](https://github.com/ClickHouse/ClickHouse/pull/58930) ([Anton Popov](https://github.com/CurtizJ)).
+* Call `getMaxFileDescriptorCount` once in Keeper [#58938](https://github.com/ClickHouse/ClickHouse/pull/58938) ([Antonio Andelic](https://github.com/antonio2368)).
+* Add missing files to digests [#58942](https://github.com/ClickHouse/ClickHouse/pull/58942) ([Raúl Marín](https://github.com/Algunenano)).
+* Analyzer: fix join column not found with compound identifiers [#58943](https://github.com/ClickHouse/ClickHouse/pull/58943) ([vdimir](https://github.com/vdimir)).
+* CI: pr_info to provide event_type for job scripts [#58947](https://github.com/ClickHouse/ClickHouse/pull/58947) ([Max K.](https://github.com/maxknv)).
+* Using the destination object for  paths generation in S3copy. [#58949](https://github.com/ClickHouse/ClickHouse/pull/58949) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* Fix data race in slru (2) [#58950](https://github.com/ClickHouse/ClickHouse/pull/58950) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix flaky test_postgresql_replica_database_engine_2/test.py::test_dependent_loading [#58951](https://github.com/ClickHouse/ClickHouse/pull/58951) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* More safe way to dump system logs in tests [#58955](https://github.com/ClickHouse/ClickHouse/pull/58955) ([alesapin](https://github.com/alesapin)).
+* Add a comment about sparse checkout [#58960](https://github.com/ClickHouse/ClickHouse/pull/58960) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Follow up to [#58357](https://github.com/ClickHouse/ClickHouse/issues/58357) [#58963](https://github.com/ClickHouse/ClickHouse/pull/58963) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Better error message about tuples [#58971](https://github.com/ClickHouse/ClickHouse/pull/58971) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix timeout for prometheus exporter for HTTP/1.1 (due to keep-alive) [#58981](https://github.com/ClickHouse/ClickHouse/pull/58981) ([Azat Khuzhin](https://github.com/azat)).
+* Fix 02891_array_shingles with analyzer [#58982](https://github.com/ClickHouse/ClickHouse/pull/58982) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix script name in SQL example in executable.md [#58984](https://github.com/ClickHouse/ClickHouse/pull/58984) ([Lino Uruñuela](https://github.com/Wachynaky)).
+* Fix typo [#58986](https://github.com/ClickHouse/ClickHouse/pull/58986) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Revert flaky [#58992](https://github.com/ClickHouse/ClickHouse/pull/58992) ([Raúl Marín](https://github.com/Algunenano)).
+* Revive: Parallel replicas custom key: skip unavailable replicas [#58993](https://github.com/ClickHouse/ClickHouse/pull/58993) ([Igor Nikonov](https://github.com/devcrafter)).
+* Make performance test `test norm_dist.xml` more realistic [#58995](https://github.com/ClickHouse/ClickHouse/pull/58995) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix 02404_memory_bound_merging with analyzer (follow up [#56419](https://github.com/ClickHouse/ClickHouse/issues/56419)) [#58996](https://github.com/ClickHouse/ClickHouse/pull/58996) ([Nikita Taranov](https://github.com/nickitat)).
+* Add test for [#58930](https://github.com/ClickHouse/ClickHouse/issues/58930) [#58999](https://github.com/ClickHouse/ClickHouse/pull/58999) ([Anton Popov](https://github.com/CurtizJ)).
+* initialization ConnectionTimeouts [#59000](https://github.com/ClickHouse/ClickHouse/pull/59000) ([Sema Checherinda](https://github.com/CheSema)).
+* DiskWeb fix loading [#59006](https://github.com/ClickHouse/ClickHouse/pull/59006) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update log level for http buffer [#59008](https://github.com/ClickHouse/ClickHouse/pull/59008) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Change log level for super imporant message in Keeper [#59010](https://github.com/ClickHouse/ClickHouse/pull/59010) ([alesapin](https://github.com/alesapin)).
+* Fix async loader stress test [#59011](https://github.com/ClickHouse/ClickHouse/pull/59011) ([Sergei Trifonov](https://github.com/serxa)).
+* Remove `StaticResourceManager` [#59013](https://github.com/ClickHouse/ClickHouse/pull/59013) ([Sergei Trifonov](https://github.com/serxa)).
+* preserve 'amz-sdk-invocation-id' and 'amz-sdk-request' headers with gcp [#59015](https://github.com/ClickHouse/ClickHouse/pull/59015) ([Sema Checherinda](https://github.com/CheSema)).
+* Update rename.md [#59017](https://github.com/ClickHouse/ClickHouse/pull/59017) ([filimonov](https://github.com/filimonov)).
+* очепятка [#59024](https://github.com/ClickHouse/ClickHouse/pull/59024) ([edpyt](https://github.com/edpyt)).
+* Split resource scheduler off `IO/` into `Common/Scheduler/` [#59025](https://github.com/ClickHouse/ClickHouse/pull/59025) ([Sergei Trifonov](https://github.com/serxa)).
+* Add a parameter for testing purposes [#59027](https://github.com/ClickHouse/ClickHouse/pull/59027) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix test 02932_kill_query_sleep when running with query cache [#59041](https://github.com/ClickHouse/ClickHouse/pull/59041) ([Vitaly Baranov](https://github.com/vitlibar)).
+* CI: Jepsen: fix sanity check in ci.py [#59043](https://github.com/ClickHouse/ClickHouse/pull/59043) ([Max K.](https://github.com/maxknv)).
+* CI: add ci_config classes for job and build names [#59046](https://github.com/ClickHouse/ClickHouse/pull/59046) ([Max K.](https://github.com/maxknv)).
+* remove flaky test [#59066](https://github.com/ClickHouse/ClickHouse/pull/59066) ([Sema Checherinda](https://github.com/CheSema)).
+* Followup to 57853 [#59068](https://github.com/ClickHouse/ClickHouse/pull/59068) ([Dmitry Novik](https://github.com/novikd)).
+* Follow-up to [#59027](https://github.com/ClickHouse/ClickHouse/issues/59027) [#59075](https://github.com/ClickHouse/ClickHouse/pull/59075) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix `test_parallel_replicas_invisible_parts` [#59077](https://github.com/ClickHouse/ClickHouse/pull/59077) ([Nikita Taranov](https://github.com/nickitat)).
+* Increase max_bytes_before_external_group_by for 00165_jit_aggregate_functions [#59078](https://github.com/ClickHouse/ClickHouse/pull/59078) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix stateless/run.sh [#59079](https://github.com/ClickHouse/ClickHouse/pull/59079) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* CI: hot fix for reuse [#59081](https://github.com/ClickHouse/ClickHouse/pull/59081) ([Max K.](https://github.com/maxknv)).
+* Fix server shutdown due to exception while loading metadata [#59083](https://github.com/ClickHouse/ClickHouse/pull/59083) ([Sergei Trifonov](https://github.com/serxa)).
+* Coordinator returns ranges for reading in sorted order [#59089](https://github.com/ClickHouse/ClickHouse/pull/59089) ([Nikita Taranov](https://github.com/nickitat)).
+* Raise timeout in 02294_decimal_second_errors [#59090](https://github.com/ClickHouse/ClickHouse/pull/59090) ([Raúl Marín](https://github.com/Algunenano)).
+* Add `[[nodiscard]]` to a couple of methods [#59093](https://github.com/ClickHouse/ClickHouse/pull/59093) ([Nikita Taranov](https://github.com/nickitat)).
+* Docs: Update integer and float aliases [#59100](https://github.com/ClickHouse/ClickHouse/pull/59100) ([Robert Schulze](https://github.com/rschu1ze)).
+* Avoid election timeouts during startup in Keeper [#59102](https://github.com/ClickHouse/ClickHouse/pull/59102) ([Antonio Andelic](https://github.com/antonio2368)).
+* Add missing setting max_estimated_execution_time in  SettingsChangesHistory [#59104](https://github.com/ClickHouse/ClickHouse/pull/59104) ([Kruglov Pavel](https://github.com/Avogar)).
+* Rename some inverted index test files [#59106](https://github.com/ClickHouse/ClickHouse/pull/59106) ([Robert Schulze](https://github.com/rschu1ze)).
+* Further reduce runtime of `norm_distance.xml` [#59108](https://github.com/ClickHouse/ClickHouse/pull/59108) ([Robert Schulze](https://github.com/rschu1ze)).
+* Minor follow-up to [#53710](https://github.com/ClickHouse/ClickHouse/issues/53710) [#59109](https://github.com/ClickHouse/ClickHouse/pull/59109) ([Robert Schulze](https://github.com/rschu1ze)).
+* Update stateless/run.sh [#59116](https://github.com/ClickHouse/ClickHouse/pull/59116) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Followup 57875 [#59117](https://github.com/ClickHouse/ClickHouse/pull/59117) ([Dmitry Novik](https://github.com/novikd)).
+* Fixing build [#59130](https://github.com/ClickHouse/ClickHouse/pull/59130) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Capability check for `s3_plain` [#59145](https://github.com/ClickHouse/ClickHouse/pull/59145) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix `02015_async_inserts_stress_long` [#59146](https://github.com/ClickHouse/ClickHouse/pull/59146) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix AggregateFunctionNothing result type issues introducing it with different names [#59147](https://github.com/ClickHouse/ClickHouse/pull/59147) ([vdimir](https://github.com/vdimir)).
+* Fix url encoding issue [#59162](https://github.com/ClickHouse/ClickHouse/pull/59162) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Upgrade simdjson to v3.6.3 [#59166](https://github.com/ClickHouse/ClickHouse/pull/59166) ([Robert Schulze](https://github.com/rschu1ze)).
+* Decrease log level for one log message [#59168](https://github.com/ClickHouse/ClickHouse/pull/59168) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix broken cache for non-existing temp_path [#59172](https://github.com/ClickHouse/ClickHouse/pull/59172) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Move some headers [#59175](https://github.com/ClickHouse/ClickHouse/pull/59175) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Analyzer: Fix CTE name clash resolution [#59177](https://github.com/ClickHouse/ClickHouse/pull/59177) ([Dmitry Novik](https://github.com/novikd)).
+* Fix another place with special symbols in the URL [#59184](https://github.com/ClickHouse/ClickHouse/pull/59184) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Actions dag build filter actions refactoring [#59228](https://github.com/ClickHouse/ClickHouse/pull/59228) ([Maksim Kita](https://github.com/kitaisreal)).
+* Minor cleanup of msan usage [#59229](https://github.com/ClickHouse/ClickHouse/pull/59229) ([Robert Schulze](https://github.com/rschu1ze)).
+* Load server configs in clickhouse local [#59231](https://github.com/ClickHouse/ClickHouse/pull/59231) ([pufit](https://github.com/pufit)).
+* Make libssh build dependent on `-DENABLE_LIBRARIES` [#59242](https://github.com/ClickHouse/ClickHouse/pull/59242) ([Robert Schulze](https://github.com/rschu1ze)).
+* Disable copy constructor for MultiVersion [#59244](https://github.com/ClickHouse/ClickHouse/pull/59244) ([Vitaly Baranov](https://github.com/vitlibar)).
+* CI: fix ci configuration for nightly job [#59252](https://github.com/ClickHouse/ClickHouse/pull/59252) ([Max K.](https://github.com/maxknv)).
+* Fix 02475_bson_each_row_format flakiness (due to small parsing block) [#59253](https://github.com/ClickHouse/ClickHouse/pull/59253) ([Azat Khuzhin](https://github.com/azat)).
+* Improve pytest --pdb experience by preserving dockerd on SIGINT (v2) [#59255](https://github.com/ClickHouse/ClickHouse/pull/59255) ([Azat Khuzhin](https://github.com/azat)).
+* Fix fasttest by pinning pip dependencies [#59256](https://github.com/ClickHouse/ClickHouse/pull/59256) ([Azat Khuzhin](https://github.com/azat)).
+* Added AtomicLogger [#59273](https://github.com/ClickHouse/ClickHouse/pull/59273) ([Maksim Kita](https://github.com/kitaisreal)).
+* Update test_reload_after_fail_in_cache_dictionary for analyzer [#59274](https://github.com/ClickHouse/ClickHouse/pull/59274) ([vdimir](https://github.com/vdimir)).
+* Update run.sh [#59280](https://github.com/ClickHouse/ClickHouse/pull/59280) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add missing setting optimize_injective_functions_in_group_by to SettingsChangesHistory [#59283](https://github.com/ClickHouse/ClickHouse/pull/59283) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix perf tests (after sumMap starts to filter out -0.) [#59287](https://github.com/ClickHouse/ClickHouse/pull/59287) ([Azat Khuzhin](https://github.com/azat)).
+* Use fresh ZooKeeper client on DROP (to have higher chances on success) [#59288](https://github.com/ClickHouse/ClickHouse/pull/59288) ([Azat Khuzhin](https://github.com/azat)).
+* Additional check [#59292](https://github.com/ClickHouse/ClickHouse/pull/59292) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* No debug symbols in Rust [#59306](https://github.com/ClickHouse/ClickHouse/pull/59306) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix deadlock in `AsyncLoader::stop()` [#59308](https://github.com/ClickHouse/ClickHouse/pull/59308) ([Sergei Trifonov](https://github.com/serxa)).
+* Speed up `00165_jit_aggregate_functions` [#59312](https://github.com/ClickHouse/ClickHouse/pull/59312) ([Nikita Taranov](https://github.com/nickitat)).
+* CI: WA for issue with perf test with artifact reuse [#59325](https://github.com/ClickHouse/ClickHouse/pull/59325) ([Max K.](https://github.com/maxknv)).
+* Fix typo [#59329](https://github.com/ClickHouse/ClickHouse/pull/59329) ([Raúl Marín](https://github.com/Algunenano)).
+* Simplify query_run_metric_arrays in perf tests [#59333](https://github.com/ClickHouse/ClickHouse/pull/59333) ([Raúl Marín](https://github.com/Algunenano)).
+* IVolume constructor improve exception message [#59335](https://github.com/ClickHouse/ClickHouse/pull/59335) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix upgrade check for new setting [#59343](https://github.com/ClickHouse/ClickHouse/pull/59343) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix sccache when building without coverage [#59345](https://github.com/ClickHouse/ClickHouse/pull/59345) ([Raúl Marín](https://github.com/Algunenano)).
+* Loggers initialization fix [#59347](https://github.com/ClickHouse/ClickHouse/pull/59347) ([Maksim Kita](https://github.com/kitaisreal)).
+* Add setting update_insert_deduplication_token_in_dependent_materialized_views to settings changes history [#59349](https://github.com/ClickHouse/ClickHouse/pull/59349) ([Maksim Kita](https://github.com/kitaisreal)).
+* Slightly better memory usage in `AsynchronousBoundedReadBuffer` [#59354](https://github.com/ClickHouse/ClickHouse/pull/59354) ([Anton Popov](https://github.com/CurtizJ)).
+* Try to make variant tests a bit faster [#59355](https://github.com/ClickHouse/ClickHouse/pull/59355) ([Kruglov Pavel](https://github.com/Avogar)).
+* Minor typos in Settings.h [#59371](https://github.com/ClickHouse/ClickHouse/pull/59371) ([Jordi Villar](https://github.com/jrdi)).
+* Rename `quantileDDSketch` to `quantileDD` [#59372](https://github.com/ClickHouse/ClickHouse/pull/59372) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index b2983033e44..34df4a3f0cf 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,3 +1,4 @@
+v24.1.1.2048-stable	2024-01-30
 v23.12.2.59-stable	2024-01-05
 v23.12.1.1368-stable	2023-12-28
 v23.11.4.24-stable	2024-01-05

From e6fcc4847133396958c604392544c26094635f56 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Tue, 30 Jan 2024 17:56:49 +0000
Subject: [PATCH 234/245] CI: fix status and report for docker server jobs

 #no_merge_commit
---
 .github/workflows/backport_branches.yml | 15 +++++++++++----
 .github/workflows/master.yml            | 16 +++++++++++-----
 .github/workflows/pull_request.yml      | 15 +++++++++++----
 .github/workflows/release_branches.yml  | 18 +++++++++++++-----
 tests/ci/ci_config.py                   | 25 ++++++++++++++++++++-----
 5 files changed, 66 insertions(+), 23 deletions(-)

diff --git a/.github/workflows/backport_branches.yml b/.github/workflows/backport_branches.yml
index ef554a1b0ff..6b05f1fe9f4 100644
--- a/.github/workflows/backport_branches.yml
+++ b/.github/workflows/backport_branches.yml
@@ -138,19 +138,26 @@ jobs:
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
-  DockerServerImages:
+  DockerServerImage:
     needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Docker server and keeper images
+      test_name: Docker server image
       runner_type: style-checker
       data: ${{ needs.RunConfig.outputs.data }}
-      checkout_depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 docker_server.py --release-type head --no-push \
           --image-repo clickhouse/clickhouse-server --image-path docker/server --allow-build-reuse
+  DockerKeeperImage:
+    needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docker keeper image
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
         python3 docker_server.py --release-type head --no-push \
           --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper --allow-build-reuse
 ############################################################################################
diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index 6d150f37a27..fff058ecf87 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -242,20 +242,26 @@ jobs:
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
-  DockerServerImages:
+  DockerServerImage:
     needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Docker server and keeper images
+      test_name: Docker server image
       runner_type: style-checker
       data: ${{ needs.RunConfig.outputs.data }}
-      # FIXME: avoid using 0 checkout
-      checkout_depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 docker_server.py --release-type head \
           --image-repo clickhouse/clickhouse-server --image-path docker/server --allow-build-reuse
+  DockerKeeperImage:
+    needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docker keeper image
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
         python3 docker_server.py --release-type head \
           --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper --allow-build-reuse
 ############################################################################################
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index b3ac2135e50..3165227ce3a 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -273,19 +273,26 @@ jobs:
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
-  DockerServerImages:
+  DockerServerImage:
     needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Docker server and keeper images
+      test_name: Docker server image
       runner_type: style-checker
       data: ${{ needs.RunConfig.outputs.data }}
-      checkout_depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 docker_server.py --release-type head --no-push \
           --image-repo clickhouse/clickhouse-server --image-path docker/server --allow-build-reuse
+  DockerKeeperImage:
+    needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docker keeper image
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
         python3 docker_server.py --release-type head --no-push \
           --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper --allow-build-reuse
 ############################################################################################
diff --git a/.github/workflows/release_branches.yml b/.github/workflows/release_branches.yml
index 69229ef75df..6d54e558b70 100644
--- a/.github/workflows/release_branches.yml
+++ b/.github/workflows/release_branches.yml
@@ -153,19 +153,26 @@ jobs:
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
-  DockerServerImages:
+  DockerServerImage:
     needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Docker server and keeper images
+      test_name: Docker server image
       runner_type: style-checker
       data: ${{ needs.RunConfig.outputs.data }}
-      checkout_depth: 0
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 docker_server.py --release-type head --no-push \
           --image-repo clickhouse/clickhouse-server --image-path docker/server --allow-build-reuse
+  DockerKeeperImage:
+    needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docker keeper image
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
         python3 docker_server.py --release-type head --no-push \
           --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper --allow-build-reuse
 ############################################################################################
@@ -456,7 +463,8 @@ jobs:
   FinishCheck:
     if: ${{ !failure() && !cancelled() }}
     needs:
-      - DockerServerImages
+      - DockerServerImage
+      - DockerKeeperImage
       - BuilderReport
       - BuilderSpecialReport
       - MarkReleaseReady
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index e011b8ad3c9..bd28822a229 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -43,7 +43,8 @@ class Build(metaclass=WithIter):
 class JobNames(metaclass=WithIter):
     STYLE_CHECK = "Style check"
     FAST_TEST = "Fast tests"
-    DOCKER_SERVER = "Docker server and keeper images"
+    DOCKER_SERVER = "Docker server image"
+    DOCKER_KEEPER = "Docker keeper image"
     INSTALL_TEST_AMD = "Install packages (amd64)"
     INSTALL_TEST_ARM = "Install packages (arm64)"
 
@@ -786,6 +787,16 @@ CI_CONFIG = CiConfig(
                     include_paths=[
                         "tests/ci/docker_server.py",
                         "./docker/server",
+                    ]
+                )
+            ),
+        ),
+        JobNames.DOCKER_KEEPER: TestConfig(
+            "",
+            job_config=JobConfig(
+                digest=DigestConfig(
+                    include_paths=[
+                        "tests/ci/docker_server.py",
                         "./docker/keeper",
                     ]
                 )
@@ -922,7 +933,7 @@ CI_CONFIG = CiConfig(
             Build.PACKAGE_DEBUG,
             job_config=JobConfig(num_batches=6, **statless_test_common_params),  # type: ignore
         ),
-        JobNames.STATELESS_TEST_S3_DEBUG: TestConfig(
+        JobNames.STATELESS_TEST_S3_TSAN: TestConfig(
             Build.PACKAGE_TSAN,
             job_config=JobConfig(num_batches=5, **statless_test_common_params),  # type: ignore
         ),
@@ -1123,10 +1134,14 @@ CHECK_DESCRIPTIONS = [
         lambda x: x.startswith("Compatibility check"),
     ),
     CheckDescription(
-        "Docker image for servers",
+        JobNames.DOCKER_SERVER,
         "The check to build and optionally push the mentioned image to docker hub",
-        lambda x: x.startswith("Docker image")
-        and (x.endswith("building check") or x.endswith("build and push")),
+        lambda x: x.startswith("Docker server")
+    ),
+    CheckDescription(
+        JobNames.DOCKER_KEEPER,
+        "The check to build and optionally push the mentioned image to docker hub",
+        lambda x: x.startswith("Docker keeper")
     ),
     CheckDescription(
         "Docs Check", "Builds and tests the documentation", lambda x: x == "Docs Check"

From 80376fdbfa84b3a7bbebefc58252a5f814cb5570 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 19:28:39 +0100
Subject: [PATCH 235/245] Fix style

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index ab48a4a798c..7667c97fa6f 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -2638,6 +2638,7 @@ varPop
 varSamp
 variadic
 variantElement
+variantType
 varint
 varpop
 varsamp

From 419ddf7c9d98e5c839609a90f52c5b7b926b204a Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Tue, 30 Jan 2024 18:34:56 +0000
Subject: [PATCH 236/245] Automatic style fix

---
 tests/ci/ci_config.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index bd28822a229..d18040540c7 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -1136,12 +1136,12 @@ CHECK_DESCRIPTIONS = [
     CheckDescription(
         JobNames.DOCKER_SERVER,
         "The check to build and optionally push the mentioned image to docker hub",
-        lambda x: x.startswith("Docker server")
+        lambda x: x.startswith("Docker server"),
     ),
     CheckDescription(
         JobNames.DOCKER_KEEPER,
         "The check to build and optionally push the mentioned image to docker hub",
-        lambda x: x.startswith("Docker keeper")
+        lambda x: x.startswith("Docker keeper"),
     ),
     CheckDescription(
         "Docs Check", "Builds and tests the documentation", lambda x: x == "Docs Check"

From 8c69a6e28d7a8ea153f6c2ce02ec5e3f1dc799ee Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 20:28:56 +0100
Subject: [PATCH 237/245] Fix build

---
 src/Functions/variantType.cpp | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Functions/variantType.cpp b/src/Functions/variantType.cpp
index 9549f4c5210..48591cb794d 100644
--- a/src/Functions/variantType.cpp
+++ b/src/Functions/variantType.cpp
@@ -89,8 +89,7 @@ REGISTER_FUNCTION(VariantType)
 Returns the variant type name for each row of `Variant` column. If row contains NULL, it returns 'None' for it.
 )",
         .syntax{"variantType(variant)"},
-        .arguments{{
-            {"variant", "Variant column"}}},
+        .arguments{{{"variant", "Variant column"}}}
         .examples{{{
             "Example",
             R"(

From 46432da743aa08b45c75f4ec3cca6c48c7e87a75 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 20:30:17 +0100
Subject: [PATCH 238/245] Remove unneded file

---
 src/Functions/array/variantType.cpp | 3 ---
 1 file changed, 3 deletions(-)
 delete mode 100644 src/Functions/array/variantType.cpp

diff --git a/src/Functions/array/variantType.cpp b/src/Functions/array/variantType.cpp
deleted file mode 100644
index a120cc213ec..00000000000
--- a/src/Functions/array/variantType.cpp
+++ /dev/null
@@ -1,3 +0,0 @@
-//
-// Created by Павел Круглов on 30/01/2024.
-//

From bd3bb0530877a4337964e630ed4313c762ec9fbb Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 20:32:59 +0100
Subject: [PATCH 239/245] Fix

---
 src/Functions/variantType.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/variantType.cpp b/src/Functions/variantType.cpp
index 48591cb794d..e867cb03a23 100644
--- a/src/Functions/variantType.cpp
+++ b/src/Functions/variantType.cpp
@@ -88,9 +88,9 @@ REGISTER_FUNCTION(VariantType)
         .description = R"(
 Returns the variant type name for each row of `Variant` column. If row contains NULL, it returns 'None' for it.
 )",
-        .syntax{"variantType(variant)"},
-        .arguments{{{"variant", "Variant column"}}}
-        .examples{{{
+        .syntax = {"variantType(variant)"},
+        .arguments = {{"variant", "Variant column"}},
+        .examples = {{{
             "Example",
             R"(
 CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;

From 280e04abb297770bcb1fe321ec1ad8d9382306cf Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 20:50:28 +0100
Subject: [PATCH 240/245] Fix test one more time

---
 .../0_stateless/02973_s3_compressed_file_in_error_message.sh    | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
index 946f0c09007..a4984583637 100755
--- a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
+++ b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
@@ -5,4 +5,4 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_CLIENT --allow_repeated_settings --send_logs_level=none -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c -F "(in file/uri a.tsv)"
+$CLICKHOUSE_CLIENT --allow_repeated_settings --send_logs_level=none -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c "(in file/uri.*a\.tsv)"

From 076fb1de310a144d35541269cb98809dce77a613 Mon Sep 17 00:00:00 2001
From: Alexey Gerasimchuck <a.gerasimchuck@arenadata.io>
Date: Tue, 30 Jan 2024 23:52:33 +0000
Subject: [PATCH 241/245] Updated the authentication failures counter logic

---
 src/Access/AccessControl.cpp                  |  29 +++--
 .../02884_authentication_quota.reference      |  66 +++++------
 .../0_stateless/02884_authentication_quota.sh | 103 ++++++++----------
 3 files changed, 99 insertions(+), 99 deletions(-)

diff --git a/src/Access/AccessControl.cpp b/src/Access/AccessControl.cpp
index 7026fda94b1..d02af01126a 100644
--- a/src/Access/AccessControl.cpp
+++ b/src/Access/AccessControl.cpp
@@ -565,19 +565,31 @@ AuthResult AccessControl::authenticate(const Credentials & credentials, const Po
     // Then user_id is not generated, and the authentication quota will always be nullptr.
     auto authentication_quota = getAuthenticationQuota(credentials.getUserName(), address, forwarded_address);
     if (authentication_quota)
-        authentication_quota->checkExceeded(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
+    {
+        /// Reserve a single try from the quota to check whether we have another authentication try.
+        /// This is required for correct behavior in this situation:
+        /// User has 1 login failures quota.
+        /// * At the first login with an invalid password: Increase the quota counter. 1 (used) > 1 (max) is false.
+        ///   Then try to authenticate the user and throw an AUTHENTICATION_FAILED error.
+        /// * In case of the second try: increase quota counter, 2 (used) > 1 (max), then throw QUOTA_EXCEED
+        ///   and don't let the user authenticate.
+        ///
+        /// The authentication failures counter will be reset after successful authentication.
+        authentication_quota->used(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS, 1);
+    }
 
-    AuthResult auth_result;
     try
     {
-        auth_result = MultipleAccessStorage::authenticate(credentials, address, *external_authenticators, allow_no_password,
-                                                          allow_plaintext_password);
+        const auto auth_result = MultipleAccessStorage::authenticate(credentials, address, *external_authenticators, allow_no_password,
+                                                                     allow_plaintext_password);
+        if (authentication_quota)
+            authentication_quota->reset(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
+
+        return auth_result;
     }
     catch (...)
     {
         tryLogCurrentException(getLogger(), "from: " + address.toString() + ", user: " + credentials.getUserName()  + ": Authentication failed");
-        if (authentication_quota)
-            authentication_quota->used(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS, 1, true);
 
         WriteBufferFromOwnString message;
         message << credentials.getUserName() << ": Authentication failed: password is incorrect, or there is no user with such name.";
@@ -597,11 +609,6 @@ AuthResult AccessControl::authenticate(const Credentials & credentials, const Po
                                             "{}: Authentication failed: password is incorrect, or there is no user with such name.{}"},
                         ErrorCodes::AUTHENTICATION_FAILED);
     }
-
-    if (authentication_quota)
-        authentication_quota->reset(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
-
-    return auth_result;
 }
 
 void AccessControl::restoreFromBackup(RestorerFromBackup & restorer)
diff --git a/tests/queries/0_stateless/02884_authentication_quota.reference b/tests/queries/0_stateless/02884_authentication_quota.reference
index 02e410ed56f..638034bab82 100644
--- a/tests/queries/0_stateless/02884_authentication_quota.reference
+++ b/tests/queries/0_stateless/02884_authentication_quota.reference
@@ -2,51 +2,53 @@
 > Create the user with quota with the maximum single authentication attempt.
 > Check if the quota has been created.
 1
+> Try to login to the user account with correct password
 > Login to the user account using the wrong password.
 password is incorrect
-> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-1	1
-> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed.
-> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-0	1
-> Login to the user account using the wrong password 2 times to exceed the quota.
-password is incorrect
-QUOTA_EXCEEDED
-> Login to the user account using the correct password, but login is unsuccesful (quota exceed).
+> Quota is exceeded 1 >= 1. Login with correct password should fail.
 QUOTA_EXCEEDED
 > Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
 2	1
-> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3
-> Login to the user account using the wrong password.
+> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 4
+> Try to login to the user account with correct password
+> Successfull login should reset failed authentications counter. Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+0	4
+> Login to the user account using the wrong password before exeeding the quota.
 password is incorrect
+password is incorrect
+password is incorrect
+password is incorrect
+QUOTA_EXCEEDED
+> Also try to login with correct password. Quota should stay exceeded.
+QUOTA_EXCEEDED
 > Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-3	3
-> Increaseing MAX FAILED SEQUENTIAL AUTHENTICATIONS should now allow the user to login.
-> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-0	3
+6	4
+> Reset the quota by increasing MAX FAILED SEQUENTIAL AUTHENTICATIONS and succesfull login
+> and check failed_sequential_authentications, max_failed_sequential_authentications.
+0	7
+ ---------------------------------------------------------------------------
 > Create the role with quota with the maximum single authentication attempt.
+> Try to login to the user account with correct password
 > Login to the user account using the wrong password.
 password is incorrect
-> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-1	1
-> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed.
-> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-0	1
-> Login to the user account using the wrong password 2 times to exceed the quota.
-password is incorrect
+> Quota is exceeded 1 >= 1. Login with correct password should fail.
 QUOTA_EXCEEDED
 > Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-QUOTA_EXCEEDED
-> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3
-> Login to the user account using the wrong password.
+2	1
+> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 4
+> Try to login to the user account with correct password
+> Successfull login should reset failed authentications counter. Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+0	4
+> Login to the user account using the wrong password before exeeding the quota.
+password is incorrect
+password is incorrect
 password is incorrect
-> Login to the user account using the correct password.
-> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1
-> Login 2 times to the user account using the wrong password to exceed the quota
 password is incorrect
-> Login to the user account using wrong password and check that the error is 'QUOTA_EXCEEDED'.
 QUOTA_EXCEEDED
-> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'.
-QUOTA_EXCEEDED
-> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'.
+> Also try to login with correct password. Quota should stay exceeded.
 QUOTA_EXCEEDED
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+6	4
+> Reset the quota by increasing MAX FAILED SEQUENTIAL AUTHENTICATIONS and succesfull login
+> and check failed_sequential_authentications, max_failed_sequential_authentications.
+0	7
diff --git a/tests/queries/0_stateless/02884_authentication_quota.sh b/tests/queries/0_stateless/02884_authentication_quota.sh
index fcb2607c3d6..f013bb4d639 100755
--- a/tests/queries/0_stateless/02884_authentication_quota.sh
+++ b/tests/queries/0_stateless/02884_authentication_quota.sh
@@ -9,6 +9,50 @@ QUOTA="2884_quota_$$"
 USER="2884_user_$$"
 ROLE="2884_role_$$"
 
+
+function login_test()
+{
+    echo "> Try to login to the user account with correct password"
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+
+    echo "> Login to the user account using the wrong password."
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+
+    echo "> Quota is exceeded 1 >= 1. Login with correct password should fail."
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+
+    echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+    ${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+
+    echo "> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 4"
+    ${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 4 TO ${USER}"
+    
+    echo "> Try to login to the user account with correct password"
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+    
+    echo "> Successfull login should reset failed authentications counter. Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+    ${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+
+    echo "> Login to the user account using the wrong password before exeeding the quota."
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+    
+    echo "> Also try to login with correct password. Quota should stay exceeded."
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+
+    echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+    ${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+
+    echo "> Reset the quota by increasing MAX FAILED SEQUENTIAL AUTHENTICATIONS and succesfull login"
+    echo "> and check failed_sequential_authentications, max_failed_sequential_authentications."
+    ${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 7 TO ${USER}"
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+    ${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+}
+
 echo "> Drop the user, quota, and role if those were created."
 ${CLICKHOUSE_CLIENT} -q "DROP USER IF EXISTS ${USER}"
 ${CLICKHOUSE_CLIENT} -q "DROP QUOTA IF EXISTS ${QUOTA}"
@@ -21,69 +65,16 @@ ${CLICKHOUSE_CLIENT} -q "CREATE QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED
 echo "> Check if the quota has been created."
 ${CLICKHOUSE_CLIENT} -q "SELECT COUNT(*) FROM system.quotas WHERE name = '${QUOTA}'"
 
-echo "> Login to the user account using the wrong password."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null"  2>&1 | grep -m1 -o 'password is incorrect'
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
-echo "> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
-echo "> Login to the user account using the wrong password 2 times to exceed the quota."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
-echo "> Login to the user account using the correct password, but login is unsuccesful (quota exceed)."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
-
-echo "> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3"
-${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3 TO ${USER}"
-echo "> Login to the user account using the wrong password."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null"  2>&1 | grep -m1 -o 'password is incorrect'
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
-echo "> Increaseing MAX FAILED SEQUENTIAL AUTHENTICATIONS should now allow the user to login."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+login_test
 
+echo " ---------------------------------------------------------------------------"
 echo "> Create the role with quota with the maximum single authentication attempt."
 ${CLICKHOUSE_CLIENT} -q "CREATE ROLE ${ROLE}"
 ${CLICKHOUSE_CLIENT} -q "GRANT ALL ON *.* TO ${ROLE}"
 ${CLICKHOUSE_CLIENT} -q "GRANT ${ROLE} to ${USER}"
 ${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1 TO ${ROLE}"
-echo "> Login to the user account using the wrong password."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
-echo "> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
-echo "> Login to the user account using the wrong password 2 times to exceed the quota."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
 
-echo "> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3"
-${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3 TO ${USER}"
-echo "> Login to the user account using the wrong password."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
-echo "> Login to the user account using the correct password."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
-echo "> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1"
-${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1 TO ${USER}"
-echo "> Login 2 times to the user account using the wrong password to exceed the quota"
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
-echo "> Login to the user account using wrong password and check that the error is 'QUOTA_EXCEEDED'."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
-echo "> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
-echo "> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+login_test
 
 ${CLICKHOUSE_CLIENT} -q "DROP USER IF EXISTS ${USER}"
 ${CLICKHOUSE_CLIENT} -q "DROP QUOTA IF EXISTS ${QUOTA}"

From 818fb9802ad200bea18aa81ca6de1146727811a1 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 31 Jan 2024 11:48:02 +0800
Subject: [PATCH 242/245] change as request

---
 src/Functions/if.cpp | 16 ++++++++++++----
 1 file changed, 12 insertions(+), 4 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index fba50385923..18ba75cbd7e 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -25,8 +25,6 @@
 #include <Functions/FunctionFactory.h>
 #include <type_traits>
 
-#pragma clang diagnostic ignored "-Wundefined-reinterpret-cast"
-
 namespace DB
 {
 namespace ErrorCodes
@@ -59,7 +57,11 @@ concept is_native_int_or_decimal_v
     auto mask = static_cast<UIntType>(static_cast<IntType>(vc) - 1); \
     auto new_a = static_cast<ResultType>(va); \
     auto new_b = static_cast<ResultType>(vb); \
-    auto tmp = (~mask & (*reinterpret_cast<UIntType *>(&new_a))) | (mask & (*reinterpret_cast<UIntType *>(&new_b))); \
+    UIntType uint_a; \
+    std::memcpy(&uint_a, &new_a, sizeof(UIntType)); \
+    UIntType uint_b; \
+    std::memcpy(&uint_b, &new_b, sizeof(UIntType)); \
+    UIntType tmp = (~mask & uint_a) | (mask & uint_b); \
     (vr) = *(reinterpret_cast<ResultType *>(&tmp));
 
 template <typename ArrayCond, typename ArrayA, typename ArrayB, typename ArrayResult, typename ResultType>
@@ -220,12 +222,18 @@ template <typename ArrayCond, typename A, typename B, typename ArrayResult, type
 inline void fillConstantConstant(const ArrayCond & cond, A a, B b, ArrayResult & res)
 {
     size_t size = cond.size();
+
+    /// Int8(alias type of uint8_t) has special aliasing properties that prevents compiler from auto-vectorizing for below codes, refer to https://gist.github.com/alexei-zaripov/dcc14c78819c5f1354afe8b70932007c
+    ///
+    /// for (size_t i = 0; i < size; ++i)
+    ///     res[i] = cond[i] ? static_cast<Int8>(a) : static_cast<Int8>(b);
+    ///
+    /// Therefore, we manually optimize it by avoiding branch miss when ResultType is Int8. Other types like (U)Int128|256 or Decimal128/256 also benefit from this optimization.
     if constexpr (std::is_same_v<ResultType, Int8> || is_over_big_int<ResultType>)
     {
         alignas(64) const ResultType ab[2] = {static_cast<ResultType>(a), static_cast<ResultType>(b)};
         for (size_t i = 0; i < size; ++i)
         {
-            /// Introduce memory access to avoid branch miss
             res[i] = ab[!cond[i]];
         }
     }

From 3dae643f1960a78324526c827f5cbe5ee33a4e1d Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 30 Jan 2024 18:29:55 +0100
Subject: [PATCH 243/245] Consistent "Fast test" job name

---
 .github/workflows/pull_request.yml |  2 +-
 tests/ci/ci_config.py              |  8 ++++----
 tests/ci/fast_test_check.py        | 10 ++++------
 3 files changed, 9 insertions(+), 11 deletions(-)

diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 3165227ce3a..56617294fb6 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -104,7 +104,7 @@ jobs:
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Fast tests
+      test_name: Fast test
       runner_type: builder
       data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index d18040540c7..69098b1042e 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -6,8 +6,8 @@ from dataclasses import dataclass, field
 from pathlib import Path
 from typing import Callable, Dict, Iterable, List, Literal, Optional, Union
 
-from integration_test_images import IMAGES
 from ci_utils import WithIter
+from integration_test_images import IMAGES
 
 
 class Labels(metaclass=WithIter):
@@ -42,7 +42,7 @@ class Build(metaclass=WithIter):
 
 class JobNames(metaclass=WithIter):
     STYLE_CHECK = "Style check"
-    FAST_TEST = "Fast tests"
+    FAST_TEST = "Fast test"
     DOCKER_SERVER = "Docker server image"
     DOCKER_KEEPER = "Docker keeper image"
     INSTALL_TEST_AMD = "Install packages (amd64)"
@@ -1147,7 +1147,7 @@ CHECK_DESCRIPTIONS = [
         "Docs Check", "Builds and tests the documentation", lambda x: x == "Docs Check"
     ),
     CheckDescription(
-        "Fast test",
+        JobNames.FAST_TEST,
         "Normally this is the first check that is ran for a PR. It builds ClickHouse "
         'and runs most of <a href="https://clickhouse.com/docs/en/development/tests'
         '#functional-tests">stateless functional tests</a>, '
@@ -1155,7 +1155,7 @@ CHECK_DESCRIPTIONS = [
         "Look at the report to see which tests fail, then reproduce the failure "
         'locally as described <a href="https://clickhouse.com/docs/en/development/'
         'tests#functional-test-locally">here</a>',
-        lambda x: x == "Fast test",
+        lambda x: x == JobNames.FAST_TEST,
     ),
     CheckDescription(
         "Flaky tests",
diff --git a/tests/ci/fast_test_check.py b/tests/ci/fast_test_check.py
index c8ddcf25057..b558253ca95 100644
--- a/tests/ci/fast_test_check.py
+++ b/tests/ci/fast_test_check.py
@@ -1,22 +1,20 @@
 #!/usr/bin/env python3
 import argparse
-import logging
-import subprocess
-import os
 import csv
+import logging
+import os
+import subprocess
 import sys
 from pathlib import Path
 from typing import Tuple
 
 from docker_images_helper import DockerImage, get_docker_image, pull_image
-from env_helper import S3_BUILDS_BUCKET, TEMP_PATH, REPO_COPY
+from env_helper import REPO_COPY, S3_BUILDS_BUCKET, TEMP_PATH
 from pr_info import FORCE_TESTS_LABEL, PRInfo
 from report import JobReport, TestResult, TestResults, read_test_results
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
-NAME = "Fast test"
-
 # Will help to avoid errors like _csv.Error: field larger than field limit (131072)
 csv.field_size_limit(sys.maxsize)
 

From 7af7255b90ad6b36e9051e4152dbb66f8c5a817a Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 30 Jan 2024 18:44:52 +0100
Subject: [PATCH 244/245] Use JobNames.DOCS_CHECK for consistency

---
 tests/ci/ci.py         | 24 ++++++++++++------------
 tests/ci/ci_config.py  |  4 +++-
 tests/ci/docs_check.py |  7 ++-----
 3 files changed, 17 insertions(+), 18 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index f52f28c3a16..86831557456 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -10,7 +10,16 @@ from pathlib import Path
 from typing import Any, Dict, Iterable, List, Optional
 
 import docker_images_helper
-from ci_config import CI_CONFIG, Labels
+import upload_result_helper
+from build_check import get_release_or_pr
+from ci_config import CI_CONFIG, JobNames, Labels
+from clickhouse_helper import (
+    CiLogsCredentials,
+    ClickHouseHelper,
+    get_instance_id,
+    get_instance_type,
+    prepare_tests_results_for_clickhouse,
+)
 from commit_status_helper import (
     CommitStatusData,
     RerunHelper,
@@ -36,15 +45,6 @@ from github import Github
 from pr_info import PRInfo
 from report import SUCCESS, BuildResult, JobReport
 from s3_helper import S3Helper
-from clickhouse_helper import (
-    CiLogsCredentials,
-    ClickHouseHelper,
-    get_instance_id,
-    get_instance_type,
-    prepare_tests_results_for_clickhouse,
-)
-from build_check import get_release_or_pr
-import upload_result_helper
 from version_helper import get_version_from_repo
 
 
@@ -277,7 +277,7 @@ def _check_and_update_for_early_style_check(run_config: dict) -> None:
 
 
 def _update_config_for_docs_only(run_config: dict) -> None:
-    DOCS_CHECK_JOBS = ["Docs check", "Style check"]
+    DOCS_CHECK_JOBS = [JobNames.DOCS_CHECK, JobNames.STYLE_CHECK]
     print(f"NOTE: Will keep only docs related jobs: [{DOCS_CHECK_JOBS}]")
     jobs_to_do = run_config.get("jobs_data", {}).get("jobs_to_do", [])
     run_config["jobs_data"]["jobs_to_do"] = [
@@ -893,7 +893,7 @@ def main() -> int:
             CI_CONFIG.get_digest_config("package_release")
         )
         docs_digest = job_digester.get_job_digest(
-            CI_CONFIG.get_digest_config("Docs check")
+            CI_CONFIG.get_digest_config(JobNames.DOCS_CHECK)
         )
         jobs_data = (
             _configure_jobs(
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 69098b1042e..89f5e5a90ec 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -1144,7 +1144,9 @@ CHECK_DESCRIPTIONS = [
         lambda x: x.startswith("Docker keeper"),
     ),
     CheckDescription(
-        "Docs Check", "Builds and tests the documentation", lambda x: x == "Docs Check"
+        JobNames.DOCS_CHECK,
+        "Builds and tests the documentation",
+        lambda x: x == JobNames.DOCS_CHECK,
     ),
     CheckDescription(
         JobNames.FAST_TEST,
diff --git a/tests/ci/docs_check.py b/tests/ci/docs_check.py
index a982cbc2a32..400d4bc6ad5 100644
--- a/tests/ci/docs_check.py
+++ b/tests/ci/docs_check.py
@@ -6,16 +6,13 @@ import sys
 from pathlib import Path
 
 from docker_images_helper import get_docker_image, pull_image
-from env_helper import TEMP_PATH, REPO_COPY
+from env_helper import REPO_COPY, TEMP_PATH
 from pr_info import PRInfo
-from report import JobReport, TestResults, TestResult
+from report import JobReport, TestResult, TestResults
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
 
-NAME = "Docs Check"
-
-
 def parse_args() -> argparse.Namespace:
     parser = argparse.ArgumentParser(
         formatter_class=argparse.ArgumentDefaultsHelpFormatter,

From bfa722bf6245507868d62f9d615ff229e8cefcf4 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 30 Jan 2024 18:46:53 +0100
Subject: [PATCH 245/245] Use JobNames.STYLE_CHECK for consistency

---
 tests/ci/ci.py          | 4 ++--
 tests/ci/ci_config.py   | 4 ++--
 tests/ci/style_check.py | 3 ---
 3 files changed, 4 insertions(+), 7 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 86831557456..433ea4a3a5f 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -268,11 +268,11 @@ def _check_and_update_for_early_style_check(run_config: dict) -> None:
     jobs_to_do = run_config.get("jobs_data", {}).get("jobs_to_do", [])
     docker_to_build = run_config.get("docker_data", {}).get("missing_multi", [])
     if (
-        "Style check" in jobs_to_do
+        JobNames.STYLE_CHECK in jobs_to_do
         and docker_to_build
         and "clickhouse/style-test" not in docker_to_build
     ):
-        index = jobs_to_do.index("Style check")
+        index = jobs_to_do.index(JobNames.STYLE_CHECK)
         jobs_to_do[index] = "Style check early"
 
 
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 89f5e5a90ec..61f75edfa2f 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -1231,10 +1231,10 @@ CHECK_DESCRIPTIONS = [
         lambda x: x.startswith("Stress test ("),
     ),
     CheckDescription(
-        "Style Check",
+        JobNames.STYLE_CHECK,
         "Runs a set of checks to keep the code style clean. If some of tests failed, "
         "see the related log from the report",
-        lambda x: x == "Style Check",
+        lambda x: x == JobNames.STYLE_CHECK,
     ),
     CheckDescription(
         "Unit tests",
diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index 4f791a5ee01..785e29b2359 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -8,7 +8,6 @@ import sys
 from pathlib import Path
 from typing import List, Tuple
 
-
 from docker_images_helper import get_docker_image, pull_image
 from env_helper import REPO_COPY, TEMP_PATH
 from git_helper import GIT_PREFIX, git_runner
@@ -17,8 +16,6 @@ from report import JobReport, TestResults, read_test_results
 from ssh import SSHKey
 from stopwatch import Stopwatch
 
-NAME = "Style Check"
-
 
 def process_result(
     result_directory: Path,